diff --git "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" --- "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" +++ "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.3805, "train/learning_rate": 2.3942992874109263e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 114636, "_timestamp": 1647488913, "_step": 16510, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 9.0, 7.0, 20.0, 30344.0, 81.0, 11.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.125, -147.578125, -143.03125, -138.484375, -133.9375, -129.390625, -124.84375, -120.296875, -115.75, -111.203125, -106.65625, -102.109375, -97.5625, -93.015625, -88.46875, -83.921875, -79.375, -74.828125, -70.28125, -65.734375, -61.1875, -56.640625, -52.09375, -47.546875, -43.0, -38.453125, -33.90625, -29.359375, -24.8125, -20.265625, -15.71875, -11.171875, -6.625, -2.078125, 2.46875, 7.015625, 11.5625, 16.109375, 20.65625, 25.203125, 29.75, 34.296875, 38.84375, 43.390625, 47.9375, 52.484375, 57.03125, 61.578125, 66.125, 70.671875, 75.21875, 79.765625, 84.3125, 88.859375, 93.40625, 97.953125, 102.5, 107.046875, 111.59375, 116.140625, 120.6875, 125.234375, 129.78125, 134.328125, 138.875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 9.0, 12.0, 12.0, 13.0, 11.0, 20.0, 23.0, 14.0, 29.0, 32.0, 36.0, 41.0, 35.0, 33.0, 38.0, 43.0, 49.0, 44.0, 43.0, 52.0, 61.0, 42.0, 49.0, 32.0, 35.0, 22.0, 23.0, 24.0, 28.0, 19.0, 13.0, 15.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-63.42264175415039, -62.10611343383789, -60.789588928222656, -59.473060607910156, -58.156532287597656, -56.84000778198242, -55.52347946166992, -54.20695495605469, -52.89042663574219, -51.57389831542969, -50.25737380981445, -48.94084548950195, -47.62432098388672, -46.30779266357422, -44.99126434326172, -43.67473602294922, -42.358211517333984, -41.041683197021484, -39.72515869140625, -38.40863037109375, -37.09210205078125, -35.775577545166016, -34.459049224853516, -33.14252471923828, -31.82599639892578, -30.509469985961914, -29.192943572998047, -27.876415252685547, -26.55988883972168, -25.243362426757812, -23.926834106445312, -22.610307693481445, -21.293785095214844, -19.977258682250977, -18.66073226928711, -17.34420394897461, -16.027677536010742, -14.711151123046875, -13.394623756408691, -12.078096389770508, -10.76156997680664, -9.445043563842773, -8.12851619720459, -6.8119893074035645, -5.495462417602539, -4.178935527801514, -2.8624086380004883, -1.5458812713623047, -0.2293548583984375, 1.087172031402588, 2.4036989212036133, 3.7202258110046387, 5.036752700805664, 6.3532795906066895, 7.669806480407715, 8.986333847045898, 10.302860260009766, 11.619386672973633, 12.935914039611816, 14.25244140625, 15.568967819213867, 16.885494232177734, 18.202022552490234, 19.5185489654541, 20.83507537841797]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 10.0, 3.0, 15.0, 23.0, 19.0, 23.0, 35.0, 27.0, 29.0, 26.0, 41.0, 28.0, 43.0, 47.0, 51.0, 57.0, 34.0, 48.0, 46.0, 47.0, 50.0, 33.0, 34.0, 29.0, 20.0, 28.0, 31.0, 24.0, 20.0, 11.0, 10.0, 11.0, 8.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.79653549194336, -35.52540969848633, -34.2542839050293, -32.983158111572266, -31.712034225463867, -30.440908432006836, -29.169784545898438, -27.898658752441406, -26.627532958984375, -25.356407165527344, -24.085281372070312, -22.814157485961914, -21.543031692504883, -20.27190589904785, -19.000782012939453, -17.729656219482422, -16.45853042602539, -15.18740463256836, -13.916279792785645, -12.64515495300293, -11.374029159545898, -10.102903366088867, -8.831778526306152, -7.5606536865234375, -6.289527893066406, -5.018402576446533, -3.74727725982666, -2.476151943206787, -1.205026626586914, 0.06609869003295898, 1.337224006652832, 2.608348846435547, 3.8794784545898438, 5.150603771209717, 6.42172908782959, 7.692854404449463, 8.963979721069336, 10.235105514526367, 11.506230354309082, 12.777355194091797, 14.048480987548828, 15.31960678100586, 16.59073257446289, 17.86185646057129, 19.13298225402832, 20.40410804748535, 21.67523193359375, 22.94635772705078, 24.217483520507812, 25.488609313964844, 26.759735107421875, 28.030858993530273, 29.301984786987305, 30.573110580444336, 31.844234466552734, 33.115360260009766, 34.3864860534668, 35.65761184692383, 36.92873764038086, 38.19986343383789, 39.470985412597656, 40.74211120605469, 42.01323699951172, 43.28436279296875, 44.55548858642578]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 8.0, 18.0, 40.0, 36.0, 64.0, 110.0, 149.0, 225.0, 356.0, 517.0, 791.0, 1178.0, 1786.0, 2775.0, 4168.0, 6169.0, 9284.0, 13129.0, 19126.0, 27131.0, 37481.0, 50007.0, 64518.0, 79362.0, 92999.0, 113192.0, 112222.0, 93945.0, 79706.0, 64437.0, 49698.0, 37285.0, 26728.0, 19286.0, 13274.0, 9185.0, 6051.0, 4034.0, 2686.0, 1851.0, 1217.0, 741.0, 526.0, 325.0, 297.0, 138.0, 112.0, 61.0, 48.0, 25.0, 16.0, 20.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-129.375, -125.4541015625, -121.533203125, -117.6123046875, -113.69140625, -109.7705078125, -105.849609375, -101.9287109375, -98.0078125, -94.0869140625, -90.166015625, -86.2451171875, -82.32421875, -78.4033203125, -74.482421875, -70.5615234375, -66.640625, -62.7197265625, -58.798828125, -54.8779296875, -50.95703125, -47.0361328125, -43.115234375, -39.1943359375, -35.2734375, -31.3525390625, -27.431640625, -23.5107421875, -19.58984375, -15.6689453125, -11.748046875, -7.8271484375, -3.90625, 0.0146484375, 3.935546875, 7.8564453125, 11.77734375, 15.6982421875, 19.619140625, 23.5400390625, 27.4609375, 31.3818359375, 35.302734375, 39.2236328125, 43.14453125, 47.0654296875, 50.986328125, 54.9072265625, 58.828125, 62.7490234375, 66.669921875, 70.5908203125, 74.51171875, 78.4326171875, 82.353515625, 86.2744140625, 90.1953125, 94.1162109375, 98.037109375, 101.9580078125, 105.87890625, 109.7998046875, 113.720703125, 117.6416015625, 121.5625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 14.0, 9.0, 14.0, 18.0, 21.0, 38.0, 33.0, 28.0, 30.0, 43.0, 42.0, 40.0, 41.0, 53.0, 69.0, 54.0, 51.0, 50.0, 31.0, 41.0, 27.0, 43.0, 31.0, 29.0, 14.0, 21.0, 15.0, 18.0, 13.0, 14.0, 6.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.90625, -61.88623046875, -59.8662109375, -57.84619140625, -55.826171875, -53.80615234375, -51.7861328125, -49.76611328125, -47.74609375, -45.72607421875, -43.7060546875, -41.68603515625, -39.666015625, -37.64599609375, -35.6259765625, -33.60595703125, -31.5859375, -29.56591796875, -27.5458984375, -25.52587890625, -23.505859375, -21.48583984375, -19.4658203125, -17.44580078125, -15.42578125, -13.40576171875, -11.3857421875, -9.36572265625, -7.345703125, -5.32568359375, -3.3056640625, -1.28564453125, 0.734375, 2.75439453125, 4.7744140625, 6.79443359375, 8.814453125, 10.83447265625, 12.8544921875, 14.87451171875, 16.89453125, 18.91455078125, 20.9345703125, 22.95458984375, 24.974609375, 26.99462890625, 29.0146484375, 31.03466796875, 33.0546875, 35.07470703125, 37.0947265625, 39.11474609375, 41.134765625, 43.15478515625, 45.1748046875, 47.19482421875, 49.21484375, 51.23486328125, 53.2548828125, 55.27490234375, 57.294921875, 59.31494140625, 61.3349609375, 63.35498046875, 65.375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 14.0, 11.0, 18.0, 23.0, 25.0, 29.0, 28.0, 35.0, 26.0, 38.0, 33.0, 42.0, 54.0, 56.0, 72.0, 56.0, 54.0, 55.0, 42.0, 40.0, 45.0, 33.0, 23.0, 31.0, 17.0, 9.0, 11.0, 12.0, 9.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.490638732910156, -42.03007888793945, -40.56951904296875, -39.10895919799805, -37.648399353027344, -36.18783950805664, -34.72727966308594, -33.26671600341797, -31.8061580657959, -30.345598220825195, -28.885038375854492, -27.424476623535156, -25.963916778564453, -24.50335693359375, -23.042797088623047, -21.582237243652344, -20.12167739868164, -18.661117553710938, -17.200557708740234, -15.739996910095215, -14.279437065124512, -12.818877220153809, -11.358316421508789, -9.897756576538086, -8.437196731567383, -6.97663688659668, -5.516076564788818, -4.055516242980957, -2.594956398010254, -1.1343965530395508, 0.32616424560546875, 1.7867240905761719, 3.247283935546875, 4.707843780517578, 6.1684041023254395, 7.628964424133301, 9.089524269104004, 10.550084114074707, 12.010644912719727, 13.47120475769043, 14.931764602661133, 16.392324447631836, 17.85288429260254, 19.313446044921875, 20.774005889892578, 22.23456573486328, 23.695125579833984, 25.155685424804688, 26.61624526977539, 28.076805114746094, 29.537364959716797, 30.9979248046875, 32.4584846496582, 33.919044494628906, 35.379608154296875, 36.84016418457031, 38.30072784423828, 39.761287689208984, 41.22184753417969, 42.68240737915039, 44.142967224121094, 45.6035270690918, 47.0640869140625, 48.52465057373047, 49.985206604003906]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 5.0, 9.0, 11.0, 13.0, 8.0, 19.0, 22.0, 26.0, 21.0, 28.0, 28.0, 35.0, 37.0, 39.0, 45.0, 28.0, 43.0, 37.0, 39.0, 43.0, 44.0, 38.0, 46.0, 31.0, 37.0, 27.0, 24.0, 24.0, 24.0, 28.0, 19.0, 19.0, 21.0, 14.0, 10.0, 11.0, 7.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70409393310547, -34.49701690673828, -33.289939880371094, -32.082862854003906, -30.87578582763672, -29.66870880126953, -28.461631774902344, -27.254554748535156, -26.04747772216797, -24.84040069580078, -23.633323669433594, -22.426246643066406, -21.21916961669922, -20.01209259033203, -18.805015563964844, -17.597938537597656, -16.39086151123047, -15.183784484863281, -13.976707458496094, -12.769630432128906, -11.562553405761719, -10.355476379394531, -9.148399353027344, -7.941322326660156, -6.734245300292969, -5.527168273925781, -4.320091247558594, -3.1130142211914062, -1.9059371948242188, -0.6988601684570312, 0.5082168579101562, 1.7152938842773438, 2.9223709106445312, 4.129447937011719, 5.336524963378906, 6.543601989746094, 7.750679016113281, 8.957756042480469, 10.164833068847656, 11.371910095214844, 12.578987121582031, 13.786064147949219, 14.993141174316406, 16.200218200683594, 17.40729522705078, 18.61437225341797, 19.821449279785156, 21.028526306152344, 22.23560333251953, 23.44268035888672, 24.649757385253906, 25.856834411621094, 27.06391143798828, 28.27098846435547, 29.478065490722656, 30.685142517089844, 31.89221954345703, 33.09929656982422, 34.306373596191406, 35.513450622558594, 36.72052764892578, 37.92760467529297, 39.134681701660156, 40.341758728027344, 41.54883575439453]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 8.0, 12.0, 22.0, 26.0, 31.0, 64.0, 92.0, 149.0, 267.0, 453.0, 685.0, 1115.0, 1799.0, 2812.0, 4686.0, 7410.0, 11981.0, 19643.0, 32215.0, 52192.0, 87367.0, 142774.0, 235755.0, 391251.0, 642794.0, 845113.0, 667734.0, 411125.0, 248148.0, 150716.0, 91502.0, 55878.0, 33992.0, 20831.0, 12831.0, 7851.0, 4932.0, 2954.0, 1842.0, 1240.0, 717.0, 477.0, 300.0, 203.0, 112.0, 84.0, 45.0, 21.0, 20.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0625, -57.0634765625, -55.064453125, -53.0654296875, -51.06640625, -49.0673828125, -47.068359375, -45.0693359375, -43.0703125, -41.0712890625, -39.072265625, -37.0732421875, -35.07421875, -33.0751953125, -31.076171875, -29.0771484375, -27.078125, -25.0791015625, -23.080078125, -21.0810546875, -19.08203125, -17.0830078125, -15.083984375, -13.0849609375, -11.0859375, -9.0869140625, -7.087890625, -5.0888671875, -3.08984375, -1.0908203125, 0.908203125, 2.9072265625, 4.90625, 6.9052734375, 8.904296875, 10.9033203125, 12.90234375, 14.9013671875, 16.900390625, 18.8994140625, 20.8984375, 22.8974609375, 24.896484375, 26.8955078125, 28.89453125, 30.8935546875, 32.892578125, 34.8916015625, 36.890625, 38.8896484375, 40.888671875, 42.8876953125, 44.88671875, 46.8857421875, 48.884765625, 50.8837890625, 52.8828125, 54.8818359375, 56.880859375, 58.8798828125, 60.87890625, 62.8779296875, 64.876953125, 66.8759765625, 68.875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 10.0, 13.0, 10.0, 6.0, 10.0, 20.0, 15.0, 18.0, 30.0, 37.0, 29.0, 37.0, 41.0, 36.0, 38.0, 43.0, 39.0, 30.0, 32.0, 44.0, 34.0, 41.0, 36.0, 36.0, 34.0, 34.0, 28.0, 29.0, 31.0, 18.0, 27.0, 11.0, 17.0, 9.0, 16.0, 10.0, 7.0, 11.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -30.12646484375, -29.0654296875, -28.00439453125, -26.943359375, -25.88232421875, -24.8212890625, -23.76025390625, -22.69921875, -21.63818359375, -20.5771484375, -19.51611328125, -18.455078125, -17.39404296875, -16.3330078125, -15.27197265625, -14.2109375, -13.14990234375, -12.0888671875, -11.02783203125, -9.966796875, -8.90576171875, -7.8447265625, -6.78369140625, -5.72265625, -4.66162109375, -3.6005859375, -2.53955078125, -1.478515625, -0.41748046875, 0.6435546875, 1.70458984375, 2.765625, 3.82666015625, 4.8876953125, 5.94873046875, 7.009765625, 8.07080078125, 9.1318359375, 10.19287109375, 11.25390625, 12.31494140625, 13.3759765625, 14.43701171875, 15.498046875, 16.55908203125, 17.6201171875, 18.68115234375, 19.7421875, 20.80322265625, 21.8642578125, 22.92529296875, 23.986328125, 25.04736328125, 26.1083984375, 27.16943359375, 28.23046875, 29.29150390625, 30.3525390625, 31.41357421875, 32.474609375, 33.53564453125, 34.5966796875, 35.65771484375, 36.71875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 7.0, 11.0, 12.0, 26.0, 49.0, 54.0, 92.0, 140.0, 180.0, 313.0, 525.0, 795.0, 1176.0, 1946.0, 2977.0, 4800.0, 7550.0, 11961.0, 19577.0, 31342.0, 50626.0, 82832.0, 131337.0, 209190.0, 323936.0, 487916.0, 665310.0, 686852.0, 520390.0, 349876.0, 225004.0, 142641.0, 88389.0, 55849.0, 34026.0, 20930.0, 13179.0, 8315.0, 5175.0, 3280.0, 2007.0, 1388.0, 829.0, 517.0, 320.0, 236.0, 134.0, 89.0, 62.0, 42.0, 32.0, 15.0, 16.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-40.90625, -39.59033203125, -38.2744140625, -36.95849609375, -35.642578125, -34.32666015625, -33.0107421875, -31.69482421875, -30.37890625, -29.06298828125, -27.7470703125, -26.43115234375, -25.115234375, -23.79931640625, -22.4833984375, -21.16748046875, -19.8515625, -18.53564453125, -17.2197265625, -15.90380859375, -14.587890625, -13.27197265625, -11.9560546875, -10.64013671875, -9.32421875, -8.00830078125, -6.6923828125, -5.37646484375, -4.060546875, -2.74462890625, -1.4287109375, -0.11279296875, 1.203125, 2.51904296875, 3.8349609375, 5.15087890625, 6.466796875, 7.78271484375, 9.0986328125, 10.41455078125, 11.73046875, 13.04638671875, 14.3623046875, 15.67822265625, 16.994140625, 18.31005859375, 19.6259765625, 20.94189453125, 22.2578125, 23.57373046875, 24.8896484375, 26.20556640625, 27.521484375, 28.83740234375, 30.1533203125, 31.46923828125, 32.78515625, 34.10107421875, 35.4169921875, 36.73291015625, 38.048828125, 39.36474609375, 40.6806640625, 41.99658203125, 43.3125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 10.0, 17.0, 22.0, 22.0, 36.0, 37.0, 40.0, 65.0, 65.0, 72.0, 93.0, 110.0, 143.0, 152.0, 171.0, 195.0, 206.0, 239.0, 232.0, 259.0, 276.0, 224.0, 204.0, 183.0, 162.0, 120.0, 128.0, 101.0, 73.0, 91.0, 56.0, 50.0, 33.0, 29.0, 24.0, 26.0, 26.0, 10.0, 8.0, 12.0, 13.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.69677734375, -15.1435546875, -14.59033203125, -14.037109375, -13.48388671875, -12.9306640625, -12.37744140625, -11.82421875, -11.27099609375, -10.7177734375, -10.16455078125, -9.611328125, -9.05810546875, -8.5048828125, -7.95166015625, -7.3984375, -6.84521484375, -6.2919921875, -5.73876953125, -5.185546875, -4.63232421875, -4.0791015625, -3.52587890625, -2.97265625, -2.41943359375, -1.8662109375, -1.31298828125, -0.759765625, -0.20654296875, 0.3466796875, 0.89990234375, 1.453125, 2.00634765625, 2.5595703125, 3.11279296875, 3.666015625, 4.21923828125, 4.7724609375, 5.32568359375, 5.87890625, 6.43212890625, 6.9853515625, 7.53857421875, 8.091796875, 8.64501953125, 9.1982421875, 9.75146484375, 10.3046875, 10.85791015625, 11.4111328125, 11.96435546875, 12.517578125, 13.07080078125, 13.6240234375, 14.17724609375, 14.73046875, 15.28369140625, 15.8369140625, 16.39013671875, 16.943359375, 17.49658203125, 18.0498046875, 18.60302734375, 19.15625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 5.0, 16.0, 20.0, 14.0, 11.0, 25.0, 30.0, 35.0, 30.0, 42.0, 39.0, 36.0, 47.0, 49.0, 46.0, 41.0, 52.0, 57.0, 47.0, 59.0, 43.0, 31.0, 29.0, 30.0, 24.0, 22.0, 16.0, 21.0, 15.0, 14.0, 15.0, 5.0, 4.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.07200622558594, -41.729984283447266, -40.38795852661133, -39.045936584472656, -37.703914642333984, -36.36189270019531, -35.019866943359375, -33.6778450012207, -32.33582305908203, -30.993799209594727, -29.651777267456055, -28.30975341796875, -26.967731475830078, -25.625707626342773, -24.28368377685547, -22.941661834716797, -21.59963607788086, -20.257612228393555, -18.915590286254883, -17.573566436767578, -16.231544494628906, -14.889520645141602, -13.547496795654297, -12.205473899841309, -10.86345100402832, -9.521428108215332, -8.179405212402344, -6.837381362915039, -5.495358467102051, -4.1533355712890625, -2.811311721801758, -1.4692888259887695, -0.12726593017578125, 1.2147572040557861, 2.5567803382873535, 3.8988037109375, 5.240826606750488, 6.582849502563477, 7.924873352050781, 9.26689624786377, 10.608919143676758, 11.950942039489746, 13.292964935302734, 14.634988784790039, 15.977011680603027, 17.319034576416016, 18.66105842590332, 20.003082275390625, 21.345104217529297, 22.6871280670166, 24.029150009155273, 25.371173858642578, 26.71319580078125, 28.055219650268555, 29.39724349975586, 30.73926544189453, 32.08129119873047, 33.42331314086914, 34.76533889770508, 36.10736083984375, 37.44938278198242, 38.791404724121094, 40.13343048095703, 41.4754524230957, 42.817474365234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 7.0, 13.0, 11.0, 16.0, 17.0, 22.0, 16.0, 21.0, 22.0, 32.0, 34.0, 34.0, 39.0, 55.0, 43.0, 41.0, 41.0, 43.0, 41.0, 39.0, 36.0, 43.0, 37.0, 36.0, 31.0, 29.0, 27.0, 31.0, 24.0, 15.0, 8.0, 13.0, 10.0, 12.0, 8.0, 10.0, 6.0, 8.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.21171569824219, -36.03618240356445, -34.86064910888672, -33.685115814208984, -32.50958251953125, -31.33405113220215, -30.158517837524414, -28.982986450195312, -27.807453155517578, -26.631919860839844, -25.45638656616211, -24.280853271484375, -23.105321884155273, -21.92978858947754, -20.754255294799805, -19.578723907470703, -18.403188705444336, -17.2276554107666, -16.052122116088867, -14.87658977508545, -13.701057434082031, -12.525524139404297, -11.349990844726562, -10.174458503723145, -8.99892520904541, -7.823392391204834, -6.647859573364258, -5.472326278686523, -4.296793460845947, -3.121260643005371, -1.9457273483276367, -0.7701950073242188, 0.4053382873535156, 1.5808712244033813, 2.756404161453247, 3.9319372177124023, 5.1074700355529785, 6.283002853393555, 7.458536148071289, 8.634068489074707, 9.809601783752441, 10.985135078430176, 12.160667419433594, 13.336200714111328, 14.511734008789062, 15.68726634979248, 16.86280059814453, 18.038331985473633, 19.213865280151367, 20.3893985748291, 21.564931869506836, 22.740463256835938, 23.915996551513672, 25.091529846191406, 26.26706314086914, 27.442596435546875, 28.61812973022461, 29.793663024902344, 30.969196319580078, 32.14472961425781, 33.32026290893555, 34.49579620361328, 35.67132568359375, 36.846858978271484, 38.02239227294922]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 19.0, 21.0, 43.0, 61.0, 80.0, 147.0, 214.0, 311.0, 518.0, 757.0, 1224.0, 1809.0, 2852.0, 4059.0, 6032.0, 8954.0, 13558.0, 19716.0, 28509.0, 40976.0, 57994.0, 78775.0, 101592.0, 121690.0, 126974.0, 113257.0, 91196.0, 68419.0, 49711.0, 34709.0, 24181.0, 16235.0, 11070.0, 7562.0, 5132.0, 3501.0, 2344.0, 1520.0, 1030.0, 605.0, 438.0, 279.0, 177.0, 96.0, 84.0, 34.0, 28.0, 31.0, 7.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.59375, -18.986572265625, -18.37939453125, -17.772216796875, -17.1650390625, -16.557861328125, -15.95068359375, -15.343505859375, -14.736328125, -14.129150390625, -13.52197265625, -12.914794921875, -12.3076171875, -11.700439453125, -11.09326171875, -10.486083984375, -9.87890625, -9.271728515625, -8.66455078125, -8.057373046875, -7.4501953125, -6.843017578125, -6.23583984375, -5.628662109375, -5.021484375, -4.414306640625, -3.80712890625, -3.199951171875, -2.5927734375, -1.985595703125, -1.37841796875, -0.771240234375, -0.1640625, 0.443115234375, 1.05029296875, 1.657470703125, 2.2646484375, 2.871826171875, 3.47900390625, 4.086181640625, 4.693359375, 5.300537109375, 5.90771484375, 6.514892578125, 7.1220703125, 7.729248046875, 8.33642578125, 8.943603515625, 9.55078125, 10.157958984375, 10.76513671875, 11.372314453125, 11.9794921875, 12.586669921875, 13.19384765625, 13.801025390625, 14.408203125, 15.015380859375, 15.62255859375, 16.229736328125, 16.8369140625, 17.444091796875, 18.05126953125, 18.658447265625, 19.265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 10.0, 5.0, 2.0, 9.0, 16.0, 13.0, 18.0, 19.0, 9.0, 27.0, 19.0, 31.0, 34.0, 34.0, 39.0, 52.0, 41.0, 42.0, 49.0, 34.0, 42.0, 41.0, 34.0, 31.0, 42.0, 28.0, 36.0, 33.0, 37.0, 28.0, 22.0, 20.0, 19.0, 19.0, 10.0, 17.0, 9.0, 9.0, 4.0, 3.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.1787109375, -31.076171875, -29.9736328125, -28.87109375, -27.7685546875, -26.666015625, -25.5634765625, -24.4609375, -23.3583984375, -22.255859375, -21.1533203125, -20.05078125, -18.9482421875, -17.845703125, -16.7431640625, -15.640625, -14.5380859375, -13.435546875, -12.3330078125, -11.23046875, -10.1279296875, -9.025390625, -7.9228515625, -6.8203125, -5.7177734375, -4.615234375, -3.5126953125, -2.41015625, -1.3076171875, -0.205078125, 0.8974609375, 2.0, 3.1025390625, 4.205078125, 5.3076171875, 6.41015625, 7.5126953125, 8.615234375, 9.7177734375, 10.8203125, 11.9228515625, 13.025390625, 14.1279296875, 15.23046875, 16.3330078125, 17.435546875, 18.5380859375, 19.640625, 20.7431640625, 21.845703125, 22.9482421875, 24.05078125, 25.1533203125, 26.255859375, 27.3583984375, 28.4609375, 29.5634765625, 30.666015625, 31.7685546875, 32.87109375, 33.9736328125, 35.076171875, 36.1787109375, 37.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 8.0, 11.0, 20.0, 17.0, 33.0, 62.0, 90.0, 156.0, 233.0, 372.0, 505.0, 849.0, 1423.0, 2293.0, 3850.0, 6659.0, 11993.0, 24140.0, 157020.0, 770624.0, 33396.0, 15163.0, 8097.0, 4563.0, 2552.0, 1603.0, 1014.0, 644.0, 375.0, 262.0, 168.0, 123.0, 76.0, 49.0, 39.0, 23.0, 13.0, 10.0, 8.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.7236328125, -44.041015625, -42.3583984375, -40.67578125, -38.9931640625, -37.310546875, -35.6279296875, -33.9453125, -32.2626953125, -30.580078125, -28.8974609375, -27.21484375, -25.5322265625, -23.849609375, -22.1669921875, -20.484375, -18.8017578125, -17.119140625, -15.4365234375, -13.75390625, -12.0712890625, -10.388671875, -8.7060546875, -7.0234375, -5.3408203125, -3.658203125, -1.9755859375, -0.29296875, 1.3896484375, 3.072265625, 4.7548828125, 6.4375, 8.1201171875, 9.802734375, 11.4853515625, 13.16796875, 14.8505859375, 16.533203125, 18.2158203125, 19.8984375, 21.5810546875, 23.263671875, 24.9462890625, 26.62890625, 28.3115234375, 29.994140625, 31.6767578125, 33.359375, 35.0419921875, 36.724609375, 38.4072265625, 40.08984375, 41.7724609375, 43.455078125, 45.1376953125, 46.8203125, 48.5029296875, 50.185546875, 51.8681640625, 53.55078125, 55.2333984375, 56.916015625, 58.5986328125, 60.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 4.0, 6.0, 12.0, 13.0, 22.0, 25.0, 17.0, 28.0, 40.0, 41.0, 29.0, 40.0, 40.0, 60.0, 41.0, 61.0, 36.0, 42.0, 46.0, 54.0, 36.0, 43.0, 38.0, 36.0, 29.0, 21.0, 27.0, 18.0, 25.0, 12.0, 13.0, 9.0, 5.0, 4.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.21875, -31.0625, -29.90625, -28.75, -27.59375, -26.4375, -25.28125, -24.125, -22.96875, -21.8125, -20.65625, -19.5, -18.34375, -17.1875, -16.03125, -14.875, -13.71875, -12.5625, -11.40625, -10.25, -9.09375, -7.9375, -6.78125, -5.625, -4.46875, -3.3125, -2.15625, -1.0, 0.15625, 1.3125, 2.46875, 3.625, 4.78125, 5.9375, 7.09375, 8.25, 9.40625, 10.5625, 11.71875, 12.875, 14.03125, 15.1875, 16.34375, 17.5, 18.65625, 19.8125, 20.96875, 22.125, 23.28125, 24.4375, 25.59375, 26.75, 27.90625, 29.0625, 30.21875, 31.375, 32.53125, 33.6875, 34.84375, 36.0, 37.15625, 38.3125, 39.46875, 40.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 14.0, 8.0, 18.0, 23.0, 24.0, 34.0, 47.0, 51.0, 80.0, 121.0, 190.0, 311.0, 523.0, 921.0, 1622.0, 3272.0, 6696.0, 15026.0, 41884.0, 871756.0, 70167.0, 18833.0, 8177.0, 3855.0, 2039.0, 1061.0, 645.0, 374.0, 228.0, 166.0, 99.0, 62.0, 56.0, 38.0, 36.0, 18.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.522705078125, -12.10009765625, -11.677490234375, -11.2548828125, -10.832275390625, -10.40966796875, -9.987060546875, -9.564453125, -9.141845703125, -8.71923828125, -8.296630859375, -7.8740234375, -7.451416015625, -7.02880859375, -6.606201171875, -6.18359375, -5.760986328125, -5.33837890625, -4.915771484375, -4.4931640625, -4.070556640625, -3.64794921875, -3.225341796875, -2.802734375, -2.380126953125, -1.95751953125, -1.534912109375, -1.1123046875, -0.689697265625, -0.26708984375, 0.155517578125, 0.578125, 1.000732421875, 1.42333984375, 1.845947265625, 2.2685546875, 2.691162109375, 3.11376953125, 3.536376953125, 3.958984375, 4.381591796875, 4.80419921875, 5.226806640625, 5.6494140625, 6.072021484375, 6.49462890625, 6.917236328125, 7.33984375, 7.762451171875, 8.18505859375, 8.607666015625, 9.0302734375, 9.452880859375, 9.87548828125, 10.298095703125, 10.720703125, 11.143310546875, 11.56591796875, 11.988525390625, 12.4111328125, 12.833740234375, 13.25634765625, 13.678955078125, 14.1015625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 4.0, 7.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 5.0, 17.0, 19.0, 30.0, 41.0, 63.0, 64.0, 97.0, 91.0, 126.0, 86.0, 72.0, 53.0, 45.0, 28.0, 20.0, 21.0, 19.0, 11.0, 5.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015010833740234375, -0.0014482289552688599, -0.0013953745365142822, -0.0013425201177597046, -0.001289665699005127, -0.0012368112802505493, -0.0011839568614959717, -0.001131102442741394, -0.0010782480239868164, -0.0010253936052322388, -0.0009725391864776611, -0.0009196847677230835, -0.0008668303489685059, -0.0008139759302139282, -0.0007611215114593506, -0.000708267092704773, -0.0006554126739501953, -0.0006025582551956177, -0.00054970383644104, -0.0004968494176864624, -0.00044399499893188477, -0.00039114058017730713, -0.0003382861614227295, -0.00028543174266815186, -0.00023257732391357422, -0.00017972290515899658, -0.00012686848640441895, -7.401406764984131e-05, -2.1159648895263672e-05, 3.1694769859313965e-05, 8.45491886138916e-05, 0.00013740360736846924, 0.00019025802612304688, 0.0002431124448776245, 0.00029596686363220215, 0.0003488212823867798, 0.0004016757011413574, 0.00045453011989593506, 0.0005073845386505127, 0.0005602389574050903, 0.000613093376159668, 0.0006659477949142456, 0.0007188022136688232, 0.0007716566324234009, 0.0008245110511779785, 0.0008773654699325562, 0.0009302198886871338, 0.0009830743074417114, 0.001035928726196289, 0.0010887831449508667, 0.0011416375637054443, 0.001194491982460022, 0.0012473464012145996, 0.0013002008199691772, 0.0013530552387237549, 0.0014059096574783325, 0.0014587640762329102, 0.0015116184949874878, 0.0015644729137420654, 0.001617327332496643, 0.0016701817512512207, 0.0017230361700057983, 0.001775890588760376, 0.0018287450075149536, 0.0018815994262695312]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 14.0, 22.0, 25.0, 27.0, 37.0, 69.0, 87.0, 131.0, 145.0, 251.0, 364.0, 653.0, 937.0, 1596.0, 2798.0, 5413.0, 11576.0, 27677.0, 69170.0, 169132.0, 305637.0, 252204.0, 117053.0, 46951.0, 18698.0, 8132.0, 3970.0, 2218.0, 1268.0, 770.0, 481.0, 318.0, 206.0, 145.0, 98.0, 77.0, 67.0, 32.0, 31.0, 18.0, 14.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.3385009765625, -8.067626953125, -7.7967529296875, -7.52587890625, -7.2550048828125, -6.984130859375, -6.7132568359375, -6.4423828125, -6.1715087890625, -5.900634765625, -5.6297607421875, -5.35888671875, -5.0880126953125, -4.817138671875, -4.5462646484375, -4.275390625, -4.0045166015625, -3.733642578125, -3.4627685546875, -3.19189453125, -2.9210205078125, -2.650146484375, -2.3792724609375, -2.1083984375, -1.8375244140625, -1.566650390625, -1.2957763671875, -1.02490234375, -0.7540283203125, -0.483154296875, -0.2122802734375, 0.05859375, 0.3294677734375, 0.600341796875, 0.8712158203125, 1.14208984375, 1.4129638671875, 1.683837890625, 1.9547119140625, 2.2255859375, 2.4964599609375, 2.767333984375, 3.0382080078125, 3.30908203125, 3.5799560546875, 3.850830078125, 4.1217041015625, 4.392578125, 4.6634521484375, 4.934326171875, 5.2052001953125, 5.47607421875, 5.7469482421875, 6.017822265625, 6.2886962890625, 6.5595703125, 6.8304443359375, 7.101318359375, 7.3721923828125, 7.64306640625, 7.9139404296875, 8.184814453125, 8.4556884765625, 8.7265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 14.0, 7.0, 17.0, 11.0, 26.0, 29.0, 39.0, 43.0, 43.0, 59.0, 67.0, 76.0, 65.0, 77.0, 71.0, 64.0, 60.0, 37.0, 44.0, 46.0, 18.0, 15.0, 13.0, 7.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5625, -2.487884521484375, -2.41326904296875, -2.338653564453125, -2.2640380859375, -2.189422607421875, -2.11480712890625, -2.040191650390625, -1.965576171875, -1.890960693359375, -1.81634521484375, -1.741729736328125, -1.6671142578125, -1.592498779296875, -1.51788330078125, -1.443267822265625, -1.36865234375, -1.294036865234375, -1.21942138671875, -1.144805908203125, -1.0701904296875, -0.995574951171875, -0.92095947265625, -0.846343994140625, -0.771728515625, -0.697113037109375, -0.62249755859375, -0.547882080078125, -0.4732666015625, -0.398651123046875, -0.32403564453125, -0.249420166015625, -0.1748046875, -0.100189208984375, -0.02557373046875, 0.049041748046875, 0.1236572265625, 0.198272705078125, 0.27288818359375, 0.347503662109375, 0.422119140625, 0.496734619140625, 0.57135009765625, 0.645965576171875, 0.7205810546875, 0.795196533203125, 0.86981201171875, 0.944427490234375, 1.01904296875, 1.093658447265625, 1.16827392578125, 1.242889404296875, 1.3175048828125, 1.392120361328125, 1.46673583984375, 1.541351318359375, 1.615966796875, 1.690582275390625, 1.76519775390625, 1.839813232421875, 1.9144287109375, 1.989044189453125, 2.06365966796875, 2.138275146484375, 2.212890625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 6.0, 17.0, 17.0, 18.0, 32.0, 31.0, 35.0, 43.0, 44.0, 51.0, 46.0, 44.0, 55.0, 62.0, 59.0, 59.0, 63.0, 63.0, 30.0, 37.0, 22.0, 32.0, 28.0, 17.0, 9.0, 16.0, 15.0, 10.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6795768737793, -42.33344268798828, -40.987308502197266, -39.64117431640625, -38.295040130615234, -36.94890594482422, -35.60277557373047, -34.25663757324219, -32.91050720214844, -31.564373016357422, -30.218238830566406, -28.87210464477539, -27.525970458984375, -26.17983627319336, -24.833703994750977, -23.48756980895996, -22.141433715820312, -20.795299530029297, -19.44916534423828, -18.103031158447266, -16.75689697265625, -15.41076374053955, -14.064630508422852, -12.718496322631836, -11.37236213684082, -10.026227951049805, -8.680093765258789, -7.33396053314209, -5.987826347351074, -4.641692161560059, -3.2955589294433594, -1.9494247436523438, -0.6032943725585938, 0.7428395748138428, 2.0889735221862793, 3.4351072311401367, 4.781241416931152, 6.127375602722168, 7.473508834838867, 8.819643020629883, 10.165777206420898, 11.511911392211914, 12.85804557800293, 14.204178810119629, 15.550312995910645, 16.896446228027344, 18.24258041381836, 19.588714599609375, 20.93484878540039, 22.280982971191406, 23.627117156982422, 24.973251342773438, 26.319385528564453, 27.66551971435547, 29.01165199279785, 30.357786178588867, 31.703920364379883, 33.050052642822266, 34.39618682861328, 35.7423210144043, 37.08845520019531, 38.43458938598633, 39.780723571777344, 41.12685775756836, 42.472991943359375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 8.0, 14.0, 15.0, 22.0, 14.0, 17.0, 23.0, 23.0, 26.0, 36.0, 45.0, 37.0, 50.0, 45.0, 44.0, 37.0, 40.0, 50.0, 38.0, 36.0, 37.0, 31.0, 38.0, 37.0, 35.0, 24.0, 31.0, 22.0, 13.0, 11.0, 10.0, 10.0, 10.0, 13.0, 10.0, 11.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.06751251220703, -32.019248962402344, -30.970985412597656, -29.92272186279297, -28.87445831298828, -27.826194763183594, -26.77793312072754, -25.72966957092285, -24.681406021118164, -23.633142471313477, -22.58487892150879, -21.5366153717041, -20.488353729248047, -19.44009017944336, -18.391826629638672, -17.343563079833984, -16.295299530029297, -15.24703598022461, -14.198772430419922, -13.15050983428955, -12.102246284484863, -11.053982734680176, -10.005720138549805, -8.957456588745117, -7.90919303894043, -6.860929489135742, -5.812666416168213, -4.764403343200684, -3.716139793395996, -2.6678762435913086, -1.6196131706237793, -0.57135009765625, 0.4769134521484375, 1.525176763534546, 2.5734400749206543, 3.6217033863067627, 4.669966697692871, 5.718230247497559, 6.766493320465088, 7.814756393432617, 8.863019943237305, 9.911283493041992, 10.95954704284668, 12.00780963897705, 13.056073188781738, 14.104336738586426, 15.152599334716797, 16.200862884521484, 17.249126434326172, 18.29738998413086, 19.345653533935547, 20.393917083740234, 21.442180633544922, 22.49044418334961, 23.538705825805664, 24.58696937561035, 25.63523292541504, 26.683496475219727, 27.731760025024414, 28.7800235748291, 29.828285217285156, 30.876548767089844, 31.92481231689453, 32.97307586669922, 34.021339416503906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 10.0, 7.0, 9.0, 26.0, 36.0, 65.0, 84.0, 150.0, 266.0, 435.0, 626.0, 1034.0, 1545.0, 2758.0, 4381.0, 7177.0, 11724.0, 19783.0, 32302.0, 52482.0, 82212.0, 119950.0, 153634.0, 160014.0, 134926.0, 97701.0, 63941.0, 39833.0, 24007.0, 14620.0, 8879.0, 5327.0, 3328.0, 2001.0, 1187.0, 825.0, 426.0, 293.0, 215.0, 116.0, 97.0, 47.0, 29.0, 17.0, 18.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.353515625, -43.80078125, -42.248046875, -40.6953125, -39.142578125, -37.58984375, -36.037109375, -34.484375, -32.931640625, -31.37890625, -29.826171875, -28.2734375, -26.720703125, -25.16796875, -23.615234375, -22.0625, -20.509765625, -18.95703125, -17.404296875, -15.8515625, -14.298828125, -12.74609375, -11.193359375, -9.640625, -8.087890625, -6.53515625, -4.982421875, -3.4296875, -1.876953125, -0.32421875, 1.228515625, 2.78125, 4.333984375, 5.88671875, 7.439453125, 8.9921875, 10.544921875, 12.09765625, 13.650390625, 15.203125, 16.755859375, 18.30859375, 19.861328125, 21.4140625, 22.966796875, 24.51953125, 26.072265625, 27.625, 29.177734375, 30.73046875, 32.283203125, 33.8359375, 35.388671875, 36.94140625, 38.494140625, 40.046875, 41.599609375, 43.15234375, 44.705078125, 46.2578125, 47.810546875, 49.36328125, 50.916015625, 52.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 5.0, 19.0, 23.0, 18.0, 24.0, 24.0, 22.0, 31.0, 48.0, 39.0, 42.0, 49.0, 32.0, 40.0, 55.0, 44.0, 33.0, 44.0, 42.0, 33.0, 40.0, 31.0, 40.0, 31.0, 27.0, 21.0, 24.0, 13.0, 14.0, 11.0, 10.0, 11.0, 12.0, 4.0, 4.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.125, -34.06884765625, -33.0126953125, -31.95654296875, -30.900390625, -29.84423828125, -28.7880859375, -27.73193359375, -26.67578125, -25.61962890625, -24.5634765625, -23.50732421875, -22.451171875, -21.39501953125, -20.3388671875, -19.28271484375, -18.2265625, -17.17041015625, -16.1142578125, -15.05810546875, -14.001953125, -12.94580078125, -11.8896484375, -10.83349609375, -9.77734375, -8.72119140625, -7.6650390625, -6.60888671875, -5.552734375, -4.49658203125, -3.4404296875, -2.38427734375, -1.328125, -0.27197265625, 0.7841796875, 1.84033203125, 2.896484375, 3.95263671875, 5.0087890625, 6.06494140625, 7.12109375, 8.17724609375, 9.2333984375, 10.28955078125, 11.345703125, 12.40185546875, 13.4580078125, 14.51416015625, 15.5703125, 16.62646484375, 17.6826171875, 18.73876953125, 19.794921875, 20.85107421875, 21.9072265625, 22.96337890625, 24.01953125, 25.07568359375, 26.1318359375, 27.18798828125, 28.244140625, 29.30029296875, 30.3564453125, 31.41259765625, 32.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 11.0, 22.0, 22.0, 26.0, 55.0, 74.0, 140.0, 205.0, 331.0, 444.0, 694.0, 1046.0, 1694.0, 2612.0, 4080.0, 6458.0, 10088.0, 15876.0, 24345.0, 36531.0, 53850.0, 74753.0, 98237.0, 119230.0, 127979.0, 120742.0, 101367.0, 78924.0, 56674.0, 39229.0, 25906.0, 16806.0, 10826.0, 6882.0, 4419.0, 2897.0, 1827.0, 1155.0, 699.0, 485.0, 337.0, 202.0, 122.0, 87.0, 51.0, 34.0, 25.0, 18.0, 7.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-38.46875, -37.25048828125, -36.0322265625, -34.81396484375, -33.595703125, -32.37744140625, -31.1591796875, -29.94091796875, -28.72265625, -27.50439453125, -26.2861328125, -25.06787109375, -23.849609375, -22.63134765625, -21.4130859375, -20.19482421875, -18.9765625, -17.75830078125, -16.5400390625, -15.32177734375, -14.103515625, -12.88525390625, -11.6669921875, -10.44873046875, -9.23046875, -8.01220703125, -6.7939453125, -5.57568359375, -4.357421875, -3.13916015625, -1.9208984375, -0.70263671875, 0.515625, 1.73388671875, 2.9521484375, 4.17041015625, 5.388671875, 6.60693359375, 7.8251953125, 9.04345703125, 10.26171875, 11.47998046875, 12.6982421875, 13.91650390625, 15.134765625, 16.35302734375, 17.5712890625, 18.78955078125, 20.0078125, 21.22607421875, 22.4443359375, 23.66259765625, 24.880859375, 26.09912109375, 27.3173828125, 28.53564453125, 29.75390625, 30.97216796875, 32.1904296875, 33.40869140625, 34.626953125, 35.84521484375, 37.0634765625, 38.28173828125, 39.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 4.0, 4.0, 8.0, 18.0, 17.0, 19.0, 15.0, 22.0, 30.0, 23.0, 30.0, 41.0, 34.0, 38.0, 38.0, 23.0, 49.0, 40.0, 44.0, 37.0, 49.0, 41.0, 43.0, 38.0, 40.0, 33.0, 34.0, 22.0, 27.0, 34.0, 22.0, 20.0, 6.0, 15.0, 7.0, 5.0, 6.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.906982421875, -20.22021484375, -19.533447265625, -18.8466796875, -18.159912109375, -17.47314453125, -16.786376953125, -16.099609375, -15.412841796875, -14.72607421875, -14.039306640625, -13.3525390625, -12.665771484375, -11.97900390625, -11.292236328125, -10.60546875, -9.918701171875, -9.23193359375, -8.545166015625, -7.8583984375, -7.171630859375, -6.48486328125, -5.798095703125, -5.111328125, -4.424560546875, -3.73779296875, -3.051025390625, -2.3642578125, -1.677490234375, -0.99072265625, -0.303955078125, 0.3828125, 1.069580078125, 1.75634765625, 2.443115234375, 3.1298828125, 3.816650390625, 4.50341796875, 5.190185546875, 5.876953125, 6.563720703125, 7.25048828125, 7.937255859375, 8.6240234375, 9.310791015625, 9.99755859375, 10.684326171875, 11.37109375, 12.057861328125, 12.74462890625, 13.431396484375, 14.1181640625, 14.804931640625, 15.49169921875, 16.178466796875, 16.865234375, 17.552001953125, 18.23876953125, 18.925537109375, 19.6123046875, 20.299072265625, 20.98583984375, 21.672607421875, 22.359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 9.0, 10.0, 28.0, 35.0, 54.0, 58.0, 92.0, 121.0, 148.0, 250.0, 298.0, 426.0, 634.0, 845.0, 1316.0, 1972.0, 3060.0, 4913.0, 8636.0, 15645.0, 30174.0, 63290.0, 132167.0, 237114.0, 249854.0, 148872.0, 71605.0, 34504.0, 17297.0, 9475.0, 5503.0, 3328.0, 2136.0, 1469.0, 926.0, 640.0, 463.0, 309.0, 258.0, 188.0, 108.0, 86.0, 71.0, 57.0, 31.0, 21.0, 20.0, 15.0, 11.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-27.84375, -27.002197265625, -26.16064453125, -25.319091796875, -24.4775390625, -23.635986328125, -22.79443359375, -21.952880859375, -21.111328125, -20.269775390625, -19.42822265625, -18.586669921875, -17.7451171875, -16.903564453125, -16.06201171875, -15.220458984375, -14.37890625, -13.537353515625, -12.69580078125, -11.854248046875, -11.0126953125, -10.171142578125, -9.32958984375, -8.488037109375, -7.646484375, -6.804931640625, -5.96337890625, -5.121826171875, -4.2802734375, -3.438720703125, -2.59716796875, -1.755615234375, -0.9140625, -0.072509765625, 0.76904296875, 1.610595703125, 2.4521484375, 3.293701171875, 4.13525390625, 4.976806640625, 5.818359375, 6.659912109375, 7.50146484375, 8.343017578125, 9.1845703125, 10.026123046875, 10.86767578125, 11.709228515625, 12.55078125, 13.392333984375, 14.23388671875, 15.075439453125, 15.9169921875, 16.758544921875, 17.60009765625, 18.441650390625, 19.283203125, 20.124755859375, 20.96630859375, 21.807861328125, 22.6494140625, 23.490966796875, 24.33251953125, 25.174072265625, 26.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 18.0, 13.0, 29.0, 30.0, 65.0, 81.0, 116.0, 144.0, 139.0, 92.0, 82.0, 57.0, 32.0, 19.0, 24.0, 14.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00426483154296875, -0.004131019115447998, -0.003997206687927246, -0.003863394260406494, -0.003729581832885742, -0.0035957694053649902, -0.0034619569778442383, -0.0033281445503234863, -0.0031943321228027344, -0.0030605196952819824, -0.0029267072677612305, -0.0027928948402404785, -0.0026590824127197266, -0.0025252699851989746, -0.0023914575576782227, -0.0022576451301574707, -0.0021238327026367188, -0.001990020275115967, -0.0018562078475952148, -0.0017223954200744629, -0.001588582992553711, -0.001454770565032959, -0.001320958137512207, -0.001187145709991455, -0.0010533332824707031, -0.0009195208549499512, -0.0007857084274291992, -0.0006518959999084473, -0.0005180835723876953, -0.00038427114486694336, -0.0002504587173461914, -0.00011664628982543945, 1.71661376953125e-05, 0.00015097856521606445, 0.0002847909927368164, 0.00041860342025756836, 0.0005524158477783203, 0.0006862282752990723, 0.0008200407028198242, 0.0009538531303405762, 0.0010876655578613281, 0.00122147798538208, 0.001355290412902832, 0.001489102840423584, 0.001622915267944336, 0.0017567276954650879, 0.0018905401229858398, 0.002024352550506592, 0.0021581649780273438, 0.0022919774055480957, 0.0024257898330688477, 0.0025596022605895996, 0.0026934146881103516, 0.0028272271156311035, 0.0029610395431518555, 0.0030948519706726074, 0.0032286643981933594, 0.0033624768257141113, 0.0034962892532348633, 0.0036301016807556152, 0.003763914108276367, 0.003897726535797119, 0.004031538963317871, 0.004165351390838623, 0.004299163818359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 12.0, 21.0, 21.0, 22.0, 32.0, 74.0, 95.0, 139.0, 203.0, 286.0, 487.0, 715.0, 1245.0, 1940.0, 3362.0, 6063.0, 11646.0, 22713.0, 47580.0, 98558.0, 182236.0, 247010.0, 200390.0, 113167.0, 54637.0, 26401.0, 13086.0, 6899.0, 3773.0, 2164.0, 1277.0, 775.0, 478.0, 321.0, 232.0, 142.0, 114.0, 68.0, 44.0, 45.0, 27.0, 19.0, 15.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-24.65625, -23.963623046875, -23.27099609375, -22.578369140625, -21.8857421875, -21.193115234375, -20.50048828125, -19.807861328125, -19.115234375, -18.422607421875, -17.72998046875, -17.037353515625, -16.3447265625, -15.652099609375, -14.95947265625, -14.266845703125, -13.57421875, -12.881591796875, -12.18896484375, -11.496337890625, -10.8037109375, -10.111083984375, -9.41845703125, -8.725830078125, -8.033203125, -7.340576171875, -6.64794921875, -5.955322265625, -5.2626953125, -4.570068359375, -3.87744140625, -3.184814453125, -2.4921875, -1.799560546875, -1.10693359375, -0.414306640625, 0.2783203125, 0.970947265625, 1.66357421875, 2.356201171875, 3.048828125, 3.741455078125, 4.43408203125, 5.126708984375, 5.8193359375, 6.511962890625, 7.20458984375, 7.897216796875, 8.58984375, 9.282470703125, 9.97509765625, 10.667724609375, 11.3603515625, 12.052978515625, 12.74560546875, 13.438232421875, 14.130859375, 14.823486328125, 15.51611328125, 16.208740234375, 16.9013671875, 17.593994140625, 18.28662109375, 18.979248046875, 19.671875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 14.0, 20.0, 19.0, 34.0, 33.0, 44.0, 48.0, 69.0, 52.0, 82.0, 62.0, 61.0, 64.0, 62.0, 59.0, 52.0, 32.0, 33.0, 30.0, 20.0, 17.0, 13.0, 16.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.289306640625, -8.06298828125, -7.836669921875, -7.6103515625, -7.384033203125, -7.15771484375, -6.931396484375, -6.705078125, -6.478759765625, -6.25244140625, -6.026123046875, -5.7998046875, -5.573486328125, -5.34716796875, -5.120849609375, -4.89453125, -4.668212890625, -4.44189453125, -4.215576171875, -3.9892578125, -3.762939453125, -3.53662109375, -3.310302734375, -3.083984375, -2.857666015625, -2.63134765625, -2.405029296875, -2.1787109375, -1.952392578125, -1.72607421875, -1.499755859375, -1.2734375, -1.047119140625, -0.82080078125, -0.594482421875, -0.3681640625, -0.141845703125, 0.08447265625, 0.310791015625, 0.537109375, 0.763427734375, 0.98974609375, 1.216064453125, 1.4423828125, 1.668701171875, 1.89501953125, 2.121337890625, 2.34765625, 2.573974609375, 2.80029296875, 3.026611328125, 3.2529296875, 3.479248046875, 3.70556640625, 3.931884765625, 4.158203125, 4.384521484375, 4.61083984375, 4.837158203125, 5.0634765625, 5.289794921875, 5.51611328125, 5.742431640625, 5.96875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 13.0, 15.0, 16.0, 23.0, 27.0, 32.0, 38.0, 41.0, 34.0, 45.0, 40.0, 62.0, 62.0, 43.0, 44.0, 47.0, 50.0, 56.0, 41.0, 37.0, 28.0, 31.0, 18.0, 21.0, 15.0, 18.0, 18.0, 18.0, 8.0, 7.0, 9.0, 8.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.633331298828125, -33.47809600830078, -32.32286071777344, -31.167621612548828, -30.012386322021484, -28.85715103149414, -27.701913833618164, -26.546676635742188, -25.391441345214844, -24.2362060546875, -23.080968856811523, -21.925731658935547, -20.770496368408203, -19.61526107788086, -18.460023880004883, -17.304786682128906, -16.149551391601562, -14.994315147399902, -13.839078903198242, -12.683842658996582, -11.528606414794922, -10.373370170593262, -9.218133926391602, -8.062897682189941, -6.907661437988281, -5.752425193786621, -4.597188949584961, -3.441952705383301, -2.2867164611816406, -1.1314802169799805, 0.023756027221679688, 1.1789922714233398, 2.3342247009277344, 3.4894609451293945, 4.644697189331055, 5.799933433532715, 6.955169677734375, 8.110405921936035, 9.265642166137695, 10.420878410339355, 11.576114654541016, 12.731350898742676, 13.886587142944336, 15.041823387145996, 16.197059631347656, 17.352294921875, 18.507532119750977, 19.662769317626953, 20.818004608154297, 21.97323989868164, 23.128477096557617, 24.283714294433594, 25.438949584960938, 26.59418487548828, 27.749422073364258, 28.904659271240234, 30.059894561767578, 31.215129852294922, 32.37036895751953, 33.525604248046875, 34.68083953857422, 35.83607482910156, 36.991310119628906, 38.146549224853516, 39.30178451538086]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 14.0, 12.0, 5.0, 11.0, 17.0, 21.0, 28.0, 28.0, 34.0, 25.0, 43.0, 46.0, 37.0, 38.0, 45.0, 43.0, 44.0, 34.0, 45.0, 34.0, 43.0, 39.0, 46.0, 39.0, 30.0, 28.0, 14.0, 28.0, 19.0, 15.0, 13.0, 14.0, 9.0, 14.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.706998825073242, -30.668437957763672, -29.6298770904541, -28.59131622314453, -27.552757263183594, -26.514196395874023, -25.475635528564453, -24.437074661254883, -23.398513793945312, -22.359952926635742, -21.321392059326172, -20.282833099365234, -19.244272232055664, -18.205711364746094, -17.167150497436523, -16.128589630126953, -15.090030670166016, -14.051469802856445, -13.012909889221191, -11.974349021911621, -10.935789108276367, -9.897228240966797, -8.858667373657227, -7.8201069831848145, -6.781546592712402, -5.74298620223999, -4.704425811767578, -3.665864944458008, -2.6273045539855957, -1.5887441635131836, -0.5501832962036133, 0.48837709426879883, 1.5269393920898438, 2.565499782562256, 3.604060411453247, 4.642621040344238, 5.68118143081665, 6.7197418212890625, 7.758302688598633, 8.796863555908203, 9.835423469543457, 10.873984336853027, 11.912544250488281, 12.951105117797852, 13.989665985107422, 15.028225898742676, 16.066787719726562, 17.1053466796875, 18.14390754699707, 19.18246841430664, 20.22102928161621, 21.25959014892578, 22.29814910888672, 23.33670997619629, 24.37527084350586, 25.41383171081543, 26.452392578125, 27.49095344543457, 28.52951431274414, 29.568073272705078, 30.60663414001465, 31.64519500732422, 32.683753967285156, 33.72231674194336, 34.7608757019043]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 17.0, 23.0, 39.0, 47.0, 63.0, 121.0, 213.0, 325.0, 594.0, 895.0, 1604.0, 2829.0, 5014.0, 9416.0, 18376.0, 36398.0, 73236.0, 155542.0, 342569.0, 757604.0, 1179749.0, 857405.0, 400112.0, 179642.0, 85275.0, 41617.0, 20869.0, 10897.0, 5859.0, 3313.0, 1841.0, 1096.0, 645.0, 404.0, 233.0, 135.0, 90.0, 64.0, 35.0, 32.0, 15.0, 15.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.66064453125, -46.1025390625, -44.54443359375, -42.986328125, -41.42822265625, -39.8701171875, -38.31201171875, -36.75390625, -35.19580078125, -33.6376953125, -32.07958984375, -30.521484375, -28.96337890625, -27.4052734375, -25.84716796875, -24.2890625, -22.73095703125, -21.1728515625, -19.61474609375, -18.056640625, -16.49853515625, -14.9404296875, -13.38232421875, -11.82421875, -10.26611328125, -8.7080078125, -7.14990234375, -5.591796875, -4.03369140625, -2.4755859375, -0.91748046875, 0.640625, 2.19873046875, 3.7568359375, 5.31494140625, 6.873046875, 8.43115234375, 9.9892578125, 11.54736328125, 13.10546875, 14.66357421875, 16.2216796875, 17.77978515625, 19.337890625, 20.89599609375, 22.4541015625, 24.01220703125, 25.5703125, 27.12841796875, 28.6865234375, 30.24462890625, 31.802734375, 33.36083984375, 34.9189453125, 36.47705078125, 38.03515625, 39.59326171875, 41.1513671875, 42.70947265625, 44.267578125, 45.82568359375, 47.3837890625, 48.94189453125, 50.5]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 11.0, 8.0, 10.0, 7.0, 14.0, 14.0, 23.0, 20.0, 29.0, 30.0, 24.0, 31.0, 45.0, 38.0, 40.0, 43.0, 45.0, 40.0, 39.0, 35.0, 44.0, 40.0, 44.0, 46.0, 35.0, 35.0, 30.0, 21.0, 17.0, 19.0, 22.0, 13.0, 17.0, 11.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.484375, -21.7109375, -20.9375, -20.1640625, -19.390625, -18.6171875, -17.84375, -17.0703125, -16.296875, -15.5234375, -14.75, -13.9765625, -13.203125, -12.4296875, -11.65625, -10.8828125, -10.109375, -9.3359375, -8.5625, -7.7890625, -7.015625, -6.2421875, -5.46875, -4.6953125, -3.921875, -3.1484375, -2.375, -1.6015625, -0.828125, -0.0546875, 0.71875, 1.4921875, 2.265625, 3.0390625, 3.8125, 4.5859375, 5.359375, 6.1328125, 6.90625, 7.6796875, 8.453125, 9.2265625, 10.0, 10.7734375, 11.546875, 12.3203125, 13.09375, 13.8671875, 14.640625, 15.4140625, 16.1875, 16.9609375, 17.734375, 18.5078125, 19.28125, 20.0546875, 20.828125, 21.6015625, 22.375, 23.1484375, 23.921875, 24.6953125, 25.46875, 26.2421875, 27.015625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 10.0, 20.0, 33.0, 38.0, 66.0, 95.0, 144.0, 234.0, 389.0, 560.0, 828.0, 1441.0, 2280.0, 3597.0, 5825.0, 9619.0, 15725.0, 26692.0, 45326.0, 77868.0, 135858.0, 237061.0, 407247.0, 657065.0, 834209.0, 690841.0, 435566.0, 254270.0, 146333.0, 83795.0, 48738.0, 28605.0, 16974.0, 10215.0, 6262.0, 3863.0, 2273.0, 1558.0, 956.0, 644.0, 384.0, 255.0, 144.0, 132.0, 79.0, 56.0, 33.0, 18.0, 10.0, 17.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-31.234375, -30.244873046875, -29.25537109375, -28.265869140625, -27.2763671875, -26.286865234375, -25.29736328125, -24.307861328125, -23.318359375, -22.328857421875, -21.33935546875, -20.349853515625, -19.3603515625, -18.370849609375, -17.38134765625, -16.391845703125, -15.40234375, -14.412841796875, -13.42333984375, -12.433837890625, -11.4443359375, -10.454833984375, -9.46533203125, -8.475830078125, -7.486328125, -6.496826171875, -5.50732421875, -4.517822265625, -3.5283203125, -2.538818359375, -1.54931640625, -0.559814453125, 0.4296875, 1.419189453125, 2.40869140625, 3.398193359375, 4.3876953125, 5.377197265625, 6.36669921875, 7.356201171875, 8.345703125, 9.335205078125, 10.32470703125, 11.314208984375, 12.3037109375, 13.293212890625, 14.28271484375, 15.272216796875, 16.26171875, 17.251220703125, 18.24072265625, 19.230224609375, 20.2197265625, 21.209228515625, 22.19873046875, 23.188232421875, 24.177734375, 25.167236328125, 26.15673828125, 27.146240234375, 28.1357421875, 29.125244140625, 30.11474609375, 31.104248046875, 32.09375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 7.0, 17.0, 19.0, 20.0, 42.0, 51.0, 54.0, 62.0, 79.0, 96.0, 132.0, 154.0, 209.0, 240.0, 303.0, 299.0, 334.0, 322.0, 293.0, 245.0, 221.0, 191.0, 140.0, 112.0, 89.0, 70.0, 54.0, 53.0, 47.0, 21.0, 19.0, 19.0, 16.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.6328125, -15.19384765625, -14.7548828125, -14.31591796875, -13.876953125, -13.43798828125, -12.9990234375, -12.56005859375, -12.12109375, -11.68212890625, -11.2431640625, -10.80419921875, -10.365234375, -9.92626953125, -9.4873046875, -9.04833984375, -8.609375, -8.17041015625, -7.7314453125, -7.29248046875, -6.853515625, -6.41455078125, -5.9755859375, -5.53662109375, -5.09765625, -4.65869140625, -4.2197265625, -3.78076171875, -3.341796875, -2.90283203125, -2.4638671875, -2.02490234375, -1.5859375, -1.14697265625, -0.7080078125, -0.26904296875, 0.169921875, 0.60888671875, 1.0478515625, 1.48681640625, 1.92578125, 2.36474609375, 2.8037109375, 3.24267578125, 3.681640625, 4.12060546875, 4.5595703125, 4.99853515625, 5.4375, 5.87646484375, 6.3154296875, 6.75439453125, 7.193359375, 7.63232421875, 8.0712890625, 8.51025390625, 8.94921875, 9.38818359375, 9.8271484375, 10.26611328125, 10.705078125, 11.14404296875, 11.5830078125, 12.02197265625, 12.4609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 4.0, 11.0, 9.0, 22.0, 22.0, 32.0, 27.0, 37.0, 43.0, 49.0, 49.0, 55.0, 49.0, 54.0, 37.0, 61.0, 58.0, 44.0, 50.0, 42.0, 35.0, 30.0, 22.0, 22.0, 24.0, 21.0, 11.0, 12.0, 8.0, 11.0, 10.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.513519287109375, -31.45552635192871, -30.397533416748047, -29.339542388916016, -28.28154945373535, -27.223556518554688, -26.165565490722656, -25.107572555541992, -24.049579620361328, -22.991586685180664, -21.93359375, -20.87560272216797, -19.817609786987305, -18.75961685180664, -17.70162582397461, -16.643632888793945, -15.585639953613281, -14.527647018432617, -13.46965503692627, -12.411663055419922, -11.353670120239258, -10.295677185058594, -9.237685203552246, -8.179693222045898, -7.121700286865234, -6.0637078285217285, -5.005715370178223, -3.947722911834717, -2.889730453491211, -1.831737995147705, -0.7737455368041992, 0.28424692153930664, 1.3422393798828125, 2.4002318382263184, 3.458224296569824, 4.51621675491333, 5.574209213256836, 6.632201671600342, 7.690194129943848, 8.748186111450195, 9.80617904663086, 10.864171981811523, 11.922163963317871, 12.980155944824219, 14.038148880004883, 15.096141815185547, 16.154132843017578, 17.212125778198242, 18.270118713378906, 19.32811164855957, 20.386104583740234, 21.444095611572266, 22.50208854675293, 23.560081481933594, 24.618072509765625, 25.67606544494629, 26.734058380126953, 27.792051315307617, 28.85004425048828, 29.908035278320312, 30.966028213500977, 32.02402114868164, 33.08201217651367, 34.14000701904297, 35.197998046875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 10.0, 9.0, 15.0, 20.0, 20.0, 21.0, 25.0, 36.0, 23.0, 34.0, 44.0, 61.0, 41.0, 64.0, 49.0, 58.0, 49.0, 41.0, 45.0, 44.0, 37.0, 36.0, 27.0, 34.0, 21.0, 19.0, 18.0, 16.0, 8.0, 12.0, 9.0, 7.0, 9.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.375486373901367, -27.36140251159668, -26.347320556640625, -25.333236694335938, -24.31915283203125, -23.305070877075195, -22.290987014770508, -21.276905059814453, -20.262821197509766, -19.248737335205078, -18.234655380249023, -17.220571517944336, -16.20648956298828, -15.192405700683594, -14.178321838378906, -13.164238929748535, -12.150156021118164, -11.136073112487793, -10.121990203857422, -9.107906341552734, -8.093823432922363, -7.079740524291992, -6.065657138824463, -5.051573753356934, -4.0374908447265625, -3.0234076976776123, -2.009324550628662, -0.9952414035797119, 0.01884174346923828, 1.0329246520996094, 2.0470080375671387, 3.061091423034668, 4.075172424316406, 5.089255332946777, 6.103338718414307, 7.117422103881836, 8.131505012512207, 9.145587921142578, 10.159671783447266, 11.173754692077637, 12.187837600708008, 13.201920509338379, 14.21600341796875, 15.230087280273438, 16.244171142578125, 17.25825309753418, 18.272336959838867, 19.286418914794922, 20.30050277709961, 21.314586639404297, 22.32866859436035, 23.34275245666504, 24.356834411621094, 25.37091827392578, 26.38500213623047, 27.399085998535156, 28.41316795349121, 29.4272518157959, 30.441333770751953, 31.45541763305664, 32.46950149536133, 33.48358154296875, 34.49766540527344, 35.511749267578125, 36.52583312988281]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 11.0, 19.0, 30.0, 46.0, 73.0, 104.0, 175.0, 248.0, 413.0, 663.0, 983.0, 1461.0, 2387.0, 3757.0, 5858.0, 8732.0, 13332.0, 19894.0, 28808.0, 41133.0, 56461.0, 74338.0, 92917.0, 108226.0, 116060.0, 109573.0, 94669.0, 76198.0, 58117.0, 42635.0, 30058.0, 20673.0, 14024.0, 9170.0, 6191.0, 3905.0, 2564.0, 1742.0, 1007.0, 674.0, 409.0, 269.0, 201.0, 118.0, 67.0, 60.0, 36.0, 27.0, 10.0, 12.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-16.453125, -15.94775390625, -15.4423828125, -14.93701171875, -14.431640625, -13.92626953125, -13.4208984375, -12.91552734375, -12.41015625, -11.90478515625, -11.3994140625, -10.89404296875, -10.388671875, -9.88330078125, -9.3779296875, -8.87255859375, -8.3671875, -7.86181640625, -7.3564453125, -6.85107421875, -6.345703125, -5.84033203125, -5.3349609375, -4.82958984375, -4.32421875, -3.81884765625, -3.3134765625, -2.80810546875, -2.302734375, -1.79736328125, -1.2919921875, -0.78662109375, -0.28125, 0.22412109375, 0.7294921875, 1.23486328125, 1.740234375, 2.24560546875, 2.7509765625, 3.25634765625, 3.76171875, 4.26708984375, 4.7724609375, 5.27783203125, 5.783203125, 6.28857421875, 6.7939453125, 7.29931640625, 7.8046875, 8.31005859375, 8.8154296875, 9.32080078125, 9.826171875, 10.33154296875, 10.8369140625, 11.34228515625, 11.84765625, 12.35302734375, 12.8583984375, 13.36376953125, 13.869140625, 14.37451171875, 14.8798828125, 15.38525390625, 15.890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 11.0, 3.0, 8.0, 9.0, 9.0, 17.0, 17.0, 21.0, 19.0, 16.0, 25.0, 28.0, 33.0, 33.0, 47.0, 38.0, 48.0, 53.0, 48.0, 48.0, 40.0, 42.0, 47.0, 49.0, 43.0, 44.0, 29.0, 22.0, 23.0, 20.0, 23.0, 16.0, 15.0, 15.0, 8.0, 5.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.375, -21.609375, -20.84375, -20.078125, -19.3125, -18.546875, -17.78125, -17.015625, -16.25, -15.484375, -14.71875, -13.953125, -13.1875, -12.421875, -11.65625, -10.890625, -10.125, -9.359375, -8.59375, -7.828125, -7.0625, -6.296875, -5.53125, -4.765625, -4.0, -3.234375, -2.46875, -1.703125, -0.9375, -0.171875, 0.59375, 1.359375, 2.125, 2.890625, 3.65625, 4.421875, 5.1875, 5.953125, 6.71875, 7.484375, 8.25, 9.015625, 9.78125, 10.546875, 11.3125, 12.078125, 12.84375, 13.609375, 14.375, 15.140625, 15.90625, 16.671875, 17.4375, 18.203125, 18.96875, 19.734375, 20.5, 21.265625, 22.03125, 22.796875, 23.5625, 24.328125, 25.09375, 25.859375, 26.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 3.0, 8.0, 16.0, 20.0, 23.0, 32.0, 47.0, 65.0, 103.0, 152.0, 189.0, 308.0, 422.0, 617.0, 918.0, 1594.0, 2143.0, 3373.0, 5210.0, 8223.0, 13000.0, 22547.0, 87186.0, 804089.0, 46583.0, 19393.0, 11493.0, 7163.0, 4642.0, 2945.0, 1981.0, 1297.0, 855.0, 613.0, 399.0, 261.0, 194.0, 125.0, 103.0, 70.0, 34.0, 28.0, 30.0, 16.0, 14.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.84375, -50.2421875, -48.640625, -47.0390625, -45.4375, -43.8359375, -42.234375, -40.6328125, -39.03125, -37.4296875, -35.828125, -34.2265625, -32.625, -31.0234375, -29.421875, -27.8203125, -26.21875, -24.6171875, -23.015625, -21.4140625, -19.8125, -18.2109375, -16.609375, -15.0078125, -13.40625, -11.8046875, -10.203125, -8.6015625, -7.0, -5.3984375, -3.796875, -2.1953125, -0.59375, 1.0078125, 2.609375, 4.2109375, 5.8125, 7.4140625, 9.015625, 10.6171875, 12.21875, 13.8203125, 15.421875, 17.0234375, 18.625, 20.2265625, 21.828125, 23.4296875, 25.03125, 26.6328125, 28.234375, 29.8359375, 31.4375, 33.0390625, 34.640625, 36.2421875, 37.84375, 39.4453125, 41.046875, 42.6484375, 44.25, 45.8515625, 47.453125, 49.0546875, 50.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 7.0, 6.0, 5.0, 10.0, 6.0, 11.0, 14.0, 23.0, 25.0, 31.0, 35.0, 41.0, 46.0, 43.0, 47.0, 53.0, 58.0, 55.0, 63.0, 44.0, 47.0, 48.0, 38.0, 35.0, 20.0, 26.0, 31.0, 22.0, 20.0, 19.0, 13.0, 8.0, 9.0, 9.0, 3.0, 8.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-47.65625, -46.3984375, -45.140625, -43.8828125, -42.625, -41.3671875, -40.109375, -38.8515625, -37.59375, -36.3359375, -35.078125, -33.8203125, -32.5625, -31.3046875, -30.046875, -28.7890625, -27.53125, -26.2734375, -25.015625, -23.7578125, -22.5, -21.2421875, -19.984375, -18.7265625, -17.46875, -16.2109375, -14.953125, -13.6953125, -12.4375, -11.1796875, -9.921875, -8.6640625, -7.40625, -6.1484375, -4.890625, -3.6328125, -2.375, -1.1171875, 0.140625, 1.3984375, 2.65625, 3.9140625, 5.171875, 6.4296875, 7.6875, 8.9453125, 10.203125, 11.4609375, 12.71875, 13.9765625, 15.234375, 16.4921875, 17.75, 19.0078125, 20.265625, 21.5234375, 22.78125, 24.0390625, 25.296875, 26.5546875, 27.8125, 29.0703125, 30.328125, 31.5859375, 32.84375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 10.0, 12.0, 17.0, 18.0, 31.0, 32.0, 54.0, 69.0, 93.0, 165.0, 234.0, 369.0, 581.0, 930.0, 1781.0, 3296.0, 7160.0, 18895.0, 124629.0, 837984.0, 31502.0, 10398.0, 4657.0, 2320.0, 1254.0, 708.0, 481.0, 284.0, 182.0, 129.0, 89.0, 44.0, 43.0, 32.0, 18.0, 16.0, 4.0, 6.0, 6.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.25, -31.333984375, -30.41796875, -29.501953125, -28.5859375, -27.669921875, -26.75390625, -25.837890625, -24.921875, -24.005859375, -23.08984375, -22.173828125, -21.2578125, -20.341796875, -19.42578125, -18.509765625, -17.59375, -16.677734375, -15.76171875, -14.845703125, -13.9296875, -13.013671875, -12.09765625, -11.181640625, -10.265625, -9.349609375, -8.43359375, -7.517578125, -6.6015625, -5.685546875, -4.76953125, -3.853515625, -2.9375, -2.021484375, -1.10546875, -0.189453125, 0.7265625, 1.642578125, 2.55859375, 3.474609375, 4.390625, 5.306640625, 6.22265625, 7.138671875, 8.0546875, 8.970703125, 9.88671875, 10.802734375, 11.71875, 12.634765625, 13.55078125, 14.466796875, 15.3828125, 16.298828125, 17.21484375, 18.130859375, 19.046875, 19.962890625, 20.87890625, 21.794921875, 22.7109375, 23.626953125, 24.54296875, 25.458984375, 26.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 15.0, 37.0, 38.0, 33.0, 58.0, 61.0, 80.0, 104.0, 117.0, 90.0, 55.0, 53.0, 38.0, 43.0, 31.0, 27.0, 10.0, 12.0, 13.0, 8.0, 6.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006221771240234375, -0.006039679050445557, -0.005857586860656738, -0.00567549467086792, -0.0054934024810791016, -0.005311310291290283, -0.005129218101501465, -0.0049471259117126465, -0.004765033721923828, -0.00458294153213501, -0.004400849342346191, -0.004218757152557373, -0.004036664962768555, -0.0038545727729797363, -0.003672480583190918, -0.0034903883934020996, -0.0033082962036132812, -0.003126204013824463, -0.0029441118240356445, -0.002762019634246826, -0.002579927444458008, -0.0023978352546691895, -0.002215743064880371, -0.0020336508750915527, -0.0018515586853027344, -0.001669466495513916, -0.0014873743057250977, -0.0013052821159362793, -0.001123189926147461, -0.0009410977363586426, -0.0007590055465698242, -0.0005769133567810059, -0.0003948211669921875, -0.00021272897720336914, -3.063678741455078e-05, 0.00015145540237426758, 0.00033354759216308594, 0.0005156397819519043, 0.0006977319717407227, 0.000879824161529541, 0.0010619163513183594, 0.0012440085411071777, 0.001426100730895996, 0.0016081929206848145, 0.0017902851104736328, 0.001972377300262451, 0.0021544694900512695, 0.002336561679840088, 0.0025186538696289062, 0.0027007460594177246, 0.002882838249206543, 0.0030649304389953613, 0.0032470226287841797, 0.003429114818572998, 0.0036112070083618164, 0.0037932991981506348, 0.003975391387939453, 0.0041574835777282715, 0.00433957576751709, 0.004521667957305908, 0.0047037601470947266, 0.004885852336883545, 0.005067944526672363, 0.005250036716461182, 0.00543212890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 20.0, 12.0, 27.0, 42.0, 65.0, 121.0, 124.0, 190.0, 287.0, 409.0, 519.0, 810.0, 1174.0, 1634.0, 2608.0, 3965.0, 6219.0, 10402.0, 18369.0, 34876.0, 70600.0, 151308.0, 278254.0, 234171.0, 112728.0, 53422.0, 27331.0, 14805.0, 8623.0, 5292.0, 3303.0, 2115.0, 1517.0, 994.0, 676.0, 488.0, 319.0, 202.0, 167.0, 111.0, 72.0, 44.0, 45.0, 23.0, 13.0, 17.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0], "bins": [-5.0625, -4.908203125, -4.75390625, -4.599609375, -4.4453125, -4.291015625, -4.13671875, -3.982421875, -3.828125, -3.673828125, -3.51953125, -3.365234375, -3.2109375, -3.056640625, -2.90234375, -2.748046875, -2.59375, -2.439453125, -2.28515625, -2.130859375, -1.9765625, -1.822265625, -1.66796875, -1.513671875, -1.359375, -1.205078125, -1.05078125, -0.896484375, -0.7421875, -0.587890625, -0.43359375, -0.279296875, -0.125, 0.029296875, 0.18359375, 0.337890625, 0.4921875, 0.646484375, 0.80078125, 0.955078125, 1.109375, 1.263671875, 1.41796875, 1.572265625, 1.7265625, 1.880859375, 2.03515625, 2.189453125, 2.34375, 2.498046875, 2.65234375, 2.806640625, 2.9609375, 3.115234375, 3.26953125, 3.423828125, 3.578125, 3.732421875, 3.88671875, 4.041015625, 4.1953125, 4.349609375, 4.50390625, 4.658203125, 4.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 12.0, 12.0, 13.0, 16.0, 21.0, 16.0, 32.0, 37.0, 33.0, 54.0, 61.0, 72.0, 65.0, 55.0, 60.0, 54.0, 61.0, 44.0, 47.0, 41.0, 37.0, 15.0, 23.0, 17.0, 14.0, 16.0, 16.0, 16.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.376434326171875, -1.33197021484375, -1.287506103515625, -1.2430419921875, -1.198577880859375, -1.15411376953125, -1.109649658203125, -1.065185546875, -1.020721435546875, -0.97625732421875, -0.931793212890625, -0.8873291015625, -0.842864990234375, -0.79840087890625, -0.753936767578125, -0.70947265625, -0.665008544921875, -0.62054443359375, -0.576080322265625, -0.5316162109375, -0.487152099609375, -0.44268798828125, -0.398223876953125, -0.353759765625, -0.309295654296875, -0.26483154296875, -0.220367431640625, -0.1759033203125, -0.131439208984375, -0.08697509765625, -0.042510986328125, 0.001953125, 0.046417236328125, 0.09088134765625, 0.135345458984375, 0.1798095703125, 0.224273681640625, 0.26873779296875, 0.313201904296875, 0.357666015625, 0.402130126953125, 0.44659423828125, 0.491058349609375, 0.5355224609375, 0.579986572265625, 0.62445068359375, 0.668914794921875, 0.71337890625, 0.757843017578125, 0.80230712890625, 0.846771240234375, 0.8912353515625, 0.935699462890625, 0.98016357421875, 1.024627685546875, 1.069091796875, 1.113555908203125, 1.15802001953125, 1.202484130859375, 1.2469482421875, 1.291412353515625, 1.33587646484375, 1.380340576171875, 1.4248046875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 10.0, 12.0, 12.0, 24.0, 18.0, 18.0, 30.0, 32.0, 25.0, 31.0, 41.0, 37.0, 36.0, 44.0, 42.0, 53.0, 58.0, 49.0, 46.0, 53.0, 39.0, 34.0, 35.0, 20.0, 24.0, 17.0, 18.0, 20.0, 21.0, 9.0, 17.0, 9.0, 6.0, 11.0, 7.0, 4.0, 4.0, 4.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-22.74522590637207, -22.057628631591797, -21.370033264160156, -20.682435989379883, -19.994840621948242, -19.30724334716797, -18.619647979736328, -17.932050704956055, -17.24445343017578, -16.556856155395508, -15.869260787963867, -15.181663513183594, -14.494067192077637, -13.80647087097168, -13.118874549865723, -12.431278228759766, -11.743681907653809, -11.056085586547852, -10.368489265441895, -9.680892944335938, -8.993295669555664, -8.305699348449707, -7.61810302734375, -6.930506229400635, -6.242909908294678, -5.555313587188721, -4.8677167892456055, -4.180120468139648, -3.4925239086151123, -2.804927349090576, -2.117331027984619, -1.429734230041504, -0.7421379089355469, -0.05454140901565552, 0.6330550909042358, 1.3206515312194824, 2.0082480907440186, 2.6958446502685547, 3.3834409713745117, 4.071037769317627, 4.758634090423584, 5.446230411529541, 6.133827209472656, 6.821423530578613, 7.50901985168457, 8.196617126464844, 8.884212493896484, 9.571809768676758, 10.259406089782715, 10.947002410888672, 11.634598731994629, 12.322195053100586, 13.00979232788086, 13.697388648986816, 14.384984970092773, 15.072582244873047, 15.760177612304688, 16.44777488708496, 17.1353702545166, 17.822967529296875, 18.510562896728516, 19.19816017150879, 19.885757446289062, 20.573352813720703, 21.260950088500977]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 19.0, 16.0, 15.0, 28.0, 27.0, 26.0, 25.0, 44.0, 40.0, 56.0, 55.0, 45.0, 56.0, 56.0, 47.0, 47.0, 48.0, 50.0, 33.0, 35.0, 29.0, 31.0, 22.0, 18.0, 8.0, 18.0, 14.0, 14.0, 3.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.978113174438477, -21.186697006225586, -20.395280838012695, -19.603862762451172, -18.81244659423828, -18.02103042602539, -17.2296142578125, -16.43819808959961, -15.646780014038086, -14.855363845825195, -14.063946723937988, -13.272530555725098, -12.48111343383789, -11.689697265625, -10.89828109741211, -10.106863975524902, -9.315447807312012, -8.524031639099121, -7.732614517211914, -6.941198348999023, -6.149781227111816, -5.358365058898926, -4.566948413848877, -3.775531768798828, -2.9841151237487793, -2.1926984786987305, -1.4012819528579712, -0.6098654270172119, 0.18155121803283691, 0.9729678630828857, 1.7643842697143555, 2.5558009147644043, 3.347217559814453, 4.138634204864502, 4.930050849914551, 5.721467018127441, 6.512884140014648, 7.304300308227539, 8.09571647644043, 8.887133598327637, 9.678550720214844, 10.469966888427734, 11.261384010314941, 12.052800178527832, 12.844217300415039, 13.63563346862793, 14.42704963684082, 15.218466758728027, 16.009883880615234, 16.801300048828125, 17.592716217041016, 18.38413429260254, 19.17555046081543, 19.96696662902832, 20.75838279724121, 21.549800872802734, 22.341215133666992, 23.132631301879883, 23.924047470092773, 24.715465545654297, 25.506881713867188, 26.298297882080078, 27.08971405029297, 27.88113021850586, 28.672548294067383]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 10.0, 9.0, 12.0, 29.0, 46.0, 81.0, 154.0, 200.0, 317.0, 478.0, 782.0, 1330.0, 2203.0, 3617.0, 6190.0, 10600.0, 18706.0, 32420.0, 56630.0, 94623.0, 145399.0, 182610.0, 174167.0, 127292.0, 80172.0, 46965.0, 26696.0, 15235.0, 8767.0, 5090.0, 2962.0, 1837.0, 1113.0, 706.0, 407.0, 266.0, 154.0, 102.0, 61.0, 48.0, 28.0, 13.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-25.453125, -24.677734375, -23.90234375, -23.126953125, -22.3515625, -21.576171875, -20.80078125, -20.025390625, -19.25, -18.474609375, -17.69921875, -16.923828125, -16.1484375, -15.373046875, -14.59765625, -13.822265625, -13.046875, -12.271484375, -11.49609375, -10.720703125, -9.9453125, -9.169921875, -8.39453125, -7.619140625, -6.84375, -6.068359375, -5.29296875, -4.517578125, -3.7421875, -2.966796875, -2.19140625, -1.416015625, -0.640625, 0.134765625, 0.91015625, 1.685546875, 2.4609375, 3.236328125, 4.01171875, 4.787109375, 5.5625, 6.337890625, 7.11328125, 7.888671875, 8.6640625, 9.439453125, 10.21484375, 10.990234375, 11.765625, 12.541015625, 13.31640625, 14.091796875, 14.8671875, 15.642578125, 16.41796875, 17.193359375, 17.96875, 18.744140625, 19.51953125, 20.294921875, 21.0703125, 21.845703125, 22.62109375, 23.396484375, 24.171875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 12.0, 14.0, 13.0, 12.0, 17.0, 24.0, 28.0, 26.0, 32.0, 38.0, 38.0, 42.0, 55.0, 43.0, 62.0, 47.0, 50.0, 49.0, 45.0, 48.0, 47.0, 41.0, 25.0, 29.0, 31.0, 29.0, 11.0, 12.0, 12.0, 11.0, 14.0, 6.0, 6.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.62109375, -17.9140625, -17.20703125, -16.5, -15.79296875, -15.0859375, -14.37890625, -13.671875, -12.96484375, -12.2578125, -11.55078125, -10.84375, -10.13671875, -9.4296875, -8.72265625, -8.015625, -7.30859375, -6.6015625, -5.89453125, -5.1875, -4.48046875, -3.7734375, -3.06640625, -2.359375, -1.65234375, -0.9453125, -0.23828125, 0.46875, 1.17578125, 1.8828125, 2.58984375, 3.296875, 4.00390625, 4.7109375, 5.41796875, 6.125, 6.83203125, 7.5390625, 8.24609375, 8.953125, 9.66015625, 10.3671875, 11.07421875, 11.78125, 12.48828125, 13.1953125, 13.90234375, 14.609375, 15.31640625, 16.0234375, 16.73046875, 17.4375, 18.14453125, 18.8515625, 19.55859375, 20.265625, 20.97265625, 21.6796875, 22.38671875, 23.09375, 23.80078125, 24.5078125, 25.21484375, 25.921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 7.0, 13.0, 25.0, 21.0, 30.0, 58.0, 65.0, 124.0, 161.0, 243.0, 379.0, 579.0, 881.0, 1368.0, 2143.0, 3465.0, 5558.0, 9051.0, 14691.0, 25013.0, 41479.0, 68713.0, 107776.0, 152215.0, 172837.0, 153377.0, 110547.0, 70126.0, 42529.0, 25337.0, 15040.0, 9124.0, 5682.0, 3516.0, 2210.0, 1507.0, 874.0, 653.0, 376.0, 266.0, 172.0, 116.0, 75.0, 43.0, 37.0, 25.0, 9.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.9677734375, -21.248046875, -20.5283203125, -19.80859375, -19.0888671875, -18.369140625, -17.6494140625, -16.9296875, -16.2099609375, -15.490234375, -14.7705078125, -14.05078125, -13.3310546875, -12.611328125, -11.8916015625, -11.171875, -10.4521484375, -9.732421875, -9.0126953125, -8.29296875, -7.5732421875, -6.853515625, -6.1337890625, -5.4140625, -4.6943359375, -3.974609375, -3.2548828125, -2.53515625, -1.8154296875, -1.095703125, -0.3759765625, 0.34375, 1.0634765625, 1.783203125, 2.5029296875, 3.22265625, 3.9423828125, 4.662109375, 5.3818359375, 6.1015625, 6.8212890625, 7.541015625, 8.2607421875, 8.98046875, 9.7001953125, 10.419921875, 11.1396484375, 11.859375, 12.5791015625, 13.298828125, 14.0185546875, 14.73828125, 15.4580078125, 16.177734375, 16.8974609375, 17.6171875, 18.3369140625, 19.056640625, 19.7763671875, 20.49609375, 21.2158203125, 21.935546875, 22.6552734375, 23.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 11.0, 9.0, 14.0, 10.0, 18.0, 17.0, 18.0, 24.0, 31.0, 35.0, 33.0, 28.0, 27.0, 25.0, 33.0, 51.0, 38.0, 45.0, 45.0, 45.0, 39.0, 39.0, 41.0, 39.0, 33.0, 30.0, 25.0, 37.0, 26.0, 23.0, 16.0, 16.0, 9.0, 9.0, 13.0, 5.0, 7.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.3125, -12.9288330078125, -12.545166015625, -12.1614990234375, -11.77783203125, -11.3941650390625, -11.010498046875, -10.6268310546875, -10.2431640625, -9.8594970703125, -9.475830078125, -9.0921630859375, -8.70849609375, -8.3248291015625, -7.941162109375, -7.5574951171875, -7.173828125, -6.7901611328125, -6.406494140625, -6.0228271484375, -5.63916015625, -5.2554931640625, -4.871826171875, -4.4881591796875, -4.1044921875, -3.7208251953125, -3.337158203125, -2.9534912109375, -2.56982421875, -2.1861572265625, -1.802490234375, -1.4188232421875, -1.03515625, -0.6514892578125, -0.267822265625, 0.1158447265625, 0.49951171875, 0.8831787109375, 1.266845703125, 1.6505126953125, 2.0341796875, 2.4178466796875, 2.801513671875, 3.1851806640625, 3.56884765625, 3.9525146484375, 4.336181640625, 4.7198486328125, 5.103515625, 5.4871826171875, 5.870849609375, 6.2545166015625, 6.63818359375, 7.0218505859375, 7.405517578125, 7.7891845703125, 8.1728515625, 8.5565185546875, 8.940185546875, 9.3238525390625, 9.70751953125, 10.0911865234375, 10.474853515625, 10.8585205078125, 11.2421875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 13.0, 12.0, 27.0, 59.0, 73.0, 116.0, 171.0, 312.0, 489.0, 851.0, 1506.0, 2725.0, 5612.0, 11750.0, 26949.0, 63640.0, 147311.0, 279906.0, 267112.0, 135746.0, 57281.0, 24796.0, 10887.0, 5201.0, 2632.0, 1386.0, 773.0, 438.0, 274.0, 185.0, 105.0, 77.0, 48.0, 25.0, 18.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-22.0, -21.404541015625, -20.80908203125, -20.213623046875, -19.6181640625, -19.022705078125, -18.42724609375, -17.831787109375, -17.236328125, -16.640869140625, -16.04541015625, -15.449951171875, -14.8544921875, -14.259033203125, -13.66357421875, -13.068115234375, -12.47265625, -11.877197265625, -11.28173828125, -10.686279296875, -10.0908203125, -9.495361328125, -8.89990234375, -8.304443359375, -7.708984375, -7.113525390625, -6.51806640625, -5.922607421875, -5.3271484375, -4.731689453125, -4.13623046875, -3.540771484375, -2.9453125, -2.349853515625, -1.75439453125, -1.158935546875, -0.5634765625, 0.031982421875, 0.62744140625, 1.222900390625, 1.818359375, 2.413818359375, 3.00927734375, 3.604736328125, 4.2001953125, 4.795654296875, 5.39111328125, 5.986572265625, 6.58203125, 7.177490234375, 7.77294921875, 8.368408203125, 8.9638671875, 9.559326171875, 10.15478515625, 10.750244140625, 11.345703125, 11.941162109375, 12.53662109375, 13.132080078125, 13.7275390625, 14.322998046875, 14.91845703125, 15.513916015625, 16.109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 4.0, 19.0, 15.0, 15.0, 20.0, 30.0, 22.0, 31.0, 34.0, 60.0, 48.0, 54.0, 57.0, 61.0, 52.0, 73.0, 44.0, 61.0, 57.0, 41.0, 24.0, 27.0, 20.0, 21.0, 13.0, 14.0, 5.0, 8.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001247406005859375, -0.0012114793062210083, -0.0011755526065826416, -0.001139625906944275, -0.0011036992073059082, -0.0010677725076675415, -0.0010318458080291748, -0.000995919108390808, -0.0009599924087524414, -0.0009240657091140747, -0.000888139009475708, -0.0008522123098373413, -0.0008162856101989746, -0.0007803589105606079, -0.0007444322109222412, -0.0007085055112838745, -0.0006725788116455078, -0.0006366521120071411, -0.0006007254123687744, -0.0005647987127304077, -0.000528872013092041, -0.0004929453134536743, -0.0004570186138153076, -0.0004210919141769409, -0.0003851652145385742, -0.0003492385149002075, -0.0003133118152618408, -0.0002773851156234741, -0.00024145841598510742, -0.00020553171634674072, -0.00016960501670837402, -0.00013367831707000732, -9.775161743164062e-05, -6.182491779327393e-05, -2.5898218154907227e-05, 1.0028481483459473e-05, 4.595518112182617e-05, 8.188188076019287e-05, 0.00011780858039855957, 0.00015373528003692627, 0.00018966197967529297, 0.00022558867931365967, 0.00026151537895202637, 0.00029744207859039307, 0.00033336877822875977, 0.00036929547786712646, 0.00040522217750549316, 0.00044114887714385986, 0.00047707557678222656, 0.0005130022764205933, 0.00054892897605896, 0.0005848556756973267, 0.0006207823753356934, 0.0006567090749740601, 0.0006926357746124268, 0.0007285624742507935, 0.0007644891738891602, 0.0008004158735275269, 0.0008363425731658936, 0.0008722692728042603, 0.000908195972442627, 0.0009441226720809937, 0.0009800493717193604, 0.001015976071357727, 0.0010519027709960938]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 10.0, 6.0, 20.0, 17.0, 28.0, 49.0, 58.0, 69.0, 129.0, 160.0, 243.0, 366.0, 521.0, 701.0, 1102.0, 1540.0, 2556.0, 3864.0, 6431.0, 10888.0, 18612.0, 31528.0, 53958.0, 90389.0, 137580.0, 178413.0, 174479.0, 129889.0, 82915.0, 49614.0, 28934.0, 16885.0, 9912.0, 5928.0, 3632.0, 2308.0, 1559.0, 1000.0, 680.0, 463.0, 353.0, 227.0, 150.0, 138.0, 86.0, 50.0, 48.0, 17.0, 18.0, 11.0, 13.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.7265625, -10.3905029296875, -10.054443359375, -9.7183837890625, -9.38232421875, -9.0462646484375, -8.710205078125, -8.3741455078125, -8.0380859375, -7.7020263671875, -7.365966796875, -7.0299072265625, -6.69384765625, -6.3577880859375, -6.021728515625, -5.6856689453125, -5.349609375, -5.0135498046875, -4.677490234375, -4.3414306640625, -4.00537109375, -3.6693115234375, -3.333251953125, -2.9971923828125, -2.6611328125, -2.3250732421875, -1.989013671875, -1.6529541015625, -1.31689453125, -0.9808349609375, -0.644775390625, -0.3087158203125, 0.02734375, 0.3634033203125, 0.699462890625, 1.0355224609375, 1.37158203125, 1.7076416015625, 2.043701171875, 2.3797607421875, 2.7158203125, 3.0518798828125, 3.387939453125, 3.7239990234375, 4.06005859375, 4.3961181640625, 4.732177734375, 5.0682373046875, 5.404296875, 5.7403564453125, 6.076416015625, 6.4124755859375, 6.74853515625, 7.0845947265625, 7.420654296875, 7.7567138671875, 8.0927734375, 8.4288330078125, 8.764892578125, 9.1009521484375, 9.43701171875, 9.7730712890625, 10.109130859375, 10.4451904296875, 10.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 11.0, 23.0, 37.0, 46.0, 45.0, 57.0, 73.0, 70.0, 84.0, 76.0, 77.0, 61.0, 63.0, 50.0, 53.0, 34.0, 29.0, 17.0, 15.0, 17.0, 7.0, 5.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.281005859375, -5.11279296875, -4.944580078125, -4.7763671875, -4.608154296875, -4.43994140625, -4.271728515625, -4.103515625, -3.935302734375, -3.76708984375, -3.598876953125, -3.4306640625, -3.262451171875, -3.09423828125, -2.926025390625, -2.7578125, -2.589599609375, -2.42138671875, -2.253173828125, -2.0849609375, -1.916748046875, -1.74853515625, -1.580322265625, -1.412109375, -1.243896484375, -1.07568359375, -0.907470703125, -0.7392578125, -0.571044921875, -0.40283203125, -0.234619140625, -0.06640625, 0.101806640625, 0.27001953125, 0.438232421875, 0.6064453125, 0.774658203125, 0.94287109375, 1.111083984375, 1.279296875, 1.447509765625, 1.61572265625, 1.783935546875, 1.9521484375, 2.120361328125, 2.28857421875, 2.456787109375, 2.625, 2.793212890625, 2.96142578125, 3.129638671875, 3.2978515625, 3.466064453125, 3.63427734375, 3.802490234375, 3.970703125, 4.138916015625, 4.30712890625, 4.475341796875, 4.6435546875, 4.811767578125, 4.97998046875, 5.148193359375, 5.31640625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 9.0, 8.0, 9.0, 10.0, 8.0, 22.0, 16.0, 24.0, 27.0, 25.0, 26.0, 28.0, 31.0, 29.0, 41.0, 42.0, 43.0, 61.0, 34.0, 38.0, 57.0, 33.0, 41.0, 28.0, 30.0, 24.0, 38.0, 30.0, 22.0, 17.0, 18.0, 15.0, 18.0, 10.0, 10.0, 11.0, 9.0, 5.0, 6.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-17.20762825012207, -16.64251708984375, -16.07740592956543, -15.512295722961426, -14.947185516357422, -14.382074356079102, -13.816963195800781, -13.251852989196777, -12.686742782592773, -12.121631622314453, -11.55652141571045, -10.991410255432129, -10.426300048828125, -9.861188888549805, -9.296077728271484, -8.73096752166748, -8.16585636138916, -7.600745677947998, -7.035634994506836, -6.470523834228516, -5.905413627624512, -5.340302467346191, -4.775191783905029, -4.210081100463867, -3.644970417022705, -3.079859733581543, -2.514749050140381, -1.9496381282806396, -1.3845274448394775, -0.8194167613983154, -0.2543058395385742, 0.3108048439025879, 0.87591552734375, 1.441026210784912, 2.006136894226074, 2.5712478160858154, 3.1363584995269775, 3.7014691829681396, 4.266580104827881, 4.831690788269043, 5.396801471710205, 5.961912155151367, 6.527022838592529, 7.092133522033691, 7.657244682312012, 8.222354888916016, 8.787466049194336, 9.352577209472656, 9.91768741607666, 10.48279857635498, 11.047908782958984, 11.613019943237305, 12.178130149841309, 12.743241310119629, 13.308351516723633, 13.873462677001953, 14.438573837280273, 15.003684997558594, 15.568795204162598, 16.1339054107666, 16.699016571044922, 17.264127731323242, 17.829238891601562, 18.39434814453125, 18.95945930480957]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 2.0, 13.0, 13.0, 14.0, 14.0, 24.0, 21.0, 20.0, 19.0, 42.0, 37.0, 46.0, 41.0, 53.0, 50.0, 43.0, 36.0, 50.0, 38.0, 43.0, 52.0, 32.0, 37.0, 39.0, 26.0, 28.0, 35.0, 20.0, 18.0, 15.0, 13.0, 12.0, 9.0, 1.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-22.352792739868164, -21.680479049682617, -21.008163452148438, -20.33584976196289, -19.66353416442871, -18.991220474243164, -18.318904876708984, -17.646591186523438, -16.97427749633789, -16.301963806152344, -15.629648208618164, -14.957334518432617, -14.285019874572754, -13.61270523071289, -12.940390586853027, -12.268075942993164, -11.5957612991333, -10.923446655273438, -10.251132011413574, -9.578817367553711, -8.906503677368164, -8.2341890335083, -7.5618743896484375, -6.889560222625732, -6.217245578765869, -5.544930934906006, -4.872616767883301, -4.2003021240234375, -3.5279877185821533, -2.855673313140869, -2.183358669281006, -1.5110445022583008, -0.8387298583984375, -0.16641539335250854, 0.5058990716934204, 1.1782135963439941, 1.8505280017852783, 2.5228424072265625, 3.195157051086426, 3.867471218109131, 4.539785861968994, 5.212100505828857, 5.8844146728515625, 6.556729316711426, 7.229043960571289, 7.901358127593994, 8.573673248291016, 9.245986938476562, 9.918301582336426, 10.590616226196289, 11.262930870056152, 11.935245513916016, 12.607559204101562, 13.279873847961426, 13.952188491821289, 14.624502182006836, 15.296817779541016, 15.969132423400879, 16.641447067260742, 17.31376075744629, 17.98607635498047, 18.658390045166016, 19.330703735351562, 20.003019332885742, 20.67533302307129]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 5.0, 11.0, 24.0, 26.0, 52.0, 70.0, 90.0, 152.0, 242.0, 293.0, 512.0, 748.0, 1169.0, 1998.0, 3155.0, 5156.0, 8613.0, 14795.0, 25667.0, 47165.0, 89235.0, 180639.0, 393046.0, 773413.0, 1025428.0, 796832.0, 419607.0, 196073.0, 94633.0, 49915.0, 26986.0, 15454.0, 9007.0, 5427.0, 3273.0, 1977.0, 1198.0, 780.0, 486.0, 308.0, 182.0, 125.0, 85.0, 71.0, 44.0, 32.0, 24.0, 9.0, 16.0, 10.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-17.953125, -17.3837890625, -16.814453125, -16.2451171875, -15.67578125, -15.1064453125, -14.537109375, -13.9677734375, -13.3984375, -12.8291015625, -12.259765625, -11.6904296875, -11.12109375, -10.5517578125, -9.982421875, -9.4130859375, -8.84375, -8.2744140625, -7.705078125, -7.1357421875, -6.56640625, -5.9970703125, -5.427734375, -4.8583984375, -4.2890625, -3.7197265625, -3.150390625, -2.5810546875, -2.01171875, -1.4423828125, -0.873046875, -0.3037109375, 0.265625, 0.8349609375, 1.404296875, 1.9736328125, 2.54296875, 3.1123046875, 3.681640625, 4.2509765625, 4.8203125, 5.3896484375, 5.958984375, 6.5283203125, 7.09765625, 7.6669921875, 8.236328125, 8.8056640625, 9.375, 9.9443359375, 10.513671875, 11.0830078125, 11.65234375, 12.2216796875, 12.791015625, 13.3603515625, 13.9296875, 14.4990234375, 15.068359375, 15.6376953125, 16.20703125, 16.7763671875, 17.345703125, 17.9150390625, 18.484375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 12.0, 9.0, 16.0, 18.0, 14.0, 18.0, 25.0, 31.0, 44.0, 36.0, 50.0, 39.0, 61.0, 56.0, 55.0, 34.0, 46.0, 59.0, 40.0, 52.0, 36.0, 42.0, 31.0, 26.0, 30.0, 25.0, 12.0, 18.0, 14.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.071044921875, -15.51708984375, -14.963134765625, -14.4091796875, -13.855224609375, -13.30126953125, -12.747314453125, -12.193359375, -11.639404296875, -11.08544921875, -10.531494140625, -9.9775390625, -9.423583984375, -8.86962890625, -8.315673828125, -7.76171875, -7.207763671875, -6.65380859375, -6.099853515625, -5.5458984375, -4.991943359375, -4.43798828125, -3.884033203125, -3.330078125, -2.776123046875, -2.22216796875, -1.668212890625, -1.1142578125, -0.560302734375, -0.00634765625, 0.547607421875, 1.1015625, 1.655517578125, 2.20947265625, 2.763427734375, 3.3173828125, 3.871337890625, 4.42529296875, 4.979248046875, 5.533203125, 6.087158203125, 6.64111328125, 7.195068359375, 7.7490234375, 8.302978515625, 8.85693359375, 9.410888671875, 9.96484375, 10.518798828125, 11.07275390625, 11.626708984375, 12.1806640625, 12.734619140625, 13.28857421875, 13.842529296875, 14.396484375, 14.950439453125, 15.50439453125, 16.058349609375, 16.6123046875, 17.166259765625, 17.72021484375, 18.274169921875, 18.828125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 16.0, 22.0, 29.0, 39.0, 62.0, 90.0, 166.0, 225.0, 365.0, 519.0, 783.0, 1131.0, 1688.0, 2735.0, 3928.0, 6195.0, 9583.0, 15369.0, 24140.0, 38971.0, 63281.0, 104201.0, 172145.0, 284770.0, 460346.0, 685588.0, 769707.0, 586512.0, 374505.0, 228442.0, 138198.0, 83148.0, 51046.0, 31477.0, 19457.0, 12462.0, 7913.0, 4969.0, 3449.0, 2211.0, 1451.0, 973.0, 670.0, 454.0, 280.0, 174.0, 132.0, 88.0, 63.0, 26.0, 32.0, 22.0, 13.0, 10.0, 2.0, 4.0, 1.0, 2.0], "bins": [-14.8984375, -14.4368896484375, -13.975341796875, -13.5137939453125, -13.05224609375, -12.5906982421875, -12.129150390625, -11.6676025390625, -11.2060546875, -10.7445068359375, -10.282958984375, -9.8214111328125, -9.35986328125, -8.8983154296875, -8.436767578125, -7.9752197265625, -7.513671875, -7.0521240234375, -6.590576171875, -6.1290283203125, -5.66748046875, -5.2059326171875, -4.744384765625, -4.2828369140625, -3.8212890625, -3.3597412109375, -2.898193359375, -2.4366455078125, -1.97509765625, -1.5135498046875, -1.052001953125, -0.5904541015625, -0.12890625, 0.3326416015625, 0.794189453125, 1.2557373046875, 1.71728515625, 2.1788330078125, 2.640380859375, 3.1019287109375, 3.5634765625, 4.0250244140625, 4.486572265625, 4.9481201171875, 5.40966796875, 5.8712158203125, 6.332763671875, 6.7943115234375, 7.255859375, 7.7174072265625, 8.178955078125, 8.6405029296875, 9.10205078125, 9.5635986328125, 10.025146484375, 10.4866943359375, 10.9482421875, 11.4097900390625, 11.871337890625, 12.3328857421875, 12.79443359375, 13.2559814453125, 13.717529296875, 14.1790771484375, 14.640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 7.0, 8.0, 15.0, 22.0, 37.0, 30.0, 51.0, 52.0, 68.0, 92.0, 88.0, 124.0, 157.0, 169.0, 206.0, 207.0, 254.0, 280.0, 265.0, 266.0, 264.0, 220.0, 218.0, 168.0, 143.0, 122.0, 135.0, 87.0, 66.0, 45.0, 38.0, 27.0, 31.0, 17.0, 17.0, 10.0, 9.0, 12.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0], "bins": [-7.32421875, -7.1240234375, -6.923828125, -6.7236328125, -6.5234375, -6.3232421875, -6.123046875, -5.9228515625, -5.72265625, -5.5224609375, -5.322265625, -5.1220703125, -4.921875, -4.7216796875, -4.521484375, -4.3212890625, -4.12109375, -3.9208984375, -3.720703125, -3.5205078125, -3.3203125, -3.1201171875, -2.919921875, -2.7197265625, -2.51953125, -2.3193359375, -2.119140625, -1.9189453125, -1.71875, -1.5185546875, -1.318359375, -1.1181640625, -0.91796875, -0.7177734375, -0.517578125, -0.3173828125, -0.1171875, 0.0830078125, 0.283203125, 0.4833984375, 0.68359375, 0.8837890625, 1.083984375, 1.2841796875, 1.484375, 1.6845703125, 1.884765625, 2.0849609375, 2.28515625, 2.4853515625, 2.685546875, 2.8857421875, 3.0859375, 3.2861328125, 3.486328125, 3.6865234375, 3.88671875, 4.0869140625, 4.287109375, 4.4873046875, 4.6875, 4.8876953125, 5.087890625, 5.2880859375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 18.0, 10.0, 13.0, 21.0, 16.0, 25.0, 21.0, 36.0, 37.0, 36.0, 48.0, 43.0, 62.0, 50.0, 50.0, 49.0, 47.0, 50.0, 43.0, 45.0, 38.0, 33.0, 38.0, 25.0, 24.0, 12.0, 24.0, 14.0, 12.0, 6.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0], "bins": [-18.966812133789062, -18.42782211303711, -17.888830184936523, -17.34984016418457, -16.810850143432617, -16.27185821533203, -15.732868194580078, -15.193878173828125, -14.654887199401855, -14.115896224975586, -13.576906204223633, -13.037915229797363, -12.498924255371094, -11.95993423461914, -11.420943260192871, -10.881952285766602, -10.342962265014648, -9.803971290588379, -9.264981269836426, -8.725990295410156, -8.187000274658203, -7.648009300231934, -7.109018325805664, -6.570027828216553, -6.031037330627441, -5.49204683303833, -4.953056335449219, -4.414065361022949, -3.875074863433838, -3.3360843658447266, -2.797093629837036, -2.2581028938293457, -1.7191104888916016, -1.1801198720932007, -0.6411292552947998, -0.10213863849639893, 0.43685197830200195, 0.9758424758911133, 1.5148332118988037, 2.053823947906494, 2.5928144454956055, 3.131804943084717, 3.6707956790924072, 4.209786415100098, 4.748776912689209, 5.28776741027832, 5.82675838470459, 6.365748882293701, 6.9047393798828125, 7.443729877471924, 7.982720375061035, 8.521711349487305, 9.060701370239258, 9.599692344665527, 10.138683319091797, 10.67767333984375, 11.21666431427002, 11.755655288696289, 12.294645309448242, 12.833636283874512, 13.372627258300781, 13.911617279052734, 14.450608253479004, 14.989599227905273, 15.528589248657227]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 13.0, 7.0, 7.0, 12.0, 15.0, 29.0, 21.0, 27.0, 25.0, 32.0, 31.0, 36.0, 40.0, 56.0, 37.0, 44.0, 39.0, 28.0, 35.0, 44.0, 36.0, 44.0, 34.0, 26.0, 27.0, 36.0, 28.0, 18.0, 28.0, 16.0, 24.0, 10.0, 13.0, 9.0, 6.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.486700057983398, -14.01639461517334, -13.546089172363281, -13.075783729553223, -12.605478286743164, -12.135173797607422, -11.664867401123047, -11.194562911987305, -10.724257469177246, -10.253952026367188, -9.783646583557129, -9.31334114074707, -8.843035697937012, -8.372730255126953, -7.902425289154053, -7.432120323181152, -6.9618144035339355, -6.491508960723877, -6.021203517913818, -5.550898551940918, -5.080593109130859, -4.610287666320801, -4.139982223510742, -3.6696770191192627, -3.199371576309204, -2.7290661334991455, -2.258760929107666, -1.7884554862976074, -1.3181501626968384, -0.8478448390960693, -0.37753939628601074, 0.09276580810546875, 0.5630712509155273, 1.0333765745162964, 1.5036818981170654, 1.973987340927124, 2.4442925453186035, 2.914597988128662, 3.3849034309387207, 3.8552086353302, 4.32551383972168, 4.795819282531738, 5.266124725341797, 5.7364301681518555, 6.206735134124756, 6.6770405769348145, 7.147346019744873, 7.617650985717773, 8.087957382202148, 8.558262825012207, 9.028568267822266, 9.498873710632324, 9.969179153442383, 10.439483642578125, 10.9097900390625, 11.380094528198242, 11.8503999710083, 12.32070541381836, 12.791010856628418, 13.261316299438477, 13.731621742248535, 14.201927185058594, 14.672231674194336, 15.142537117004395, 15.612842559814453]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 9.0, 9.0, 14.0, 17.0, 37.0, 47.0, 73.0, 90.0, 128.0, 235.0, 351.0, 488.0, 704.0, 1026.0, 1531.0, 2329.0, 3397.0, 4955.0, 7190.0, 10510.0, 15307.0, 22284.0, 32208.0, 46645.0, 68102.0, 97434.0, 130269.0, 148200.0, 132756.0, 99201.0, 69726.0, 48239.0, 32846.0, 22666.0, 15681.0, 10738.0, 7372.0, 4915.0, 3421.0, 2386.0, 1616.0, 1093.0, 763.0, 499.0, 325.0, 214.0, 170.0, 117.0, 71.0, 53.0, 41.0, 20.0, 14.0, 16.0, 7.0, 8.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-9.8046875, -9.47265625, -9.140625, -8.80859375, -8.4765625, -8.14453125, -7.8125, -7.48046875, -7.1484375, -6.81640625, -6.484375, -6.15234375, -5.8203125, -5.48828125, -5.15625, -4.82421875, -4.4921875, -4.16015625, -3.828125, -3.49609375, -3.1640625, -2.83203125, -2.5, -2.16796875, -1.8359375, -1.50390625, -1.171875, -0.83984375, -0.5078125, -0.17578125, 0.15625, 0.48828125, 0.8203125, 1.15234375, 1.484375, 1.81640625, 2.1484375, 2.48046875, 2.8125, 3.14453125, 3.4765625, 3.80859375, 4.140625, 4.47265625, 4.8046875, 5.13671875, 5.46875, 5.80078125, 6.1328125, 6.46484375, 6.796875, 7.12890625, 7.4609375, 7.79296875, 8.125, 8.45703125, 8.7890625, 9.12109375, 9.453125, 9.78515625, 10.1171875, 10.44921875, 10.78125, 11.11328125, 11.4453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 7.0, 9.0, 11.0, 12.0, 10.0, 11.0, 19.0, 17.0, 16.0, 31.0, 34.0, 24.0, 28.0, 39.0, 38.0, 39.0, 44.0, 36.0, 38.0, 47.0, 36.0, 38.0, 44.0, 39.0, 32.0, 32.0, 33.0, 30.0, 35.0, 15.0, 22.0, 17.0, 22.0, 16.0, 8.0, 15.0, 7.0, 9.0, 7.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3359375, -13.8780517578125, -13.420166015625, -12.9622802734375, -12.50439453125, -12.0465087890625, -11.588623046875, -11.1307373046875, -10.6728515625, -10.2149658203125, -9.757080078125, -9.2991943359375, -8.84130859375, -8.3834228515625, -7.925537109375, -7.4676513671875, -7.009765625, -6.5518798828125, -6.093994140625, -5.6361083984375, -5.17822265625, -4.7203369140625, -4.262451171875, -3.8045654296875, -3.3466796875, -2.8887939453125, -2.430908203125, -1.9730224609375, -1.51513671875, -1.0572509765625, -0.599365234375, -0.1414794921875, 0.31640625, 0.7742919921875, 1.232177734375, 1.6900634765625, 2.14794921875, 2.6058349609375, 3.063720703125, 3.5216064453125, 3.9794921875, 4.4373779296875, 4.895263671875, 5.3531494140625, 5.81103515625, 6.2689208984375, 6.726806640625, 7.1846923828125, 7.642578125, 8.1004638671875, 8.558349609375, 9.0162353515625, 9.47412109375, 9.9320068359375, 10.389892578125, 10.8477783203125, 11.3056640625, 11.7635498046875, 12.221435546875, 12.6793212890625, 13.13720703125, 13.5950927734375, 14.052978515625, 14.5108642578125, 14.96875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 14.0, 16.0, 27.0, 36.0, 46.0, 79.0, 87.0, 143.0, 185.0, 277.0, 398.0, 591.0, 894.0, 1408.0, 2235.0, 3553.0, 5878.0, 10156.0, 18988.0, 50498.0, 854299.0, 53733.0, 18714.0, 9996.0, 5898.0, 3657.0, 2219.0, 1472.0, 965.0, 656.0, 425.0, 316.0, 200.0, 156.0, 101.0, 53.0, 48.0, 54.0, 36.0, 20.0, 14.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.876708984375, -21.08154296875, -20.286376953125, -19.4912109375, -18.696044921875, -17.90087890625, -17.105712890625, -16.310546875, -15.515380859375, -14.72021484375, -13.925048828125, -13.1298828125, -12.334716796875, -11.53955078125, -10.744384765625, -9.94921875, -9.154052734375, -8.35888671875, -7.563720703125, -6.7685546875, -5.973388671875, -5.17822265625, -4.383056640625, -3.587890625, -2.792724609375, -1.99755859375, -1.202392578125, -0.4072265625, 0.387939453125, 1.18310546875, 1.978271484375, 2.7734375, 3.568603515625, 4.36376953125, 5.158935546875, 5.9541015625, 6.749267578125, 7.54443359375, 8.339599609375, 9.134765625, 9.929931640625, 10.72509765625, 11.520263671875, 12.3154296875, 13.110595703125, 13.90576171875, 14.700927734375, 15.49609375, 16.291259765625, 17.08642578125, 17.881591796875, 18.6767578125, 19.471923828125, 20.26708984375, 21.062255859375, 21.857421875, 22.652587890625, 23.44775390625, 24.242919921875, 25.0380859375, 25.833251953125, 26.62841796875, 27.423583984375, 28.21875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 13.0, 13.0, 14.0, 21.0, 19.0, 27.0, 27.0, 42.0, 39.0, 38.0, 42.0, 56.0, 53.0, 53.0, 50.0, 46.0, 52.0, 57.0, 42.0, 43.0, 47.0, 34.0, 30.0, 23.0, 13.0, 12.0, 18.0, 9.0, 9.0, 7.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0, -17.43115234375, -16.8623046875, -16.29345703125, -15.724609375, -15.15576171875, -14.5869140625, -14.01806640625, -13.44921875, -12.88037109375, -12.3115234375, -11.74267578125, -11.173828125, -10.60498046875, -10.0361328125, -9.46728515625, -8.8984375, -8.32958984375, -7.7607421875, -7.19189453125, -6.623046875, -6.05419921875, -5.4853515625, -4.91650390625, -4.34765625, -3.77880859375, -3.2099609375, -2.64111328125, -2.072265625, -1.50341796875, -0.9345703125, -0.36572265625, 0.203125, 0.77197265625, 1.3408203125, 1.90966796875, 2.478515625, 3.04736328125, 3.6162109375, 4.18505859375, 4.75390625, 5.32275390625, 5.8916015625, 6.46044921875, 7.029296875, 7.59814453125, 8.1669921875, 8.73583984375, 9.3046875, 9.87353515625, 10.4423828125, 11.01123046875, 11.580078125, 12.14892578125, 12.7177734375, 13.28662109375, 13.85546875, 14.42431640625, 14.9931640625, 15.56201171875, 16.130859375, 16.69970703125, 17.2685546875, 17.83740234375, 18.40625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 12.0, 23.0, 24.0, 28.0, 28.0, 46.0, 63.0, 92.0, 142.0, 172.0, 305.0, 454.0, 691.0, 1103.0, 1891.0, 3433.0, 6872.0, 15940.0, 60170.0, 888292.0, 41538.0, 13352.0, 6096.0, 3053.0, 1688.0, 1044.0, 650.0, 423.0, 267.0, 166.0, 130.0, 89.0, 55.0, 52.0, 41.0, 28.0, 19.0, 13.0, 8.0, 7.0, 14.0, 6.0, 3.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.3984375, -14.9080810546875, -14.417724609375, -13.9273681640625, -13.43701171875, -12.9466552734375, -12.456298828125, -11.9659423828125, -11.4755859375, -10.9852294921875, -10.494873046875, -10.0045166015625, -9.51416015625, -9.0238037109375, -8.533447265625, -8.0430908203125, -7.552734375, -7.0623779296875, -6.572021484375, -6.0816650390625, -5.59130859375, -5.1009521484375, -4.610595703125, -4.1202392578125, -3.6298828125, -3.1395263671875, -2.649169921875, -2.1588134765625, -1.66845703125, -1.1781005859375, -0.687744140625, -0.1973876953125, 0.29296875, 0.7833251953125, 1.273681640625, 1.7640380859375, 2.25439453125, 2.7447509765625, 3.235107421875, 3.7254638671875, 4.2158203125, 4.7061767578125, 5.196533203125, 5.6868896484375, 6.17724609375, 6.6676025390625, 7.157958984375, 7.6483154296875, 8.138671875, 8.6290283203125, 9.119384765625, 9.6097412109375, 10.10009765625, 10.5904541015625, 11.080810546875, 11.5711669921875, 12.0615234375, 12.5518798828125, 13.042236328125, 13.5325927734375, 14.02294921875, 14.5133056640625, 15.003662109375, 15.4940185546875, 15.984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 9.0, 8.0, 16.0, 10.0, 28.0, 36.0, 47.0, 88.0, 175.0, 214.0, 107.0, 80.0, 41.0, 29.0, 29.0, 18.0, 11.0, 12.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002223968505859375, -0.0021390914916992188, -0.0020542144775390625, -0.0019693374633789062, -0.00188446044921875, -0.0017995834350585938, -0.0017147064208984375, -0.0016298294067382812, -0.001544952392578125, -0.0014600753784179688, -0.0013751983642578125, -0.0012903213500976562, -0.0012054443359375, -0.0011205673217773438, -0.0010356903076171875, -0.0009508132934570312, -0.000865936279296875, -0.0007810592651367188, -0.0006961822509765625, -0.0006113052368164062, -0.00052642822265625, -0.00044155120849609375, -0.0003566741943359375, -0.00027179718017578125, -0.000186920166015625, -0.00010204315185546875, -1.71661376953125e-05, 6.771087646484375e-05, 0.000152587890625, 0.00023746490478515625, 0.0003223419189453125, 0.00040721893310546875, 0.000492095947265625, 0.0005769729614257812, 0.0006618499755859375, 0.0007467269897460938, 0.00083160400390625, 0.0009164810180664062, 0.0010013580322265625, 0.0010862350463867188, 0.001171112060546875, 0.0012559890747070312, 0.0013408660888671875, 0.0014257431030273438, 0.0015106201171875, 0.0015954971313476562, 0.0016803741455078125, 0.0017652511596679688, 0.001850128173828125, 0.0019350051879882812, 0.0020198822021484375, 0.0021047592163085938, 0.00218963623046875, 0.0022745132446289062, 0.0023593902587890625, 0.0024442672729492188, 0.002529144287109375, 0.0026140213012695312, 0.0026988983154296875, 0.0027837753295898438, 0.00286865234375, 0.0029535293579101562, 0.0030384063720703125, 0.0031232833862304688, 0.003208160400390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 14.0, 17.0, 28.0, 32.0, 34.0, 54.0, 89.0, 118.0, 160.0, 265.0, 342.0, 429.0, 605.0, 900.0, 1232.0, 1807.0, 2649.0, 4121.0, 6540.0, 10740.0, 18590.0, 33307.0, 65210.0, 126984.0, 211091.0, 230390.0, 153297.0, 80485.0, 41694.0, 22050.0, 12769.0, 7662.0, 4801.0, 3057.0, 2113.0, 1393.0, 981.0, 692.0, 515.0, 349.0, 274.0, 181.0, 124.0, 91.0, 70.0, 61.0, 35.0, 28.0, 15.0, 15.0, 13.0, 6.0, 12.0, 1.0, 5.0, 3.0, 2.0], "bins": [-3.314453125, -3.211395263671875, -3.10833740234375, -3.005279541015625, -2.9022216796875, -2.799163818359375, -2.69610595703125, -2.593048095703125, -2.489990234375, -2.386932373046875, -2.28387451171875, -2.180816650390625, -2.0777587890625, -1.974700927734375, -1.87164306640625, -1.768585205078125, -1.66552734375, -1.562469482421875, -1.45941162109375, -1.356353759765625, -1.2532958984375, -1.150238037109375, -1.04718017578125, -0.944122314453125, -0.841064453125, -0.738006591796875, -0.63494873046875, -0.531890869140625, -0.4288330078125, -0.325775146484375, -0.22271728515625, -0.119659423828125, -0.0166015625, 0.086456298828125, 0.18951416015625, 0.292572021484375, 0.3956298828125, 0.498687744140625, 0.60174560546875, 0.704803466796875, 0.807861328125, 0.910919189453125, 1.01397705078125, 1.117034912109375, 1.2200927734375, 1.323150634765625, 1.42620849609375, 1.529266357421875, 1.63232421875, 1.735382080078125, 1.83843994140625, 1.941497802734375, 2.0445556640625, 2.147613525390625, 2.25067138671875, 2.353729248046875, 2.456787109375, 2.559844970703125, 2.66290283203125, 2.765960693359375, 2.8690185546875, 2.972076416015625, 3.07513427734375, 3.178192138671875, 3.28125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 4.0, 5.0, 6.0, 9.0, 19.0, 22.0, 23.0, 32.0, 43.0, 42.0, 73.0, 79.0, 91.0, 69.0, 90.0, 63.0, 53.0, 60.0, 38.0, 38.0, 28.0, 23.0, 13.0, 10.0, 8.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.52734375, -1.479949951171875, -1.43255615234375, -1.385162353515625, -1.3377685546875, -1.290374755859375, -1.24298095703125, -1.195587158203125, -1.148193359375, -1.100799560546875, -1.05340576171875, -1.006011962890625, -0.9586181640625, -0.911224365234375, -0.86383056640625, -0.816436767578125, -0.76904296875, -0.721649169921875, -0.67425537109375, -0.626861572265625, -0.5794677734375, -0.532073974609375, -0.48468017578125, -0.437286376953125, -0.389892578125, -0.342498779296875, -0.29510498046875, -0.247711181640625, -0.2003173828125, -0.152923583984375, -0.10552978515625, -0.058135986328125, -0.0107421875, 0.036651611328125, 0.08404541015625, 0.131439208984375, 0.1788330078125, 0.226226806640625, 0.27362060546875, 0.321014404296875, 0.368408203125, 0.415802001953125, 0.46319580078125, 0.510589599609375, 0.5579833984375, 0.605377197265625, 0.65277099609375, 0.700164794921875, 0.74755859375, 0.794952392578125, 0.84234619140625, 0.889739990234375, 0.9371337890625, 0.984527587890625, 1.03192138671875, 1.079315185546875, 1.126708984375, 1.174102783203125, 1.22149658203125, 1.268890380859375, 1.3162841796875, 1.363677978515625, 1.41107177734375, 1.458465576171875, 1.505859375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 8.0, 15.0, 17.0, 19.0, 19.0, 23.0, 27.0, 35.0, 41.0, 38.0, 42.0, 45.0, 54.0, 49.0, 50.0, 60.0, 60.0, 56.0, 42.0, 60.0, 35.0, 38.0, 31.0, 16.0, 21.0, 12.0, 11.0, 10.0, 8.0, 5.0, 14.0, 6.0, 4.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.22270965576172, -16.706270217895508, -16.189830780029297, -15.673391342163086, -15.156951904296875, -14.640512466430664, -14.124073028564453, -13.607633590698242, -13.091194152832031, -12.57475471496582, -12.05831527709961, -11.541875839233398, -11.025436401367188, -10.508996963500977, -9.992557525634766, -9.476118087768555, -8.959678649902344, -8.443239212036133, -7.926799774169922, -7.410360336303711, -6.8939208984375, -6.377481460571289, -5.861042022705078, -5.344602584838867, -4.828163146972656, -4.311723709106445, -3.7952842712402344, -3.2788448333740234, -2.7624053955078125, -2.2459659576416016, -1.7295265197753906, -1.2130870819091797, -0.6966495513916016, -0.18021011352539062, 0.3362293243408203, 0.8526687622070312, 1.3691082000732422, 1.8855476379394531, 2.401987075805664, 2.918426513671875, 3.434865951538086, 3.951305389404297, 4.467744827270508, 4.984184265136719, 5.50062370300293, 6.017063140869141, 6.533502578735352, 7.0499420166015625, 7.566381454467773, 8.082820892333984, 8.599260330200195, 9.115699768066406, 9.632139205932617, 10.148578643798828, 10.665018081665039, 11.18145751953125, 11.697896957397461, 12.214336395263672, 12.730775833129883, 13.247215270996094, 13.763654708862305, 14.280094146728516, 14.796533584594727, 15.312973022460938, 15.829412460327148]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 6.0, 12.0, 6.0, 8.0, 8.0, 12.0, 22.0, 29.0, 18.0, 22.0, 30.0, 30.0, 38.0, 32.0, 37.0, 43.0, 50.0, 23.0, 45.0, 40.0, 39.0, 38.0, 35.0, 35.0, 35.0, 33.0, 27.0, 23.0, 32.0, 16.0, 35.0, 23.0, 10.0, 17.0, 12.0, 9.0, 9.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.771490097045898, -12.355425834655762, -11.939361572265625, -11.523297309875488, -11.107233047485352, -10.691168785095215, -10.275104522705078, -9.859040260314941, -9.442975997924805, -9.026911735534668, -8.610847473144531, -8.194783210754395, -7.778718948364258, -7.362654685974121, -6.946590423583984, -6.530526161193848, -6.114461898803711, -5.698397636413574, -5.2823333740234375, -4.866269111633301, -4.450204849243164, -4.034140586853027, -3.6180763244628906, -3.202012062072754, -2.785947799682617, -2.3698835372924805, -1.9538192749023438, -1.537755012512207, -1.1216907501220703, -0.7056264877319336, -0.2895622253417969, 0.12650203704833984, 0.5425653457641602, 0.9586296081542969, 1.3746938705444336, 1.7907581329345703, 2.206822395324707, 2.6228866577148438, 3.0389509201049805, 3.455015182495117, 3.871079444885254, 4.287143707275391, 4.703207969665527, 5.119272232055664, 5.535336494445801, 5.9514007568359375, 6.367465019226074, 6.783529281616211, 7.199593544006348, 7.615657806396484, 8.031722068786621, 8.447786331176758, 8.863850593566895, 9.279914855957031, 9.695979118347168, 10.112043380737305, 10.528107643127441, 10.944171905517578, 11.360236167907715, 11.776300430297852, 12.192364692687988, 12.608428955078125, 13.024493217468262, 13.440557479858398, 13.856621742248535]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 3.0, 8.0, 9.0, 12.0, 23.0, 38.0, 60.0, 80.0, 153.0, 228.0, 364.0, 660.0, 1044.0, 1751.0, 3089.0, 5168.0, 9233.0, 16151.0, 27865.0, 48017.0, 79250.0, 121427.0, 163342.0, 174091.0, 145343.0, 100483.0, 63089.0, 37077.0, 21446.0, 12103.0, 7078.0, 4114.0, 2308.0, 1295.0, 876.0, 472.0, 324.0, 175.0, 108.0, 72.0, 59.0, 26.0, 14.0, 17.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -12.98974609375, -12.4951171875, -12.00048828125, -11.505859375, -11.01123046875, -10.5166015625, -10.02197265625, -9.52734375, -9.03271484375, -8.5380859375, -8.04345703125, -7.548828125, -7.05419921875, -6.5595703125, -6.06494140625, -5.5703125, -5.07568359375, -4.5810546875, -4.08642578125, -3.591796875, -3.09716796875, -2.6025390625, -2.10791015625, -1.61328125, -1.11865234375, -0.6240234375, -0.12939453125, 0.365234375, 0.85986328125, 1.3544921875, 1.84912109375, 2.34375, 2.83837890625, 3.3330078125, 3.82763671875, 4.322265625, 4.81689453125, 5.3115234375, 5.80615234375, 6.30078125, 6.79541015625, 7.2900390625, 7.78466796875, 8.279296875, 8.77392578125, 9.2685546875, 9.76318359375, 10.2578125, 10.75244140625, 11.2470703125, 11.74169921875, 12.236328125, 12.73095703125, 13.2255859375, 13.72021484375, 14.21484375, 14.70947265625, 15.2041015625, 15.69873046875, 16.193359375, 16.68798828125, 17.1826171875, 17.67724609375, 18.171875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 11.0, 13.0, 4.0, 18.0, 14.0, 14.0, 19.0, 23.0, 22.0, 29.0, 25.0, 24.0, 36.0, 41.0, 28.0, 44.0, 40.0, 33.0, 43.0, 42.0, 42.0, 25.0, 33.0, 27.0, 46.0, 39.0, 28.0, 29.0, 21.0, 15.0, 22.0, 19.0, 21.0, 18.0, 18.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-12.4765625, -12.1031494140625, -11.729736328125, -11.3563232421875, -10.98291015625, -10.6094970703125, -10.236083984375, -9.8626708984375, -9.4892578125, -9.1158447265625, -8.742431640625, -8.3690185546875, -7.99560546875, -7.6221923828125, -7.248779296875, -6.8753662109375, -6.501953125, -6.1285400390625, -5.755126953125, -5.3817138671875, -5.00830078125, -4.6348876953125, -4.261474609375, -3.8880615234375, -3.5146484375, -3.1412353515625, -2.767822265625, -2.3944091796875, -2.02099609375, -1.6475830078125, -1.274169921875, -0.9007568359375, -0.52734375, -0.1539306640625, 0.219482421875, 0.5928955078125, 0.96630859375, 1.3397216796875, 1.713134765625, 2.0865478515625, 2.4599609375, 2.8333740234375, 3.206787109375, 3.5802001953125, 3.95361328125, 4.3270263671875, 4.700439453125, 5.0738525390625, 5.447265625, 5.8206787109375, 6.194091796875, 6.5675048828125, 6.94091796875, 7.3143310546875, 7.687744140625, 8.0611572265625, 8.4345703125, 8.8079833984375, 9.181396484375, 9.5548095703125, 9.92822265625, 10.3016357421875, 10.675048828125, 11.0484619140625, 11.421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 12.0, 21.0, 24.0, 29.0, 54.0, 72.0, 146.0, 223.0, 344.0, 578.0, 942.0, 1480.0, 2492.0, 4107.0, 6770.0, 11415.0, 19324.0, 32226.0, 54068.0, 85931.0, 127850.0, 162405.0, 165220.0, 134550.0, 92333.0, 58305.0, 35281.0, 20948.0, 12530.0, 7534.0, 4431.0, 2666.0, 1584.0, 1043.0, 571.0, 341.0, 240.0, 164.0, 108.0, 57.0, 38.0, 38.0, 22.0, 14.0, 6.0, 7.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.921875, -14.4708251953125, -14.019775390625, -13.5687255859375, -13.11767578125, -12.6666259765625, -12.215576171875, -11.7645263671875, -11.3134765625, -10.8624267578125, -10.411376953125, -9.9603271484375, -9.50927734375, -9.0582275390625, -8.607177734375, -8.1561279296875, -7.705078125, -7.2540283203125, -6.802978515625, -6.3519287109375, -5.90087890625, -5.4498291015625, -4.998779296875, -4.5477294921875, -4.0966796875, -3.6456298828125, -3.194580078125, -2.7435302734375, -2.29248046875, -1.8414306640625, -1.390380859375, -0.9393310546875, -0.48828125, -0.0372314453125, 0.413818359375, 0.8648681640625, 1.31591796875, 1.7669677734375, 2.218017578125, 2.6690673828125, 3.1201171875, 3.5711669921875, 4.022216796875, 4.4732666015625, 4.92431640625, 5.3753662109375, 5.826416015625, 6.2774658203125, 6.728515625, 7.1795654296875, 7.630615234375, 8.0816650390625, 8.53271484375, 8.9837646484375, 9.434814453125, 9.8858642578125, 10.3369140625, 10.7879638671875, 11.239013671875, 11.6900634765625, 12.14111328125, 12.5921630859375, 13.043212890625, 13.4942626953125, 13.9453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 14.0, 8.0, 18.0, 15.0, 14.0, 13.0, 20.0, 25.0, 29.0, 32.0, 33.0, 37.0, 52.0, 48.0, 38.0, 37.0, 56.0, 54.0, 50.0, 58.0, 37.0, 33.0, 42.0, 28.0, 43.0, 24.0, 20.0, 25.0, 14.0, 11.0, 18.0, 6.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9921875, -7.6903076171875, -7.388427734375, -7.0865478515625, -6.78466796875, -6.4827880859375, -6.180908203125, -5.8790283203125, -5.5771484375, -5.2752685546875, -4.973388671875, -4.6715087890625, -4.36962890625, -4.0677490234375, -3.765869140625, -3.4639892578125, -3.162109375, -2.8602294921875, -2.558349609375, -2.2564697265625, -1.95458984375, -1.6527099609375, -1.350830078125, -1.0489501953125, -0.7470703125, -0.4451904296875, -0.143310546875, 0.1585693359375, 0.46044921875, 0.7623291015625, 1.064208984375, 1.3660888671875, 1.66796875, 1.9698486328125, 2.271728515625, 2.5736083984375, 2.87548828125, 3.1773681640625, 3.479248046875, 3.7811279296875, 4.0830078125, 4.3848876953125, 4.686767578125, 4.9886474609375, 5.29052734375, 5.5924072265625, 5.894287109375, 6.1961669921875, 6.498046875, 6.7999267578125, 7.101806640625, 7.4036865234375, 7.70556640625, 8.0074462890625, 8.309326171875, 8.6112060546875, 8.9130859375, 9.2149658203125, 9.516845703125, 9.8187255859375, 10.12060546875, 10.4224853515625, 10.724365234375, 11.0262451171875, 11.328125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 12.0, 15.0, 17.0, 21.0, 31.0, 48.0, 60.0, 74.0, 103.0, 179.0, 269.0, 335.0, 479.0, 690.0, 1107.0, 1812.0, 2843.0, 4511.0, 7439.0, 12676.0, 21903.0, 37863.0, 67909.0, 117003.0, 178375.0, 202819.0, 158671.0, 97953.0, 55968.0, 31479.0, 18152.0, 10554.0, 6411.0, 3826.0, 2406.0, 1538.0, 967.0, 615.0, 440.0, 289.0, 201.0, 140.0, 104.0, 57.0, 55.0, 41.0, 26.0, 13.0, 16.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0], "bins": [-10.6640625, -10.3441162109375, -10.024169921875, -9.7042236328125, -9.38427734375, -9.0643310546875, -8.744384765625, -8.4244384765625, -8.1044921875, -7.7845458984375, -7.464599609375, -7.1446533203125, -6.82470703125, -6.5047607421875, -6.184814453125, -5.8648681640625, -5.544921875, -5.2249755859375, -4.905029296875, -4.5850830078125, -4.26513671875, -3.9451904296875, -3.625244140625, -3.3052978515625, -2.9853515625, -2.6654052734375, -2.345458984375, -2.0255126953125, -1.70556640625, -1.3856201171875, -1.065673828125, -0.7457275390625, -0.42578125, -0.1058349609375, 0.214111328125, 0.5340576171875, 0.85400390625, 1.1739501953125, 1.493896484375, 1.8138427734375, 2.1337890625, 2.4537353515625, 2.773681640625, 3.0936279296875, 3.41357421875, 3.7335205078125, 4.053466796875, 4.3734130859375, 4.693359375, 5.0133056640625, 5.333251953125, 5.6531982421875, 5.97314453125, 6.2930908203125, 6.613037109375, 6.9329833984375, 7.2529296875, 7.5728759765625, 7.892822265625, 8.2127685546875, 8.53271484375, 8.8526611328125, 9.172607421875, 9.4925537109375, 9.8125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 15.0, 21.0, 23.0, 30.0, 41.0, 51.0, 62.0, 66.0, 62.0, 83.0, 76.0, 74.0, 62.0, 57.0, 53.0, 48.0, 38.0, 28.0, 22.0, 10.0, 11.0, 16.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00102996826171875, -0.000993490219116211, -0.0009570121765136719, -0.0009205341339111328, -0.0008840560913085938, -0.0008475780487060547, -0.0008111000061035156, -0.0007746219635009766, -0.0007381439208984375, -0.0007016658782958984, -0.0006651878356933594, -0.0006287097930908203, -0.0005922317504882812, -0.0005557537078857422, -0.0005192756652832031, -0.00048279762268066406, -0.000446319580078125, -0.00040984153747558594, -0.0003733634948730469, -0.0003368854522705078, -0.00030040740966796875, -0.0002639293670654297, -0.00022745132446289062, -0.00019097328186035156, -0.0001544952392578125, -0.00011801719665527344, -8.153915405273438e-05, -4.506111145019531e-05, -8.58306884765625e-06, 2.7894973754882812e-05, 6.437301635742188e-05, 0.00010085105895996094, 0.0001373291015625, 0.00017380714416503906, 0.00021028518676757812, 0.0002467632293701172, 0.00028324127197265625, 0.0003197193145751953, 0.0003561973571777344, 0.00039267539978027344, 0.0004291534423828125, 0.00046563148498535156, 0.0005021095275878906, 0.0005385875701904297, 0.0005750656127929688, 0.0006115436553955078, 0.0006480216979980469, 0.0006844997406005859, 0.000720977783203125, 0.0007574558258056641, 0.0007939338684082031, 0.0008304119110107422, 0.0008668899536132812, 0.0009033679962158203, 0.0009398460388183594, 0.0009763240814208984, 0.0010128021240234375, 0.0010492801666259766, 0.0010857582092285156, 0.0011222362518310547, 0.0011587142944335938, 0.0011951923370361328, 0.0012316703796386719, 0.001268148422241211, 0.00130462646484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 12.0, 6.0, 16.0, 29.0, 32.0, 37.0, 64.0, 108.0, 153.0, 295.0, 520.0, 959.0, 1827.0, 3489.0, 7040.0, 14998.0, 33857.0, 79939.0, 183261.0, 296859.0, 231942.0, 108662.0, 45586.0, 20135.0, 9153.0, 4576.0, 2259.0, 1265.0, 618.0, 343.0, 172.0, 101.0, 78.0, 46.0, 25.0, 25.0, 18.0, 18.0, 5.0, 7.0, 10.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.4962158203125, -14.023681640625, -13.5511474609375, -13.07861328125, -12.6060791015625, -12.133544921875, -11.6610107421875, -11.1884765625, -10.7159423828125, -10.243408203125, -9.7708740234375, -9.29833984375, -8.8258056640625, -8.353271484375, -7.8807373046875, -7.408203125, -6.9356689453125, -6.463134765625, -5.9906005859375, -5.51806640625, -5.0455322265625, -4.572998046875, -4.1004638671875, -3.6279296875, -3.1553955078125, -2.682861328125, -2.2103271484375, -1.73779296875, -1.2652587890625, -0.792724609375, -0.3201904296875, 0.15234375, 0.6248779296875, 1.097412109375, 1.5699462890625, 2.04248046875, 2.5150146484375, 2.987548828125, 3.4600830078125, 3.9326171875, 4.4051513671875, 4.877685546875, 5.3502197265625, 5.82275390625, 6.2952880859375, 6.767822265625, 7.2403564453125, 7.712890625, 8.1854248046875, 8.657958984375, 9.1304931640625, 9.60302734375, 10.0755615234375, 10.548095703125, 11.0206298828125, 11.4931640625, 11.9656982421875, 12.438232421875, 12.9107666015625, 13.38330078125, 13.8558349609375, 14.328369140625, 14.8009033203125, 15.2734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 11.0, 15.0, 14.0, 19.0, 23.0, 28.0, 41.0, 54.0, 41.0, 66.0, 73.0, 62.0, 64.0, 66.0, 64.0, 53.0, 53.0, 43.0, 47.0, 26.0, 21.0, 25.0, 13.0, 20.0, 13.0, 3.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.07818603515625, -2.9532470703125, -2.82830810546875, -2.703369140625, -2.57843017578125, -2.4534912109375, -2.32855224609375, -2.20361328125, -2.07867431640625, -1.9537353515625, -1.82879638671875, -1.703857421875, -1.57891845703125, -1.4539794921875, -1.32904052734375, -1.2041015625, -1.07916259765625, -0.9542236328125, -0.82928466796875, -0.704345703125, -0.57940673828125, -0.4544677734375, -0.32952880859375, -0.20458984375, -0.07965087890625, 0.0452880859375, 0.17022705078125, 0.295166015625, 0.42010498046875, 0.5450439453125, 0.66998291015625, 0.794921875, 0.91986083984375, 1.0447998046875, 1.16973876953125, 1.294677734375, 1.41961669921875, 1.5445556640625, 1.66949462890625, 1.79443359375, 1.91937255859375, 2.0443115234375, 2.16925048828125, 2.294189453125, 2.41912841796875, 2.5440673828125, 2.66900634765625, 2.7939453125, 2.91888427734375, 3.0438232421875, 3.16876220703125, 3.293701171875, 3.41864013671875, 3.5435791015625, 3.66851806640625, 3.79345703125, 3.91839599609375, 4.0433349609375, 4.16827392578125, 4.293212890625, 4.41815185546875, 4.5430908203125, 4.66802978515625, 4.79296875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 9.0, 13.0, 12.0, 9.0, 24.0, 22.0, 17.0, 33.0, 20.0, 40.0, 37.0, 45.0, 50.0, 53.0, 71.0, 40.0, 60.0, 54.0, 55.0, 41.0, 48.0, 52.0, 39.0, 37.0, 28.0, 9.0, 15.0, 19.0, 9.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.446269035339355, -14.960251808166504, -14.474233627319336, -13.988216400146484, -13.502198219299316, -13.016180992126465, -12.530162811279297, -12.044145584106445, -11.558127403259277, -11.072110176086426, -10.586091995239258, -10.100074768066406, -9.614056587219238, -9.128039360046387, -8.642021179199219, -8.156003952026367, -7.669986248016357, -7.183968544006348, -6.697950839996338, -6.211933135986328, -5.725915431976318, -5.239897727966309, -4.753880500793457, -4.267862319946289, -3.7818448543548584, -3.2958271503448486, -2.809809446334839, -2.323791980743408, -1.8377741575241089, -1.3517565727233887, -0.8657388687133789, -0.37972116470336914, 0.10629653930664062, 0.5923142433166504, 1.0783319473266602, 1.5643495321273804, 2.0503673553466797, 2.5363848209381104, 3.02240252494812, 3.50842022895813, 3.9944379329681396, 4.48045539855957, 4.96647310256958, 5.45249080657959, 5.9385085105896, 6.424526214599609, 6.910543918609619, 7.396561622619629, 7.882579326629639, 8.368597030639648, 8.8546142578125, 9.340632438659668, 9.82664966583252, 10.312667846679688, 10.798685073852539, 11.284703254699707, 11.770720481872559, 12.25673770904541, 12.742755889892578, 13.22877311706543, 13.714791297912598, 14.20080852508545, 14.686826705932617, 15.172843933105469, 15.658862113952637]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 7.0, 11.0, 5.0, 6.0, 18.0, 15.0, 17.0, 20.0, 18.0, 19.0, 17.0, 28.0, 32.0, 31.0, 42.0, 39.0, 33.0, 48.0, 34.0, 43.0, 44.0, 32.0, 33.0, 38.0, 30.0, 38.0, 27.0, 24.0, 26.0, 23.0, 33.0, 20.0, 14.0, 17.0, 15.0, 14.0, 6.0, 11.0, 11.0, 7.0, 2.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.707863807678223, -11.32986831665039, -10.951872825622559, -10.57387638092041, -10.195880889892578, -9.817885398864746, -9.439889907836914, -9.061893463134766, -8.683897972106934, -8.305902481079102, -7.927906513214111, -7.549911022186279, -7.171915054321289, -6.793919563293457, -6.415924072265625, -6.037928104400635, -5.659932613372803, -5.281937122344971, -4.9039411544799805, -4.525945663452148, -4.147949695587158, -3.769954204559326, -3.391958475112915, -3.013962745666504, -2.6359670162200928, -2.2579712867736816, -1.8799755573272705, -1.501979947090149, -1.1239842176437378, -0.7459884881973267, -0.3679928779602051, 0.010002851486206055, 0.3879985809326172, 0.7659943103790283, 1.1439900398254395, 1.521985650062561, 1.8999813795089722, 2.2779769897460938, 2.655972719192505, 3.033968448638916, 3.411964178085327, 3.7899599075317383, 4.16795539855957, 4.5459513664245605, 4.923946857452393, 5.301942825317383, 5.679938316345215, 6.057933807373047, 6.435929775238037, 6.813925266265869, 7.191921234130859, 7.569916725158691, 7.947912693023682, 8.325908660888672, 8.703904151916504, 9.081899642944336, 9.459895133972168, 9.837890625, 10.215886116027832, 10.59388256072998, 10.971878051757812, 11.349873542785645, 11.727869033813477, 12.105865478515625, 12.483860969543457]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 17.0, 23.0, 22.0, 50.0, 89.0, 144.0, 227.0, 328.0, 477.0, 816.0, 1322.0, 2095.0, 3406.0, 5900.0, 10225.0, 18393.0, 33999.0, 65996.0, 135980.0, 309491.0, 673099.0, 1046046.0, 931256.0, 508270.0, 225269.0, 104213.0, 51843.0, 27700.0, 15504.0, 8667.0, 4978.0, 3110.0, 1967.0, 1190.0, 782.0, 458.0, 299.0, 219.0, 141.0, 105.0, 47.0, 43.0, 25.0, 17.0, 9.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.5703125, -12.162353515625, -11.75439453125, -11.346435546875, -10.9384765625, -10.530517578125, -10.12255859375, -9.714599609375, -9.306640625, -8.898681640625, -8.49072265625, -8.082763671875, -7.6748046875, -7.266845703125, -6.85888671875, -6.450927734375, -6.04296875, -5.635009765625, -5.22705078125, -4.819091796875, -4.4111328125, -4.003173828125, -3.59521484375, -3.187255859375, -2.779296875, -2.371337890625, -1.96337890625, -1.555419921875, -1.1474609375, -0.739501953125, -0.33154296875, 0.076416015625, 0.484375, 0.892333984375, 1.30029296875, 1.708251953125, 2.1162109375, 2.524169921875, 2.93212890625, 3.340087890625, 3.748046875, 4.156005859375, 4.56396484375, 4.971923828125, 5.3798828125, 5.787841796875, 6.19580078125, 6.603759765625, 7.01171875, 7.419677734375, 7.82763671875, 8.235595703125, 8.6435546875, 9.051513671875, 9.45947265625, 9.867431640625, 10.275390625, 10.683349609375, 11.09130859375, 11.499267578125, 11.9072265625, 12.315185546875, 12.72314453125, 13.131103515625, 13.5390625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 5.0, 5.0, 9.0, 8.0, 10.0, 12.0, 10.0, 16.0, 18.0, 19.0, 21.0, 21.0, 32.0, 29.0, 31.0, 37.0, 39.0, 42.0, 42.0, 39.0, 44.0, 30.0, 28.0, 41.0, 30.0, 23.0, 37.0, 40.0, 26.0, 24.0, 30.0, 23.0, 17.0, 27.0, 16.0, 22.0, 16.0, 15.0, 10.0, 10.0, 3.0, 7.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-8.4921875, -8.21337890625, -7.9345703125, -7.65576171875, -7.376953125, -7.09814453125, -6.8193359375, -6.54052734375, -6.26171875, -5.98291015625, -5.7041015625, -5.42529296875, -5.146484375, -4.86767578125, -4.5888671875, -4.31005859375, -4.03125, -3.75244140625, -3.4736328125, -3.19482421875, -2.916015625, -2.63720703125, -2.3583984375, -2.07958984375, -1.80078125, -1.52197265625, -1.2431640625, -0.96435546875, -0.685546875, -0.40673828125, -0.1279296875, 0.15087890625, 0.4296875, 0.70849609375, 0.9873046875, 1.26611328125, 1.544921875, 1.82373046875, 2.1025390625, 2.38134765625, 2.66015625, 2.93896484375, 3.2177734375, 3.49658203125, 3.775390625, 4.05419921875, 4.3330078125, 4.61181640625, 4.890625, 5.16943359375, 5.4482421875, 5.72705078125, 6.005859375, 6.28466796875, 6.5634765625, 6.84228515625, 7.12109375, 7.39990234375, 7.6787109375, 7.95751953125, 8.236328125, 8.51513671875, 8.7939453125, 9.07275390625, 9.3515625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 8.0, 16.0, 25.0, 35.0, 46.0, 60.0, 112.0, 195.0, 279.0, 425.0, 677.0, 1001.0, 1456.0, 2389.0, 3671.0, 5933.0, 9570.0, 15485.0, 26075.0, 44021.0, 76330.0, 133245.0, 237138.0, 417676.0, 690572.0, 866063.0, 687391.0, 418587.0, 236072.0, 132386.0, 76249.0, 43835.0, 26125.0, 15401.0, 9476.0, 5875.0, 3709.0, 2330.0, 1562.0, 912.0, 694.0, 364.0, 282.0, 196.0, 116.0, 80.0, 52.0, 31.0, 14.0, 18.0, 10.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.984375, -10.6463623046875, -10.308349609375, -9.9703369140625, -9.63232421875, -9.2943115234375, -8.956298828125, -8.6182861328125, -8.2802734375, -7.9422607421875, -7.604248046875, -7.2662353515625, -6.92822265625, -6.5902099609375, -6.252197265625, -5.9141845703125, -5.576171875, -5.2381591796875, -4.900146484375, -4.5621337890625, -4.22412109375, -3.8861083984375, -3.548095703125, -3.2100830078125, -2.8720703125, -2.5340576171875, -2.196044921875, -1.8580322265625, -1.52001953125, -1.1820068359375, -0.843994140625, -0.5059814453125, -0.16796875, 0.1700439453125, 0.508056640625, 0.8460693359375, 1.18408203125, 1.5220947265625, 1.860107421875, 2.1981201171875, 2.5361328125, 2.8741455078125, 3.212158203125, 3.5501708984375, 3.88818359375, 4.2261962890625, 4.564208984375, 4.9022216796875, 5.240234375, 5.5782470703125, 5.916259765625, 6.2542724609375, 6.59228515625, 6.9302978515625, 7.268310546875, 7.6063232421875, 7.9443359375, 8.2823486328125, 8.620361328125, 8.9583740234375, 9.29638671875, 9.6343994140625, 9.972412109375, 10.3104248046875, 10.6484375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 11.0, 15.0, 18.0, 24.0, 24.0, 41.0, 42.0, 48.0, 59.0, 72.0, 89.0, 110.0, 147.0, 174.0, 233.0, 222.0, 253.0, 293.0, 284.0, 283.0, 258.0, 258.0, 210.0, 173.0, 133.0, 110.0, 93.0, 77.0, 69.0, 46.0, 47.0, 26.0, 29.0, 23.0, 14.0, 13.0, 9.0, 10.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.171875, -4.0390625, -3.90625, -3.7734375, -3.640625, -3.5078125, -3.375, -3.2421875, -3.109375, -2.9765625, -2.84375, -2.7109375, -2.578125, -2.4453125, -2.3125, -2.1796875, -2.046875, -1.9140625, -1.78125, -1.6484375, -1.515625, -1.3828125, -1.25, -1.1171875, -0.984375, -0.8515625, -0.71875, -0.5859375, -0.453125, -0.3203125, -0.1875, -0.0546875, 0.078125, 0.2109375, 0.34375, 0.4765625, 0.609375, 0.7421875, 0.875, 1.0078125, 1.140625, 1.2734375, 1.40625, 1.5390625, 1.671875, 1.8046875, 1.9375, 2.0703125, 2.203125, 2.3359375, 2.46875, 2.6015625, 2.734375, 2.8671875, 3.0, 3.1328125, 3.265625, 3.3984375, 3.53125, 3.6640625, 3.796875, 3.9296875, 4.0625, 4.1953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 3.0, 6.0, 9.0, 2.0, 13.0, 16.0, 17.0, 19.0, 26.0, 31.0, 40.0, 49.0, 47.0, 50.0, 51.0, 54.0, 48.0, 53.0, 65.0, 54.0, 61.0, 44.0, 48.0, 39.0, 28.0, 20.0, 17.0, 17.0, 15.0, 16.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.015341758728027, -11.61558723449707, -11.21583366394043, -10.816080093383789, -10.416325569152832, -10.016571044921875, -9.616817474365234, -9.217063903808594, -8.817309379577637, -8.41755485534668, -8.017801284790039, -7.61804723739624, -7.218293190002441, -6.818539142608643, -6.418785095214844, -6.019031047821045, -5.619277000427246, -5.219522953033447, -4.819768905639648, -4.42001485824585, -4.020260810852051, -3.620506763458252, -3.220752716064453, -2.8209986686706543, -2.4212446212768555, -2.0214905738830566, -1.6217365264892578, -1.221982479095459, -0.8222284317016602, -0.42247438430786133, -0.0227203369140625, 0.37703371047973633, 0.7767887115478516, 1.1765427589416504, 1.5762968063354492, 1.976050853729248, 2.375804901123047, 2.7755589485168457, 3.1753129959106445, 3.5750670433044434, 3.974821090698242, 4.374575138092041, 4.77432918548584, 5.174083232879639, 5.5738372802734375, 5.973591327667236, 6.373345375061035, 6.773099422454834, 7.172853469848633, 7.572607517242432, 7.9723615646362305, 8.372116088867188, 8.771869659423828, 9.171623229980469, 9.571377754211426, 9.971132278442383, 10.370885848999023, 10.770639419555664, 11.170393943786621, 11.570148468017578, 11.969902038574219, 12.36965560913086, 12.769410133361816, 13.169164657592773, 13.568918228149414]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 10.0, 12.0, 9.0, 13.0, 16.0, 16.0, 17.0, 30.0, 32.0, 24.0, 23.0, 29.0, 33.0, 31.0, 34.0, 36.0, 45.0, 48.0, 42.0, 37.0, 50.0, 38.0, 34.0, 38.0, 28.0, 40.0, 27.0, 27.0, 20.0, 17.0, 11.0, 22.0, 18.0, 10.0, 8.0, 12.0, 9.0, 4.0, 6.0, 5.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.879922866821289, -9.566076278686523, -9.252229690551758, -8.938384056091309, -8.624537467956543, -8.310690879821777, -7.996844291687012, -7.682998180389404, -7.369152069091797, -7.055305480957031, -6.741459369659424, -6.427612781524658, -6.113766670227051, -5.799920082092285, -5.4860734939575195, -5.172227382659912, -4.8583807945251465, -4.544534206390381, -4.230688095092773, -3.916841506958008, -3.6029953956604004, -3.2891488075256348, -2.9753024578094482, -2.6614561080932617, -2.347609758377075, -2.0337634086608887, -1.7199170589447021, -1.406070590019226, -1.0922242403030396, -0.778377890586853, -0.46453142166137695, -0.15068507194519043, 0.1631612777709961, 0.477007657289505, 0.7908540368080139, 1.1047004461288452, 1.4185467958450317, 1.7323931455612183, 2.0462396144866943, 2.360085964202881, 2.6739323139190674, 2.987778663635254, 3.3016250133514404, 3.615471363067627, 3.9293179512023926, 4.2431640625, 4.557010650634766, 4.870857238769531, 5.184703350067139, 5.498549938201904, 5.812396049499512, 6.126242637634277, 6.440088748931885, 6.75393533706665, 7.067781448364258, 7.381628036499023, 7.695474624633789, 8.009321212768555, 8.32316780090332, 8.63701343536377, 8.950860023498535, 9.2647066116333, 9.578553199768066, 9.892398834228516, 10.206245422363281]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 8.0, 4.0, 11.0, 9.0, 17.0, 24.0, 31.0, 46.0, 81.0, 78.0, 128.0, 190.0, 265.0, 388.0, 600.0, 838.0, 1206.0, 1911.0, 2842.0, 4517.0, 7360.0, 12484.0, 22139.0, 40503.0, 75503.0, 140225.0, 216981.0, 214668.0, 137527.0, 74263.0, 39523.0, 21554.0, 12415.0, 7274.0, 4400.0, 2854.0, 1793.0, 1197.0, 843.0, 596.0, 375.0, 269.0, 185.0, 150.0, 96.0, 60.0, 45.0, 27.0, 16.0, 9.0, 14.0, 8.0, 3.0, 3.0, 5.0, 0.0, 3.0], "bins": [-8.9453125, -8.68206787109375, -8.4188232421875, -8.15557861328125, -7.892333984375, -7.62908935546875, -7.3658447265625, -7.10260009765625, -6.83935546875, -6.57611083984375, -6.3128662109375, -6.04962158203125, -5.786376953125, -5.52313232421875, -5.2598876953125, -4.99664306640625, -4.7333984375, -4.47015380859375, -4.2069091796875, -3.94366455078125, -3.680419921875, -3.41717529296875, -3.1539306640625, -2.89068603515625, -2.62744140625, -2.36419677734375, -2.1009521484375, -1.83770751953125, -1.574462890625, -1.31121826171875, -1.0479736328125, -0.78472900390625, -0.521484375, -0.25823974609375, 0.0050048828125, 0.26824951171875, 0.531494140625, 0.79473876953125, 1.0579833984375, 1.32122802734375, 1.58447265625, 1.84771728515625, 2.1109619140625, 2.37420654296875, 2.637451171875, 2.90069580078125, 3.1639404296875, 3.42718505859375, 3.6904296875, 3.95367431640625, 4.2169189453125, 4.48016357421875, 4.743408203125, 5.00665283203125, 5.2698974609375, 5.53314208984375, 5.79638671875, 6.05963134765625, 6.3228759765625, 6.58612060546875, 6.849365234375, 7.11260986328125, 7.3758544921875, 7.63909912109375, 7.90234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 6.0, 12.0, 14.0, 9.0, 20.0, 25.0, 23.0, 22.0, 38.0, 28.0, 27.0, 33.0, 34.0, 24.0, 31.0, 40.0, 47.0, 45.0, 42.0, 39.0, 38.0, 40.0, 33.0, 30.0, 30.0, 41.0, 24.0, 22.0, 20.0, 20.0, 15.0, 11.0, 15.0, 9.0, 18.0, 5.0, 12.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.84033203125, -8.5244140625, -8.20849609375, -7.892578125, -7.57666015625, -7.2607421875, -6.94482421875, -6.62890625, -6.31298828125, -5.9970703125, -5.68115234375, -5.365234375, -5.04931640625, -4.7333984375, -4.41748046875, -4.1015625, -3.78564453125, -3.4697265625, -3.15380859375, -2.837890625, -2.52197265625, -2.2060546875, -1.89013671875, -1.57421875, -1.25830078125, -0.9423828125, -0.62646484375, -0.310546875, 0.00537109375, 0.3212890625, 0.63720703125, 0.953125, 1.26904296875, 1.5849609375, 1.90087890625, 2.216796875, 2.53271484375, 2.8486328125, 3.16455078125, 3.48046875, 3.79638671875, 4.1123046875, 4.42822265625, 4.744140625, 5.06005859375, 5.3759765625, 5.69189453125, 6.0078125, 6.32373046875, 6.6396484375, 6.95556640625, 7.271484375, 7.58740234375, 7.9033203125, 8.21923828125, 8.53515625, 8.85107421875, 9.1669921875, 9.48291015625, 9.798828125, 10.11474609375, 10.4306640625, 10.74658203125, 11.0625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 6.0, 9.0, 22.0, 10.0, 21.0, 25.0, 31.0, 41.0, 60.0, 73.0, 103.0, 162.0, 175.0, 284.0, 431.0, 548.0, 793.0, 1197.0, 2018.0, 3035.0, 4972.0, 8559.0, 15898.0, 35763.0, 789560.0, 130880.0, 23698.0, 11969.0, 6812.0, 3943.0, 2543.0, 1575.0, 992.0, 727.0, 458.0, 293.0, 221.0, 165.0, 113.0, 100.0, 69.0, 44.0, 33.0, 29.0, 21.0, 28.0, 14.0, 8.0, 6.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.3359375, -11.9478759765625, -11.559814453125, -11.1717529296875, -10.78369140625, -10.3956298828125, -10.007568359375, -9.6195068359375, -9.2314453125, -8.8433837890625, -8.455322265625, -8.0672607421875, -7.67919921875, -7.2911376953125, -6.903076171875, -6.5150146484375, -6.126953125, -5.7388916015625, -5.350830078125, -4.9627685546875, -4.57470703125, -4.1866455078125, -3.798583984375, -3.4105224609375, -3.0224609375, -2.6343994140625, -2.246337890625, -1.8582763671875, -1.47021484375, -1.0821533203125, -0.694091796875, -0.3060302734375, 0.08203125, 0.4700927734375, 0.858154296875, 1.2462158203125, 1.63427734375, 2.0223388671875, 2.410400390625, 2.7984619140625, 3.1865234375, 3.5745849609375, 3.962646484375, 4.3507080078125, 4.73876953125, 5.1268310546875, 5.514892578125, 5.9029541015625, 6.291015625, 6.6790771484375, 7.067138671875, 7.4552001953125, 7.84326171875, 8.2313232421875, 8.619384765625, 9.0074462890625, 9.3955078125, 9.7835693359375, 10.171630859375, 10.5596923828125, 10.94775390625, 11.3358154296875, 11.723876953125, 12.1119384765625, 12.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 4.0, 11.0, 13.0, 14.0, 31.0, 21.0, 30.0, 35.0, 40.0, 34.0, 31.0, 49.0, 41.0, 42.0, 63.0, 48.0, 61.0, 44.0, 38.0, 59.0, 49.0, 31.0, 28.0, 26.0, 23.0, 21.0, 16.0, 15.0, 20.0, 8.0, 4.0, 9.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.784912109375, -8.46826171875, -8.151611328125, -7.8349609375, -7.518310546875, -7.20166015625, -6.885009765625, -6.568359375, -6.251708984375, -5.93505859375, -5.618408203125, -5.3017578125, -4.985107421875, -4.66845703125, -4.351806640625, -4.03515625, -3.718505859375, -3.40185546875, -3.085205078125, -2.7685546875, -2.451904296875, -2.13525390625, -1.818603515625, -1.501953125, -1.185302734375, -0.86865234375, -0.552001953125, -0.2353515625, 0.081298828125, 0.39794921875, 0.714599609375, 1.03125, 1.347900390625, 1.66455078125, 1.981201171875, 2.2978515625, 2.614501953125, 2.93115234375, 3.247802734375, 3.564453125, 3.881103515625, 4.19775390625, 4.514404296875, 4.8310546875, 5.147705078125, 5.46435546875, 5.781005859375, 6.09765625, 6.414306640625, 6.73095703125, 7.047607421875, 7.3642578125, 7.680908203125, 7.99755859375, 8.314208984375, 8.630859375, 8.947509765625, 9.26416015625, 9.580810546875, 9.8974609375, 10.214111328125, 10.53076171875, 10.847412109375, 11.1640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 5.0, 11.0, 12.0, 14.0, 18.0, 28.0, 28.0, 38.0, 49.0, 90.0, 138.0, 174.0, 269.0, 403.0, 668.0, 1136.0, 1858.0, 3451.0, 7436.0, 19755.0, 379287.0, 596737.0, 20604.0, 7639.0, 3704.0, 1950.0, 1083.0, 695.0, 432.0, 261.0, 165.0, 122.0, 79.0, 65.0, 36.0, 27.0, 22.0, 14.0, 11.0, 8.0, 11.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.699951171875, -12.29052734375, -11.881103515625, -11.4716796875, -11.062255859375, -10.65283203125, -10.243408203125, -9.833984375, -9.424560546875, -9.01513671875, -8.605712890625, -8.1962890625, -7.786865234375, -7.37744140625, -6.968017578125, -6.55859375, -6.149169921875, -5.73974609375, -5.330322265625, -4.9208984375, -4.511474609375, -4.10205078125, -3.692626953125, -3.283203125, -2.873779296875, -2.46435546875, -2.054931640625, -1.6455078125, -1.236083984375, -0.82666015625, -0.417236328125, -0.0078125, 0.401611328125, 0.81103515625, 1.220458984375, 1.6298828125, 2.039306640625, 2.44873046875, 2.858154296875, 3.267578125, 3.677001953125, 4.08642578125, 4.495849609375, 4.9052734375, 5.314697265625, 5.72412109375, 6.133544921875, 6.54296875, 6.952392578125, 7.36181640625, 7.771240234375, 8.1806640625, 8.590087890625, 8.99951171875, 9.408935546875, 9.818359375, 10.227783203125, 10.63720703125, 11.046630859375, 11.4560546875, 11.865478515625, 12.27490234375, 12.684326171875, 13.09375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 14.0, 11.0, 13.0, 16.0, 23.0, 47.0, 70.0, 114.0, 193.0, 159.0, 105.0, 78.0, 40.0, 35.0, 15.0, 18.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012226104736328125, -0.0011842697858810425, -0.0011459290981292725, -0.0011075884103775024, -0.0010692477226257324, -0.0010309070348739624, -0.0009925663471221924, -0.0009542256593704224, -0.0009158849716186523, -0.0008775442838668823, -0.0008392035961151123, -0.0008008629083633423, -0.0007625222206115723, -0.0007241815328598022, -0.0006858408451080322, -0.0006475001573562622, -0.0006091594696044922, -0.0005708187818527222, -0.0005324780941009521, -0.0004941374063491821, -0.0004557967185974121, -0.0004174560308456421, -0.00037911534309387207, -0.00034077465534210205, -0.00030243396759033203, -0.000264093279838562, -0.000225752592086792, -0.00018741190433502197, -0.00014907121658325195, -0.00011073052883148193, -7.238984107971191e-05, -3.4049153327941895e-05, 4.291534423828125e-06, 4.2632222175598145e-05, 8.097290992736816e-05, 0.00011931359767913818, 0.0001576542854309082, 0.00019599497318267822, 0.00023433566093444824, 0.00027267634868621826, 0.0003110170364379883, 0.0003493577241897583, 0.0003876984119415283, 0.00042603909969329834, 0.00046437978744506836, 0.0005027204751968384, 0.0005410611629486084, 0.0005794018507003784, 0.0006177425384521484, 0.0006560832262039185, 0.0006944239139556885, 0.0007327646017074585, 0.0007711052894592285, 0.0008094459772109985, 0.0008477866649627686, 0.0008861273527145386, 0.0009244680404663086, 0.0009628087282180786, 0.0010011494159698486, 0.0010394901037216187, 0.0010778307914733887, 0.0011161714792251587, 0.0011545121669769287, 0.0011928528547286987, 0.0012311935424804688]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 9.0, 7.0, 8.0, 20.0, 28.0, 36.0, 55.0, 80.0, 102.0, 153.0, 218.0, 298.0, 399.0, 555.0, 821.0, 1256.0, 1787.0, 2864.0, 4583.0, 7712.0, 13492.0, 24640.0, 48511.0, 106067.0, 233196.0, 293465.0, 159003.0, 70422.0, 34087.0, 18011.0, 10142.0, 5943.0, 3566.0, 2230.0, 1440.0, 1025.0, 675.0, 482.0, 343.0, 236.0, 170.0, 130.0, 97.0, 64.0, 40.0, 36.0, 21.0, 11.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.699737548828125, -2.60064697265625, -2.501556396484375, -2.4024658203125, -2.303375244140625, -2.20428466796875, -2.105194091796875, -2.006103515625, -1.907012939453125, -1.80792236328125, -1.708831787109375, -1.6097412109375, -1.510650634765625, -1.41156005859375, -1.312469482421875, -1.21337890625, -1.114288330078125, -1.01519775390625, -0.916107177734375, -0.8170166015625, -0.717926025390625, -0.61883544921875, -0.519744873046875, -0.420654296875, -0.321563720703125, -0.22247314453125, -0.123382568359375, -0.0242919921875, 0.074798583984375, 0.17388916015625, 0.272979736328125, 0.3720703125, 0.471160888671875, 0.57025146484375, 0.669342041015625, 0.7684326171875, 0.867523193359375, 0.96661376953125, 1.065704345703125, 1.164794921875, 1.263885498046875, 1.36297607421875, 1.462066650390625, 1.5611572265625, 1.660247802734375, 1.75933837890625, 1.858428955078125, 1.95751953125, 2.056610107421875, 2.15570068359375, 2.254791259765625, 2.3538818359375, 2.452972412109375, 2.55206298828125, 2.651153564453125, 2.750244140625, 2.849334716796875, 2.94842529296875, 3.047515869140625, 3.1466064453125, 3.245697021484375, 3.34478759765625, 3.443878173828125, 3.54296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 4.0, 4.0, 12.0, 9.0, 19.0, 13.0, 10.0, 15.0, 30.0, 38.0, 33.0, 49.0, 58.0, 63.0, 62.0, 68.0, 75.0, 82.0, 53.0, 57.0, 39.0, 29.0, 28.0, 20.0, 23.0, 14.0, 17.0, 9.0, 12.0, 8.0, 14.0, 11.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8900985717773438, -0.8549041748046875, -0.8197097778320312, -0.784515380859375, -0.7493209838867188, -0.7141265869140625, -0.6789321899414062, -0.64373779296875, -0.6085433959960938, -0.5733489990234375, -0.5381546020507812, -0.502960205078125, -0.46776580810546875, -0.4325714111328125, -0.39737701416015625, -0.3621826171875, -0.32698822021484375, -0.2917938232421875, -0.25659942626953125, -0.221405029296875, -0.18621063232421875, -0.1510162353515625, -0.11582183837890625, -0.08062744140625, -0.04543304443359375, -0.0102386474609375, 0.02495574951171875, 0.060150146484375, 0.09534454345703125, 0.1305389404296875, 0.16573333740234375, 0.200927734375, 0.23612213134765625, 0.2713165283203125, 0.30651092529296875, 0.341705322265625, 0.37689971923828125, 0.4120941162109375, 0.44728851318359375, 0.48248291015625, 0.5176773071289062, 0.5528717041015625, 0.5880661010742188, 0.623260498046875, 0.6584548950195312, 0.6936492919921875, 0.7288436889648438, 0.7640380859375, 0.7992324829101562, 0.8344268798828125, 0.8696212768554688, 0.904815673828125, 0.9400100708007812, 0.9752044677734375, 1.0103988647460938, 1.04559326171875, 1.0807876586914062, 1.1159820556640625, 1.1511764526367188, 1.186370849609375, 1.2215652465820312, 1.2567596435546875, 1.2919540405273438, 1.3271484375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 17.0, 15.0, 17.0, 26.0, 24.0, 36.0, 53.0, 51.0, 46.0, 47.0, 59.0, 60.0, 58.0, 78.0, 49.0, 46.0, 50.0, 39.0, 43.0, 26.0, 28.0, 20.0, 20.0, 12.0, 6.0, 6.0, 4.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.922833442687988, -12.509087562561035, -12.095340728759766, -11.681594848632812, -11.26784896850586, -10.85410213470459, -10.440356254577637, -10.026609420776367, -9.612863540649414, -9.199117660522461, -8.785370826721191, -8.371624946594238, -7.957878589630127, -7.544132232666016, -7.1303863525390625, -6.716639995574951, -6.30289363861084, -5.8891472816467285, -5.475400924682617, -5.061655044555664, -4.647908687591553, -4.234162330627441, -3.820416212081909, -3.406670093536377, -2.9929237365722656, -2.5791773796081543, -2.165431261062622, -1.7516850233078003, -1.3379387855529785, -0.9241924285888672, -0.510446310043335, -0.09670019149780273, 0.3170452117919922, 0.730791449546814, 1.1445376873016357, 1.5582839250564575, 1.9720301628112793, 2.3857765197753906, 2.799522638320923, 3.213268756866455, 3.6270151138305664, 4.040761470794678, 4.454507827758789, 4.868253707885742, 5.2820000648498535, 5.695746421813965, 6.109492301940918, 6.523238658905029, 6.936985015869141, 7.350731372833252, 7.764477729797363, 8.178223609924316, 8.591970443725586, 9.005716323852539, 9.419462203979492, 9.833208084106445, 10.246954917907715, 10.660700798034668, 11.074447631835938, 11.48819351196289, 11.901939392089844, 12.315686225891113, 12.729432106018066, 13.143178939819336, 13.556924819946289]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 5.0, 8.0, 13.0, 14.0, 9.0, 12.0, 20.0, 20.0, 19.0, 30.0, 32.0, 26.0, 27.0, 36.0, 30.0, 45.0, 43.0, 41.0, 38.0, 48.0, 45.0, 34.0, 35.0, 33.0, 40.0, 42.0, 29.0, 18.0, 37.0, 20.0, 20.0, 17.0, 12.0, 17.0, 10.0, 11.0, 9.0, 6.0, 6.0, 6.0, 7.0, 9.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.073317527770996, -9.760954856872559, -9.448593139648438, -9.13623046875, -8.823867797851562, -8.511505126953125, -8.199142456054688, -7.886780738830566, -7.574418067932129, -7.262055397033691, -6.949693202972412, -6.637331008911133, -6.324968338012695, -6.012605667114258, -5.7002434730529785, -5.387881278991699, -5.075518608093262, -4.763155937194824, -4.450793743133545, -4.138431549072266, -3.826068878173828, -3.5137064456939697, -3.2013440132141113, -2.888981580734253, -2.5766191482543945, -2.264256715774536, -1.9518942832946777, -1.6395318508148193, -1.327169418334961, -1.0148069858551025, -0.7024445533752441, -0.39008212089538574, -0.07771873474121094, 0.23464369773864746, 0.5470061302185059, 0.8593685626983643, 1.1717309951782227, 1.484093427658081, 1.7964558601379395, 2.108818292617798, 2.4211807250976562, 2.7335431575775146, 3.045905590057373, 3.3582680225372314, 3.67063045501709, 3.9829928874969482, 4.295355319976807, 4.607717514038086, 4.920080184936523, 5.232442855834961, 5.54480504989624, 5.8571672439575195, 6.169529914855957, 6.4818925857543945, 6.794254779815674, 7.106616973876953, 7.418979644775391, 7.731342315673828, 8.043704986572266, 8.356066703796387, 8.668429374694824, 8.980792045593262, 9.293153762817383, 9.60551643371582, 9.917879104614258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 16.0, 19.0, 29.0, 42.0, 63.0, 84.0, 118.0, 186.0, 274.0, 388.0, 522.0, 813.0, 1199.0, 1883.0, 2841.0, 4458.0, 7076.0, 11175.0, 17817.0, 28384.0, 43826.0, 67402.0, 97318.0, 129125.0, 148063.0, 141008.0, 113324.0, 81025.0, 54312.0, 35021.0, 22294.0, 13719.0, 8761.0, 5547.0, 3554.0, 2232.0, 1471.0, 1001.0, 690.0, 468.0, 308.0, 216.0, 143.0, 96.0, 71.0, 56.0, 25.0, 24.0, 12.0, 17.0, 14.0, 9.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.8828125, -11.5084228515625, -11.134033203125, -10.7596435546875, -10.38525390625, -10.0108642578125, -9.636474609375, -9.2620849609375, -8.8876953125, -8.5133056640625, -8.138916015625, -7.7645263671875, -7.39013671875, -7.0157470703125, -6.641357421875, -6.2669677734375, -5.892578125, -5.5181884765625, -5.143798828125, -4.7694091796875, -4.39501953125, -4.0206298828125, -3.646240234375, -3.2718505859375, -2.8974609375, -2.5230712890625, -2.148681640625, -1.7742919921875, -1.39990234375, -1.0255126953125, -0.651123046875, -0.2767333984375, 0.09765625, 0.4720458984375, 0.846435546875, 1.2208251953125, 1.59521484375, 1.9696044921875, 2.343994140625, 2.7183837890625, 3.0927734375, 3.4671630859375, 3.841552734375, 4.2159423828125, 4.59033203125, 4.9647216796875, 5.339111328125, 5.7135009765625, 6.087890625, 6.4622802734375, 6.836669921875, 7.2110595703125, 7.58544921875, 7.9598388671875, 8.334228515625, 8.7086181640625, 9.0830078125, 9.4573974609375, 9.831787109375, 10.2061767578125, 10.58056640625, 10.9549560546875, 11.329345703125, 11.7037353515625, 12.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 9.0, 14.0, 13.0, 17.0, 12.0, 21.0, 25.0, 16.0, 22.0, 22.0, 30.0, 30.0, 39.0, 42.0, 42.0, 36.0, 46.0, 34.0, 43.0, 43.0, 39.0, 42.0, 39.0, 35.0, 34.0, 25.0, 34.0, 31.0, 17.0, 22.0, 16.0, 14.0, 15.0, 15.0, 8.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6627197265625, -8.372314453125, -8.0819091796875, -7.79150390625, -7.5010986328125, -7.210693359375, -6.9202880859375, -6.6298828125, -6.3394775390625, -6.049072265625, -5.7586669921875, -5.46826171875, -5.1778564453125, -4.887451171875, -4.5970458984375, -4.306640625, -4.0162353515625, -3.725830078125, -3.4354248046875, -3.14501953125, -2.8546142578125, -2.564208984375, -2.2738037109375, -1.9833984375, -1.6929931640625, -1.402587890625, -1.1121826171875, -0.82177734375, -0.5313720703125, -0.240966796875, 0.0494384765625, 0.33984375, 0.6302490234375, 0.920654296875, 1.2110595703125, 1.50146484375, 1.7918701171875, 2.082275390625, 2.3726806640625, 2.6630859375, 2.9534912109375, 3.243896484375, 3.5343017578125, 3.82470703125, 4.1151123046875, 4.405517578125, 4.6959228515625, 4.986328125, 5.2767333984375, 5.567138671875, 5.8575439453125, 6.14794921875, 6.4383544921875, 6.728759765625, 7.0191650390625, 7.3095703125, 7.5999755859375, 7.890380859375, 8.1807861328125, 8.47119140625, 8.7615966796875, 9.052001953125, 9.3424072265625, 9.6328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 10.0, 8.0, 27.0, 35.0, 43.0, 56.0, 81.0, 117.0, 203.0, 287.0, 392.0, 578.0, 874.0, 1307.0, 1937.0, 2943.0, 4534.0, 6811.0, 10360.0, 15500.0, 23868.0, 36593.0, 53518.0, 76392.0, 103056.0, 125532.0, 134798.0, 123338.0, 99649.0, 73659.0, 50844.0, 34108.0, 22958.0, 15211.0, 9856.0, 6453.0, 4233.0, 2852.0, 1805.0, 1168.0, 832.0, 517.0, 394.0, 247.0, 164.0, 145.0, 65.0, 63.0, 30.0, 40.0, 20.0, 19.0, 6.0, 11.0, 3.0, 3.0, 4.0, 1.0], "bins": [-10.125, -9.8128662109375, -9.500732421875, -9.1885986328125, -8.87646484375, -8.5643310546875, -8.252197265625, -7.9400634765625, -7.6279296875, -7.3157958984375, -7.003662109375, -6.6915283203125, -6.37939453125, -6.0672607421875, -5.755126953125, -5.4429931640625, -5.130859375, -4.8187255859375, -4.506591796875, -4.1944580078125, -3.88232421875, -3.5701904296875, -3.258056640625, -2.9459228515625, -2.6337890625, -2.3216552734375, -2.009521484375, -1.6973876953125, -1.38525390625, -1.0731201171875, -0.760986328125, -0.4488525390625, -0.13671875, 0.1754150390625, 0.487548828125, 0.7996826171875, 1.11181640625, 1.4239501953125, 1.736083984375, 2.0482177734375, 2.3603515625, 2.6724853515625, 2.984619140625, 3.2967529296875, 3.60888671875, 3.9210205078125, 4.233154296875, 4.5452880859375, 4.857421875, 5.1695556640625, 5.481689453125, 5.7938232421875, 6.10595703125, 6.4180908203125, 6.730224609375, 7.0423583984375, 7.3544921875, 7.6666259765625, 7.978759765625, 8.2908935546875, 8.60302734375, 8.9151611328125, 9.227294921875, 9.5394287109375, 9.8515625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 9.0, 5.0, 6.0, 11.0, 6.0, 11.0, 11.0, 13.0, 25.0, 16.0, 28.0, 25.0, 20.0, 35.0, 32.0, 37.0, 40.0, 42.0, 33.0, 37.0, 33.0, 36.0, 46.0, 49.0, 48.0, 41.0, 34.0, 40.0, 31.0, 33.0, 31.0, 24.0, 18.0, 15.0, 16.0, 7.0, 11.0, 11.0, 10.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.7464599609375, -5.543701171875, -5.3409423828125, -5.13818359375, -4.9354248046875, -4.732666015625, -4.5299072265625, -4.3271484375, -4.1243896484375, -3.921630859375, -3.7188720703125, -3.51611328125, -3.3133544921875, -3.110595703125, -2.9078369140625, -2.705078125, -2.5023193359375, -2.299560546875, -2.0968017578125, -1.89404296875, -1.6912841796875, -1.488525390625, -1.2857666015625, -1.0830078125, -0.8802490234375, -0.677490234375, -0.4747314453125, -0.27197265625, -0.0692138671875, 0.133544921875, 0.3363037109375, 0.5390625, 0.7418212890625, 0.944580078125, 1.1473388671875, 1.35009765625, 1.5528564453125, 1.755615234375, 1.9583740234375, 2.1611328125, 2.3638916015625, 2.566650390625, 2.7694091796875, 2.97216796875, 3.1749267578125, 3.377685546875, 3.5804443359375, 3.783203125, 3.9859619140625, 4.188720703125, 4.3914794921875, 4.59423828125, 4.7969970703125, 4.999755859375, 5.2025146484375, 5.4052734375, 5.6080322265625, 5.810791015625, 6.0135498046875, 6.21630859375, 6.4190673828125, 6.621826171875, 6.8245849609375, 7.02734375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 13.0, 14.0, 17.0, 27.0, 39.0, 64.0, 83.0, 112.0, 157.0, 228.0, 337.0, 489.0, 710.0, 1139.0, 1727.0, 3163.0, 5306.0, 9638.0, 19176.0, 38903.0, 87226.0, 185641.0, 288813.0, 211396.0, 100675.0, 45126.0, 22073.0, 10981.0, 5902.0, 3413.0, 2031.0, 1277.0, 868.0, 580.0, 373.0, 269.0, 170.0, 118.0, 86.0, 58.0, 34.0, 35.0, 16.0, 9.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-12.2734375, -11.872314453125, -11.47119140625, -11.070068359375, -10.6689453125, -10.267822265625, -9.86669921875, -9.465576171875, -9.064453125, -8.663330078125, -8.26220703125, -7.861083984375, -7.4599609375, -7.058837890625, -6.65771484375, -6.256591796875, -5.85546875, -5.454345703125, -5.05322265625, -4.652099609375, -4.2509765625, -3.849853515625, -3.44873046875, -3.047607421875, -2.646484375, -2.245361328125, -1.84423828125, -1.443115234375, -1.0419921875, -0.640869140625, -0.23974609375, 0.161376953125, 0.5625, 0.963623046875, 1.36474609375, 1.765869140625, 2.1669921875, 2.568115234375, 2.96923828125, 3.370361328125, 3.771484375, 4.172607421875, 4.57373046875, 4.974853515625, 5.3759765625, 5.777099609375, 6.17822265625, 6.579345703125, 6.98046875, 7.381591796875, 7.78271484375, 8.183837890625, 8.5849609375, 8.986083984375, 9.38720703125, 9.788330078125, 10.189453125, 10.590576171875, 10.99169921875, 11.392822265625, 11.7939453125, 12.195068359375, 12.59619140625, 12.997314453125, 13.3984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 7.0, 13.0, 17.0, 24.0, 29.0, 43.0, 53.0, 63.0, 100.0, 99.0, 107.0, 93.0, 70.0, 61.0, 74.0, 36.0, 29.0, 24.0, 18.0, 12.0, 10.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015239715576171875, -0.0014796257019042969, -0.0014352798461914062, -0.0013909339904785156, -0.001346588134765625, -0.0013022422790527344, -0.0012578964233398438, -0.0012135505676269531, -0.0011692047119140625, -0.0011248588562011719, -0.0010805130004882812, -0.0010361671447753906, -0.0009918212890625, -0.0009474754333496094, -0.0009031295776367188, -0.0008587837219238281, -0.0008144378662109375, -0.0007700920104980469, -0.0007257461547851562, -0.0006814002990722656, -0.000637054443359375, -0.0005927085876464844, -0.0005483627319335938, -0.0005040168762207031, -0.0004596710205078125, -0.0004153251647949219, -0.00037097930908203125, -0.0003266334533691406, -0.00028228759765625, -0.00023794174194335938, -0.00019359588623046875, -0.00014925003051757812, -0.0001049041748046875, -6.0558319091796875e-05, -1.621246337890625e-05, 2.8133392333984375e-05, 7.2479248046875e-05, 0.00011682510375976562, 0.00016117095947265625, 0.00020551681518554688, 0.0002498626708984375, 0.0002942085266113281, 0.00033855438232421875, 0.0003829002380371094, 0.00042724609375, 0.0004715919494628906, 0.0005159378051757812, 0.0005602836608886719, 0.0006046295166015625, 0.0006489753723144531, 0.0006933212280273438, 0.0007376670837402344, 0.000782012939453125, 0.0008263587951660156, 0.0008707046508789062, 0.0009150505065917969, 0.0009593963623046875, 0.0010037422180175781, 0.0010480880737304688, 0.0010924339294433594, 0.00113677978515625, 0.0011811256408691406, 0.0012254714965820312, 0.0012698173522949219, 0.0013141632080078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 12.0, 7.0, 13.0, 35.0, 31.0, 30.0, 68.0, 93.0, 119.0, 180.0, 251.0, 363.0, 635.0, 957.0, 1511.0, 2405.0, 3854.0, 6260.0, 10292.0, 18144.0, 30881.0, 54578.0, 95152.0, 152664.0, 197745.0, 179645.0, 122113.0, 71737.0, 40917.0, 23420.0, 13541.0, 7855.0, 4853.0, 2941.0, 1884.0, 1123.0, 762.0, 479.0, 322.0, 216.0, 138.0, 103.0, 62.0, 54.0, 36.0, 26.0, 14.0, 9.0, 8.0, 6.0, 4.0, 8.0, 4.0, 3.0], "bins": [-8.515625, -8.2705078125, -8.025390625, -7.7802734375, -7.53515625, -7.2900390625, -7.044921875, -6.7998046875, -6.5546875, -6.3095703125, -6.064453125, -5.8193359375, -5.57421875, -5.3291015625, -5.083984375, -4.8388671875, -4.59375, -4.3486328125, -4.103515625, -3.8583984375, -3.61328125, -3.3681640625, -3.123046875, -2.8779296875, -2.6328125, -2.3876953125, -2.142578125, -1.8974609375, -1.65234375, -1.4072265625, -1.162109375, -0.9169921875, -0.671875, -0.4267578125, -0.181640625, 0.0634765625, 0.30859375, 0.5537109375, 0.798828125, 1.0439453125, 1.2890625, 1.5341796875, 1.779296875, 2.0244140625, 2.26953125, 2.5146484375, 2.759765625, 3.0048828125, 3.25, 3.4951171875, 3.740234375, 3.9853515625, 4.23046875, 4.4755859375, 4.720703125, 4.9658203125, 5.2109375, 5.4560546875, 5.701171875, 5.9462890625, 6.19140625, 6.4365234375, 6.681640625, 6.9267578125, 7.171875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 4.0, 9.0, 11.0, 7.0, 14.0, 14.0, 11.0, 17.0, 25.0, 36.0, 33.0, 49.0, 44.0, 51.0, 64.0, 70.0, 57.0, 55.0, 49.0, 59.0, 63.0, 43.0, 35.0, 35.0, 29.0, 24.0, 26.0, 10.0, 11.0, 12.0, 4.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.447265625, -3.35089111328125, -3.2545166015625, -3.15814208984375, -3.061767578125, -2.96539306640625, -2.8690185546875, -2.77264404296875, -2.67626953125, -2.57989501953125, -2.4835205078125, -2.38714599609375, -2.290771484375, -2.19439697265625, -2.0980224609375, -2.00164794921875, -1.9052734375, -1.80889892578125, -1.7125244140625, -1.61614990234375, -1.519775390625, -1.42340087890625, -1.3270263671875, -1.23065185546875, -1.13427734375, -1.03790283203125, -0.9415283203125, -0.84515380859375, -0.748779296875, -0.65240478515625, -0.5560302734375, -0.45965576171875, -0.36328125, -0.26690673828125, -0.1705322265625, -0.07415771484375, 0.022216796875, 0.11859130859375, 0.2149658203125, 0.31134033203125, 0.40771484375, 0.50408935546875, 0.6004638671875, 0.69683837890625, 0.793212890625, 0.88958740234375, 0.9859619140625, 1.08233642578125, 1.1787109375, 1.27508544921875, 1.3714599609375, 1.46783447265625, 1.564208984375, 1.66058349609375, 1.7569580078125, 1.85333251953125, 1.94970703125, 2.04608154296875, 2.1424560546875, 2.23883056640625, 2.335205078125, 2.43157958984375, 2.5279541015625, 2.62432861328125, 2.720703125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 10.0, 3.0, 16.0, 8.0, 26.0, 23.0, 45.0, 33.0, 34.0, 60.0, 53.0, 59.0, 57.0, 48.0, 72.0, 59.0, 51.0, 49.0, 45.0, 42.0, 38.0, 33.0, 25.0, 12.0, 18.0, 22.0, 9.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.666426658630371, -12.26688289642334, -11.867339134216309, -11.467795372009277, -11.068251609802246, -10.668707847595215, -10.269164085388184, -9.869620323181152, -9.470076560974121, -9.07053279876709, -8.670989036560059, -8.271445274353027, -7.871901512145996, -7.472357749938965, -7.072813987731934, -6.673270225524902, -6.273726463317871, -5.87418270111084, -5.474638938903809, -5.075095176696777, -4.675551414489746, -4.276007652282715, -3.8764638900756836, -3.4769201278686523, -3.077376365661621, -2.67783260345459, -2.2782888412475586, -1.8787450790405273, -1.479201316833496, -1.0796575546264648, -0.6801137924194336, -0.28057003021240234, 0.1189727783203125, 0.5185165405273438, 0.918060302734375, 1.3176040649414062, 1.7171478271484375, 2.1166915893554688, 2.5162353515625, 2.9157791137695312, 3.3153228759765625, 3.7148666381835938, 4.114410400390625, 4.513954162597656, 4.9134979248046875, 5.313041687011719, 5.71258544921875, 6.112129211425781, 6.5116729736328125, 6.911216735839844, 7.310760498046875, 7.710304260253906, 8.109848022460938, 8.509391784667969, 8.908935546875, 9.308479309082031, 9.708023071289062, 10.107566833496094, 10.507110595703125, 10.906654357910156, 11.306198120117188, 11.705741882324219, 12.10528564453125, 12.504829406738281, 12.904373168945312]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 11.0, 13.0, 8.0, 7.0, 15.0, 18.0, 16.0, 18.0, 18.0, 26.0, 19.0, 28.0, 37.0, 28.0, 25.0, 40.0, 26.0, 39.0, 37.0, 39.0, 33.0, 34.0, 34.0, 26.0, 24.0, 28.0, 27.0, 34.0, 28.0, 23.0, 23.0, 29.0, 26.0, 25.0, 23.0, 18.0, 12.0, 8.0, 6.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-8.129793167114258, -7.8636579513549805, -7.597522735595703, -7.331387519836426, -7.065252304077148, -6.799117088317871, -6.5329813957214355, -6.266846179962158, -6.000710964202881, -5.7345757484436035, -5.468440532684326, -5.202305316925049, -4.936169624328613, -4.670034408569336, -4.403899192810059, -4.137763977050781, -3.871628761291504, -3.6054935455322266, -3.339358329772949, -3.0732228755950928, -2.8070876598358154, -2.540952444076538, -2.2748169898986816, -2.0086817741394043, -1.742546558380127, -1.4764113426208496, -1.2102760076522827, -0.9441407322883606, -0.6780054569244385, -0.41187024116516113, -0.14573490619659424, 0.12040042877197266, 0.38653564453125, 0.6526709198951721, 0.9188061952590942, 1.1849415302276611, 1.4510767459869385, 1.7172119617462158, 1.9833472967147827, 2.2494826316833496, 2.515617847442627, 2.7817530632019043, 3.0478882789611816, 3.314023733139038, 3.5801589488983154, 3.8462941646575928, 4.112429618835449, 4.378564834594727, 4.644700050354004, 4.910835266113281, 5.176970481872559, 5.443105697631836, 5.709240913391113, 5.975376129150391, 6.241511821746826, 6.5076470375061035, 6.773782253265381, 7.039917469024658, 7.3060526847839355, 7.572187900543213, 7.838323593139648, 8.104458808898926, 8.370594024658203, 8.63672924041748, 8.902864456176758]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 13.0, 13.0, 23.0, 26.0, 41.0, 74.0, 122.0, 178.0, 307.0, 485.0, 749.0, 1236.0, 2027.0, 3524.0, 6059.0, 10646.0, 19279.0, 36401.0, 72187.0, 152884.0, 342262.0, 720005.0, 1047133.0, 888923.0, 477114.0, 211551.0, 96541.0, 47124.0, 24735.0, 13425.0, 7711.0, 4479.0, 2626.0, 1620.0, 1055.0, 578.0, 367.0, 265.0, 182.0, 92.0, 67.0, 43.0, 38.0, 25.0, 11.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.795166015625, -8.48876953125, -8.182373046875, -7.8759765625, -7.569580078125, -7.26318359375, -6.956787109375, -6.650390625, -6.343994140625, -6.03759765625, -5.731201171875, -5.4248046875, -5.118408203125, -4.81201171875, -4.505615234375, -4.19921875, -3.892822265625, -3.58642578125, -3.280029296875, -2.9736328125, -2.667236328125, -2.36083984375, -2.054443359375, -1.748046875, -1.441650390625, -1.13525390625, -0.828857421875, -0.5224609375, -0.216064453125, 0.09033203125, 0.396728515625, 0.703125, 1.009521484375, 1.31591796875, 1.622314453125, 1.9287109375, 2.235107421875, 2.54150390625, 2.847900390625, 3.154296875, 3.460693359375, 3.76708984375, 4.073486328125, 4.3798828125, 4.686279296875, 4.99267578125, 5.299072265625, 5.60546875, 5.911865234375, 6.21826171875, 6.524658203125, 6.8310546875, 7.137451171875, 7.44384765625, 7.750244140625, 8.056640625, 8.363037109375, 8.66943359375, 8.975830078125, 9.2822265625, 9.588623046875, 9.89501953125, 10.201416015625, 10.5078125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 11.0, 5.0, 13.0, 13.0, 15.0, 19.0, 22.0, 22.0, 28.0, 25.0, 29.0, 32.0, 30.0, 29.0, 30.0, 37.0, 28.0, 28.0, 43.0, 42.0, 37.0, 45.0, 43.0, 30.0, 35.0, 31.0, 42.0, 28.0, 32.0, 25.0, 26.0, 24.0, 13.0, 16.0, 15.0, 8.0, 14.0, 7.0, 4.0, 4.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.15673828125, -5.9306640625, -5.70458984375, -5.478515625, -5.25244140625, -5.0263671875, -4.80029296875, -4.57421875, -4.34814453125, -4.1220703125, -3.89599609375, -3.669921875, -3.44384765625, -3.2177734375, -2.99169921875, -2.765625, -2.53955078125, -2.3134765625, -2.08740234375, -1.861328125, -1.63525390625, -1.4091796875, -1.18310546875, -0.95703125, -0.73095703125, -0.5048828125, -0.27880859375, -0.052734375, 0.17333984375, 0.3994140625, 0.62548828125, 0.8515625, 1.07763671875, 1.3037109375, 1.52978515625, 1.755859375, 1.98193359375, 2.2080078125, 2.43408203125, 2.66015625, 2.88623046875, 3.1123046875, 3.33837890625, 3.564453125, 3.79052734375, 4.0166015625, 4.24267578125, 4.46875, 4.69482421875, 4.9208984375, 5.14697265625, 5.373046875, 5.59912109375, 5.8251953125, 6.05126953125, 6.27734375, 6.50341796875, 6.7294921875, 6.95556640625, 7.181640625, 7.40771484375, 7.6337890625, 7.85986328125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 10.0, 8.0, 20.0, 40.0, 44.0, 67.0, 104.0, 140.0, 238.0, 373.0, 495.0, 763.0, 1272.0, 1978.0, 3110.0, 4896.0, 8124.0, 13244.0, 22538.0, 38766.0, 67856.0, 122578.0, 223743.0, 405989.0, 691440.0, 898670.0, 719482.0, 429253.0, 236888.0, 129832.0, 71834.0, 40494.0, 23530.0, 14124.0, 8276.0, 5223.0, 3136.0, 2028.0, 1229.0, 857.0, 574.0, 352.0, 239.0, 139.0, 89.0, 62.0, 46.0, 35.0, 25.0, 13.0, 12.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.6171875, -8.3524169921875, -8.087646484375, -7.8228759765625, -7.55810546875, -7.2933349609375, -7.028564453125, -6.7637939453125, -6.4990234375, -6.2342529296875, -5.969482421875, -5.7047119140625, -5.43994140625, -5.1751708984375, -4.910400390625, -4.6456298828125, -4.380859375, -4.1160888671875, -3.851318359375, -3.5865478515625, -3.32177734375, -3.0570068359375, -2.792236328125, -2.5274658203125, -2.2626953125, -1.9979248046875, -1.733154296875, -1.4683837890625, -1.20361328125, -0.9388427734375, -0.674072265625, -0.4093017578125, -0.14453125, 0.1202392578125, 0.385009765625, 0.6497802734375, 0.91455078125, 1.1793212890625, 1.444091796875, 1.7088623046875, 1.9736328125, 2.2384033203125, 2.503173828125, 2.7679443359375, 3.03271484375, 3.2974853515625, 3.562255859375, 3.8270263671875, 4.091796875, 4.3565673828125, 4.621337890625, 4.8861083984375, 5.15087890625, 5.4156494140625, 5.680419921875, 5.9451904296875, 6.2099609375, 6.4747314453125, 6.739501953125, 7.0042724609375, 7.26904296875, 7.5338134765625, 7.798583984375, 8.0633544921875, 8.328125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 4.0, 11.0, 17.0, 23.0, 33.0, 31.0, 40.0, 59.0, 58.0, 87.0, 124.0, 124.0, 190.0, 207.0, 250.0, 299.0, 331.0, 299.0, 244.0, 290.0, 252.0, 220.0, 182.0, 132.0, 127.0, 92.0, 69.0, 56.0, 53.0, 36.0, 31.0, 27.0, 17.0, 13.0, 5.0, 10.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.287109375, -3.17987060546875, -3.0726318359375, -2.96539306640625, -2.858154296875, -2.75091552734375, -2.6436767578125, -2.53643798828125, -2.42919921875, -2.32196044921875, -2.2147216796875, -2.10748291015625, -2.000244140625, -1.89300537109375, -1.7857666015625, -1.67852783203125, -1.5712890625, -1.46405029296875, -1.3568115234375, -1.24957275390625, -1.142333984375, -1.03509521484375, -0.9278564453125, -0.82061767578125, -0.71337890625, -0.60614013671875, -0.4989013671875, -0.39166259765625, -0.284423828125, -0.17718505859375, -0.0699462890625, 0.03729248046875, 0.14453125, 0.25177001953125, 0.3590087890625, 0.46624755859375, 0.573486328125, 0.68072509765625, 0.7879638671875, 0.89520263671875, 1.00244140625, 1.10968017578125, 1.2169189453125, 1.32415771484375, 1.431396484375, 1.53863525390625, 1.6458740234375, 1.75311279296875, 1.8603515625, 1.96759033203125, 2.0748291015625, 2.18206787109375, 2.289306640625, 2.39654541015625, 2.5037841796875, 2.61102294921875, 2.71826171875, 2.82550048828125, 2.9327392578125, 3.03997802734375, 3.147216796875, 3.25445556640625, 3.3616943359375, 3.46893310546875, 3.576171875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 5.0, 14.0, 13.0, 10.0, 22.0, 15.0, 21.0, 31.0, 35.0, 49.0, 44.0, 53.0, 64.0, 79.0, 65.0, 70.0, 59.0, 59.0, 42.0, 42.0, 37.0, 31.0, 21.0, 26.0, 25.0, 18.0, 9.0, 9.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.875686645507812, -10.540382385253906, -10.205078125, -9.869773864746094, -9.534468650817871, -9.199164390563965, -8.863860130310059, -8.528555870056152, -8.19325065612793, -7.857946395874023, -7.522641658782959, -7.187337398529053, -6.852032661437988, -6.516728401184082, -6.181424140930176, -5.8461198806762695, -5.510815620422363, -5.175511360168457, -4.840206623077393, -4.504902362823486, -4.169597625732422, -3.8342933654785156, -3.4989891052246094, -3.163684606552124, -2.8283801078796387, -2.4930756092071533, -2.157771110534668, -1.8224668502807617, -1.4871623516082764, -1.151857852935791, -0.8165535926818848, -0.4812490940093994, -0.14594459533691406, 0.1893598437309265, 0.5246642827987671, 0.8599686622619629, 1.1952731609344482, 1.5305776596069336, 1.8658819198608398, 2.201186418533325, 2.5364909172058105, 2.871795415878296, 3.2070999145507812, 3.5424041748046875, 3.877708673477173, 4.213013172149658, 4.5483174324035645, 4.883622169494629, 5.218926429748535, 5.554230690002441, 5.889535427093506, 6.224839687347412, 6.560144424438477, 6.895448684692383, 7.230752944946289, 7.566057205200195, 7.90136194229126, 8.236666679382324, 8.57197093963623, 8.907275199890137, 9.242579460144043, 9.577884674072266, 9.913188934326172, 10.248493194580078, 10.583797454833984]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 4.0, 6.0, 10.0, 5.0, 11.0, 13.0, 15.0, 17.0, 21.0, 16.0, 22.0, 26.0, 31.0, 29.0, 33.0, 25.0, 28.0, 27.0, 33.0, 40.0, 31.0, 27.0, 32.0, 29.0, 37.0, 35.0, 27.0, 42.0, 25.0, 28.0, 31.0, 27.0, 23.0, 21.0, 16.0, 23.0, 15.0, 12.0, 12.0, 14.0, 13.0, 7.0, 8.0, 11.0, 8.0, 11.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-6.885350704193115, -6.668995380401611, -6.452640533447266, -6.236285209655762, -6.019929885864258, -5.803574562072754, -5.58721923828125, -5.370864391326904, -5.1545090675354, -4.9381537437438965, -4.721798896789551, -4.505443572998047, -4.289088249206543, -4.072732925415039, -3.8563778400421143, -3.6400227546691895, -3.4236674308776855, -3.2073121070861816, -2.990957021713257, -2.774601936340332, -2.558246612548828, -2.341891288757324, -2.1255362033843994, -1.909180998802185, -1.6928257942199707, -1.4764705896377563, -1.260115385055542, -1.0437601804733276, -0.8274049758911133, -0.6110497713088989, -0.39469456672668457, -0.17833936214447021, 0.03801584243774414, 0.2543710470199585, 0.47072625160217285, 0.6870814561843872, 0.9034366607666016, 1.119791865348816, 1.3361470699310303, 1.5525022745132446, 1.768857479095459, 1.9852126836776733, 2.2015678882598877, 2.4179229736328125, 2.6342782974243164, 2.8506336212158203, 3.066988706588745, 3.28334379196167, 3.499699115753174, 3.7160544395446777, 3.9324095249176025, 4.148764610290527, 4.365119934082031, 4.581475257873535, 4.797830581665039, 5.014185428619385, 5.230540752410889, 5.446896076202393, 5.663250923156738, 5.879606246948242, 6.095961570739746, 6.31231689453125, 6.528672218322754, 6.7450270652771, 6.9613823890686035]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 17.0, 13.0, 27.0, 54.0, 66.0, 100.0, 182.0, 220.0, 347.0, 555.0, 897.0, 1288.0, 1977.0, 3103.0, 4970.0, 7619.0, 12402.0, 19807.0, 31557.0, 50743.0, 80344.0, 121531.0, 160714.0, 167778.0, 134099.0, 92021.0, 58745.0, 35971.0, 22541.0, 14285.0, 8899.0, 5602.0, 3560.0, 2242.0, 1512.0, 933.0, 628.0, 408.0, 252.0, 189.0, 105.0, 64.0, 53.0, 40.0, 27.0, 18.0, 17.0, 9.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.14453125, -3.0435791015625, -2.942626953125, -2.8416748046875, -2.74072265625, -2.6397705078125, -2.538818359375, -2.4378662109375, -2.3369140625, -2.2359619140625, -2.135009765625, -2.0340576171875, -1.93310546875, -1.8321533203125, -1.731201171875, -1.6302490234375, -1.529296875, -1.4283447265625, -1.327392578125, -1.2264404296875, -1.12548828125, -1.0245361328125, -0.923583984375, -0.8226318359375, -0.7216796875, -0.6207275390625, -0.519775390625, -0.4188232421875, -0.31787109375, -0.2169189453125, -0.115966796875, -0.0150146484375, 0.0859375, 0.1868896484375, 0.287841796875, 0.3887939453125, 0.48974609375, 0.5906982421875, 0.691650390625, 0.7926025390625, 0.8935546875, 0.9945068359375, 1.095458984375, 1.1964111328125, 1.29736328125, 1.3983154296875, 1.499267578125, 1.6002197265625, 1.701171875, 1.8021240234375, 1.903076171875, 2.0040283203125, 2.10498046875, 2.2059326171875, 2.306884765625, 2.4078369140625, 2.5087890625, 2.6097412109375, 2.710693359375, 2.8116455078125, 2.91259765625, 3.0135498046875, 3.114501953125, 3.2154541015625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 9.0, 12.0, 9.0, 7.0, 17.0, 14.0, 13.0, 18.0, 21.0, 23.0, 28.0, 33.0, 29.0, 27.0, 30.0, 48.0, 28.0, 46.0, 35.0, 29.0, 39.0, 37.0, 32.0, 36.0, 34.0, 32.0, 22.0, 33.0, 33.0, 24.0, 27.0, 27.0, 18.0, 13.0, 15.0, 9.0, 11.0, 14.0, 7.0, 12.0, 10.0, 5.0, 9.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-7.78515625, -7.54473876953125, -7.3043212890625, -7.06390380859375, -6.823486328125, -6.58306884765625, -6.3426513671875, -6.10223388671875, -5.86181640625, -5.62139892578125, -5.3809814453125, -5.14056396484375, -4.900146484375, -4.65972900390625, -4.4193115234375, -4.17889404296875, -3.9384765625, -3.69805908203125, -3.4576416015625, -3.21722412109375, -2.976806640625, -2.73638916015625, -2.4959716796875, -2.25555419921875, -2.01513671875, -1.77471923828125, -1.5343017578125, -1.29388427734375, -1.053466796875, -0.81304931640625, -0.5726318359375, -0.33221435546875, -0.091796875, 0.14862060546875, 0.3890380859375, 0.62945556640625, 0.869873046875, 1.11029052734375, 1.3507080078125, 1.59112548828125, 1.83154296875, 2.07196044921875, 2.3123779296875, 2.55279541015625, 2.793212890625, 3.03363037109375, 3.2740478515625, 3.51446533203125, 3.7548828125, 3.99530029296875, 4.2357177734375, 4.47613525390625, 4.716552734375, 4.95697021484375, 5.1973876953125, 5.43780517578125, 5.67822265625, 5.91864013671875, 6.1590576171875, 6.39947509765625, 6.639892578125, 6.88031005859375, 7.1207275390625, 7.36114501953125, 7.6015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 8.0, 15.0, 11.0, 34.0, 41.0, 64.0, 86.0, 129.0, 205.0, 262.0, 413.0, 615.0, 926.0, 1446.0, 2236.0, 3660.0, 5850.0, 10403.0, 19084.0, 45662.0, 841611.0, 65222.0, 21456.0, 11314.0, 6728.0, 3864.0, 2452.0, 1605.0, 1006.0, 644.0, 465.0, 309.0, 237.0, 149.0, 93.0, 84.0, 38.0, 34.0, 28.0, 15.0, 8.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.7254638671875, -6.505615234375, -6.2857666015625, -6.06591796875, -5.8460693359375, -5.626220703125, -5.4063720703125, -5.1865234375, -4.9666748046875, -4.746826171875, -4.5269775390625, -4.30712890625, -4.0872802734375, -3.867431640625, -3.6475830078125, -3.427734375, -3.2078857421875, -2.988037109375, -2.7681884765625, -2.54833984375, -2.3284912109375, -2.108642578125, -1.8887939453125, -1.6689453125, -1.4490966796875, -1.229248046875, -1.0093994140625, -0.78955078125, -0.5697021484375, -0.349853515625, -0.1300048828125, 0.08984375, 0.3096923828125, 0.529541015625, 0.7493896484375, 0.96923828125, 1.1890869140625, 1.408935546875, 1.6287841796875, 1.8486328125, 2.0684814453125, 2.288330078125, 2.5081787109375, 2.72802734375, 2.9478759765625, 3.167724609375, 3.3875732421875, 3.607421875, 3.8272705078125, 4.047119140625, 4.2669677734375, 4.48681640625, 4.7066650390625, 4.926513671875, 5.1463623046875, 5.3662109375, 5.5860595703125, 5.805908203125, 6.0257568359375, 6.24560546875, 6.4654541015625, 6.685302734375, 6.9051513671875, 7.125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 8.0, 10.0, 14.0, 16.0, 20.0, 30.0, 36.0, 37.0, 43.0, 43.0, 45.0, 48.0, 59.0, 51.0, 54.0, 64.0, 42.0, 45.0, 47.0, 34.0, 33.0, 35.0, 29.0, 28.0, 16.0, 23.0, 15.0, 16.0, 4.0, 6.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.4921875, -8.26727294921875, -8.0423583984375, -7.81744384765625, -7.592529296875, -7.36761474609375, -7.1427001953125, -6.91778564453125, -6.69287109375, -6.46795654296875, -6.2430419921875, -6.01812744140625, -5.793212890625, -5.56829833984375, -5.3433837890625, -5.11846923828125, -4.8935546875, -4.66864013671875, -4.4437255859375, -4.21881103515625, -3.993896484375, -3.76898193359375, -3.5440673828125, -3.31915283203125, -3.09423828125, -2.86932373046875, -2.6444091796875, -2.41949462890625, -2.194580078125, -1.96966552734375, -1.7447509765625, -1.51983642578125, -1.294921875, -1.07000732421875, -0.8450927734375, -0.62017822265625, -0.395263671875, -0.17034912109375, 0.0545654296875, 0.27947998046875, 0.50439453125, 0.72930908203125, 0.9542236328125, 1.17913818359375, 1.404052734375, 1.62896728515625, 1.8538818359375, 2.07879638671875, 2.3037109375, 2.52862548828125, 2.7535400390625, 2.97845458984375, 3.203369140625, 3.42828369140625, 3.6531982421875, 3.87811279296875, 4.10302734375, 4.32794189453125, 4.5528564453125, 4.77777099609375, 5.002685546875, 5.22760009765625, 5.4525146484375, 5.67742919921875, 5.90234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 11.0, 18.0, 23.0, 17.0, 37.0, 48.0, 64.0, 108.0, 128.0, 204.0, 366.0, 510.0, 904.0, 1603.0, 2908.0, 5790.0, 13116.0, 39876.0, 898381.0, 54630.0, 15423.0, 6735.0, 3176.0, 1760.0, 946.0, 571.0, 370.0, 257.0, 174.0, 104.0, 65.0, 63.0, 47.0, 25.0, 19.0, 17.0, 8.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.078125, -4.92230224609375, -4.7664794921875, -4.61065673828125, -4.454833984375, -4.29901123046875, -4.1431884765625, -3.98736572265625, -3.83154296875, -3.67572021484375, -3.5198974609375, -3.36407470703125, -3.208251953125, -3.05242919921875, -2.8966064453125, -2.74078369140625, -2.5849609375, -2.42913818359375, -2.2733154296875, -2.11749267578125, -1.961669921875, -1.80584716796875, -1.6500244140625, -1.49420166015625, -1.33837890625, -1.18255615234375, -1.0267333984375, -0.87091064453125, -0.715087890625, -0.55926513671875, -0.4034423828125, -0.24761962890625, -0.091796875, 0.06402587890625, 0.2198486328125, 0.37567138671875, 0.531494140625, 0.68731689453125, 0.8431396484375, 0.99896240234375, 1.15478515625, 1.31060791015625, 1.4664306640625, 1.62225341796875, 1.778076171875, 1.93389892578125, 2.0897216796875, 2.24554443359375, 2.4013671875, 2.55718994140625, 2.7130126953125, 2.86883544921875, 3.024658203125, 3.18048095703125, 3.3363037109375, 3.49212646484375, 3.64794921875, 3.80377197265625, 3.9595947265625, 4.11541748046875, 4.271240234375, 4.42706298828125, 4.5828857421875, 4.73870849609375, 4.89453125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 12.0, 7.0, 9.0, 12.0, 11.0, 18.0, 29.0, 22.0, 35.0, 53.0, 52.0, 76.0, 102.0, 117.0, 91.0, 78.0, 53.0, 44.0, 38.0, 26.0, 26.0, 15.0, 13.0, 7.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002982616424560547, -0.0002881772816181183, -0.0002780929207801819, -0.0002680085599422455, -0.0002579241991043091, -0.0002478398382663727, -0.00023775547742843628, -0.00022767111659049988, -0.00021758675575256348, -0.00020750239491462708, -0.00019741803407669067, -0.00018733367323875427, -0.00017724931240081787, -0.00016716495156288147, -0.00015708059072494507, -0.00014699622988700867, -0.00013691186904907227, -0.00012682750821113586, -0.00011674314737319946, -0.00010665878653526306, -9.657442569732666e-05, -8.649006485939026e-05, -7.640570402145386e-05, -6.632134318351746e-05, -5.6236982345581055e-05, -4.615262150764465e-05, -3.606826066970825e-05, -2.598389983177185e-05, -1.589953899383545e-05, -5.815178155899048e-06, 4.2691826820373535e-06, 1.4353543519973755e-05, 2.4437904357910156e-05, 3.452226519584656e-05, 4.460662603378296e-05, 5.469098687171936e-05, 6.477534770965576e-05, 7.485970854759216e-05, 8.494406938552856e-05, 9.502843022346497e-05, 0.00010511279106140137, 0.00011519715189933777, 0.00012528151273727417, 0.00013536587357521057, 0.00014545023441314697, 0.00015553459525108337, 0.00016561895608901978, 0.00017570331692695618, 0.00018578767776489258, 0.00019587203860282898, 0.00020595639944076538, 0.00021604076027870178, 0.00022612512111663818, 0.00023620948195457458, 0.000246293842792511, 0.0002563782036304474, 0.0002664625644683838, 0.0002765469253063202, 0.0002866312861442566, 0.000296715646982193, 0.0003068000078201294, 0.0003168843686580658, 0.0003269687294960022, 0.0003370530903339386, 0.000347137451171875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 15.0, 18.0, 25.0, 36.0, 69.0, 80.0, 111.0, 150.0, 219.0, 291.0, 458.0, 672.0, 992.0, 1552.0, 2283.0, 3429.0, 5552.0, 8809.0, 14020.0, 22213.0, 36365.0, 59107.0, 96846.0, 150776.0, 195063.0, 164871.0, 108704.0, 67048.0, 40671.0, 25085.0, 15329.0, 9715.0, 6252.0, 3942.0, 2500.0, 1680.0, 1120.0, 771.0, 483.0, 357.0, 253.0, 163.0, 128.0, 81.0, 74.0, 43.0, 33.0, 33.0, 18.0, 4.0, 9.0, 6.0, 5.0, 6.0, 3.0], "bins": [-1.1845703125, -1.1493377685546875, -1.114105224609375, -1.0788726806640625, -1.04364013671875, -1.0084075927734375, -0.973175048828125, -0.9379425048828125, -0.9027099609375, -0.8674774169921875, -0.832244873046875, -0.7970123291015625, -0.76177978515625, -0.7265472412109375, -0.691314697265625, -0.6560821533203125, -0.620849609375, -0.5856170654296875, -0.550384521484375, -0.5151519775390625, -0.47991943359375, -0.4446868896484375, -0.409454345703125, -0.3742218017578125, -0.3389892578125, -0.3037567138671875, -0.268524169921875, -0.2332916259765625, -0.19805908203125, -0.1628265380859375, -0.127593994140625, -0.0923614501953125, -0.05712890625, -0.0218963623046875, 0.013336181640625, 0.0485687255859375, 0.08380126953125, 0.1190338134765625, 0.154266357421875, 0.1894989013671875, 0.2247314453125, 0.2599639892578125, 0.295196533203125, 0.3304290771484375, 0.36566162109375, 0.4008941650390625, 0.436126708984375, 0.4713592529296875, 0.506591796875, 0.5418243408203125, 0.577056884765625, 0.6122894287109375, 0.64752197265625, 0.6827545166015625, 0.717987060546875, 0.7532196044921875, 0.7884521484375, 0.8236846923828125, 0.858917236328125, 0.8941497802734375, 0.92938232421875, 0.9646148681640625, 0.999847412109375, 1.0350799560546875, 1.0703125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 8.0, 11.0, 16.0, 11.0, 8.0, 20.0, 15.0, 22.0, 36.0, 32.0, 44.0, 34.0, 49.0, 46.0, 50.0, 77.0, 45.0, 51.0, 70.0, 53.0, 50.0, 42.0, 32.0, 24.0, 25.0, 15.0, 18.0, 20.0, 9.0, 7.0, 10.0, 3.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4853515625, -0.4700355529785156, -0.45471954345703125, -0.4394035339355469, -0.4240875244140625, -0.4087715148925781, -0.39345550537109375, -0.3781394958496094, -0.362823486328125, -0.3475074768066406, -0.33219146728515625, -0.3168754577636719, -0.3015594482421875, -0.2862434387207031, -0.27092742919921875, -0.2556114196777344, -0.24029541015625, -0.22497940063476562, -0.20966339111328125, -0.19434738159179688, -0.1790313720703125, -0.16371536254882812, -0.14839935302734375, -0.13308334350585938, -0.117767333984375, -0.10245132446289062, -0.08713531494140625, -0.07181930541992188, -0.0565032958984375, -0.041187286376953125, -0.02587127685546875, -0.010555267333984375, 0.0047607421875, 0.020076751708984375, 0.03539276123046875, 0.050708770751953125, 0.0660247802734375, 0.08134078979492188, 0.09665679931640625, 0.11197280883789062, 0.127288818359375, 0.14260482788085938, 0.15792083740234375, 0.17323684692382812, 0.1885528564453125, 0.20386886596679688, 0.21918487548828125, 0.23450088500976562, 0.24981689453125, 0.2651329040527344, 0.28044891357421875, 0.2957649230957031, 0.3110809326171875, 0.3263969421386719, 0.34171295166015625, 0.3570289611816406, 0.372344970703125, 0.3876609802246094, 0.40297698974609375, 0.4182929992675781, 0.4336090087890625, 0.4489250183105469, 0.46424102783203125, 0.4795570373535156, 0.494873046875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 6.0, 14.0, 15.0, 10.0, 13.0, 28.0, 27.0, 31.0, 30.0, 61.0, 43.0, 46.0, 62.0, 65.0, 76.0, 60.0, 60.0, 63.0, 36.0, 35.0, 28.0, 30.0, 29.0, 21.0, 23.0, 17.0, 13.0, 9.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.425981521606445, -9.113774299621582, -8.801567077636719, -8.489360809326172, -8.177153587341309, -7.864946365356445, -7.55273962020874, -7.240532875061035, -6.928325653076172, -6.616118431091309, -6.3039116859436035, -5.991704940795898, -5.679497718811035, -5.367290496826172, -5.055083751678467, -4.742877006530762, -4.430669784545898, -4.118462562561035, -3.80625581741333, -3.494048833847046, -3.1818418502807617, -2.8696348667144775, -2.5574278831481934, -2.245220899581909, -1.933013916015625, -1.6208069324493408, -1.3085999488830566, -0.9963929653167725, -0.6841859817504883, -0.3719789981842041, -0.05977201461791992, 0.25243496894836426, 0.5646429061889648, 0.876849889755249, 1.1890568733215332, 1.5012638568878174, 1.8134708404541016, 2.1256778240203857, 2.43788480758667, 2.750091791152954, 3.0622987747192383, 3.3745057582855225, 3.6867127418518066, 3.998919725418091, 4.311126708984375, 4.623333930969238, 4.935540676116943, 5.247747421264648, 5.559954643249512, 5.872161865234375, 6.18436861038208, 6.496575355529785, 6.808782577514648, 7.120989799499512, 7.433196544647217, 7.745403289794922, 8.057610511779785, 8.369817733764648, 8.682024002075195, 8.994231224060059, 9.306438446044922, 9.618645668029785, 9.930852890014648, 10.243059158325195, 10.555266380310059]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 7.0, 9.0, 7.0, 5.0, 14.0, 12.0, 14.0, 13.0, 21.0, 20.0, 24.0, 23.0, 29.0, 27.0, 33.0, 25.0, 22.0, 32.0, 39.0, 28.0, 31.0, 34.0, 27.0, 30.0, 37.0, 37.0, 27.0, 33.0, 38.0, 26.0, 33.0, 26.0, 32.0, 16.0, 8.0, 27.0, 26.0, 12.0, 11.0, 10.0, 9.0, 10.0, 14.0, 4.0, 8.0, 9.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-7.102121829986572, -6.886204719543457, -6.6702880859375, -6.454370975494385, -6.2384538650512695, -6.0225372314453125, -5.806620121002197, -5.590703010559082, -5.374786376953125, -5.15886926651001, -4.942952632904053, -4.7270355224609375, -4.5111188888549805, -4.295201778411865, -4.07928466796875, -3.863367795944214, -3.6474509239196777, -3.4315340518951416, -3.2156171798706055, -2.9997000694274902, -2.783783197402954, -2.567866325378418, -2.3519492149353027, -2.1360323429107666, -1.9201154708862305, -1.7041985988616943, -1.4882816076278687, -1.272364616394043, -1.0564477443695068, -0.8405308723449707, -0.624613881111145, -0.40869688987731934, -0.192779541015625, 0.023137390613555908, 0.23905432224273682, 0.4549712538719177, 0.6708881855010986, 0.8868050575256348, 1.1027220487594604, 1.3186390399932861, 1.5345559120178223, 1.7504727840423584, 1.966389775276184, 2.1823067665100098, 2.398223638534546, 2.614140510559082, 2.8300576210021973, 3.0459744930267334, 3.2618913650512695, 3.4778082370758057, 3.693725109100342, 3.909642219543457, 4.125558853149414, 4.341475963592529, 4.5573930740356445, 4.773309707641602, 4.989226818084717, 5.205143928527832, 5.421060562133789, 5.636977672576904, 5.8528947830200195, 6.068811416625977, 6.284728527069092, 6.500645637512207, 6.716562271118164]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 9.0, 15.0, 26.0, 27.0, 37.0, 56.0, 77.0, 121.0, 204.0, 286.0, 434.0, 665.0, 1041.0, 1601.0, 2494.0, 4024.0, 6595.0, 10616.0, 17652.0, 29350.0, 48412.0, 76788.0, 114663.0, 152910.0, 165167.0, 142097.0, 102252.0, 66240.0, 40547.0, 24700.0, 14893.0, 9165.0, 5739.0, 3488.0, 2197.0, 1370.0, 889.0, 578.0, 376.0, 236.0, 179.0, 110.0, 83.0, 44.0, 37.0, 19.0, 13.0, 13.0, 12.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4921875, -8.22119140625, -7.9501953125, -7.67919921875, -7.408203125, -7.13720703125, -6.8662109375, -6.59521484375, -6.32421875, -6.05322265625, -5.7822265625, -5.51123046875, -5.240234375, -4.96923828125, -4.6982421875, -4.42724609375, -4.15625, -3.88525390625, -3.6142578125, -3.34326171875, -3.072265625, -2.80126953125, -2.5302734375, -2.25927734375, -1.98828125, -1.71728515625, -1.4462890625, -1.17529296875, -0.904296875, -0.63330078125, -0.3623046875, -0.09130859375, 0.1796875, 0.45068359375, 0.7216796875, 0.99267578125, 1.263671875, 1.53466796875, 1.8056640625, 2.07666015625, 2.34765625, 2.61865234375, 2.8896484375, 3.16064453125, 3.431640625, 3.70263671875, 3.9736328125, 4.24462890625, 4.515625, 4.78662109375, 5.0576171875, 5.32861328125, 5.599609375, 5.87060546875, 6.1416015625, 6.41259765625, 6.68359375, 6.95458984375, 7.2255859375, 7.49658203125, 7.767578125, 8.03857421875, 8.3095703125, 8.58056640625, 8.8515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 10.0, 6.0, 9.0, 14.0, 14.0, 11.0, 16.0, 17.0, 24.0, 18.0, 35.0, 25.0, 38.0, 33.0, 28.0, 36.0, 35.0, 40.0, 24.0, 45.0, 33.0, 39.0, 40.0, 36.0, 38.0, 31.0, 39.0, 34.0, 31.0, 26.0, 25.0, 24.0, 12.0, 19.0, 7.0, 15.0, 17.0, 12.0, 5.0, 12.0, 8.0, 4.0, 2.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.2701416015625, -7.040283203125, -6.8104248046875, -6.58056640625, -6.3507080078125, -6.120849609375, -5.8909912109375, -5.6611328125, -5.4312744140625, -5.201416015625, -4.9715576171875, -4.74169921875, -4.5118408203125, -4.281982421875, -4.0521240234375, -3.822265625, -3.5924072265625, -3.362548828125, -3.1326904296875, -2.90283203125, -2.6729736328125, -2.443115234375, -2.2132568359375, -1.9833984375, -1.7535400390625, -1.523681640625, -1.2938232421875, -1.06396484375, -0.8341064453125, -0.604248046875, -0.3743896484375, -0.14453125, 0.0853271484375, 0.315185546875, 0.5450439453125, 0.77490234375, 1.0047607421875, 1.234619140625, 1.4644775390625, 1.6943359375, 1.9241943359375, 2.154052734375, 2.3839111328125, 2.61376953125, 2.8436279296875, 3.073486328125, 3.3033447265625, 3.533203125, 3.7630615234375, 3.992919921875, 4.2227783203125, 4.45263671875, 4.6824951171875, 4.912353515625, 5.1422119140625, 5.3720703125, 5.6019287109375, 5.831787109375, 6.0616455078125, 6.29150390625, 6.5213623046875, 6.751220703125, 6.9810791015625, 7.2109375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 16.0, 29.0, 31.0, 44.0, 93.0, 131.0, 181.0, 301.0, 467.0, 733.0, 1099.0, 1767.0, 2971.0, 4505.0, 7576.0, 12355.0, 20213.0, 33135.0, 54483.0, 86751.0, 129131.0, 164995.0, 165330.0, 130653.0, 88589.0, 55592.0, 34088.0, 20416.0, 12563.0, 7534.0, 4700.0, 2861.0, 1860.0, 1201.0, 784.0, 486.0, 314.0, 199.0, 122.0, 79.0, 54.0, 36.0, 28.0, 22.0, 11.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.09912109375, -6.8544921875, -6.60986328125, -6.365234375, -6.12060546875, -5.8759765625, -5.63134765625, -5.38671875, -5.14208984375, -4.8974609375, -4.65283203125, -4.408203125, -4.16357421875, -3.9189453125, -3.67431640625, -3.4296875, -3.18505859375, -2.9404296875, -2.69580078125, -2.451171875, -2.20654296875, -1.9619140625, -1.71728515625, -1.47265625, -1.22802734375, -0.9833984375, -0.73876953125, -0.494140625, -0.24951171875, -0.0048828125, 0.23974609375, 0.484375, 0.72900390625, 0.9736328125, 1.21826171875, 1.462890625, 1.70751953125, 1.9521484375, 2.19677734375, 2.44140625, 2.68603515625, 2.9306640625, 3.17529296875, 3.419921875, 3.66455078125, 3.9091796875, 4.15380859375, 4.3984375, 4.64306640625, 4.8876953125, 5.13232421875, 5.376953125, 5.62158203125, 5.8662109375, 6.11083984375, 6.35546875, 6.60009765625, 6.8447265625, 7.08935546875, 7.333984375, 7.57861328125, 7.8232421875, 8.06787109375, 8.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 11.0, 9.0, 10.0, 18.0, 16.0, 12.0, 14.0, 22.0, 15.0, 40.0, 25.0, 30.0, 39.0, 29.0, 40.0, 40.0, 31.0, 51.0, 37.0, 46.0, 34.0, 44.0, 31.0, 38.0, 34.0, 42.0, 42.0, 27.0, 20.0, 19.0, 21.0, 14.0, 22.0, 12.0, 14.0, 12.0, 4.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.5234375, -5.364501953125, -5.20556640625, -5.046630859375, -4.8876953125, -4.728759765625, -4.56982421875, -4.410888671875, -4.251953125, -4.093017578125, -3.93408203125, -3.775146484375, -3.6162109375, -3.457275390625, -3.29833984375, -3.139404296875, -2.98046875, -2.821533203125, -2.66259765625, -2.503662109375, -2.3447265625, -2.185791015625, -2.02685546875, -1.867919921875, -1.708984375, -1.550048828125, -1.39111328125, -1.232177734375, -1.0732421875, -0.914306640625, -0.75537109375, -0.596435546875, -0.4375, -0.278564453125, -0.11962890625, 0.039306640625, 0.1982421875, 0.357177734375, 0.51611328125, 0.675048828125, 0.833984375, 0.992919921875, 1.15185546875, 1.310791015625, 1.4697265625, 1.628662109375, 1.78759765625, 1.946533203125, 2.10546875, 2.264404296875, 2.42333984375, 2.582275390625, 2.7412109375, 2.900146484375, 3.05908203125, 3.218017578125, 3.376953125, 3.535888671875, 3.69482421875, 3.853759765625, 4.0126953125, 4.171630859375, 4.33056640625, 4.489501953125, 4.6484375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 15.0, 21.0, 31.0, 51.0, 61.0, 111.0, 196.0, 340.0, 579.0, 1015.0, 1817.0, 3556.0, 7044.0, 15436.0, 36364.0, 95533.0, 252421.0, 352696.0, 171342.0, 62852.0, 25042.0, 10882.0, 5229.0, 2600.0, 1399.0, 789.0, 411.0, 273.0, 149.0, 95.0, 62.0, 34.0, 35.0, 18.0, 16.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.15625, -11.675537109375, -11.19482421875, -10.714111328125, -10.2333984375, -9.752685546875, -9.27197265625, -8.791259765625, -8.310546875, -7.829833984375, -7.34912109375, -6.868408203125, -6.3876953125, -5.906982421875, -5.42626953125, -4.945556640625, -4.46484375, -3.984130859375, -3.50341796875, -3.022705078125, -2.5419921875, -2.061279296875, -1.58056640625, -1.099853515625, -0.619140625, -0.138427734375, 0.34228515625, 0.822998046875, 1.3037109375, 1.784423828125, 2.26513671875, 2.745849609375, 3.2265625, 3.707275390625, 4.18798828125, 4.668701171875, 5.1494140625, 5.630126953125, 6.11083984375, 6.591552734375, 7.072265625, 7.552978515625, 8.03369140625, 8.514404296875, 8.9951171875, 9.475830078125, 9.95654296875, 10.437255859375, 10.91796875, 11.398681640625, 11.87939453125, 12.360107421875, 12.8408203125, 13.321533203125, 13.80224609375, 14.282958984375, 14.763671875, 15.244384765625, 15.72509765625, 16.205810546875, 16.6865234375, 17.167236328125, 17.64794921875, 18.128662109375, 18.609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 13.0, 17.0, 22.0, 25.0, 39.0, 48.0, 40.0, 61.0, 61.0, 54.0, 74.0, 76.0, 54.0, 70.0, 56.0, 49.0, 42.0, 33.0, 24.0, 24.0, 27.0, 13.0, 13.0, 9.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009326934814453125, -0.0009019076824188232, -0.000871121883392334, -0.0008403360843658447, -0.0008095502853393555, -0.0007787644863128662, -0.000747978687286377, -0.0007171928882598877, -0.0006864070892333984, -0.0006556212902069092, -0.0006248354911804199, -0.0005940496921539307, -0.0005632638931274414, -0.0005324780941009521, -0.0005016922950744629, -0.00047090649604797363, -0.0004401206970214844, -0.0004093348979949951, -0.00037854909896850586, -0.0003477632999420166, -0.00031697750091552734, -0.0002861917018890381, -0.00025540590286254883, -0.00022462010383605957, -0.0001938343048095703, -0.00016304850578308105, -0.0001322627067565918, -0.00010147690773010254, -7.069110870361328e-05, -3.9905309677124023e-05, -9.119510650634766e-06, 2.1666288375854492e-05, 5.245208740234375e-05, 8.323788642883301e-05, 0.00011402368545532227, 0.00014480948448181152, 0.00017559528350830078, 0.00020638108253479004, 0.0002371668815612793, 0.00026795268058776855, 0.0002987384796142578, 0.00032952427864074707, 0.00036031007766723633, 0.0003910958766937256, 0.00042188167572021484, 0.0004526674747467041, 0.00048345327377319336, 0.0005142390727996826, 0.0005450248718261719, 0.0005758106708526611, 0.0006065964698791504, 0.0006373822689056396, 0.0006681680679321289, 0.0006989538669586182, 0.0007297396659851074, 0.0007605254650115967, 0.0007913112640380859, 0.0008220970630645752, 0.0008528828620910645, 0.0008836686611175537, 0.000914454460144043, 0.0009452402591705322, 0.0009760260581970215, 0.0010068118572235107, 0.00103759765625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 8.0, 11.0, 19.0, 20.0, 39.0, 39.0, 57.0, 103.0, 152.0, 204.0, 320.0, 474.0, 722.0, 1127.0, 1929.0, 3197.0, 5557.0, 10464.0, 20900.0, 47019.0, 112148.0, 240573.0, 294303.0, 171584.0, 72722.0, 31572.0, 14733.0, 7651.0, 4219.0, 2520.0, 1466.0, 923.0, 604.0, 368.0, 233.0, 175.0, 134.0, 66.0, 45.0, 45.0, 28.0, 19.0, 17.0, 15.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.203125, -10.8201904296875, -10.437255859375, -10.0543212890625, -9.67138671875, -9.2884521484375, -8.905517578125, -8.5225830078125, -8.1396484375, -7.7567138671875, -7.373779296875, -6.9908447265625, -6.60791015625, -6.2249755859375, -5.842041015625, -5.4591064453125, -5.076171875, -4.6932373046875, -4.310302734375, -3.9273681640625, -3.54443359375, -3.1614990234375, -2.778564453125, -2.3956298828125, -2.0126953125, -1.6297607421875, -1.246826171875, -0.8638916015625, -0.48095703125, -0.0980224609375, 0.284912109375, 0.6678466796875, 1.05078125, 1.4337158203125, 1.816650390625, 2.1995849609375, 2.58251953125, 2.9654541015625, 3.348388671875, 3.7313232421875, 4.1142578125, 4.4971923828125, 4.880126953125, 5.2630615234375, 5.64599609375, 6.0289306640625, 6.411865234375, 6.7947998046875, 7.177734375, 7.5606689453125, 7.943603515625, 8.3265380859375, 8.70947265625, 9.0924072265625, 9.475341796875, 9.8582763671875, 10.2412109375, 10.6241455078125, 11.007080078125, 11.3900146484375, 11.77294921875, 12.1558837890625, 12.538818359375, 12.9217529296875, 13.3046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 8.0, 8.0, 10.0, 16.0, 13.0, 18.0, 23.0, 25.0, 35.0, 48.0, 50.0, 65.0, 79.0, 70.0, 72.0, 79.0, 58.0, 53.0, 57.0, 44.0, 31.0, 27.0, 21.0, 22.0, 10.0, 4.0, 7.0, 4.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.86712646484375, -2.7576904296875, -2.64825439453125, -2.538818359375, -2.42938232421875, -2.3199462890625, -2.21051025390625, -2.10107421875, -1.99163818359375, -1.8822021484375, -1.77276611328125, -1.663330078125, -1.55389404296875, -1.4444580078125, -1.33502197265625, -1.2255859375, -1.11614990234375, -1.0067138671875, -0.89727783203125, -0.787841796875, -0.67840576171875, -0.5689697265625, -0.45953369140625, -0.35009765625, -0.24066162109375, -0.1312255859375, -0.02178955078125, 0.087646484375, 0.19708251953125, 0.3065185546875, 0.41595458984375, 0.525390625, 0.63482666015625, 0.7442626953125, 0.85369873046875, 0.963134765625, 1.07257080078125, 1.1820068359375, 1.29144287109375, 1.40087890625, 1.51031494140625, 1.6197509765625, 1.72918701171875, 1.838623046875, 1.94805908203125, 2.0574951171875, 2.16693115234375, 2.2763671875, 2.38580322265625, 2.4952392578125, 2.60467529296875, 2.714111328125, 2.82354736328125, 2.9329833984375, 3.04241943359375, 3.15185546875, 3.26129150390625, 3.3707275390625, 3.48016357421875, 3.589599609375, 3.69903564453125, 3.8084716796875, 3.91790771484375, 4.02734375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 4.0, 10.0, 16.0, 17.0, 24.0, 22.0, 35.0, 36.0, 45.0, 43.0, 57.0, 48.0, 64.0, 69.0, 74.0, 72.0, 50.0, 57.0, 46.0, 31.0, 41.0, 32.0, 22.0, 16.0, 12.0, 12.0, 9.0, 8.0, 7.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.535650253295898, -11.200141906738281, -10.86463451385498, -10.529126167297363, -10.193618774414062, -9.858110427856445, -9.522603034973145, -9.187094688415527, -8.851587295532227, -8.51607894897461, -8.180571556091309, -7.84506368637085, -7.509555816650391, -7.174047946929932, -6.838540077209473, -6.5030317306518555, -6.1675238609313965, -5.8320159912109375, -5.4965081214904785, -5.1610002517700195, -4.8254923820495605, -4.489984512329102, -4.154476165771484, -3.8189685344696045, -3.4834606647491455, -3.1479527950286865, -2.8124449253082275, -2.4769368171691895, -2.1414289474487305, -1.805921196937561, -1.4704132080078125, -1.1349053382873535, -0.7993974685668945, -0.46388956904411316, -0.1283816695213318, 0.20712625980377197, 0.542634129524231, 0.8781419992446899, 1.2136499881744385, 1.5491578578948975, 1.8846657276153564, 2.2201735973358154, 2.5556814670562744, 2.8911895751953125, 3.2266974449157715, 3.5622053146362305, 3.8977131843566895, 4.233221054077148, 4.568728923797607, 4.904236793518066, 5.239744663238525, 5.575252532958984, 5.910760402679443, 6.246268272399902, 6.5817766189575195, 6.91728401184082, 7.2527923583984375, 7.5883002281188965, 7.9238080978393555, 8.259316444396973, 8.594823837280273, 8.93033218383789, 9.265839576721191, 9.601347923278809, 9.93685531616211]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 3.0, 3.0, 8.0, 5.0, 12.0, 2.0, 14.0, 20.0, 17.0, 28.0, 21.0, 21.0, 19.0, 31.0, 23.0, 31.0, 32.0, 30.0, 40.0, 38.0, 40.0, 45.0, 39.0, 30.0, 31.0, 28.0, 44.0, 28.0, 34.0, 29.0, 22.0, 33.0, 20.0, 26.0, 23.0, 12.0, 23.0, 20.0, 15.0, 15.0, 10.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.768545150756836, -6.531733989715576, -6.294923305511475, -6.058112144470215, -5.821300983428955, -5.5844902992248535, -5.347679138183594, -5.110868453979492, -4.874057292938232, -4.637246131896973, -4.400435447692871, -4.163624286651611, -3.9268133640289307, -3.69000244140625, -3.4531912803649902, -3.2163803577423096, -2.97956919670105, -2.742758274078369, -2.5059471130371094, -2.2691361904144287, -2.032325267791748, -1.7955142259597778, -1.5587031841278076, -1.321892261505127, -1.0850812196731567, -0.8482702374458313, -0.6114592552185059, -0.37464821338653564, -0.1378372311592102, 0.09897375106811523, 0.33578479290008545, 0.5725957155227661, 0.8094067573547363, 1.0462177991867065, 1.2830287218093872, 1.5198397636413574, 1.756650686264038, 1.9934617280960083, 2.2302727699279785, 2.467083692550659, 2.70389461517334, 2.9407055377960205, 3.1775166988372803, 3.414327621459961, 3.6511385440826416, 3.8879494667053223, 4.124760627746582, 4.361571311950684, 4.598382949829102, 4.835194110870361, 5.072004795074463, 5.308815956115723, 5.545627117156982, 5.782437801361084, 6.019248962402344, 6.256059646606445, 6.492870807647705, 6.729681968688965, 6.966492652893066, 7.203303813934326, 7.440114974975586, 7.6769256591796875, 7.913736820220947, 8.150547981262207, 8.387358665466309]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 10.0, 25.0, 28.0, 41.0, 63.0, 125.0, 167.0, 300.0, 477.0, 740.0, 1214.0, 1975.0, 3242.0, 5438.0, 9735.0, 17281.0, 32195.0, 62905.0, 129905.0, 285515.0, 625333.0, 1025214.0, 968491.0, 543012.0, 244651.0, 112989.0, 56356.0, 28958.0, 16003.0, 8908.0, 5040.0, 3095.0, 1769.0, 1110.0, 694.0, 453.0, 290.0, 190.0, 114.0, 81.0, 56.0, 35.0, 17.0, 11.0, 9.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.287109375, -8.02734375, -7.767578125, -7.5078125, -7.248046875, -6.98828125, -6.728515625, -6.46875, -6.208984375, -5.94921875, -5.689453125, -5.4296875, -5.169921875, -4.91015625, -4.650390625, -4.390625, -4.130859375, -3.87109375, -3.611328125, -3.3515625, -3.091796875, -2.83203125, -2.572265625, -2.3125, -2.052734375, -1.79296875, -1.533203125, -1.2734375, -1.013671875, -0.75390625, -0.494140625, -0.234375, 0.025390625, 0.28515625, 0.544921875, 0.8046875, 1.064453125, 1.32421875, 1.583984375, 1.84375, 2.103515625, 2.36328125, 2.623046875, 2.8828125, 3.142578125, 3.40234375, 3.662109375, 3.921875, 4.181640625, 4.44140625, 4.701171875, 4.9609375, 5.220703125, 5.48046875, 5.740234375, 6.0, 6.259765625, 6.51953125, 6.779296875, 7.0390625, 7.298828125, 7.55859375, 7.818359375, 8.078125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 12.0, 12.0, 21.0, 22.0, 21.0, 23.0, 28.0, 24.0, 26.0, 34.0, 33.0, 40.0, 42.0, 43.0, 47.0, 31.0, 38.0, 45.0, 42.0, 42.0, 37.0, 36.0, 31.0, 26.0, 29.0, 31.0, 27.0, 21.0, 19.0, 14.0, 16.0, 11.0, 8.0, 6.0, 11.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.96697998046875, -4.7894287109375, -4.61187744140625, -4.434326171875, -4.25677490234375, -4.0792236328125, -3.90167236328125, -3.72412109375, -3.54656982421875, -3.3690185546875, -3.19146728515625, -3.013916015625, -2.83636474609375, -2.6588134765625, -2.48126220703125, -2.3037109375, -2.12615966796875, -1.9486083984375, -1.77105712890625, -1.593505859375, -1.41595458984375, -1.2384033203125, -1.06085205078125, -0.88330078125, -0.70574951171875, -0.5281982421875, -0.35064697265625, -0.173095703125, 0.00445556640625, 0.1820068359375, 0.35955810546875, 0.537109375, 0.71466064453125, 0.8922119140625, 1.06976318359375, 1.247314453125, 1.42486572265625, 1.6024169921875, 1.77996826171875, 1.95751953125, 2.13507080078125, 2.3126220703125, 2.49017333984375, 2.667724609375, 2.84527587890625, 3.0228271484375, 3.20037841796875, 3.3779296875, 3.55548095703125, 3.7330322265625, 3.91058349609375, 4.088134765625, 4.26568603515625, 4.4432373046875, 4.62078857421875, 4.79833984375, 4.97589111328125, 5.1534423828125, 5.33099365234375, 5.508544921875, 5.68609619140625, 5.8636474609375, 6.04119873046875, 6.21875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 13.0, 15.0, 22.0, 32.0, 36.0, 57.0, 101.0, 138.0, 214.0, 352.0, 559.0, 900.0, 1434.0, 2507.0, 4256.0, 7291.0, 13014.0, 23805.0, 43815.0, 83548.0, 162141.0, 312386.0, 571998.0, 874189.0, 869497.0, 570787.0, 309428.0, 160487.0, 83159.0, 43590.0, 23455.0, 12987.0, 7303.0, 4222.0, 2558.0, 1469.0, 881.0, 570.0, 386.0, 211.0, 160.0, 96.0, 56.0, 44.0, 44.0, 23.0, 14.0, 12.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.578125, -7.34844970703125, -7.1187744140625, -6.88909912109375, -6.659423828125, -6.42974853515625, -6.2000732421875, -5.97039794921875, -5.74072265625, -5.51104736328125, -5.2813720703125, -5.05169677734375, -4.822021484375, -4.59234619140625, -4.3626708984375, -4.13299560546875, -3.9033203125, -3.67364501953125, -3.4439697265625, -3.21429443359375, -2.984619140625, -2.75494384765625, -2.5252685546875, -2.29559326171875, -2.06591796875, -1.83624267578125, -1.6065673828125, -1.37689208984375, -1.147216796875, -0.91754150390625, -0.6878662109375, -0.45819091796875, -0.228515625, 0.00115966796875, 0.2308349609375, 0.46051025390625, 0.690185546875, 0.91986083984375, 1.1495361328125, 1.37921142578125, 1.60888671875, 1.83856201171875, 2.0682373046875, 2.29791259765625, 2.527587890625, 2.75726318359375, 2.9869384765625, 3.21661376953125, 3.4462890625, 3.67596435546875, 3.9056396484375, 4.13531494140625, 4.364990234375, 4.59466552734375, 4.8243408203125, 5.05401611328125, 5.28369140625, 5.51336669921875, 5.7430419921875, 5.97271728515625, 6.202392578125, 6.43206787109375, 6.6617431640625, 6.89141845703125, 7.12109375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 10.0, 3.0, 11.0, 11.0, 17.0, 16.0, 28.0, 40.0, 39.0, 49.0, 58.0, 77.0, 99.0, 113.0, 138.0, 176.0, 178.0, 208.0, 245.0, 251.0, 256.0, 243.0, 267.0, 237.0, 221.0, 192.0, 149.0, 146.0, 114.0, 90.0, 86.0, 67.0, 50.0, 30.0, 37.0, 27.0, 24.0, 12.0, 17.0, 9.0, 10.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.222198486328125, -2.14556884765625, -2.068939208984375, -1.9923095703125, -1.915679931640625, -1.83905029296875, -1.762420654296875, -1.685791015625, -1.609161376953125, -1.53253173828125, -1.455902099609375, -1.3792724609375, -1.302642822265625, -1.22601318359375, -1.149383544921875, -1.07275390625, -0.996124267578125, -0.91949462890625, -0.842864990234375, -0.7662353515625, -0.689605712890625, -0.61297607421875, -0.536346435546875, -0.459716796875, -0.383087158203125, -0.30645751953125, -0.229827880859375, -0.1531982421875, -0.076568603515625, 6.103515625e-05, 0.076690673828125, 0.1533203125, 0.229949951171875, 0.30657958984375, 0.383209228515625, 0.4598388671875, 0.536468505859375, 0.61309814453125, 0.689727783203125, 0.766357421875, 0.842987060546875, 0.91961669921875, 0.996246337890625, 1.0728759765625, 1.149505615234375, 1.22613525390625, 1.302764892578125, 1.37939453125, 1.456024169921875, 1.53265380859375, 1.609283447265625, 1.6859130859375, 1.762542724609375, 1.83917236328125, 1.915802001953125, 1.992431640625, 2.069061279296875, 2.14569091796875, 2.222320556640625, 2.2989501953125, 2.375579833984375, 2.45220947265625, 2.528839111328125, 2.60546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 17.0, 21.0, 29.0, 23.0, 36.0, 37.0, 44.0, 55.0, 55.0, 70.0, 62.0, 65.0, 54.0, 66.0, 61.0, 48.0, 32.0, 33.0, 35.0, 18.0, 25.0, 15.0, 23.0, 8.0, 12.0, 4.0, 5.0, 7.0, 5.0, 2.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.380881309509277, -8.1304931640625, -7.880105495452881, -7.629717826843262, -7.379330158233643, -7.128942489624023, -6.878554344177246, -6.628166675567627, -6.377779006958008, -6.127391338348389, -5.877003192901611, -5.626615524291992, -5.376227855682373, -5.125840187072754, -4.875452041625977, -4.625064373016357, -4.37467622756958, -4.124288558959961, -3.8739006519317627, -3.6235127449035645, -3.3731250762939453, -3.122737169265747, -2.872349262237549, -2.6219615936279297, -2.3715736865997314, -2.121185779571533, -1.870798110961914, -1.6204102039337158, -1.3700224161148071, -1.1196346282958984, -0.8692467212677002, -0.6188589334487915, -0.368471622467041, -0.11808380484580994, 0.13230401277542114, 0.3826918601989746, 0.6330796480178833, 0.883467435836792, 1.1338553428649902, 1.384243130683899, 1.6346309185028076, 1.8850187063217163, 2.135406494140625, 2.3857944011688232, 2.6361823081970215, 2.8865699768066406, 3.136957883834839, 3.387345790863037, 3.6377334594726562, 3.8881213665008545, 4.138509273529053, 4.388896942138672, 4.639284610748291, 4.88967227935791, 5.1400604248046875, 5.390448093414307, 5.640835762023926, 5.891223430633545, 6.141611576080322, 6.391999244689941, 6.6423869132995605, 6.89277458190918, 7.143162727355957, 7.393550395965576, 7.6439385414123535]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 8.0, 3.0, 9.0, 12.0, 7.0, 12.0, 14.0, 20.0, 24.0, 31.0, 30.0, 29.0, 25.0, 21.0, 29.0, 36.0, 41.0, 35.0, 45.0, 35.0, 25.0, 33.0, 49.0, 34.0, 31.0, 36.0, 36.0, 23.0, 23.0, 33.0, 28.0, 23.0, 32.0, 22.0, 20.0, 15.0, 15.0, 7.0, 8.0, 8.0, 8.0, 2.0, 7.0, 1.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.365355014801025, -5.178637504577637, -4.99191951751709, -4.805201530456543, -4.618484020233154, -4.431766510009766, -4.245048522949219, -4.058330535888672, -3.871613025665283, -3.6848952770233154, -3.4981775283813477, -3.31145977973938, -3.124742031097412, -2.9380242824554443, -2.7513065338134766, -2.564588785171509, -2.377871036529541, -2.1911532878875732, -2.0044355392456055, -1.8177177906036377, -1.63100004196167, -1.4442822933197021, -1.2575645446777344, -1.0708467960357666, -0.8841290473937988, -0.697411298751831, -0.5106935501098633, -0.3239758014678955, -0.13725805282592773, 0.04945969581604004, 0.2361774444580078, 0.4228951930999756, 0.6096124649047852, 0.7963302135467529, 0.9830479621887207, 1.1697657108306885, 1.3564834594726562, 1.543201208114624, 1.7299189567565918, 1.9166367053985596, 2.1033544540405273, 2.290072202682495, 2.476789951324463, 2.6635076999664307, 2.8502254486083984, 3.036943197250366, 3.223660945892334, 3.4103786945343018, 3.5970964431762695, 3.7838141918182373, 3.970531940460205, 4.157249450683594, 4.343967437744141, 4.5306854248046875, 4.717402935028076, 4.904120445251465, 5.090838432312012, 5.277556419372559, 5.464273929595947, 5.650991439819336, 5.837709426879883, 6.02442741394043, 6.211144924163818, 6.397862434387207, 6.584580421447754]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 14.0, 11.0, 19.0, 27.0, 46.0, 85.0, 110.0, 144.0, 210.0, 340.0, 503.0, 711.0, 1077.0, 1590.0, 2314.0, 3439.0, 4952.0, 7198.0, 10986.0, 15869.0, 23954.0, 35254.0, 51168.0, 73986.0, 101835.0, 129538.0, 140483.0, 125238.0, 97098.0, 69661.0, 48319.0, 33202.0, 22352.0, 14985.0, 10102.0, 6992.0, 4694.0, 3210.0, 2181.0, 1457.0, 1038.0, 689.0, 493.0, 326.0, 214.0, 141.0, 109.0, 77.0, 42.0, 33.0, 13.0, 17.0, 8.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.544921875, -1.4972686767578125, -1.449615478515625, -1.4019622802734375, -1.35430908203125, -1.3066558837890625, -1.259002685546875, -1.2113494873046875, -1.1636962890625, -1.1160430908203125, -1.068389892578125, -1.0207366943359375, -0.97308349609375, -0.9254302978515625, -0.877777099609375, -0.8301239013671875, -0.782470703125, -0.7348175048828125, -0.687164306640625, -0.6395111083984375, -0.59185791015625, -0.5442047119140625, -0.496551513671875, -0.4488983154296875, -0.4012451171875, -0.3535919189453125, -0.305938720703125, -0.2582855224609375, -0.21063232421875, -0.1629791259765625, -0.115325927734375, -0.0676727294921875, -0.02001953125, 0.0276336669921875, 0.075286865234375, 0.1229400634765625, 0.17059326171875, 0.2182464599609375, 0.265899658203125, 0.3135528564453125, 0.3612060546875, 0.4088592529296875, 0.456512451171875, 0.5041656494140625, 0.55181884765625, 0.5994720458984375, 0.647125244140625, 0.6947784423828125, 0.742431640625, 0.7900848388671875, 0.837738037109375, 0.8853912353515625, 0.93304443359375, 0.9806976318359375, 1.028350830078125, 1.0760040283203125, 1.1236572265625, 1.1713104248046875, 1.218963623046875, 1.2666168212890625, 1.31427001953125, 1.3619232177734375, 1.409576416015625, 1.4572296142578125, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 6.0, 3.0, 5.0, 11.0, 9.0, 11.0, 15.0, 15.0, 15.0, 24.0, 18.0, 28.0, 36.0, 18.0, 25.0, 30.0, 35.0, 42.0, 42.0, 38.0, 41.0, 29.0, 42.0, 33.0, 42.0, 32.0, 40.0, 28.0, 30.0, 41.0, 19.0, 32.0, 23.0, 27.0, 25.0, 10.0, 14.0, 12.0, 6.0, 12.0, 5.0, 8.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.73046875, -6.53253173828125, -6.3345947265625, -6.13665771484375, -5.938720703125, -5.74078369140625, -5.5428466796875, -5.34490966796875, -5.14697265625, -4.94903564453125, -4.7510986328125, -4.55316162109375, -4.355224609375, -4.15728759765625, -3.9593505859375, -3.76141357421875, -3.5634765625, -3.36553955078125, -3.1676025390625, -2.96966552734375, -2.771728515625, -2.57379150390625, -2.3758544921875, -2.17791748046875, -1.97998046875, -1.78204345703125, -1.5841064453125, -1.38616943359375, -1.188232421875, -0.99029541015625, -0.7923583984375, -0.59442138671875, -0.396484375, -0.19854736328125, -0.0006103515625, 0.19732666015625, 0.395263671875, 0.59320068359375, 0.7911376953125, 0.98907470703125, 1.18701171875, 1.38494873046875, 1.5828857421875, 1.78082275390625, 1.978759765625, 2.17669677734375, 2.3746337890625, 2.57257080078125, 2.7705078125, 2.96844482421875, 3.1663818359375, 3.36431884765625, 3.562255859375, 3.76019287109375, 3.9581298828125, 4.15606689453125, 4.35400390625, 4.55194091796875, 4.7498779296875, 4.94781494140625, 5.145751953125, 5.34368896484375, 5.5416259765625, 5.73956298828125, 5.9375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 6.0, 9.0, 17.0, 25.0, 35.0, 48.0, 69.0, 82.0, 139.0, 191.0, 272.0, 399.0, 602.0, 861.0, 1250.0, 1932.0, 3096.0, 5013.0, 8317.0, 15687.0, 35201.0, 765872.0, 153176.0, 24897.0, 12279.0, 6869.0, 4250.0, 2637.0, 1640.0, 1126.0, 804.0, 503.0, 359.0, 243.0, 180.0, 127.0, 83.0, 67.0, 49.0, 34.0, 29.0, 21.0, 14.0, 15.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.58203125, -4.43798828125, -4.2939453125, -4.14990234375, -4.005859375, -3.86181640625, -3.7177734375, -3.57373046875, -3.4296875, -3.28564453125, -3.1416015625, -2.99755859375, -2.853515625, -2.70947265625, -2.5654296875, -2.42138671875, -2.27734375, -2.13330078125, -1.9892578125, -1.84521484375, -1.701171875, -1.55712890625, -1.4130859375, -1.26904296875, -1.125, -0.98095703125, -0.8369140625, -0.69287109375, -0.548828125, -0.40478515625, -0.2607421875, -0.11669921875, 0.02734375, 0.17138671875, 0.3154296875, 0.45947265625, 0.603515625, 0.74755859375, 0.8916015625, 1.03564453125, 1.1796875, 1.32373046875, 1.4677734375, 1.61181640625, 1.755859375, 1.89990234375, 2.0439453125, 2.18798828125, 2.33203125, 2.47607421875, 2.6201171875, 2.76416015625, 2.908203125, 3.05224609375, 3.1962890625, 3.34033203125, 3.484375, 3.62841796875, 3.7724609375, 3.91650390625, 4.060546875, 4.20458984375, 4.3486328125, 4.49267578125, 4.63671875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 19.0, 15.0, 19.0, 20.0, 25.0, 31.0, 28.0, 26.0, 38.0, 48.0, 43.0, 59.0, 47.0, 38.0, 39.0, 51.0, 50.0, 37.0, 44.0, 41.0, 30.0, 32.0, 22.0, 26.0, 20.0, 15.0, 20.0, 19.0, 15.0, 14.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.78515625, -4.6246337890625, -4.464111328125, -4.3035888671875, -4.14306640625, -3.9825439453125, -3.822021484375, -3.6614990234375, -3.5009765625, -3.3404541015625, -3.179931640625, -3.0194091796875, -2.85888671875, -2.6983642578125, -2.537841796875, -2.3773193359375, -2.216796875, -2.0562744140625, -1.895751953125, -1.7352294921875, -1.57470703125, -1.4141845703125, -1.253662109375, -1.0931396484375, -0.9326171875, -0.7720947265625, -0.611572265625, -0.4510498046875, -0.29052734375, -0.1300048828125, 0.030517578125, 0.1910400390625, 0.3515625, 0.5120849609375, 0.672607421875, 0.8331298828125, 0.99365234375, 1.1541748046875, 1.314697265625, 1.4752197265625, 1.6357421875, 1.7962646484375, 1.956787109375, 2.1173095703125, 2.27783203125, 2.4383544921875, 2.598876953125, 2.7593994140625, 2.919921875, 3.0804443359375, 3.240966796875, 3.4014892578125, 3.56201171875, 3.7225341796875, 3.883056640625, 4.0435791015625, 4.2041015625, 4.3646240234375, 4.525146484375, 4.6856689453125, 4.84619140625, 5.0067138671875, 5.167236328125, 5.3277587890625, 5.48828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 11.0, 15.0, 8.0, 21.0, 27.0, 62.0, 76.0, 114.0, 174.0, 310.0, 588.0, 1168.0, 2704.0, 7048.0, 25005.0, 931472.0, 60389.0, 11932.0, 3936.0, 1636.0, 785.0, 406.0, 253.0, 160.0, 74.0, 62.0, 41.0, 22.0, 14.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.08984375, -3.9609375, -3.83203125, -3.703125, -3.57421875, -3.4453125, -3.31640625, -3.1875, -3.05859375, -2.9296875, -2.80078125, -2.671875, -2.54296875, -2.4140625, -2.28515625, -2.15625, -2.02734375, -1.8984375, -1.76953125, -1.640625, -1.51171875, -1.3828125, -1.25390625, -1.125, -0.99609375, -0.8671875, -0.73828125, -0.609375, -0.48046875, -0.3515625, -0.22265625, -0.09375, 0.03515625, 0.1640625, 0.29296875, 0.421875, 0.55078125, 0.6796875, 0.80859375, 0.9375, 1.06640625, 1.1953125, 1.32421875, 1.453125, 1.58203125, 1.7109375, 1.83984375, 1.96875, 2.09765625, 2.2265625, 2.35546875, 2.484375, 2.61328125, 2.7421875, 2.87109375, 3.0, 3.12890625, 3.2578125, 3.38671875, 3.515625, 3.64453125, 3.7734375, 3.90234375, 4.03125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 10.0, 8.0, 9.0, 20.0, 32.0, 40.0, 74.0, 112.0, 172.0, 173.0, 138.0, 77.0, 35.0, 29.0, 22.0, 9.0, 9.0, 11.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023674964904785156, -0.00022937916219234467, -0.00022200867533683777, -0.00021463818848133087, -0.00020726770162582397, -0.00019989721477031708, -0.00019252672791481018, -0.00018515624105930328, -0.0001777857542037964, -0.0001704152673482895, -0.0001630447804927826, -0.0001556742936372757, -0.0001483038067817688, -0.0001409333199262619, -0.000133562833070755, -0.0001261923462152481, -0.00011882185935974121, -0.00011145137250423431, -0.00010408088564872742, -9.671039879322052e-05, -8.933991193771362e-05, -8.196942508220673e-05, -7.459893822669983e-05, -6.722845137119293e-05, -5.9857964515686035e-05, -5.248747766017914e-05, -4.511699080467224e-05, -3.7746503949165344e-05, -3.0376017093658447e-05, -2.300553023815155e-05, -1.5635043382644653e-05, -8.264556527137756e-06, -8.940696716308594e-07, 6.476417183876038e-06, 1.3846904039382935e-05, 2.121739089488983e-05, 2.858787775039673e-05, 3.5958364605903625e-05, 4.332885146141052e-05, 5.069933831691742e-05, 5.8069825172424316e-05, 6.544031202793121e-05, 7.281079888343811e-05, 8.018128573894501e-05, 8.75517725944519e-05, 9.49222594499588e-05, 0.0001022927463054657, 0.0001096632331609726, 0.00011703372001647949, 0.0001244042068719864, 0.00013177469372749329, 0.00013914518058300018, 0.00014651566743850708, 0.00015388615429401398, 0.00016125664114952087, 0.00016862712800502777, 0.00017599761486053467, 0.00018336810171604156, 0.00019073858857154846, 0.00019810907542705536, 0.00020547956228256226, 0.00021285004913806915, 0.00022022053599357605, 0.00022759102284908295, 0.00023496150970458984]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 12.0, 14.0, 17.0, 24.0, 30.0, 54.0, 65.0, 108.0, 133.0, 219.0, 339.0, 540.0, 829.0, 1331.0, 2208.0, 3806.0, 7065.0, 12750.0, 25351.0, 51186.0, 107401.0, 227993.0, 293119.0, 161636.0, 75274.0, 36513.0, 18158.0, 9543.0, 5120.0, 2913.0, 1724.0, 1097.0, 650.0, 427.0, 291.0, 177.0, 139.0, 80.0, 62.0, 44.0, 31.0, 17.0, 17.0, 8.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9013671875, -0.87158203125, -0.841796875, -0.81201171875, -0.7822265625, -0.75244140625, -0.72265625, -0.69287109375, -0.6630859375, -0.63330078125, -0.603515625, -0.57373046875, -0.5439453125, -0.51416015625, -0.484375, -0.45458984375, -0.4248046875, -0.39501953125, -0.365234375, -0.33544921875, -0.3056640625, -0.27587890625, -0.24609375, -0.21630859375, -0.1865234375, -0.15673828125, -0.126953125, -0.09716796875, -0.0673828125, -0.03759765625, -0.0078125, 0.02197265625, 0.0517578125, 0.08154296875, 0.111328125, 0.14111328125, 0.1708984375, 0.20068359375, 0.23046875, 0.26025390625, 0.2900390625, 0.31982421875, 0.349609375, 0.37939453125, 0.4091796875, 0.43896484375, 0.46875, 0.49853515625, 0.5283203125, 0.55810546875, 0.587890625, 0.61767578125, 0.6474609375, 0.67724609375, 0.70703125, 0.73681640625, 0.7666015625, 0.79638671875, 0.826171875, 0.85595703125, 0.8857421875, 0.91552734375, 0.9453125, 0.97509765625, 1.0048828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 3.0, 2.0, 9.0, 5.0, 12.0, 15.0, 20.0, 24.0, 14.0, 28.0, 48.0, 87.0, 122.0, 117.0, 114.0, 93.0, 69.0, 38.0, 36.0, 27.0, 24.0, 19.0, 19.0, 8.0, 4.0, 10.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.4370536804199219, -0.42342376708984375, -0.4097938537597656, -0.3961639404296875, -0.3825340270996094, -0.36890411376953125, -0.3552742004394531, -0.341644287109375, -0.3280143737792969, -0.31438446044921875, -0.3007545471191406, -0.2871246337890625, -0.2734947204589844, -0.25986480712890625, -0.24623489379882812, -0.23260498046875, -0.21897506713867188, -0.20534515380859375, -0.19171524047851562, -0.1780853271484375, -0.16445541381835938, -0.15082550048828125, -0.13719558715820312, -0.123565673828125, -0.10993576049804688, -0.09630584716796875, -0.08267593383789062, -0.0690460205078125, -0.055416107177734375, -0.04178619384765625, -0.028156280517578125, -0.0145263671875, -0.000896453857421875, 0.01273345947265625, 0.026363372802734375, 0.0399932861328125, 0.053623199462890625, 0.06725311279296875, 0.08088302612304688, 0.094512939453125, 0.10814285278320312, 0.12177276611328125, 0.13540267944335938, 0.1490325927734375, 0.16266250610351562, 0.17629241943359375, 0.18992233276367188, 0.20355224609375, 0.21718215942382812, 0.23081207275390625, 0.24444198608398438, 0.2580718994140625, 0.2717018127441406, 0.28533172607421875, 0.2989616394042969, 0.312591552734375, 0.3262214660644531, 0.33985137939453125, 0.3534812927246094, 0.3671112060546875, 0.3807411193847656, 0.39437103271484375, 0.4080009460449219, 0.421630859375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 12.0, 7.0, 16.0, 23.0, 23.0, 23.0, 37.0, 44.0, 40.0, 51.0, 69.0, 70.0, 65.0, 52.0, 73.0, 71.0, 48.0, 39.0, 50.0, 33.0, 24.0, 23.0, 25.0, 14.0, 18.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.509370803833008, -8.254297256469727, -7.9992241859436035, -7.7441511154174805, -7.489077568054199, -7.234004020690918, -6.978930950164795, -6.723857879638672, -6.468784332275391, -6.213710784912109, -5.958637714385986, -5.703564643859863, -5.448491096496582, -5.193417549133301, -4.938344478607178, -4.683271408081055, -4.428197860717773, -4.173124313354492, -3.918051242828369, -3.662977933883667, -3.407904624938965, -3.1528313159942627, -2.8977580070495605, -2.6426846981048584, -2.3876113891601562, -2.132538080215454, -1.877464771270752, -1.6223914623260498, -1.3673181533813477, -1.1122448444366455, -0.8571715354919434, -0.6020982265472412, -0.34702539443969727, -0.09195208549499512, 0.16312122344970703, 0.4181945323944092, 0.6732678413391113, 0.9283411502838135, 1.1834144592285156, 1.4384877681732178, 1.69356107711792, 1.948634386062622, 2.203707695007324, 2.4587810039520264, 2.7138543128967285, 2.9689276218414307, 3.224000930786133, 3.479074239730835, 3.734147548675537, 3.9892208576202393, 4.244294166564941, 4.499367713928223, 4.754440784454346, 5.009513854980469, 5.26458740234375, 5.519660949707031, 5.774734020233154, 6.029807090759277, 6.284880638122559, 6.53995418548584, 6.795027256011963, 7.050100326538086, 7.305173873901367, 7.560247421264648, 7.8153204917907715]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 11.0, 7.0, 12.0, 12.0, 19.0, 20.0, 19.0, 31.0, 36.0, 30.0, 22.0, 31.0, 24.0, 35.0, 45.0, 33.0, 41.0, 27.0, 34.0, 36.0, 44.0, 37.0, 33.0, 35.0, 28.0, 22.0, 32.0, 24.0, 30.0, 22.0, 33.0, 23.0, 13.0, 14.0, 13.0, 13.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4951276779174805, -5.30919075012207, -5.12325382232666, -4.937317371368408, -4.751380443572998, -4.565443515777588, -4.379507064819336, -4.193570137023926, -4.007633209228516, -3.8216962814331055, -3.6357595920562744, -3.4498229026794434, -3.263885974884033, -3.077949047088623, -2.892012357711792, -2.706075668334961, -2.520138740539551, -2.3342018127441406, -2.1482651233673096, -1.962328314781189, -1.7763915061950684, -1.5904546976089478, -1.4045178890228271, -1.2185810804367065, -1.032644271850586, -0.8467074632644653, -0.6607706546783447, -0.4748338460922241, -0.2888970375061035, -0.10296022891998291, 0.0829765796661377, 0.2689133882522583, 0.4548501968383789, 0.6407870054244995, 0.8267238140106201, 1.0126606225967407, 1.1985974311828613, 1.384534239768982, 1.5704710483551025, 1.7564078569412231, 1.9423446655273438, 2.128281593322754, 2.314218282699585, 2.500154972076416, 2.686091899871826, 2.8720288276672363, 3.0579655170440674, 3.2439022064208984, 3.4298391342163086, 3.6157760620117188, 3.80171275138855, 3.987649440765381, 4.173586368560791, 4.359523296356201, 4.545459747314453, 4.731396675109863, 4.917333602905273, 5.103270530700684, 5.289207458496094, 5.475143909454346, 5.661080837249756, 5.847017765045166, 6.032954216003418, 6.218891143798828, 6.404828071594238]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 13.0, 24.0, 44.0, 60.0, 85.0, 119.0, 188.0, 322.0, 469.0, 700.0, 1119.0, 1629.0, 2519.0, 3892.0, 6008.0, 9174.0, 14387.0, 21525.0, 33738.0, 50584.0, 73863.0, 102846.0, 128921.0, 140405.0, 129692.0, 103801.0, 75046.0, 50935.0, 33432.0, 22168.0, 14127.0, 9381.0, 6009.0, 3926.0, 2508.0, 1682.0, 1074.0, 714.0, 478.0, 329.0, 206.0, 133.0, 90.0, 56.0, 42.0, 39.0, 20.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.59765625, -5.42547607421875, -5.2532958984375, -5.08111572265625, -4.908935546875, -4.73675537109375, -4.5645751953125, -4.39239501953125, -4.22021484375, -4.04803466796875, -3.8758544921875, -3.70367431640625, -3.531494140625, -3.35931396484375, -3.1871337890625, -3.01495361328125, -2.8427734375, -2.67059326171875, -2.4984130859375, -2.32623291015625, -2.154052734375, -1.98187255859375, -1.8096923828125, -1.63751220703125, -1.46533203125, -1.29315185546875, -1.1209716796875, -0.94879150390625, -0.776611328125, -0.60443115234375, -0.4322509765625, -0.26007080078125, -0.087890625, 0.08428955078125, 0.2564697265625, 0.42864990234375, 0.600830078125, 0.77301025390625, 0.9451904296875, 1.11737060546875, 1.28955078125, 1.46173095703125, 1.6339111328125, 1.80609130859375, 1.978271484375, 2.15045166015625, 2.3226318359375, 2.49481201171875, 2.6669921875, 2.83917236328125, 3.0113525390625, 3.18353271484375, 3.355712890625, 3.52789306640625, 3.7000732421875, 3.87225341796875, 4.04443359375, 4.21661376953125, 4.3887939453125, 4.56097412109375, 4.733154296875, 4.90533447265625, 5.0775146484375, 5.24969482421875, 5.421875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 13.0, 15.0, 11.0, 23.0, 29.0, 30.0, 29.0, 31.0, 31.0, 42.0, 46.0, 30.0, 37.0, 34.0, 38.0, 37.0, 36.0, 44.0, 37.0, 32.0, 34.0, 40.0, 34.0, 25.0, 30.0, 23.0, 26.0, 20.0, 22.0, 13.0, 17.0, 14.0, 7.0, 8.0, 9.0, 10.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.54296875, -5.3514404296875, -5.159912109375, -4.9683837890625, -4.77685546875, -4.5853271484375, -4.393798828125, -4.2022705078125, -4.0107421875, -3.8192138671875, -3.627685546875, -3.4361572265625, -3.24462890625, -3.0531005859375, -2.861572265625, -2.6700439453125, -2.478515625, -2.2869873046875, -2.095458984375, -1.9039306640625, -1.71240234375, -1.5208740234375, -1.329345703125, -1.1378173828125, -0.9462890625, -0.7547607421875, -0.563232421875, -0.3717041015625, -0.18017578125, 0.0113525390625, 0.202880859375, 0.3944091796875, 0.5859375, 0.7774658203125, 0.968994140625, 1.1605224609375, 1.35205078125, 1.5435791015625, 1.735107421875, 1.9266357421875, 2.1181640625, 2.3096923828125, 2.501220703125, 2.6927490234375, 2.88427734375, 3.0758056640625, 3.267333984375, 3.4588623046875, 3.650390625, 3.8419189453125, 4.033447265625, 4.2249755859375, 4.41650390625, 4.6080322265625, 4.799560546875, 4.9910888671875, 5.1826171875, 5.3741455078125, 5.565673828125, 5.7572021484375, 5.94873046875, 6.1402587890625, 6.331787109375, 6.5233154296875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 17.0, 25.0, 26.0, 34.0, 68.0, 105.0, 172.0, 255.0, 427.0, 624.0, 1132.0, 1788.0, 2973.0, 4975.0, 8443.0, 13931.0, 23366.0, 38992.0, 64316.0, 100796.0, 143055.0, 168044.0, 157433.0, 118563.0, 78172.0, 48370.0, 29356.0, 17351.0, 10194.0, 6058.0, 3618.0, 2238.0, 1321.0, 879.0, 521.0, 329.0, 225.0, 116.0, 84.0, 45.0, 49.0, 21.0, 11.0, 5.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.3681640625, -5.193359375, -5.0185546875, -4.84375, -4.6689453125, -4.494140625, -4.3193359375, -4.14453125, -3.9697265625, -3.794921875, -3.6201171875, -3.4453125, -3.2705078125, -3.095703125, -2.9208984375, -2.74609375, -2.5712890625, -2.396484375, -2.2216796875, -2.046875, -1.8720703125, -1.697265625, -1.5224609375, -1.34765625, -1.1728515625, -0.998046875, -0.8232421875, -0.6484375, -0.4736328125, -0.298828125, -0.1240234375, 0.05078125, 0.2255859375, 0.400390625, 0.5751953125, 0.75, 0.9248046875, 1.099609375, 1.2744140625, 1.44921875, 1.6240234375, 1.798828125, 1.9736328125, 2.1484375, 2.3232421875, 2.498046875, 2.6728515625, 2.84765625, 3.0224609375, 3.197265625, 3.3720703125, 3.546875, 3.7216796875, 3.896484375, 4.0712890625, 4.24609375, 4.4208984375, 4.595703125, 4.7705078125, 4.9453125, 5.1201171875, 5.294921875, 5.4697265625, 5.64453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 4.0, 9.0, 16.0, 19.0, 19.0, 14.0, 16.0, 28.0, 37.0, 28.0, 37.0, 37.0, 44.0, 43.0, 45.0, 39.0, 36.0, 45.0, 34.0, 40.0, 44.0, 41.0, 37.0, 39.0, 34.0, 32.0, 22.0, 25.0, 28.0, 15.0, 14.0, 14.0, 11.0, 10.0, 10.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5794677734375, -4.440185546875, -4.3009033203125, -4.16162109375, -4.0223388671875, -3.883056640625, -3.7437744140625, -3.6044921875, -3.4652099609375, -3.325927734375, -3.1866455078125, -3.04736328125, -2.9080810546875, -2.768798828125, -2.6295166015625, -2.490234375, -2.3509521484375, -2.211669921875, -2.0723876953125, -1.93310546875, -1.7938232421875, -1.654541015625, -1.5152587890625, -1.3759765625, -1.2366943359375, -1.097412109375, -0.9581298828125, -0.81884765625, -0.6795654296875, -0.540283203125, -0.4010009765625, -0.26171875, -0.1224365234375, 0.016845703125, 0.1561279296875, 0.29541015625, 0.4346923828125, 0.573974609375, 0.7132568359375, 0.8525390625, 0.9918212890625, 1.131103515625, 1.2703857421875, 1.40966796875, 1.5489501953125, 1.688232421875, 1.8275146484375, 1.966796875, 2.1060791015625, 2.245361328125, 2.3846435546875, 2.52392578125, 2.6632080078125, 2.802490234375, 2.9417724609375, 3.0810546875, 3.2203369140625, 3.359619140625, 3.4989013671875, 3.63818359375, 3.7774658203125, 3.916748046875, 4.0560302734375, 4.1953125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 15.0, 15.0, 23.0, 41.0, 55.0, 96.0, 155.0, 226.0, 309.0, 524.0, 925.0, 1578.0, 2840.0, 5515.0, 11137.0, 24638.0, 55484.0, 129480.0, 256659.0, 279352.0, 155041.0, 67460.0, 29344.0, 13382.0, 6448.0, 3367.0, 1790.0, 1029.0, 596.0, 360.0, 234.0, 136.0, 99.0, 63.0, 47.0, 27.0, 18.0, 6.0, 7.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.45892333984375, -5.2498779296875, -5.04083251953125, -4.831787109375, -4.62274169921875, -4.4136962890625, -4.20465087890625, -3.99560546875, -3.78656005859375, -3.5775146484375, -3.36846923828125, -3.159423828125, -2.95037841796875, -2.7413330078125, -2.53228759765625, -2.3232421875, -2.11419677734375, -1.9051513671875, -1.69610595703125, -1.487060546875, -1.27801513671875, -1.0689697265625, -0.85992431640625, -0.65087890625, -0.44183349609375, -0.2327880859375, -0.02374267578125, 0.185302734375, 0.39434814453125, 0.6033935546875, 0.81243896484375, 1.021484375, 1.23052978515625, 1.4395751953125, 1.64862060546875, 1.857666015625, 2.06671142578125, 2.2757568359375, 2.48480224609375, 2.69384765625, 2.90289306640625, 3.1119384765625, 3.32098388671875, 3.530029296875, 3.73907470703125, 3.9481201171875, 4.15716552734375, 4.3662109375, 4.57525634765625, 4.7843017578125, 4.99334716796875, 5.202392578125, 5.41143798828125, 5.6204833984375, 5.82952880859375, 6.03857421875, 6.24761962890625, 6.4566650390625, 6.66571044921875, 6.874755859375, 7.08380126953125, 7.2928466796875, 7.50189208984375, 7.7109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 5.0, 8.0, 3.0, 21.0, 14.0, 10.0, 27.0, 33.0, 33.0, 31.0, 44.0, 56.0, 64.0, 60.0, 68.0, 70.0, 66.0, 55.0, 62.0, 44.0, 44.0, 35.0, 33.0, 22.0, 17.0, 19.0, 10.0, 10.0, 8.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041675567626953125, -0.0004015490412712097, -0.0003863424062728882, -0.00037113577127456665, -0.0003559291362762451, -0.0003407225012779236, -0.00032551586627960205, -0.0003103092312812805, -0.000295102596282959, -0.00027989596128463745, -0.0002646893262863159, -0.0002494826912879944, -0.00023427605628967285, -0.00021906942129135132, -0.00020386278629302979, -0.00018865615129470825, -0.00017344951629638672, -0.00015824288129806519, -0.00014303624629974365, -0.00012782961130142212, -0.00011262297630310059, -9.741634130477905e-05, -8.220970630645752e-05, -6.700307130813599e-05, -5.179643630981445e-05, -3.658980131149292e-05, -2.1383166313171387e-05, -6.1765313148498535e-06, 9.03010368347168e-06, 2.4236738681793213e-05, 3.9443373680114746e-05, 5.465000867843628e-05, 6.985664367675781e-05, 8.506327867507935e-05, 0.00010026991367340088, 0.00011547654867172241, 0.00013068318367004395, 0.00014588981866836548, 0.000161096453666687, 0.00017630308866500854, 0.00019150972366333008, 0.0002067163586616516, 0.00022192299365997314, 0.00023712962865829468, 0.0002523362636566162, 0.00026754289865493774, 0.0002827495336532593, 0.0002979561686515808, 0.00031316280364990234, 0.0003283694386482239, 0.0003435760736465454, 0.00035878270864486694, 0.0003739893436431885, 0.00038919597864151, 0.00040440261363983154, 0.0004196092486381531, 0.0004348158836364746, 0.00045002251863479614, 0.0004652291536331177, 0.0004804357886314392, 0.0004956424236297607, 0.0005108490586280823, 0.0005260556936264038, 0.0005412623286247253, 0.0005564689636230469]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 8.0, 5.0, 8.0, 20.0, 22.0, 28.0, 41.0, 79.0, 103.0, 149.0, 213.0, 312.0, 502.0, 708.0, 1220.0, 1899.0, 3073.0, 5131.0, 8952.0, 16131.0, 29022.0, 54822.0, 104114.0, 179691.0, 226630.0, 182494.0, 107502.0, 56600.0, 29833.0, 16107.0, 9292.0, 5182.0, 3165.0, 1922.0, 1251.0, 803.0, 500.0, 317.0, 188.0, 158.0, 132.0, 81.0, 39.0, 44.0, 13.0, 14.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.421875, -5.2601318359375, -5.098388671875, -4.9366455078125, -4.77490234375, -4.6131591796875, -4.451416015625, -4.2896728515625, -4.1279296875, -3.9661865234375, -3.804443359375, -3.6427001953125, -3.48095703125, -3.3192138671875, -3.157470703125, -2.9957275390625, -2.833984375, -2.6722412109375, -2.510498046875, -2.3487548828125, -2.18701171875, -2.0252685546875, -1.863525390625, -1.7017822265625, -1.5400390625, -1.3782958984375, -1.216552734375, -1.0548095703125, -0.89306640625, -0.7313232421875, -0.569580078125, -0.4078369140625, -0.24609375, -0.0843505859375, 0.077392578125, 0.2391357421875, 0.40087890625, 0.5626220703125, 0.724365234375, 0.8861083984375, 1.0478515625, 1.2095947265625, 1.371337890625, 1.5330810546875, 1.69482421875, 1.8565673828125, 2.018310546875, 2.1800537109375, 2.341796875, 2.5035400390625, 2.665283203125, 2.8270263671875, 2.98876953125, 3.1505126953125, 3.312255859375, 3.4739990234375, 3.6357421875, 3.7974853515625, 3.959228515625, 4.1209716796875, 4.28271484375, 4.4444580078125, 4.606201171875, 4.7679443359375, 4.9296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 14.0, 9.0, 15.0, 15.0, 19.0, 17.0, 28.0, 34.0, 33.0, 34.0, 64.0, 73.0, 79.0, 67.0, 63.0, 72.0, 77.0, 57.0, 41.0, 27.0, 21.0, 29.0, 16.0, 18.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.38543701171875, -2.3021240234375, -2.21881103515625, -2.135498046875, -2.05218505859375, -1.9688720703125, -1.88555908203125, -1.80224609375, -1.71893310546875, -1.6356201171875, -1.55230712890625, -1.468994140625, -1.38568115234375, -1.3023681640625, -1.21905517578125, -1.1357421875, -1.05242919921875, -0.9691162109375, -0.88580322265625, -0.802490234375, -0.71917724609375, -0.6358642578125, -0.55255126953125, -0.46923828125, -0.38592529296875, -0.3026123046875, -0.21929931640625, -0.135986328125, -0.05267333984375, 0.0306396484375, 0.11395263671875, 0.197265625, 0.28057861328125, 0.3638916015625, 0.44720458984375, 0.530517578125, 0.61383056640625, 0.6971435546875, 0.78045654296875, 0.86376953125, 0.94708251953125, 1.0303955078125, 1.11370849609375, 1.197021484375, 1.28033447265625, 1.3636474609375, 1.44696044921875, 1.5302734375, 1.61358642578125, 1.6968994140625, 1.78021240234375, 1.863525390625, 1.94683837890625, 2.0301513671875, 2.11346435546875, 2.19677734375, 2.28009033203125, 2.3634033203125, 2.44671630859375, 2.530029296875, 2.61334228515625, 2.6966552734375, 2.77996826171875, 2.86328125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 13.0, 10.0, 6.0, 14.0, 10.0, 19.0, 17.0, 32.0, 35.0, 35.0, 48.0, 60.0, 46.0, 74.0, 56.0, 57.0, 66.0, 58.0, 58.0, 53.0, 37.0, 36.0, 32.0, 28.0, 15.0, 21.0, 10.0, 12.0, 12.0, 0.0, 6.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.575044631958008, -7.339587211608887, -7.104129791259766, -6.8686723709106445, -6.633214950561523, -6.397757530212402, -6.162300109863281, -5.92684268951416, -5.691385269165039, -5.455927848815918, -5.220470428466797, -4.985013008117676, -4.749555587768555, -4.514098167419434, -4.2786407470703125, -4.043183326721191, -3.8077259063720703, -3.572268486022949, -3.336811065673828, -3.101353645324707, -2.865896224975586, -2.630438804626465, -2.3949813842773438, -2.1595239639282227, -1.9240665435791016, -1.6886091232299805, -1.4531517028808594, -1.2176942825317383, -0.9822368621826172, -0.7467794418334961, -0.511322021484375, -0.2758646011352539, -0.040407657623291016, 0.19504976272583008, 0.43050718307495117, 0.6659646034240723, 0.9014220237731934, 1.1368794441223145, 1.3723368644714355, 1.6077942848205566, 1.8432517051696777, 2.078709125518799, 2.31416654586792, 2.549623966217041, 2.785081386566162, 3.020538806915283, 3.2559962272644043, 3.4914536476135254, 3.7269110679626465, 3.9623684883117676, 4.197825908660889, 4.43328332901001, 4.668740749359131, 4.904198169708252, 5.139655590057373, 5.375113010406494, 5.610570430755615, 5.846027851104736, 6.081485271453857, 6.3169426918029785, 6.5524001121521, 6.787857532501221, 7.023314952850342, 7.258772373199463, 7.494229793548584]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 7.0, 11.0, 8.0, 11.0, 7.0, 15.0, 14.0, 17.0, 17.0, 18.0, 18.0, 30.0, 24.0, 31.0, 29.0, 33.0, 35.0, 38.0, 45.0, 52.0, 45.0, 38.0, 38.0, 33.0, 33.0, 46.0, 29.0, 40.0, 21.0, 42.0, 24.0, 24.0, 21.0, 16.0, 18.0, 9.0, 10.0, 14.0, 7.0, 9.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.377585411071777, -6.171494960784912, -5.965404033660889, -5.759313583374023, -5.55322265625, -5.347132205963135, -5.141041278839111, -4.934950828552246, -4.728859901428223, -4.522769451141357, -4.316678524017334, -4.110588073730469, -3.9044971466064453, -3.69840669631958, -3.4923157691955566, -3.2862253189086914, -3.080134630203247, -2.8740439414978027, -2.6679532527923584, -2.461862564086914, -2.2557718753814697, -2.0496811866760254, -1.8435906171798706, -1.6374999284744263, -1.431409239768982, -1.2253185510635376, -1.0192278623580933, -0.8131372332572937, -0.6070465445518494, -0.4009559154510498, -0.19486522674560547, 0.011225461959838867, 0.2173161506652832, 0.42340683937072754, 0.6294975280761719, 0.8355881571769714, 1.0416789054870605, 1.2477694749832153, 1.4538601636886597, 1.659950852394104, 1.8660415410995483, 2.072132110595703, 2.2782227993011475, 2.484313488006592, 2.690404176712036, 2.8964948654174805, 3.102585554122925, 3.308676242828369, 3.5147669315338135, 3.720857620239258, 3.926948308944702, 4.1330389976501465, 4.339129447937012, 4.545220375061035, 4.7513108253479, 4.957401752471924, 5.163492202758789, 5.369582653045654, 5.575673580169678, 5.781764030456543, 5.987854957580566, 6.193945407867432, 6.400036334991455, 6.60612678527832, 6.812217712402344]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 6.0, 10.0, 12.0, 23.0, 31.0, 45.0, 64.0, 99.0, 172.0, 263.0, 432.0, 763.0, 1329.0, 2203.0, 4114.0, 7551.0, 14057.0, 26835.0, 54393.0, 113600.0, 250912.0, 555324.0, 981052.0, 1027157.0, 617578.0, 282626.0, 127582.0, 60110.0, 30364.0, 15479.0, 8584.0, 4680.0, 2646.0, 1643.0, 1032.0, 568.0, 341.0, 219.0, 124.0, 95.0, 54.0, 34.0, 23.0, 15.0, 14.0, 10.0, 11.0, 6.0, 2.0, 3.0], "bins": [-7.55859375, -7.354736328125, -7.15087890625, -6.947021484375, -6.7431640625, -6.539306640625, -6.33544921875, -6.131591796875, -5.927734375, -5.723876953125, -5.52001953125, -5.316162109375, -5.1123046875, -4.908447265625, -4.70458984375, -4.500732421875, -4.296875, -4.093017578125, -3.88916015625, -3.685302734375, -3.4814453125, -3.277587890625, -3.07373046875, -2.869873046875, -2.666015625, -2.462158203125, -2.25830078125, -2.054443359375, -1.8505859375, -1.646728515625, -1.44287109375, -1.239013671875, -1.03515625, -0.831298828125, -0.62744140625, -0.423583984375, -0.2197265625, -0.015869140625, 0.18798828125, 0.391845703125, 0.595703125, 0.799560546875, 1.00341796875, 1.207275390625, 1.4111328125, 1.614990234375, 1.81884765625, 2.022705078125, 2.2265625, 2.430419921875, 2.63427734375, 2.838134765625, 3.0419921875, 3.245849609375, 3.44970703125, 3.653564453125, 3.857421875, 4.061279296875, 4.26513671875, 4.468994140625, 4.6728515625, 4.876708984375, 5.08056640625, 5.284423828125, 5.48828125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 14.0, 15.0, 7.0, 18.0, 16.0, 14.0, 36.0, 31.0, 29.0, 24.0, 28.0, 46.0, 31.0, 38.0, 39.0, 48.0, 57.0, 44.0, 42.0, 32.0, 45.0, 33.0, 28.0, 30.0, 32.0, 31.0, 23.0, 27.0, 19.0, 13.0, 10.0, 11.0, 10.0, 8.0, 12.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.9171142578125, -3.779541015625, -3.6419677734375, -3.50439453125, -3.3668212890625, -3.229248046875, -3.0916748046875, -2.9541015625, -2.8165283203125, -2.678955078125, -2.5413818359375, -2.40380859375, -2.2662353515625, -2.128662109375, -1.9910888671875, -1.853515625, -1.7159423828125, -1.578369140625, -1.4407958984375, -1.30322265625, -1.1656494140625, -1.028076171875, -0.8905029296875, -0.7529296875, -0.6153564453125, -0.477783203125, -0.3402099609375, -0.20263671875, -0.0650634765625, 0.072509765625, 0.2100830078125, 0.34765625, 0.4852294921875, 0.622802734375, 0.7603759765625, 0.89794921875, 1.0355224609375, 1.173095703125, 1.3106689453125, 1.4482421875, 1.5858154296875, 1.723388671875, 1.8609619140625, 1.99853515625, 2.1361083984375, 2.273681640625, 2.4112548828125, 2.548828125, 2.6864013671875, 2.823974609375, 2.9615478515625, 3.09912109375, 3.2366943359375, 3.374267578125, 3.5118408203125, 3.6494140625, 3.7869873046875, 3.924560546875, 4.0621337890625, 4.19970703125, 4.3372802734375, 4.474853515625, 4.6124267578125, 4.75]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 12.0, 16.0, 22.0, 47.0, 65.0, 112.0, 177.0, 283.0, 481.0, 867.0, 1513.0, 2632.0, 4895.0, 9265.0, 17573.0, 35404.0, 72164.0, 152932.0, 327481.0, 666678.0, 1048434.0, 908159.0, 495086.0, 233712.0, 109110.0, 52485.0, 26009.0, 13277.0, 6901.0, 3691.0, 2037.0, 1156.0, 628.0, 394.0, 223.0, 133.0, 69.0, 57.0, 39.0, 19.0, 12.0, 9.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.91217041015625, -5.6993408203125, -5.48651123046875, -5.273681640625, -5.06085205078125, -4.8480224609375, -4.63519287109375, -4.42236328125, -4.20953369140625, -3.9967041015625, -3.78387451171875, -3.571044921875, -3.35821533203125, -3.1453857421875, -2.93255615234375, -2.7197265625, -2.50689697265625, -2.2940673828125, -2.08123779296875, -1.868408203125, -1.65557861328125, -1.4427490234375, -1.22991943359375, -1.01708984375, -0.80426025390625, -0.5914306640625, -0.37860107421875, -0.165771484375, 0.04705810546875, 0.2598876953125, 0.47271728515625, 0.685546875, 0.89837646484375, 1.1112060546875, 1.32403564453125, 1.536865234375, 1.74969482421875, 1.9625244140625, 2.17535400390625, 2.38818359375, 2.60101318359375, 2.8138427734375, 3.02667236328125, 3.239501953125, 3.45233154296875, 3.6651611328125, 3.87799072265625, 4.0908203125, 4.30364990234375, 4.5164794921875, 4.72930908203125, 4.942138671875, 5.15496826171875, 5.3677978515625, 5.58062744140625, 5.79345703125, 6.00628662109375, 6.2191162109375, 6.43194580078125, 6.644775390625, 6.85760498046875, 7.0704345703125, 7.28326416015625, 7.49609375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 8.0, 8.0, 14.0, 24.0, 19.0, 39.0, 33.0, 63.0, 63.0, 96.0, 114.0, 150.0, 167.0, 250.0, 257.0, 262.0, 290.0, 284.0, 308.0, 285.0, 257.0, 231.0, 162.0, 148.0, 135.0, 92.0, 68.0, 45.0, 46.0, 39.0, 31.0, 29.0, 15.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.300048828125, -2.22705078125, -2.154052734375, -2.0810546875, -2.008056640625, -1.93505859375, -1.862060546875, -1.7890625, -1.716064453125, -1.64306640625, -1.570068359375, -1.4970703125, -1.424072265625, -1.35107421875, -1.278076171875, -1.205078125, -1.132080078125, -1.05908203125, -0.986083984375, -0.9130859375, -0.840087890625, -0.76708984375, -0.694091796875, -0.62109375, -0.548095703125, -0.47509765625, -0.402099609375, -0.3291015625, -0.256103515625, -0.18310546875, -0.110107421875, -0.037109375, 0.035888671875, 0.10888671875, 0.181884765625, 0.2548828125, 0.327880859375, 0.40087890625, 0.473876953125, 0.546875, 0.619873046875, 0.69287109375, 0.765869140625, 0.8388671875, 0.911865234375, 0.98486328125, 1.057861328125, 1.130859375, 1.203857421875, 1.27685546875, 1.349853515625, 1.4228515625, 1.495849609375, 1.56884765625, 1.641845703125, 1.71484375, 1.787841796875, 1.86083984375, 1.933837890625, 2.0068359375, 2.079833984375, 2.15283203125, 2.225830078125, 2.298828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 7.0, 7.0, 11.0, 16.0, 15.0, 21.0, 25.0, 25.0, 31.0, 42.0, 45.0, 45.0, 40.0, 50.0, 55.0, 54.0, 53.0, 49.0, 51.0, 45.0, 38.0, 38.0, 28.0, 22.0, 28.0, 20.0, 32.0, 17.0, 22.0, 15.0, 5.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.2724809646606445, -5.1135125160217285, -4.9545440673828125, -4.7955756187438965, -4.6366071701049805, -4.477639198303223, -4.318670749664307, -4.159702301025391, -4.000733852386475, -3.8417654037475586, -3.6827969551086426, -3.5238287448883057, -3.3648602962493896, -3.2058918476104736, -3.0469236373901367, -2.8879551887512207, -2.7289867401123047, -2.5700182914733887, -2.4110498428344727, -2.2520816326141357, -2.0931131839752197, -1.9341447353363037, -1.7751764059066772, -1.6162080764770508, -1.4572396278381348, -1.2982711791992188, -1.1393028497695923, -0.980334460735321, -0.8213660717010498, -0.6623976826667786, -0.5034292936325073, -0.34446096420288086, -0.18549299240112305, -0.026524603366851807, 0.13244378566741943, 0.2914121747016907, 0.4503805637359619, 0.6093489527702332, 0.7683173418045044, 0.9272856712341309, 1.0862541198730469, 1.245222568511963, 1.4041908979415894, 1.5631592273712158, 1.7221276760101318, 1.8810961246490479, 2.0400643348693848, 2.199032783508301, 2.358001232147217, 2.516969680786133, 2.675938129425049, 2.8349063396453857, 2.9938747882843018, 3.1528432369232178, 3.3118114471435547, 3.4707798957824707, 3.6297483444213867, 3.7887167930603027, 3.9476852416992188, 4.106653690338135, 4.265622138977051, 4.424590110778809, 4.583558559417725, 4.742527008056641, 4.901495456695557]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 19.0, 21.0, 17.0, 17.0, 30.0, 26.0, 25.0, 29.0, 40.0, 28.0, 40.0, 38.0, 33.0, 45.0, 44.0, 45.0, 29.0, 39.0, 44.0, 45.0, 26.0, 33.0, 28.0, 34.0, 20.0, 15.0, 24.0, 21.0, 12.0, 18.0, 6.0, 7.0, 11.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.015134334564209, -4.854822158813477, -4.694509506225586, -4.5341973304748535, -4.373885154724121, -4.2135725021362305, -4.053260326385498, -3.8929481506347656, -3.732635736465454, -3.5723233222961426, -3.41201114654541, -3.2516987323760986, -3.091386318206787, -2.9310741424560547, -2.770761728286743, -2.6104493141174316, -2.450137138366699, -2.2898247241973877, -2.1295125484466553, -1.9692001342773438, -1.8088878393173218, -1.6485755443572998, -1.4882631301879883, -1.3279508352279663, -1.1676385402679443, -1.0073262453079224, -0.8470138907432556, -0.6867015361785889, -0.5263892412185669, -0.3660769462585449, -0.20576459169387817, -0.045452237129211426, 0.11486005783081055, 0.2751723825931549, 0.43548470735549927, 0.595797061920166, 0.756109356880188, 0.91642165184021, 1.0767340660095215, 1.2370463609695435, 1.3973586559295654, 1.5576709508895874, 1.7179832458496094, 1.878295660018921, 2.0386080741882324, 2.198920249938965, 2.3592326641082764, 2.519545078277588, 2.6798572540283203, 2.840169668197632, 3.0004818439483643, 3.160794258117676, 3.321106433868408, 3.4814188480377197, 3.6417312622070312, 3.8020434379577637, 3.962355852127075, 4.122668266296387, 4.282980442047119, 4.443292617797852, 4.603605270385742, 4.763917446136475, 4.924229621887207, 5.084542274475098, 5.24485445022583]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 12.0, 9.0, 12.0, 22.0, 39.0, 56.0, 76.0, 160.0, 234.0, 363.0, 563.0, 901.0, 1465.0, 2254.0, 3546.0, 5593.0, 9090.0, 14477.0, 22441.0, 36056.0, 59457.0, 97459.0, 154282.0, 196903.0, 165245.0, 106454.0, 64866.0, 39751.0, 24641.0, 15497.0, 9782.0, 6179.0, 3947.0, 2447.0, 1546.0, 1009.0, 650.0, 368.0, 264.0, 144.0, 122.0, 57.0, 42.0, 26.0, 21.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.505859375, -1.45965576171875, -1.4134521484375, -1.36724853515625, -1.321044921875, -1.27484130859375, -1.2286376953125, -1.18243408203125, -1.13623046875, -1.09002685546875, -1.0438232421875, -0.99761962890625, -0.951416015625, -0.90521240234375, -0.8590087890625, -0.81280517578125, -0.7666015625, -0.72039794921875, -0.6741943359375, -0.62799072265625, -0.581787109375, -0.53558349609375, -0.4893798828125, -0.44317626953125, -0.39697265625, -0.35076904296875, -0.3045654296875, -0.25836181640625, -0.212158203125, -0.16595458984375, -0.1197509765625, -0.07354736328125, -0.02734375, 0.01885986328125, 0.0650634765625, 0.11126708984375, 0.157470703125, 0.20367431640625, 0.2498779296875, 0.29608154296875, 0.34228515625, 0.38848876953125, 0.4346923828125, 0.48089599609375, 0.527099609375, 0.57330322265625, 0.6195068359375, 0.66571044921875, 0.7119140625, 0.75811767578125, 0.8043212890625, 0.85052490234375, 0.896728515625, 0.94293212890625, 0.9891357421875, 1.03533935546875, 1.08154296875, 1.12774658203125, 1.1739501953125, 1.22015380859375, 1.266357421875, 1.31256103515625, 1.3587646484375, 1.40496826171875, 1.451171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 9.0, 12.0, 14.0, 16.0, 17.0, 14.0, 18.0, 19.0, 27.0, 25.0, 27.0, 36.0, 22.0, 35.0, 43.0, 30.0, 45.0, 38.0, 44.0, 40.0, 39.0, 45.0, 47.0, 50.0, 26.0, 26.0, 27.0, 27.0, 30.0, 18.0, 23.0, 18.0, 12.0, 12.0, 13.0, 8.0, 6.0, 8.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3515625, -5.181884765625, -5.01220703125, -4.842529296875, -4.6728515625, -4.503173828125, -4.33349609375, -4.163818359375, -3.994140625, -3.824462890625, -3.65478515625, -3.485107421875, -3.3154296875, -3.145751953125, -2.97607421875, -2.806396484375, -2.63671875, -2.467041015625, -2.29736328125, -2.127685546875, -1.9580078125, -1.788330078125, -1.61865234375, -1.448974609375, -1.279296875, -1.109619140625, -0.93994140625, -0.770263671875, -0.6005859375, -0.430908203125, -0.26123046875, -0.091552734375, 0.078125, 0.247802734375, 0.41748046875, 0.587158203125, 0.7568359375, 0.926513671875, 1.09619140625, 1.265869140625, 1.435546875, 1.605224609375, 1.77490234375, 1.944580078125, 2.1142578125, 2.283935546875, 2.45361328125, 2.623291015625, 2.79296875, 2.962646484375, 3.13232421875, 3.302001953125, 3.4716796875, 3.641357421875, 3.81103515625, 3.980712890625, 4.150390625, 4.320068359375, 4.48974609375, 4.659423828125, 4.8291015625, 4.998779296875, 5.16845703125, 5.338134765625, 5.5078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 13.0, 16.0, 26.0, 25.0, 23.0, 42.0, 54.0, 81.0, 127.0, 171.0, 247.0, 360.0, 479.0, 764.0, 1213.0, 1824.0, 2903.0, 4897.0, 8443.0, 16139.0, 40664.0, 779329.0, 136840.0, 24523.0, 11796.0, 6588.0, 3925.0, 2310.0, 1531.0, 979.0, 626.0, 455.0, 307.0, 219.0, 165.0, 115.0, 80.0, 56.0, 42.0, 38.0, 21.0, 23.0, 18.0, 14.0, 12.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.779296875, -2.69696044921875, -2.6146240234375, -2.53228759765625, -2.449951171875, -2.36761474609375, -2.2852783203125, -2.20294189453125, -2.12060546875, -2.03826904296875, -1.9559326171875, -1.87359619140625, -1.791259765625, -1.70892333984375, -1.6265869140625, -1.54425048828125, -1.4619140625, -1.37957763671875, -1.2972412109375, -1.21490478515625, -1.132568359375, -1.05023193359375, -0.9678955078125, -0.88555908203125, -0.80322265625, -0.72088623046875, -0.6385498046875, -0.55621337890625, -0.473876953125, -0.39154052734375, -0.3092041015625, -0.22686767578125, -0.14453125, -0.06219482421875, 0.0201416015625, 0.10247802734375, 0.184814453125, 0.26715087890625, 0.3494873046875, 0.43182373046875, 0.51416015625, 0.59649658203125, 0.6788330078125, 0.76116943359375, 0.843505859375, 0.92584228515625, 1.0081787109375, 1.09051513671875, 1.1728515625, 1.25518798828125, 1.3375244140625, 1.41986083984375, 1.502197265625, 1.58453369140625, 1.6668701171875, 1.74920654296875, 1.83154296875, 1.91387939453125, 1.9962158203125, 2.07855224609375, 2.160888671875, 2.24322509765625, 2.3255615234375, 2.40789794921875, 2.490234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 16.0, 12.0, 22.0, 21.0, 30.0, 25.0, 20.0, 34.0, 24.0, 40.0, 36.0, 39.0, 37.0, 38.0, 47.0, 62.0, 51.0, 42.0, 49.0, 45.0, 32.0, 36.0, 26.0, 29.0, 33.0, 24.0, 19.0, 21.0, 11.0, 7.0, 10.0, 6.0, 4.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.2845458984375, -4.155029296875, -4.0255126953125, -3.89599609375, -3.7664794921875, -3.636962890625, -3.5074462890625, -3.3779296875, -3.2484130859375, -3.118896484375, -2.9893798828125, -2.85986328125, -2.7303466796875, -2.600830078125, -2.4713134765625, -2.341796875, -2.2122802734375, -2.082763671875, -1.9532470703125, -1.82373046875, -1.6942138671875, -1.564697265625, -1.4351806640625, -1.3056640625, -1.1761474609375, -1.046630859375, -0.9171142578125, -0.78759765625, -0.6580810546875, -0.528564453125, -0.3990478515625, -0.26953125, -0.1400146484375, -0.010498046875, 0.1190185546875, 0.24853515625, 0.3780517578125, 0.507568359375, 0.6370849609375, 0.7666015625, 0.8961181640625, 1.025634765625, 1.1551513671875, 1.28466796875, 1.4141845703125, 1.543701171875, 1.6732177734375, 1.802734375, 1.9322509765625, 2.061767578125, 2.1912841796875, 2.32080078125, 2.4503173828125, 2.579833984375, 2.7093505859375, 2.8388671875, 2.9683837890625, 3.097900390625, 3.2274169921875, 3.35693359375, 3.4864501953125, 3.615966796875, 3.7454833984375, 3.875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 11.0, 4.0, 11.0, 12.0, 21.0, 29.0, 30.0, 54.0, 89.0, 122.0, 213.0, 274.0, 459.0, 741.0, 1093.0, 1814.0, 2993.0, 5206.0, 9811.0, 20261.0, 60863.0, 871769.0, 37539.0, 15947.0, 8226.0, 4347.0, 2562.0, 1485.0, 838.0, 589.0, 400.0, 234.0, 168.0, 113.0, 60.0, 48.0, 40.0, 29.0, 12.0, 20.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.048828125, -1.0182952880859375, -0.987762451171875, -0.9572296142578125, -0.92669677734375, -0.8961639404296875, -0.865631103515625, -0.8350982666015625, -0.8045654296875, -0.7740325927734375, -0.743499755859375, -0.7129669189453125, -0.68243408203125, -0.6519012451171875, -0.621368408203125, -0.5908355712890625, -0.560302734375, -0.5297698974609375, -0.499237060546875, -0.4687042236328125, -0.43817138671875, -0.4076385498046875, -0.377105712890625, -0.3465728759765625, -0.3160400390625, -0.2855072021484375, -0.254974365234375, -0.2244415283203125, -0.19390869140625, -0.1633758544921875, -0.132843017578125, -0.1023101806640625, -0.07177734375, -0.0412445068359375, -0.010711669921875, 0.0198211669921875, 0.05035400390625, 0.0808868408203125, 0.111419677734375, 0.1419525146484375, 0.1724853515625, 0.2030181884765625, 0.233551025390625, 0.2640838623046875, 0.29461669921875, 0.3251495361328125, 0.355682373046875, 0.3862152099609375, 0.416748046875, 0.4472808837890625, 0.477813720703125, 0.5083465576171875, 0.53887939453125, 0.5694122314453125, 0.599945068359375, 0.6304779052734375, 0.6610107421875, 0.6915435791015625, 0.722076416015625, 0.7526092529296875, 0.78314208984375, 0.8136749267578125, 0.844207763671875, 0.8747406005859375, 0.9052734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 4.0, 20.0, 20.0, 23.0, 25.0, 47.0, 31.0, 42.0, 57.0, 66.0, 74.0, 97.0, 98.0, 79.0, 67.0, 44.0, 49.0, 32.0, 23.0, 26.0, 13.0, 10.0, 12.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.230043411254883e-05, -7.032230496406555e-05, -6.834417581558228e-05, -6.6366046667099e-05, -6.438791751861572e-05, -6.240978837013245e-05, -6.043165922164917e-05, -5.8453530073165894e-05, -5.647540092468262e-05, -5.449727177619934e-05, -5.2519142627716064e-05, -5.054101347923279e-05, -4.856288433074951e-05, -4.6584755182266235e-05, -4.460662603378296e-05, -4.262849688529968e-05, -4.0650367736816406e-05, -3.867223858833313e-05, -3.6694109439849854e-05, -3.471598029136658e-05, -3.27378511428833e-05, -3.0759721994400024e-05, -2.8781592845916748e-05, -2.680346369743347e-05, -2.4825334548950195e-05, -2.284720540046692e-05, -2.0869076251983643e-05, -1.8890947103500366e-05, -1.691281795501709e-05, -1.4934688806533813e-05, -1.2956559658050537e-05, -1.097843050956726e-05, -9.000301361083984e-06, -7.022172212600708e-06, -5.044043064117432e-06, -3.0659139156341553e-06, -1.087784767150879e-06, 8.903443813323975e-07, 2.868473529815674e-06, 4.84660267829895e-06, 6.8247318267822266e-06, 8.802860975265503e-06, 1.078099012374878e-05, 1.2759119272232056e-05, 1.4737248420715332e-05, 1.671537756919861e-05, 1.8693506717681885e-05, 2.067163586616516e-05, 2.2649765014648438e-05, 2.4627894163131714e-05, 2.660602331161499e-05, 2.8584152460098267e-05, 3.056228160858154e-05, 3.254041075706482e-05, 3.4518539905548096e-05, 3.649666905403137e-05, 3.847479820251465e-05, 4.0452927350997925e-05, 4.24310564994812e-05, 4.440918564796448e-05, 4.6387314796447754e-05, 4.836544394493103e-05, 5.034357309341431e-05, 5.232170224189758e-05, 5.429983139038086e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 16.0, 15.0, 17.0, 38.0, 43.0, 49.0, 97.0, 185.0, 328.0, 550.0, 960.0, 1830.0, 3415.0, 6944.0, 13551.0, 28670.0, 60807.0, 129134.0, 250156.0, 268851.0, 148465.0, 69563.0, 32799.0, 15724.0, 7827.0, 3877.0, 2055.0, 1086.0, 607.0, 342.0, 194.0, 130.0, 78.0, 50.0, 28.0, 24.0, 9.0, 10.0, 9.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4967193603515625, -0.480743408203125, -0.4647674560546875, -0.44879150390625, -0.4328155517578125, -0.416839599609375, -0.4008636474609375, -0.3848876953125, -0.3689117431640625, -0.352935791015625, -0.3369598388671875, -0.32098388671875, -0.3050079345703125, -0.289031982421875, -0.2730560302734375, -0.257080078125, -0.2411041259765625, -0.225128173828125, -0.2091522216796875, -0.19317626953125, -0.1772003173828125, -0.161224365234375, -0.1452484130859375, -0.1292724609375, -0.1132965087890625, -0.097320556640625, -0.0813446044921875, -0.06536865234375, -0.0493927001953125, -0.033416748046875, -0.0174407958984375, -0.00146484375, 0.0145111083984375, 0.030487060546875, 0.0464630126953125, 0.06243896484375, 0.0784149169921875, 0.094390869140625, 0.1103668212890625, 0.1263427734375, 0.1423187255859375, 0.158294677734375, 0.1742706298828125, 0.19024658203125, 0.2062225341796875, 0.222198486328125, 0.2381744384765625, 0.254150390625, 0.2701263427734375, 0.286102294921875, 0.3020782470703125, 0.31805419921875, 0.3340301513671875, 0.350006103515625, 0.3659820556640625, 0.3819580078125, 0.3979339599609375, 0.413909912109375, 0.4298858642578125, 0.44586181640625, 0.4618377685546875, 0.477813720703125, 0.4937896728515625, 0.509765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 8.0, 17.0, 17.0, 39.0, 34.0, 38.0, 48.0, 70.0, 68.0, 89.0, 75.0, 75.0, 87.0, 73.0, 60.0, 43.0, 22.0, 28.0, 23.0, 13.0, 6.0, 10.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.2098388671875, -0.2042560577392578, -0.19867324829101562, -0.19309043884277344, -0.18750762939453125, -0.18192481994628906, -0.17634201049804688, -0.1707592010498047, -0.1651763916015625, -0.1595935821533203, -0.15401077270507812, -0.14842796325683594, -0.14284515380859375, -0.13726234436035156, -0.13167953491210938, -0.1260967254638672, -0.120513916015625, -0.11493110656738281, -0.10934829711914062, -0.10376548767089844, -0.09818267822265625, -0.09259986877441406, -0.08701705932617188, -0.08143424987792969, -0.0758514404296875, -0.07026863098144531, -0.06468582153320312, -0.05910301208496094, -0.05352020263671875, -0.04793739318847656, -0.042354583740234375, -0.03677177429199219, -0.03118896484375, -0.025606155395507812, -0.020023345947265625, -0.014440536499023438, -0.00885772705078125, -0.0032749176025390625, 0.002307891845703125, 0.007890701293945312, 0.0134735107421875, 0.019056320190429688, 0.024639129638671875, 0.030221939086914062, 0.03580474853515625, 0.04138755798339844, 0.046970367431640625, 0.05255317687988281, 0.058135986328125, 0.06371879577636719, 0.06930160522460938, 0.07488441467285156, 0.08046722412109375, 0.08605003356933594, 0.09163284301757812, 0.09721565246582031, 0.1027984619140625, 0.10838127136230469, 0.11396408081054688, 0.11954689025878906, 0.12512969970703125, 0.13071250915527344, 0.13629531860351562, 0.1418781280517578, 0.1474609375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 8.0, 10.0, 15.0, 19.0, 18.0, 26.0, 22.0, 32.0, 40.0, 54.0, 42.0, 47.0, 48.0, 61.0, 56.0, 56.0, 56.0, 49.0, 46.0, 35.0, 36.0, 24.0, 25.0, 26.0, 24.0, 30.0, 16.0, 17.0, 10.0, 5.0, 13.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.523178577423096, -5.359871864318848, -5.1965651512146, -5.03325891494751, -4.869952201843262, -4.706645488739014, -4.543338775634766, -4.380032539367676, -4.216725826263428, -4.05341911315918, -3.8901126384735107, -3.7268059253692627, -3.5634994506835938, -3.4001927375793457, -3.2368860244750977, -3.0735795497894287, -2.9102728366851807, -2.7469661235809326, -2.5836596488952637, -2.4203529357910156, -2.2570464611053467, -2.0937397480010986, -1.9304331541061401, -1.7671265602111816, -1.6038199663162231, -1.4405133724212646, -1.2772067785263062, -1.1139001846313477, -0.9505935311317444, -0.7872869372367859, -0.6239802837371826, -0.4606736898422241, -0.2973670959472656, -0.13406048715114594, 0.029246121644973755, 0.19255274534225464, 0.35585933923721313, 0.5191659331321716, 0.6824725866317749, 0.8457791805267334, 1.009085774421692, 1.1723923683166504, 1.3356989622116089, 1.4990055561065674, 1.6623122692108154, 1.8256187438964844, 1.9889254570007324, 2.1522321701049805, 2.3155386447906494, 2.4788453578948975, 2.6421518325805664, 2.8054585456848145, 2.9687650203704834, 3.1320717334747314, 3.2953782081604004, 3.4586849212646484, 3.6219916343688965, 3.7852983474731445, 3.9486048221588135, 4.111911296844482, 4.2752180099487305, 4.4385247230529785, 4.601831436157227, 4.765137672424316, 4.9284443855285645]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 4.0, 5.0, 6.0, 10.0, 11.0, 14.0, 24.0, 19.0, 17.0, 18.0, 28.0, 27.0, 25.0, 33.0, 39.0, 32.0, 34.0, 37.0, 40.0, 40.0, 46.0, 47.0, 30.0, 38.0, 46.0, 38.0, 33.0, 36.0, 25.0, 29.0, 20.0, 16.0, 24.0, 17.0, 14.0, 17.0, 6.0, 7.0, 9.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.982836723327637, -4.823299407958984, -4.66376256942749, -4.504225254058838, -4.344688415527344, -4.185151100158691, -4.025613784790039, -3.866076946258545, -3.7065396308898926, -3.5470025539398193, -3.387465476989746, -3.2279281616210938, -3.0683910846710205, -2.9088540077209473, -2.749316930770874, -2.589779853820801, -2.4302427768707275, -2.2707056999206543, -2.111168622970581, -1.9516314268112183, -1.7920942306518555, -1.6325571537017822, -1.473020076751709, -1.3134828805923462, -1.153945803642273, -0.9944086670875549, -0.8348715305328369, -0.6753344535827637, -0.5157973170280457, -0.35626018047332764, -0.1967231035232544, -0.0371859073638916, 0.12235116958618164, 0.28188830614089966, 0.4414254128932953, 0.6009625196456909, 0.7604996562004089, 0.920036792755127, 1.0795738697052002, 1.239111065864563, 1.3986481428146362, 1.5581852197647095, 1.7177224159240723, 1.8772594928741455, 2.0367965698242188, 2.196333885192871, 2.3558707237243652, 2.5154080390930176, 2.674945116043091, 2.834482192993164, 2.9940192699432373, 3.1535563468933105, 3.313093662261963, 3.472630739212036, 3.6321678161621094, 3.7917051315307617, 3.951241970062256, 4.110779285430908, 4.270316123962402, 4.429853439331055, 4.589390277862549, 4.748927593231201, 4.908464431762695, 5.068001747131348, 5.2275390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 19.0, 30.0, 37.0, 69.0, 91.0, 147.0, 166.0, 293.0, 436.0, 675.0, 1011.0, 1577.0, 2447.0, 3633.0, 5691.0, 8898.0, 13709.0, 20948.0, 31653.0, 47290.0, 67888.0, 91961.0, 116406.0, 129122.0, 126939.0, 109260.0, 85095.0, 60657.0, 42179.0, 27765.0, 18248.0, 12246.0, 7693.0, 4997.0, 3171.0, 2053.0, 1373.0, 908.0, 606.0, 396.0, 271.0, 170.0, 119.0, 81.0, 46.0, 26.0, 20.0, 15.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-3.712890625, -3.599853515625, -3.48681640625, -3.373779296875, -3.2607421875, -3.147705078125, -3.03466796875, -2.921630859375, -2.80859375, -2.695556640625, -2.58251953125, -2.469482421875, -2.3564453125, -2.243408203125, -2.13037109375, -2.017333984375, -1.904296875, -1.791259765625, -1.67822265625, -1.565185546875, -1.4521484375, -1.339111328125, -1.22607421875, -1.113037109375, -1.0, -0.886962890625, -0.77392578125, -0.660888671875, -0.5478515625, -0.434814453125, -0.32177734375, -0.208740234375, -0.095703125, 0.017333984375, 0.13037109375, 0.243408203125, 0.3564453125, 0.469482421875, 0.58251953125, 0.695556640625, 0.80859375, 0.921630859375, 1.03466796875, 1.147705078125, 1.2607421875, 1.373779296875, 1.48681640625, 1.599853515625, 1.712890625, 1.825927734375, 1.93896484375, 2.052001953125, 2.1650390625, 2.278076171875, 2.39111328125, 2.504150390625, 2.6171875, 2.730224609375, 2.84326171875, 2.956298828125, 3.0693359375, 3.182373046875, 3.29541015625, 3.408447265625, 3.521484375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 10.0, 16.0, 10.0, 10.0, 22.0, 23.0, 24.0, 21.0, 32.0, 21.0, 31.0, 34.0, 31.0, 44.0, 46.0, 47.0, 32.0, 39.0, 56.0, 42.0, 36.0, 49.0, 39.0, 39.0, 31.0, 26.0, 20.0, 32.0, 21.0, 19.0, 13.0, 18.0, 5.0, 8.0, 7.0, 5.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.44921875, -5.2750244140625, -5.100830078125, -4.9266357421875, -4.75244140625, -4.5782470703125, -4.404052734375, -4.2298583984375, -4.0556640625, -3.8814697265625, -3.707275390625, -3.5330810546875, -3.35888671875, -3.1846923828125, -3.010498046875, -2.8363037109375, -2.662109375, -2.4879150390625, -2.313720703125, -2.1395263671875, -1.96533203125, -1.7911376953125, -1.616943359375, -1.4427490234375, -1.2685546875, -1.0943603515625, -0.920166015625, -0.7459716796875, -0.57177734375, -0.3975830078125, -0.223388671875, -0.0491943359375, 0.125, 0.2991943359375, 0.473388671875, 0.6475830078125, 0.82177734375, 0.9959716796875, 1.170166015625, 1.3443603515625, 1.5185546875, 1.6927490234375, 1.866943359375, 2.0411376953125, 2.21533203125, 2.3895263671875, 2.563720703125, 2.7379150390625, 2.912109375, 3.0863037109375, 3.260498046875, 3.4346923828125, 3.60888671875, 3.7830810546875, 3.957275390625, 4.1314697265625, 4.3056640625, 4.4798583984375, 4.654052734375, 4.8282470703125, 5.00244140625, 5.1766357421875, 5.350830078125, 5.5250244140625, 5.69921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 17.0, 24.0, 44.0, 64.0, 106.0, 154.0, 255.0, 405.0, 710.0, 1125.0, 1706.0, 2876.0, 4973.0, 8157.0, 14130.0, 24347.0, 41861.0, 68958.0, 107689.0, 147099.0, 167981.0, 153484.0, 115497.0, 75710.0, 45733.0, 26998.0, 15808.0, 9112.0, 5386.0, 3146.0, 1929.0, 1125.0, 742.0, 459.0, 282.0, 142.0, 108.0, 77.0, 47.0, 29.0, 18.0, 11.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.840911865234375, -3.71112060546875, -3.581329345703125, -3.4515380859375, -3.321746826171875, -3.19195556640625, -3.062164306640625, -2.932373046875, -2.802581787109375, -2.67279052734375, -2.542999267578125, -2.4132080078125, -2.283416748046875, -2.15362548828125, -2.023834228515625, -1.89404296875, -1.764251708984375, -1.63446044921875, -1.504669189453125, -1.3748779296875, -1.245086669921875, -1.11529541015625, -0.985504150390625, -0.855712890625, -0.725921630859375, -0.59613037109375, -0.466339111328125, -0.3365478515625, -0.206756591796875, -0.07696533203125, 0.052825927734375, 0.1826171875, 0.312408447265625, 0.44219970703125, 0.571990966796875, 0.7017822265625, 0.831573486328125, 0.96136474609375, 1.091156005859375, 1.220947265625, 1.350738525390625, 1.48052978515625, 1.610321044921875, 1.7401123046875, 1.869903564453125, 1.99969482421875, 2.129486083984375, 2.25927734375, 2.389068603515625, 2.51885986328125, 2.648651123046875, 2.7784423828125, 2.908233642578125, 3.03802490234375, 3.167816162109375, 3.297607421875, 3.427398681640625, 3.55718994140625, 3.686981201171875, 3.8167724609375, 3.946563720703125, 4.07635498046875, 4.206146240234375, 4.3359375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 12.0, 9.0, 15.0, 20.0, 9.0, 20.0, 22.0, 23.0, 35.0, 34.0, 41.0, 35.0, 41.0, 42.0, 47.0, 30.0, 45.0, 31.0, 46.0, 40.0, 29.0, 43.0, 33.0, 44.0, 33.0, 29.0, 41.0, 18.0, 23.0, 19.0, 13.0, 14.0, 7.0, 7.0, 5.0, 7.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.21875, -4.10357666015625, -3.9884033203125, -3.87322998046875, -3.758056640625, -3.64288330078125, -3.5277099609375, -3.41253662109375, -3.29736328125, -3.18218994140625, -3.0670166015625, -2.95184326171875, -2.836669921875, -2.72149658203125, -2.6063232421875, -2.49114990234375, -2.3759765625, -2.26080322265625, -2.1456298828125, -2.03045654296875, -1.915283203125, -1.80010986328125, -1.6849365234375, -1.56976318359375, -1.45458984375, -1.33941650390625, -1.2242431640625, -1.10906982421875, -0.993896484375, -0.87872314453125, -0.7635498046875, -0.64837646484375, -0.533203125, -0.41802978515625, -0.3028564453125, -0.18768310546875, -0.072509765625, 0.04266357421875, 0.1578369140625, 0.27301025390625, 0.38818359375, 0.50335693359375, 0.6185302734375, 0.73370361328125, 0.848876953125, 0.96405029296875, 1.0792236328125, 1.19439697265625, 1.3095703125, 1.42474365234375, 1.5399169921875, 1.65509033203125, 1.770263671875, 1.88543701171875, 2.0006103515625, 2.11578369140625, 2.23095703125, 2.34613037109375, 2.4613037109375, 2.57647705078125, 2.691650390625, 2.80682373046875, 2.9219970703125, 3.03717041015625, 3.15234375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 21.0, 11.0, 21.0, 36.0, 62.0, 90.0, 139.0, 200.0, 334.0, 559.0, 918.0, 1443.0, 2535.0, 4650.0, 8566.0, 16714.0, 33900.0, 71808.0, 147502.0, 241923.0, 237495.0, 142613.0, 69330.0, 32823.0, 16024.0, 8211.0, 4371.0, 2496.0, 1434.0, 897.0, 488.0, 295.0, 203.0, 147.0, 91.0, 64.0, 39.0, 32.0, 17.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.04779052734375, -3.9080810546875, -3.76837158203125, -3.628662109375, -3.48895263671875, -3.3492431640625, -3.20953369140625, -3.06982421875, -2.93011474609375, -2.7904052734375, -2.65069580078125, -2.510986328125, -2.37127685546875, -2.2315673828125, -2.09185791015625, -1.9521484375, -1.81243896484375, -1.6727294921875, -1.53302001953125, -1.393310546875, -1.25360107421875, -1.1138916015625, -0.97418212890625, -0.83447265625, -0.69476318359375, -0.5550537109375, -0.41534423828125, -0.275634765625, -0.13592529296875, 0.0037841796875, 0.14349365234375, 0.283203125, 0.42291259765625, 0.5626220703125, 0.70233154296875, 0.842041015625, 0.98175048828125, 1.1214599609375, 1.26116943359375, 1.40087890625, 1.54058837890625, 1.6802978515625, 1.82000732421875, 1.959716796875, 2.09942626953125, 2.2391357421875, 2.37884521484375, 2.5185546875, 2.65826416015625, 2.7979736328125, 2.93768310546875, 3.077392578125, 3.21710205078125, 3.3568115234375, 3.49652099609375, 3.63623046875, 3.77593994140625, 3.9156494140625, 4.05535888671875, 4.195068359375, 4.33477783203125, 4.4744873046875, 4.61419677734375, 4.75390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 6.0, 7.0, 8.0, 5.0, 7.0, 13.0, 14.0, 17.0, 26.0, 25.0, 33.0, 46.0, 32.0, 37.0, 32.0, 56.0, 58.0, 48.0, 56.0, 41.0, 50.0, 53.0, 45.0, 38.0, 36.0, 42.0, 25.0, 18.0, 23.0, 14.0, 13.0, 11.0, 14.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.0003337860107421875, -0.00032532960176467896, -0.0003168731927871704, -0.00030841678380966187, -0.0002999603748321533, -0.0002915039658546448, -0.00028304755687713623, -0.0002745911478996277, -0.00026613473892211914, -0.0002576783299446106, -0.00024922192096710205, -0.0002407655119895935, -0.00023230910301208496, -0.00022385269403457642, -0.00021539628505706787, -0.00020693987607955933, -0.00019848346710205078, -0.00019002705812454224, -0.0001815706491470337, -0.00017311424016952515, -0.0001646578311920166, -0.00015620142221450806, -0.0001477450132369995, -0.00013928860425949097, -0.00013083219528198242, -0.00012237578630447388, -0.00011391937732696533, -0.00010546296834945679, -9.700655937194824e-05, -8.85501503944397e-05, -8.009374141693115e-05, -7.163733243942261e-05, -6.318092346191406e-05, -5.472451448440552e-05, -4.626810550689697e-05, -3.781169652938843e-05, -2.9355287551879883e-05, -2.0898878574371338e-05, -1.2442469596862793e-05, -3.986060619354248e-06, 4.470348358154297e-06, 1.2926757335662842e-05, 2.1383166313171387e-05, 2.983957529067993e-05, 3.8295984268188477e-05, 4.675239324569702e-05, 5.5208802223205566e-05, 6.366521120071411e-05, 7.212162017822266e-05, 8.05780291557312e-05, 8.903443813323975e-05, 9.749084711074829e-05, 0.00010594725608825684, 0.00011440366506576538, 0.00012286007404327393, 0.00013131648302078247, 0.00013977289199829102, 0.00014822930097579956, 0.0001566857099533081, 0.00016514211893081665, 0.0001735985279083252, 0.00018205493688583374, 0.00019051134586334229, 0.00019896775484085083, 0.00020742416381835938]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 5.0, 4.0, 3.0, 14.0, 11.0, 24.0, 35.0, 38.0, 63.0, 101.0, 146.0, 200.0, 314.0, 418.0, 699.0, 1087.0, 1675.0, 2839.0, 5052.0, 9280.0, 19445.0, 43308.0, 101597.0, 211365.0, 282234.0, 197792.0, 92375.0, 39637.0, 18064.0, 8744.0, 4749.0, 2643.0, 1627.0, 1010.0, 679.0, 429.0, 289.0, 179.0, 122.0, 94.0, 50.0, 34.0, 30.0, 19.0, 12.0, 8.0, 6.0, 5.0, 3.0, 0.0, 4.0, 2.0], "bins": [-5.796875, -5.6378173828125, -5.478759765625, -5.3197021484375, -5.16064453125, -5.0015869140625, -4.842529296875, -4.6834716796875, -4.5244140625, -4.3653564453125, -4.206298828125, -4.0472412109375, -3.88818359375, -3.7291259765625, -3.570068359375, -3.4110107421875, -3.251953125, -3.0928955078125, -2.933837890625, -2.7747802734375, -2.61572265625, -2.4566650390625, -2.297607421875, -2.1385498046875, -1.9794921875, -1.8204345703125, -1.661376953125, -1.5023193359375, -1.34326171875, -1.1842041015625, -1.025146484375, -0.8660888671875, -0.70703125, -0.5479736328125, -0.388916015625, -0.2298583984375, -0.07080078125, 0.0882568359375, 0.247314453125, 0.4063720703125, 0.5654296875, 0.7244873046875, 0.883544921875, 1.0426025390625, 1.20166015625, 1.3607177734375, 1.519775390625, 1.6788330078125, 1.837890625, 1.9969482421875, 2.156005859375, 2.3150634765625, 2.47412109375, 2.6331787109375, 2.792236328125, 2.9512939453125, 3.1103515625, 3.2694091796875, 3.428466796875, 3.5875244140625, 3.74658203125, 3.9056396484375, 4.064697265625, 4.2237548828125, 4.3828125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 10.0, 11.0, 6.0, 9.0, 11.0, 11.0, 15.0, 29.0, 36.0, 45.0, 35.0, 42.0, 48.0, 60.0, 62.0, 79.0, 63.0, 54.0, 62.0, 60.0, 42.0, 41.0, 28.0, 16.0, 24.0, 20.0, 20.0, 7.0, 15.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.346282958984375, -1.30584716796875, -1.265411376953125, -1.2249755859375, -1.184539794921875, -1.14410400390625, -1.103668212890625, -1.063232421875, -1.022796630859375, -0.98236083984375, -0.941925048828125, -0.9014892578125, -0.861053466796875, -0.82061767578125, -0.780181884765625, -0.73974609375, -0.699310302734375, -0.65887451171875, -0.618438720703125, -0.5780029296875, -0.537567138671875, -0.49713134765625, -0.456695556640625, -0.416259765625, -0.375823974609375, -0.33538818359375, -0.294952392578125, -0.2545166015625, -0.214080810546875, -0.17364501953125, -0.133209228515625, -0.0927734375, -0.052337646484375, -0.01190185546875, 0.028533935546875, 0.0689697265625, 0.109405517578125, 0.14984130859375, 0.190277099609375, 0.230712890625, 0.271148681640625, 0.31158447265625, 0.352020263671875, 0.3924560546875, 0.432891845703125, 0.47332763671875, 0.513763427734375, 0.55419921875, 0.594635009765625, 0.63507080078125, 0.675506591796875, 0.7159423828125, 0.756378173828125, 0.79681396484375, 0.837249755859375, 0.877685546875, 0.918121337890625, 0.95855712890625, 0.998992919921875, 1.0394287109375, 1.079864501953125, 1.12030029296875, 1.160736083984375, 1.201171875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 1.0, 5.0, 5.0, 11.0, 9.0, 7.0, 11.0, 15.0, 17.0, 24.0, 22.0, 34.0, 42.0, 47.0, 45.0, 37.0, 62.0, 72.0, 60.0, 46.0, 55.0, 43.0, 42.0, 42.0, 36.0, 30.0, 20.0, 40.0, 22.0, 10.0, 10.0, 15.0, 16.0, 9.0, 8.0, 3.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.03448486328125, -4.875150203704834, -4.715815544128418, -4.55648136138916, -4.397146701812744, -4.237812042236328, -4.078477382659912, -3.919142723083496, -3.759808301925659, -3.600473642349243, -3.4411392211914062, -3.2818045616149902, -3.122469902038574, -2.9631354808807373, -2.8038008213043213, -2.6444664001464844, -2.4851317405700684, -2.3257970809936523, -2.1664626598358154, -2.0071280002593994, -1.847793459892273, -1.6884589195251465, -1.5291242599487305, -1.369789719581604, -1.2104551792144775, -1.051120638847351, -0.8917860388755798, -0.7324514389038086, -0.5731168985366821, -0.41378235816955566, -0.2544477581977844, -0.09511315822601318, 0.06422138214111328, 0.22355595231056213, 0.382890522480011, 0.5422251224517822, 0.7015596628189087, 0.8608942031860352, 1.0202288627624512, 1.1795634031295776, 1.338897943496704, 1.4982324838638306, 1.657567024230957, 1.816901683807373, 1.9762362241744995, 2.135570764541626, 2.294905424118042, 2.454239845275879, 2.613574504852295, 2.772909164428711, 2.932243585586548, 3.091578245162964, 3.250912666320801, 3.410247325897217, 3.569581985473633, 3.728916645050049, 3.8882510662078857, 4.047585487365723, 4.206920146942139, 4.366254806518555, 4.525589466094971, 4.684924125671387, 4.8442583084106445, 5.0035929679870605, 5.162927627563477]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 16.0, 20.0, 20.0, 35.0, 33.0, 32.0, 39.0, 44.0, 31.0, 40.0, 39.0, 33.0, 47.0, 44.0, 37.0, 50.0, 49.0, 41.0, 32.0, 42.0, 40.0, 39.0, 29.0, 22.0, 17.0, 15.0, 20.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.929340362548828, -5.738770961761475, -5.548201084136963, -5.357631683349609, -5.167062282562256, -4.976492881774902, -4.785923004150391, -4.595353603363037, -4.404784202575684, -4.21421480178833, -4.023644924163818, -3.833075523376465, -3.6425061225891113, -3.4519364833831787, -3.261366844177246, -3.0707974433898926, -2.880227565765381, -2.6896579265594482, -2.4990885257720947, -2.308518886566162, -2.1179494857788086, -1.927379846572876, -1.7368102073669434, -1.5462406873703003, -1.3556711673736572, -1.1651016473770142, -0.9745320677757263, -0.7839624881744385, -0.5933929681777954, -0.40282344818115234, -0.21225380897521973, -0.02168428897857666, 0.1688847541809082, 0.35945430397987366, 0.5500238537788391, 0.740593433380127, 0.93116295337677, 1.121732473373413, 1.3123021125793457, 1.5028716325759888, 1.6934411525726318, 1.884010672569275, 2.074580192565918, 2.2651498317718506, 2.455719470977783, 2.6462888717651367, 2.8368585109710693, 3.027428150177002, 3.2179975509643555, 3.408567190170288, 3.5991365909576416, 3.789706230163574, 3.9802756309509277, 4.170845031738281, 4.361414909362793, 4.5519843101501465, 4.7425537109375, 4.9331231117248535, 5.123692989349365, 5.314262390136719, 5.504831790924072, 5.695401191711426, 5.8859710693359375, 6.076540470123291, 6.267110347747803]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 10.0, 21.0, 24.0, 41.0, 41.0, 82.0, 116.0, 201.0, 284.0, 478.0, 789.0, 1168.0, 2006.0, 3234.0, 5904.0, 10743.0, 19451.0, 37751.0, 75361.0, 158241.0, 348517.0, 719261.0, 1051797.0, 876378.0, 463245.0, 211989.0, 100278.0, 49468.0, 25574.0, 13357.0, 7524.0, 4327.0, 2524.0, 1455.0, 944.0, 588.0, 357.0, 249.0, 151.0, 109.0, 68.0, 51.0, 32.0, 17.0, 22.0, 17.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.14617919921875, -4.9837646484375, -4.82135009765625, -4.658935546875, -4.49652099609375, -4.3341064453125, -4.17169189453125, -4.00927734375, -3.84686279296875, -3.6844482421875, -3.52203369140625, -3.359619140625, -3.19720458984375, -3.0347900390625, -2.87237548828125, -2.7099609375, -2.54754638671875, -2.3851318359375, -2.22271728515625, -2.060302734375, -1.89788818359375, -1.7354736328125, -1.57305908203125, -1.41064453125, -1.24822998046875, -1.0858154296875, -0.92340087890625, -0.760986328125, -0.59857177734375, -0.4361572265625, -0.27374267578125, -0.111328125, 0.05108642578125, 0.2135009765625, 0.37591552734375, 0.538330078125, 0.70074462890625, 0.8631591796875, 1.02557373046875, 1.18798828125, 1.35040283203125, 1.5128173828125, 1.67523193359375, 1.837646484375, 2.00006103515625, 2.1624755859375, 2.32489013671875, 2.4873046875, 2.64971923828125, 2.8121337890625, 2.97454833984375, 3.136962890625, 3.29937744140625, 3.4617919921875, 3.62420654296875, 3.78662109375, 3.94903564453125, 4.1114501953125, 4.27386474609375, 4.436279296875, 4.59869384765625, 4.7611083984375, 4.92352294921875, 5.0859375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 14.0, 17.0, 17.0, 18.0, 24.0, 18.0, 27.0, 39.0, 30.0, 28.0, 39.0, 25.0, 42.0, 41.0, 45.0, 40.0, 53.0, 47.0, 47.0, 43.0, 35.0, 38.0, 34.0, 30.0, 26.0, 36.0, 28.0, 27.0, 17.0, 8.0, 10.0, 9.0, 3.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.153289794921875, -3.03118896484375, -2.909088134765625, -2.7869873046875, -2.664886474609375, -2.54278564453125, -2.420684814453125, -2.298583984375, -2.176483154296875, -2.05438232421875, -1.932281494140625, -1.8101806640625, -1.688079833984375, -1.56597900390625, -1.443878173828125, -1.32177734375, -1.199676513671875, -1.07757568359375, -0.955474853515625, -0.8333740234375, -0.711273193359375, -0.58917236328125, -0.467071533203125, -0.344970703125, -0.222869873046875, -0.10076904296875, 0.021331787109375, 0.1434326171875, 0.265533447265625, 0.38763427734375, 0.509735107421875, 0.6318359375, 0.753936767578125, 0.87603759765625, 0.998138427734375, 1.1202392578125, 1.242340087890625, 1.36444091796875, 1.486541748046875, 1.608642578125, 1.730743408203125, 1.85284423828125, 1.974945068359375, 2.0970458984375, 2.219146728515625, 2.34124755859375, 2.463348388671875, 2.58544921875, 2.707550048828125, 2.82965087890625, 2.951751708984375, 3.0738525390625, 3.195953369140625, 3.31805419921875, 3.440155029296875, 3.562255859375, 3.684356689453125, 3.80645751953125, 3.928558349609375, 4.0506591796875, 4.172760009765625, 4.29486083984375, 4.416961669921875, 4.5390625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 8.0, 21.0, 30.0, 32.0, 66.0, 104.0, 138.0, 220.0, 315.0, 552.0, 947.0, 1406.0, 2253.0, 3637.0, 5947.0, 9990.0, 16953.0, 29437.0, 52027.0, 95323.0, 175390.0, 326459.0, 577620.0, 852951.0, 828420.0, 543543.0, 303535.0, 162962.0, 87997.0, 48459.0, 27739.0, 15861.0, 9379.0, 5537.0, 3382.0, 2073.0, 1287.0, 822.0, 509.0, 332.0, 220.0, 130.0, 93.0, 70.0, 36.0, 28.0, 14.0, 11.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.35455322265625, -4.2091064453125, -4.06365966796875, -3.918212890625, -3.77276611328125, -3.6273193359375, -3.48187255859375, -3.33642578125, -3.19097900390625, -3.0455322265625, -2.90008544921875, -2.754638671875, -2.60919189453125, -2.4637451171875, -2.31829833984375, -2.1728515625, -2.02740478515625, -1.8819580078125, -1.73651123046875, -1.591064453125, -1.44561767578125, -1.3001708984375, -1.15472412109375, -1.00927734375, -0.86383056640625, -0.7183837890625, -0.57293701171875, -0.427490234375, -0.28204345703125, -0.1365966796875, 0.00885009765625, 0.154296875, 0.29974365234375, 0.4451904296875, 0.59063720703125, 0.736083984375, 0.88153076171875, 1.0269775390625, 1.17242431640625, 1.31787109375, 1.46331787109375, 1.6087646484375, 1.75421142578125, 1.899658203125, 2.04510498046875, 2.1905517578125, 2.33599853515625, 2.4814453125, 2.62689208984375, 2.7723388671875, 2.91778564453125, 3.063232421875, 3.20867919921875, 3.3541259765625, 3.49957275390625, 3.64501953125, 3.79046630859375, 3.9359130859375, 4.08135986328125, 4.226806640625, 4.37225341796875, 4.5177001953125, 4.66314697265625, 4.80859375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 16.0, 12.0, 18.0, 25.0, 28.0, 32.0, 42.0, 50.0, 59.0, 60.0, 95.0, 115.0, 135.0, 179.0, 170.0, 209.0, 220.0, 208.0, 284.0, 279.0, 213.0, 253.0, 189.0, 174.0, 163.0, 145.0, 137.0, 93.0, 84.0, 70.0, 55.0, 51.0, 42.0, 35.0, 26.0, 17.0, 18.0, 17.0, 12.0, 13.0, 3.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.630859375, -1.5804443359375, -1.530029296875, -1.4796142578125, -1.42919921875, -1.3787841796875, -1.328369140625, -1.2779541015625, -1.2275390625, -1.1771240234375, -1.126708984375, -1.0762939453125, -1.02587890625, -0.9754638671875, -0.925048828125, -0.8746337890625, -0.82421875, -0.7738037109375, -0.723388671875, -0.6729736328125, -0.62255859375, -0.5721435546875, -0.521728515625, -0.4713134765625, -0.4208984375, -0.3704833984375, -0.320068359375, -0.2696533203125, -0.21923828125, -0.1688232421875, -0.118408203125, -0.0679931640625, -0.017578125, 0.0328369140625, 0.083251953125, 0.1336669921875, 0.18408203125, 0.2344970703125, 0.284912109375, 0.3353271484375, 0.3857421875, 0.4361572265625, 0.486572265625, 0.5369873046875, 0.58740234375, 0.6378173828125, 0.688232421875, 0.7386474609375, 0.7890625, 0.8394775390625, 0.889892578125, 0.9403076171875, 0.99072265625, 1.0411376953125, 1.091552734375, 1.1419677734375, 1.1923828125, 1.2427978515625, 1.293212890625, 1.3436279296875, 1.39404296875, 1.4444580078125, 1.494873046875, 1.5452880859375, 1.595703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 22.0, 17.0, 16.0, 32.0, 29.0, 33.0, 44.0, 46.0, 43.0, 54.0, 54.0, 56.0, 56.0, 61.0, 41.0, 44.0, 48.0, 40.0, 31.0, 29.0, 27.0, 24.0, 17.0, 13.0, 13.0, 8.0, 11.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3879594802856445, -4.246031284332275, -4.104103088378906, -3.962175130844116, -3.820246934890747, -3.678318738937378, -3.536390781402588, -3.3944625854492188, -3.2525343894958496, -3.1106061935424805, -2.9686779975891113, -2.8267500400543213, -2.684821844100952, -2.542893648147583, -2.400965690612793, -2.259037494659424, -2.1171092987060547, -1.9751811027526855, -1.833253026008606, -1.6913249492645264, -1.5493967533111572, -1.407468557357788, -1.2655404806137085, -1.123612403869629, -0.9816842079162598, -0.8397560715675354, -0.697827935218811, -0.5558997988700867, -0.4139716625213623, -0.27204352617263794, -0.13011538982391357, 0.011812746524810791, 0.15374135971069336, 0.2956694960594177, 0.4375976324081421, 0.5795257687568665, 0.7214539051055908, 0.8633820414543152, 1.0053101778030396, 1.1472382545471191, 1.2891664505004883, 1.4310946464538574, 1.573022723197937, 1.7149507999420166, 1.8568789958953857, 1.9988071918487549, 2.140735149383545, 2.282663345336914, 2.424591541290283, 2.5665197372436523, 2.7084479331970215, 2.8503758907318115, 2.9923040866851807, 3.13423228263855, 3.27616024017334, 3.418088436126709, 3.560016632080078, 3.7019448280334473, 3.8438730239868164, 3.9858009815216064, 4.127729415893555, 4.269657135009766, 4.411585330963135, 4.553513526916504, 4.695441722869873]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 8.0, 3.0, 4.0, 4.0, 10.0, 7.0, 19.0, 14.0, 27.0, 17.0, 29.0, 32.0, 38.0, 32.0, 38.0, 43.0, 43.0, 39.0, 47.0, 40.0, 51.0, 47.0, 51.0, 38.0, 43.0, 35.0, 37.0, 35.0, 27.0, 25.0, 25.0, 20.0, 16.0, 13.0, 14.0, 15.0, 7.0, 2.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.613129138946533, -4.4596991539001465, -4.306269645690918, -4.152839660644531, -3.9994101524353027, -3.845980167388916, -3.6925504207611084, -3.539120674133301, -3.385690927505493, -3.2322611808776855, -3.078831434249878, -2.9254016876220703, -2.7719717025756836, -2.618542194366455, -2.4651122093200684, -2.3116824626922607, -2.158252716064453, -2.0048229694366455, -1.851393222808838, -1.6979633569717407, -1.544533610343933, -1.3911038637161255, -1.2376739978790283, -1.0842442512512207, -0.9308145046234131, -0.7773847579956055, -0.6239549517631531, -0.47052517533302307, -0.31709539890289307, -0.16366565227508545, -0.010235846042633057, 0.14319396018981934, 0.29662418365478516, 0.45005396008491516, 0.6034837365150452, 0.7569135427474976, 0.9103432893753052, 1.0637730360031128, 1.21720290184021, 1.3706326484680176, 1.5240623950958252, 1.6774921417236328, 1.8309218883514404, 1.9843517541885376, 2.1377816200256348, 2.2912111282348633, 2.44464111328125, 2.5980708599090576, 2.7515006065368652, 2.904930353164673, 3.0583600997924805, 3.211789846420288, 3.3652195930480957, 3.5186495780944824, 3.67207932472229, 3.8255090713500977, 3.9789388179779053, 4.132368564605713, 4.2857985496521, 4.439228057861328, 4.592658042907715, 4.746087551116943, 4.89951753616333, 5.052947044372559, 5.206377029418945]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 14.0, 12.0, 16.0, 30.0, 41.0, 55.0, 99.0, 144.0, 218.0, 299.0, 506.0, 823.0, 1177.0, 1984.0, 3190.0, 5086.0, 8205.0, 13608.0, 22396.0, 37473.0, 64275.0, 114339.0, 198871.0, 229550.0, 146395.0, 81896.0, 46594.0, 27638.0, 16649.0, 10221.0, 6193.0, 3832.0, 2464.0, 1560.0, 976.0, 596.0, 389.0, 237.0, 161.0, 121.0, 72.0, 53.0, 36.0, 17.0, 11.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.97412109375, -0.9429092407226562, -0.9116973876953125, -0.8804855346679688, -0.849273681640625, -0.8180618286132812, -0.7868499755859375, -0.7556381225585938, -0.72442626953125, -0.6932144165039062, -0.6620025634765625, -0.6307907104492188, -0.599578857421875, -0.5683670043945312, -0.5371551513671875, -0.5059432983398438, -0.4747314453125, -0.44351959228515625, -0.4123077392578125, -0.38109588623046875, -0.349884033203125, -0.31867218017578125, -0.2874603271484375, -0.25624847412109375, -0.22503662109375, -0.19382476806640625, -0.1626129150390625, -0.13140106201171875, -0.100189208984375, -0.06897735595703125, -0.0377655029296875, -0.00655364990234375, 0.024658203125, 0.05587005615234375, 0.0870819091796875, 0.11829376220703125, 0.149505615234375, 0.18071746826171875, 0.2119293212890625, 0.24314117431640625, 0.27435302734375, 0.30556488037109375, 0.3367767333984375, 0.36798858642578125, 0.399200439453125, 0.43041229248046875, 0.4616241455078125, 0.49283599853515625, 0.5240478515625, 0.5552597045898438, 0.5864715576171875, 0.6176834106445312, 0.648895263671875, 0.6801071166992188, 0.7113189697265625, 0.7425308227539062, 0.77374267578125, 0.8049545288085938, 0.8361663818359375, 0.8673782348632812, 0.898590087890625, 0.9298019409179688, 0.9610137939453125, 0.9922256469726562, 1.0234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 11.0, 13.0, 14.0, 21.0, 23.0, 26.0, 32.0, 32.0, 31.0, 41.0, 43.0, 41.0, 40.0, 54.0, 45.0, 50.0, 41.0, 48.0, 35.0, 31.0, 47.0, 25.0, 32.0, 24.0, 31.0, 25.0, 27.0, 14.0, 17.0, 15.0, 8.0, 9.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.3070068359375, -4.153076171875, -3.9991455078125, -3.84521484375, -3.6912841796875, -3.537353515625, -3.3834228515625, -3.2294921875, -3.0755615234375, -2.921630859375, -2.7677001953125, -2.61376953125, -2.4598388671875, -2.305908203125, -2.1519775390625, -1.998046875, -1.8441162109375, -1.690185546875, -1.5362548828125, -1.38232421875, -1.2283935546875, -1.074462890625, -0.9205322265625, -0.7666015625, -0.6126708984375, -0.458740234375, -0.3048095703125, -0.15087890625, 0.0030517578125, 0.156982421875, 0.3109130859375, 0.46484375, 0.6187744140625, 0.772705078125, 0.9266357421875, 1.08056640625, 1.2344970703125, 1.388427734375, 1.5423583984375, 1.6962890625, 1.8502197265625, 2.004150390625, 2.1580810546875, 2.31201171875, 2.4659423828125, 2.619873046875, 2.7738037109375, 2.927734375, 3.0816650390625, 3.235595703125, 3.3895263671875, 3.54345703125, 3.6973876953125, 3.851318359375, 4.0052490234375, 4.1591796875, 4.3131103515625, 4.467041015625, 4.6209716796875, 4.77490234375, 4.9288330078125, 5.082763671875, 5.2366943359375, 5.390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 5.0, 11.0, 12.0, 20.0, 21.0, 27.0, 41.0, 57.0, 75.0, 101.0, 142.0, 199.0, 354.0, 525.0, 841.0, 1317.0, 2486.0, 4523.0, 9072.0, 21008.0, 96462.0, 834453.0, 45634.0, 15258.0, 7095.0, 3590.0, 2003.0, 1165.0, 717.0, 422.0, 286.0, 197.0, 113.0, 89.0, 60.0, 49.0, 29.0, 27.0, 26.0, 9.0, 12.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.9930419921875, -1.931396484375, -1.8697509765625, -1.80810546875, -1.7464599609375, -1.684814453125, -1.6231689453125, -1.5615234375, -1.4998779296875, -1.438232421875, -1.3765869140625, -1.31494140625, -1.2532958984375, -1.191650390625, -1.1300048828125, -1.068359375, -1.0067138671875, -0.945068359375, -0.8834228515625, -0.82177734375, -0.7601318359375, -0.698486328125, -0.6368408203125, -0.5751953125, -0.5135498046875, -0.451904296875, -0.3902587890625, -0.32861328125, -0.2669677734375, -0.205322265625, -0.1436767578125, -0.08203125, -0.0203857421875, 0.041259765625, 0.1029052734375, 0.16455078125, 0.2261962890625, 0.287841796875, 0.3494873046875, 0.4111328125, 0.4727783203125, 0.534423828125, 0.5960693359375, 0.65771484375, 0.7193603515625, 0.781005859375, 0.8426513671875, 0.904296875, 0.9659423828125, 1.027587890625, 1.0892333984375, 1.15087890625, 1.2125244140625, 1.274169921875, 1.3358154296875, 1.3974609375, 1.4591064453125, 1.520751953125, 1.5823974609375, 1.64404296875, 1.7056884765625, 1.767333984375, 1.8289794921875, 1.890625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 8.0, 9.0, 4.0, 5.0, 11.0, 15.0, 13.0, 18.0, 15.0, 21.0, 29.0, 21.0, 26.0, 28.0, 37.0, 35.0, 38.0, 30.0, 35.0, 31.0, 32.0, 36.0, 42.0, 26.0, 48.0, 29.0, 38.0, 28.0, 36.0, 26.0, 22.0, 24.0, 23.0, 21.0, 17.0, 15.0, 16.0, 16.0, 17.0, 10.0, 7.0, 2.0, 12.0, 2.0, 5.0, 6.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-2.783203125, -2.7017822265625, -2.620361328125, -2.5389404296875, -2.45751953125, -2.3760986328125, -2.294677734375, -2.2132568359375, -2.1318359375, -2.0504150390625, -1.968994140625, -1.8875732421875, -1.80615234375, -1.7247314453125, -1.643310546875, -1.5618896484375, -1.48046875, -1.3990478515625, -1.317626953125, -1.2362060546875, -1.15478515625, -1.0733642578125, -0.991943359375, -0.9105224609375, -0.8291015625, -0.7476806640625, -0.666259765625, -0.5848388671875, -0.50341796875, -0.4219970703125, -0.340576171875, -0.2591552734375, -0.177734375, -0.0963134765625, -0.014892578125, 0.0665283203125, 0.14794921875, 0.2293701171875, 0.310791015625, 0.3922119140625, 0.4736328125, 0.5550537109375, 0.636474609375, 0.7178955078125, 0.79931640625, 0.8807373046875, 0.962158203125, 1.0435791015625, 1.125, 1.2064208984375, 1.287841796875, 1.3692626953125, 1.45068359375, 1.5321044921875, 1.613525390625, 1.6949462890625, 1.7763671875, 1.8577880859375, 1.939208984375, 2.0206298828125, 2.10205078125, 2.1834716796875, 2.264892578125, 2.3463134765625, 2.427734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 14.0, 20.0, 18.0, 30.0, 50.0, 46.0, 91.0, 139.0, 166.0, 281.0, 399.0, 616.0, 930.0, 1532.0, 2360.0, 3991.0, 6751.0, 12522.0, 25831.0, 239775.0, 689487.0, 29896.0, 14107.0, 7703.0, 4362.0, 2725.0, 1654.0, 998.0, 671.0, 408.0, 292.0, 200.0, 138.0, 91.0, 66.0, 45.0, 43.0, 24.0, 9.0, 19.0, 10.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.49609375, -0.480133056640625, -0.46417236328125, -0.448211669921875, -0.4322509765625, -0.416290283203125, -0.40032958984375, -0.384368896484375, -0.368408203125, -0.352447509765625, -0.33648681640625, -0.320526123046875, -0.3045654296875, -0.288604736328125, -0.27264404296875, -0.256683349609375, -0.24072265625, -0.224761962890625, -0.20880126953125, -0.192840576171875, -0.1768798828125, -0.160919189453125, -0.14495849609375, -0.128997802734375, -0.113037109375, -0.097076416015625, -0.08111572265625, -0.065155029296875, -0.0491943359375, -0.033233642578125, -0.01727294921875, -0.001312255859375, 0.0146484375, 0.030609130859375, 0.04656982421875, 0.062530517578125, 0.0784912109375, 0.094451904296875, 0.11041259765625, 0.126373291015625, 0.142333984375, 0.158294677734375, 0.17425537109375, 0.190216064453125, 0.2061767578125, 0.222137451171875, 0.23809814453125, 0.254058837890625, 0.27001953125, 0.285980224609375, 0.30194091796875, 0.317901611328125, 0.3338623046875, 0.349822998046875, 0.36578369140625, 0.381744384765625, 0.397705078125, 0.413665771484375, 0.42962646484375, 0.445587158203125, 0.4615478515625, 0.477508544921875, 0.49346923828125, 0.509429931640625, 0.525390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 5.0, 4.0, 16.0, 14.0, 14.0, 22.0, 20.0, 32.0, 28.0, 44.0, 40.0, 60.0, 68.0, 65.0, 62.0, 62.0, 74.0, 65.0, 56.0, 43.0, 33.0, 41.0, 25.0, 22.0, 16.0, 15.0, 9.0, 8.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.522634506225586e-05, -3.412831574678421e-05, -3.303028643131256e-05, -3.193225711584091e-05, -3.083422780036926e-05, -2.9736198484897614e-05, -2.8638169169425964e-05, -2.7540139853954315e-05, -2.6442110538482666e-05, -2.5344081223011017e-05, -2.4246051907539368e-05, -2.314802259206772e-05, -2.204999327659607e-05, -2.095196396112442e-05, -1.985393464565277e-05, -1.8755905330181122e-05, -1.7657876014709473e-05, -1.6559846699237823e-05, -1.5461817383766174e-05, -1.4363788068294525e-05, -1.3265758752822876e-05, -1.2167729437351227e-05, -1.1069700121879578e-05, -9.971670806407928e-06, -8.87364149093628e-06, -7.77561217546463e-06, -6.677582859992981e-06, -5.579553544521332e-06, -4.481524229049683e-06, -3.3834949135780334e-06, -2.2854655981063843e-06, -1.1874362826347351e-06, -8.940696716308594e-08, 1.0086223483085632e-06, 2.1066516637802124e-06, 3.2046809792518616e-06, 4.302710294723511e-06, 5.40073961019516e-06, 6.498768925666809e-06, 7.596798241138458e-06, 8.694827556610107e-06, 9.792856872081757e-06, 1.0890886187553406e-05, 1.1988915503025055e-05, 1.3086944818496704e-05, 1.4184974133968353e-05, 1.5283003449440002e-05, 1.638103276491165e-05, 1.74790620803833e-05, 1.857709139585495e-05, 1.96751207113266e-05, 2.0773150026798248e-05, 2.1871179342269897e-05, 2.2969208657741547e-05, 2.4067237973213196e-05, 2.5165267288684845e-05, 2.6263296604156494e-05, 2.7361325919628143e-05, 2.8459355235099792e-05, 2.955738455057144e-05, 3.065541386604309e-05, 3.175344318151474e-05, 3.285147249698639e-05, 3.394950181245804e-05, 3.504753112792969e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 7.0, 12.0, 16.0, 17.0, 28.0, 50.0, 72.0, 115.0, 153.0, 265.0, 389.0, 574.0, 888.0, 1505.0, 2376.0, 3832.0, 6175.0, 10601.0, 18098.0, 33031.0, 64891.0, 132735.0, 243584.0, 247169.0, 136058.0, 65858.0, 34056.0, 18449.0, 10566.0, 6400.0, 3971.0, 2381.0, 1522.0, 948.0, 572.0, 396.0, 279.0, 187.0, 101.0, 74.0, 53.0, 34.0, 24.0, 13.0, 12.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.253173828125, -0.24573135375976562, -0.23828887939453125, -0.23084640502929688, -0.2234039306640625, -0.21596145629882812, -0.20851898193359375, -0.20107650756835938, -0.193634033203125, -0.18619155883789062, -0.17874908447265625, -0.17130661010742188, -0.1638641357421875, -0.15642166137695312, -0.14897918701171875, -0.14153671264648438, -0.13409423828125, -0.12665176391601562, -0.11920928955078125, -0.11176681518554688, -0.1043243408203125, -0.09688186645507812, -0.08943939208984375, -0.08199691772460938, -0.074554443359375, -0.06711196899414062, -0.05966949462890625, -0.052227020263671875, -0.0447845458984375, -0.037342071533203125, -0.02989959716796875, -0.022457122802734375, -0.0150146484375, -0.007572174072265625, -0.00012969970703125, 0.007312774658203125, 0.0147552490234375, 0.022197723388671875, 0.02964019775390625, 0.037082672119140625, 0.044525146484375, 0.051967620849609375, 0.05941009521484375, 0.06685256958007812, 0.0742950439453125, 0.08173751831054688, 0.08917999267578125, 0.09662246704101562, 0.10406494140625, 0.11150741577148438, 0.11894989013671875, 0.12639236450195312, 0.1338348388671875, 0.14127731323242188, 0.14871978759765625, 0.15616226196289062, 0.163604736328125, 0.17104721069335938, 0.17848968505859375, 0.18593215942382812, 0.1933746337890625, 0.20081710815429688, 0.20825958251953125, 0.21570205688476562, 0.22314453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 2.0, 5.0, 5.0, 7.0, 4.0, 10.0, 6.0, 8.0, 14.0, 14.0, 11.0, 18.0, 17.0, 34.0, 26.0, 42.0, 54.0, 35.0, 78.0, 94.0, 54.0, 65.0, 82.0, 52.0, 64.0, 34.0, 37.0, 27.0, 18.0, 12.0, 16.0, 3.0, 10.0, 5.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06451416015625, -0.06237983703613281, -0.060245513916015625, -0.05811119079589844, -0.05597686767578125, -0.05384254455566406, -0.051708221435546875, -0.04957389831542969, -0.0474395751953125, -0.04530525207519531, -0.043170928955078125, -0.04103660583496094, -0.03890228271484375, -0.03676795959472656, -0.034633636474609375, -0.03249931335449219, -0.030364990234375, -0.028230667114257812, -0.026096343994140625, -0.023962020874023438, -0.02182769775390625, -0.019693374633789062, -0.017559051513671875, -0.015424728393554688, -0.0132904052734375, -0.011156082153320312, -0.009021759033203125, -0.0068874359130859375, -0.00475311279296875, -0.0026187896728515625, -0.000484466552734375, 0.0016498565673828125, 0.0037841796875, 0.0059185028076171875, 0.008052825927734375, 0.010187149047851562, 0.01232147216796875, 0.014455795288085938, 0.016590118408203125, 0.018724441528320312, 0.0208587646484375, 0.022993087768554688, 0.025127410888671875, 0.027261734008789062, 0.02939605712890625, 0.03153038024902344, 0.033664703369140625, 0.03579902648925781, 0.037933349609375, 0.04006767272949219, 0.042201995849609375, 0.04433631896972656, 0.04647064208984375, 0.04860496520996094, 0.050739288330078125, 0.05287361145019531, 0.0550079345703125, 0.05714225769042969, 0.059276580810546875, 0.06141090393066406, 0.06354522705078125, 0.06567955017089844, 0.06781387329101562, 0.06994819641113281, 0.07208251953125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 4.0, 8.0, 6.0, 15.0, 20.0, 16.0, 17.0, 24.0, 28.0, 23.0, 42.0, 51.0, 45.0, 49.0, 56.0, 50.0, 66.0, 63.0, 50.0, 50.0, 48.0, 42.0, 33.0, 31.0, 31.0, 23.0, 16.0, 18.0, 15.0, 13.0, 9.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.650997161865234, -4.503167152404785, -4.355337142944336, -4.207507133483887, -4.0596771240234375, -3.9118471145629883, -3.764017343521118, -3.616187334060669, -3.4683573246002197, -3.3205273151397705, -3.1726973056793213, -3.024867296218872, -2.877037525177002, -2.7292075157165527, -2.5813775062561035, -2.4335474967956543, -2.285717487335205, -2.137887477874756, -1.9900574684143066, -1.842227578163147, -1.6943975687026978, -1.5465675592422485, -1.3987376689910889, -1.2509076595306396, -1.1030776500701904, -0.9552476406097412, -0.8074176907539368, -0.6595877408981323, -0.5117577314376831, -0.3639277219772339, -0.21609777212142944, -0.068267822265625, 0.07956171035766602, 0.22739169001579285, 0.3752216696739197, 0.5230516195297241, 0.6708816289901733, 0.8187116384506226, 0.966541588306427, 1.1143715381622314, 1.2622015476226807, 1.4100315570831299, 1.557861566543579, 1.7056914567947388, 1.853521466255188, 2.0013513565063477, 2.149181365966797, 2.297011375427246, 2.4448413848876953, 2.5926713943481445, 2.7405014038085938, 2.888331413269043, 3.036161422729492, 3.1839914321899414, 3.3318212032318115, 3.4796512126922607, 3.62748122215271, 3.775311231613159, 3.9231412410736084, 4.0709710121154785, 4.218801021575928, 4.366631031036377, 4.514461040496826, 4.662291049957275, 4.810121059417725]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 4.0, 3.0, 5.0, 11.0, 7.0, 17.0, 15.0, 26.0, 19.0, 25.0, 36.0, 36.0, 32.0, 43.0, 37.0, 45.0, 41.0, 47.0, 34.0, 54.0, 49.0, 50.0, 37.0, 46.0, 33.0, 34.0, 37.0, 28.0, 24.0, 25.0, 21.0, 18.0, 13.0, 13.0, 12.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5604777336120605, -4.408585071563721, -4.256692409515381, -4.104799270629883, -3.952906608581543, -3.801013946533203, -3.6491212844848633, -3.4972286224365234, -3.3453357219696045, -3.1934430599212646, -3.0415501594543457, -2.889657497406006, -2.737764835357666, -2.585871934890747, -2.4339792728424072, -2.2820863723754883, -2.1301937103271484, -1.978300929069519, -1.8264081478118896, -1.6745154857635498, -1.5226227045059204, -1.370729923248291, -1.2188372611999512, -1.0669444799423218, -0.9150516986846924, -0.763158917427063, -0.6112661957740784, -0.45937344431877136, -0.30748069286346436, -0.15558791160583496, -0.003695189952850342, 0.14819753170013428, 0.30009031295776367, 0.4519830644130707, 0.6038758158683777, 0.7557685375213623, 0.9076613187789917, 1.059554100036621, 1.211446762084961, 1.3633395433425903, 1.5152323246002197, 1.6671251058578491, 1.8190178871154785, 1.9709105491638184, 2.122803211212158, 2.274696111679077, 2.426588773727417, 2.578481674194336, 2.730374336242676, 2.8822669982910156, 3.0341598987579346, 3.1860525608062744, 3.3379454612731934, 3.489838123321533, 3.641730785369873, 3.793623447418213, 3.945516347885132, 4.097409248352051, 4.249301910400391, 4.4011945724487305, 4.55308723449707, 4.70497989654541, 4.856873035430908, 5.008765697479248, 5.160658359527588]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 7.0, 16.0, 31.0, 37.0, 61.0, 83.0, 143.0, 220.0, 350.0, 517.0, 915.0, 1425.0, 2264.0, 3506.0, 5834.0, 9748.0, 16038.0, 26385.0, 42806.0, 67352.0, 98925.0, 132972.0, 152158.0, 144648.0, 117352.0, 83135.0, 54537.0, 34108.0, 20838.0, 12308.0, 7697.0, 4670.0, 2722.0, 1746.0, 1093.0, 697.0, 419.0, 269.0, 184.0, 117.0, 78.0, 47.0, 42.0, 27.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.157562255859375, -3.05145263671875, -2.945343017578125, -2.8392333984375, -2.733123779296875, -2.62701416015625, -2.520904541015625, -2.414794921875, -2.308685302734375, -2.20257568359375, -2.096466064453125, -1.9903564453125, -1.884246826171875, -1.77813720703125, -1.672027587890625, -1.56591796875, -1.459808349609375, -1.35369873046875, -1.247589111328125, -1.1414794921875, -1.035369873046875, -0.92926025390625, -0.823150634765625, -0.717041015625, -0.610931396484375, -0.50482177734375, -0.398712158203125, -0.2926025390625, -0.186492919921875, -0.08038330078125, 0.025726318359375, 0.1318359375, 0.237945556640625, 0.34405517578125, 0.450164794921875, 0.5562744140625, 0.662384033203125, 0.76849365234375, 0.874603271484375, 0.980712890625, 1.086822509765625, 1.19293212890625, 1.299041748046875, 1.4051513671875, 1.511260986328125, 1.61737060546875, 1.723480224609375, 1.82958984375, 1.935699462890625, 2.04180908203125, 2.147918701171875, 2.2540283203125, 2.360137939453125, 2.46624755859375, 2.572357177734375, 2.678466796875, 2.784576416015625, 2.89068603515625, 2.996795654296875, 3.1029052734375, 3.209014892578125, 3.31512451171875, 3.421234130859375, 3.52734375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 6.0, 15.0, 19.0, 21.0, 22.0, 25.0, 38.0, 32.0, 42.0, 40.0, 43.0, 48.0, 51.0, 44.0, 63.0, 59.0, 45.0, 39.0, 41.0, 36.0, 33.0, 35.0, 33.0, 35.0, 23.0, 20.0, 14.0, 12.0, 12.0, 7.0, 11.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.05987548828125, -4.8931884765625, -4.72650146484375, -4.559814453125, -4.39312744140625, -4.2264404296875, -4.05975341796875, -3.89306640625, -3.72637939453125, -3.5596923828125, -3.39300537109375, -3.226318359375, -3.05963134765625, -2.8929443359375, -2.72625732421875, -2.5595703125, -2.39288330078125, -2.2261962890625, -2.05950927734375, -1.892822265625, -1.72613525390625, -1.5594482421875, -1.39276123046875, -1.22607421875, -1.05938720703125, -0.8927001953125, -0.72601318359375, -0.559326171875, -0.39263916015625, -0.2259521484375, -0.05926513671875, 0.107421875, 0.27410888671875, 0.4407958984375, 0.60748291015625, 0.774169921875, 0.94085693359375, 1.1075439453125, 1.27423095703125, 1.44091796875, 1.60760498046875, 1.7742919921875, 1.94097900390625, 2.107666015625, 2.27435302734375, 2.4410400390625, 2.60772705078125, 2.7744140625, 2.94110107421875, 3.1077880859375, 3.27447509765625, 3.441162109375, 3.60784912109375, 3.7745361328125, 3.94122314453125, 4.10791015625, 4.27459716796875, 4.4412841796875, 4.60797119140625, 4.774658203125, 4.94134521484375, 5.1080322265625, 5.27471923828125, 5.44140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 15.0, 14.0, 24.0, 36.0, 49.0, 77.0, 143.0, 211.0, 362.0, 530.0, 956.0, 1526.0, 2468.0, 4352.0, 7592.0, 12887.0, 22606.0, 38692.0, 64015.0, 100705.0, 139782.0, 165317.0, 156828.0, 122383.0, 82795.0, 51511.0, 30274.0, 17703.0, 10173.0, 5957.0, 3477.0, 1948.0, 1209.0, 707.0, 423.0, 300.0, 188.0, 110.0, 80.0, 49.0, 22.0, 20.0, 10.0, 12.0, 9.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.552734375, -3.4443359375, -3.3359375, -3.2275390625, -3.119140625, -3.0107421875, -2.90234375, -2.7939453125, -2.685546875, -2.5771484375, -2.46875, -2.3603515625, -2.251953125, -2.1435546875, -2.03515625, -1.9267578125, -1.818359375, -1.7099609375, -1.6015625, -1.4931640625, -1.384765625, -1.2763671875, -1.16796875, -1.0595703125, -0.951171875, -0.8427734375, -0.734375, -0.6259765625, -0.517578125, -0.4091796875, -0.30078125, -0.1923828125, -0.083984375, 0.0244140625, 0.1328125, 0.2412109375, 0.349609375, 0.4580078125, 0.56640625, 0.6748046875, 0.783203125, 0.8916015625, 1.0, 1.1083984375, 1.216796875, 1.3251953125, 1.43359375, 1.5419921875, 1.650390625, 1.7587890625, 1.8671875, 1.9755859375, 2.083984375, 2.1923828125, 2.30078125, 2.4091796875, 2.517578125, 2.6259765625, 2.734375, 2.8427734375, 2.951171875, 3.0595703125, 3.16796875, 3.2763671875, 3.384765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 5.0, 5.0, 2.0, 15.0, 9.0, 10.0, 20.0, 20.0, 21.0, 23.0, 24.0, 35.0, 33.0, 34.0, 46.0, 23.0, 40.0, 29.0, 46.0, 32.0, 32.0, 33.0, 38.0, 31.0, 24.0, 30.0, 28.0, 39.0, 36.0, 35.0, 16.0, 20.0, 21.0, 20.0, 18.0, 20.0, 7.0, 11.0, 11.0, 7.0, 8.0, 2.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.33984375, -2.263916015625, -2.18798828125, -2.112060546875, -2.0361328125, -1.960205078125, -1.88427734375, -1.808349609375, -1.732421875, -1.656494140625, -1.58056640625, -1.504638671875, -1.4287109375, -1.352783203125, -1.27685546875, -1.200927734375, -1.125, -1.049072265625, -0.97314453125, -0.897216796875, -0.8212890625, -0.745361328125, -0.66943359375, -0.593505859375, -0.517578125, -0.441650390625, -0.36572265625, -0.289794921875, -0.2138671875, -0.137939453125, -0.06201171875, 0.013916015625, 0.08984375, 0.165771484375, 0.24169921875, 0.317626953125, 0.3935546875, 0.469482421875, 0.54541015625, 0.621337890625, 0.697265625, 0.773193359375, 0.84912109375, 0.925048828125, 1.0009765625, 1.076904296875, 1.15283203125, 1.228759765625, 1.3046875, 1.380615234375, 1.45654296875, 1.532470703125, 1.6083984375, 1.684326171875, 1.76025390625, 1.836181640625, 1.912109375, 1.988037109375, 2.06396484375, 2.139892578125, 2.2158203125, 2.291748046875, 2.36767578125, 2.443603515625, 2.51953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 14.0, 21.0, 28.0, 37.0, 52.0, 90.0, 129.0, 214.0, 359.0, 549.0, 869.0, 1566.0, 2329.0, 4053.0, 6729.0, 11796.0, 21134.0, 37254.0, 66320.0, 112334.0, 167187.0, 194875.0, 163849.0, 108750.0, 63877.0, 36208.0, 20008.0, 11364.0, 6648.0, 3852.0, 2305.0, 1332.0, 887.0, 553.0, 321.0, 199.0, 154.0, 95.0, 65.0, 48.0, 23.0, 19.0, 16.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0], "bins": [-2.443359375, -2.36810302734375, -2.2928466796875, -2.21759033203125, -2.142333984375, -2.06707763671875, -1.9918212890625, -1.91656494140625, -1.84130859375, -1.76605224609375, -1.6907958984375, -1.61553955078125, -1.540283203125, -1.46502685546875, -1.3897705078125, -1.31451416015625, -1.2392578125, -1.16400146484375, -1.0887451171875, -1.01348876953125, -0.938232421875, -0.86297607421875, -0.7877197265625, -0.71246337890625, -0.63720703125, -0.56195068359375, -0.4866943359375, -0.41143798828125, -0.336181640625, -0.26092529296875, -0.1856689453125, -0.11041259765625, -0.03515625, 0.04010009765625, 0.1153564453125, 0.19061279296875, 0.265869140625, 0.34112548828125, 0.4163818359375, 0.49163818359375, 0.56689453125, 0.64215087890625, 0.7174072265625, 0.79266357421875, 0.867919921875, 0.94317626953125, 1.0184326171875, 1.09368896484375, 1.1689453125, 1.24420166015625, 1.3194580078125, 1.39471435546875, 1.469970703125, 1.54522705078125, 1.6204833984375, 1.69573974609375, 1.77099609375, 1.84625244140625, 1.9215087890625, 1.99676513671875, 2.072021484375, 2.14727783203125, 2.2225341796875, 2.29779052734375, 2.373046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 8.0, 9.0, 10.0, 9.0, 18.0, 28.0, 26.0, 42.0, 33.0, 55.0, 54.0, 52.0, 50.0, 62.0, 63.0, 54.0, 68.0, 43.0, 50.0, 48.0, 35.0, 23.0, 19.0, 30.0, 25.0, 13.0, 13.0, 10.0, 6.0, 12.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020779669284820557, -0.0002003014087677002, -0.00019280612468719482, -0.00018531084060668945, -0.00017781555652618408, -0.0001703202724456787, -0.00016282498836517334, -0.00015532970428466797, -0.0001478344202041626, -0.00014033913612365723, -0.00013284385204315186, -0.00012534856796264648, -0.00011785328388214111, -0.00011035799980163574, -0.00010286271572113037, -9.5367431640625e-05, -8.787214756011963e-05, -8.037686347961426e-05, -7.288157939910889e-05, -6.538629531860352e-05, -5.7891011238098145e-05, -5.0395727157592773e-05, -4.29004430770874e-05, -3.540515899658203e-05, -2.790987491607666e-05, -2.041459083557129e-05, -1.2919306755065918e-05, -5.424022674560547e-06, 2.0712614059448242e-06, 9.566545486450195e-06, 1.7061829566955566e-05, 2.4557113647460938e-05, 3.205239772796631e-05, 3.954768180847168e-05, 4.704296588897705e-05, 5.453824996948242e-05, 6.203353404998779e-05, 6.952881813049316e-05, 7.702410221099854e-05, 8.45193862915039e-05, 9.201467037200928e-05, 9.950995445251465e-05, 0.00010700523853302002, 0.00011450052261352539, 0.00012199580669403076, 0.00012949109077453613, 0.0001369863748550415, 0.00014448165893554688, 0.00015197694301605225, 0.00015947222709655762, 0.000166967511177063, 0.00017446279525756836, 0.00018195807933807373, 0.0001894533634185791, 0.00019694864749908447, 0.00020444393157958984, 0.00021193921566009521, 0.00021943449974060059, 0.00022692978382110596, 0.00023442506790161133, 0.0002419203519821167, 0.00024941563606262207, 0.00025691092014312744, 0.0002644062042236328]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 17.0, 25.0, 29.0, 34.0, 74.0, 89.0, 132.0, 195.0, 261.0, 402.0, 624.0, 918.0, 1488.0, 2286.0, 3739.0, 6053.0, 9992.0, 17060.0, 29657.0, 51853.0, 87546.0, 137002.0, 180073.0, 177689.0, 134213.0, 85797.0, 49884.0, 29056.0, 16862.0, 9540.0, 5882.0, 3568.0, 2233.0, 1468.0, 930.0, 585.0, 399.0, 270.0, 178.0, 129.0, 89.0, 59.0, 46.0, 31.0, 23.0, 14.0, 13.0, 10.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.328125, -2.25531005859375, -2.1824951171875, -2.10968017578125, -2.036865234375, -1.96405029296875, -1.8912353515625, -1.81842041015625, -1.74560546875, -1.67279052734375, -1.5999755859375, -1.52716064453125, -1.454345703125, -1.38153076171875, -1.3087158203125, -1.23590087890625, -1.1630859375, -1.09027099609375, -1.0174560546875, -0.94464111328125, -0.871826171875, -0.79901123046875, -0.7261962890625, -0.65338134765625, -0.58056640625, -0.50775146484375, -0.4349365234375, -0.36212158203125, -0.289306640625, -0.21649169921875, -0.1436767578125, -0.07086181640625, 0.001953125, 0.07476806640625, 0.1475830078125, 0.22039794921875, 0.293212890625, 0.36602783203125, 0.4388427734375, 0.51165771484375, 0.58447265625, 0.65728759765625, 0.7301025390625, 0.80291748046875, 0.875732421875, 0.94854736328125, 1.0213623046875, 1.09417724609375, 1.1669921875, 1.23980712890625, 1.3126220703125, 1.38543701171875, 1.458251953125, 1.53106689453125, 1.6038818359375, 1.67669677734375, 1.74951171875, 1.82232666015625, 1.8951416015625, 1.96795654296875, 2.040771484375, 2.11358642578125, 2.1864013671875, 2.25921630859375, 2.33203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 6.0, 6.0, 7.0, 6.0, 11.0, 14.0, 13.0, 13.0, 29.0, 19.0, 36.0, 23.0, 41.0, 48.0, 46.0, 47.0, 51.0, 50.0, 48.0, 45.0, 44.0, 60.0, 40.0, 41.0, 36.0, 33.0, 30.0, 30.0, 13.0, 18.0, 19.0, 19.0, 8.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.606201171875, -0.58447265625, -0.562744140625, -0.541015625, -0.519287109375, -0.49755859375, -0.475830078125, -0.4541015625, -0.432373046875, -0.41064453125, -0.388916015625, -0.3671875, -0.345458984375, -0.32373046875, -0.302001953125, -0.2802734375, -0.258544921875, -0.23681640625, -0.215087890625, -0.193359375, -0.171630859375, -0.14990234375, -0.128173828125, -0.1064453125, -0.084716796875, -0.06298828125, -0.041259765625, -0.01953125, 0.002197265625, 0.02392578125, 0.045654296875, 0.0673828125, 0.089111328125, 0.11083984375, 0.132568359375, 0.154296875, 0.176025390625, 0.19775390625, 0.219482421875, 0.2412109375, 0.262939453125, 0.28466796875, 0.306396484375, 0.328125, 0.349853515625, 0.37158203125, 0.393310546875, 0.4150390625, 0.436767578125, 0.45849609375, 0.480224609375, 0.501953125, 0.523681640625, 0.54541015625, 0.567138671875, 0.5888671875, 0.610595703125, 0.63232421875, 0.654052734375, 0.67578125, 0.697509765625, 0.71923828125, 0.740966796875, 0.7626953125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 8.0, 19.0, 5.0, 16.0, 24.0, 25.0, 23.0, 30.0, 28.0, 37.0, 34.0, 54.0, 49.0, 56.0, 60.0, 59.0, 52.0, 57.0, 50.0, 42.0, 46.0, 42.0, 28.0, 27.0, 17.0, 13.0, 12.0, 16.0, 12.0, 8.0, 8.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.62278413772583, -4.477611541748047, -4.3324384689331055, -4.187265872955322, -4.042093276977539, -3.8969204425811768, -3.7517476081848145, -3.6065750122070312, -3.461402177810669, -3.3162293434143066, -3.1710567474365234, -3.025883913040161, -2.880711078643799, -2.7355384826660156, -2.5903656482696533, -2.445192813873291, -2.300020217895508, -2.1548473834991455, -2.0096747875213623, -1.864501953125, -1.7193292379379272, -1.5741565227508545, -1.4289836883544922, -1.2838109731674194, -1.1386382579803467, -0.9934655427932739, -0.8482927680015564, -0.7031199932098389, -0.5579472780227661, -0.41277456283569336, -0.26760178804397583, -0.1224290132522583, 0.02274322509765625, 0.1679159700870514, 0.31308871507644653, 0.4582614600658417, 0.6034342050552368, 0.7486069202423096, 0.8937796950340271, 1.0389524698257446, 1.1841251850128174, 1.3292979001998901, 1.474470615386963, 1.6196434497833252, 1.764816164970398, 1.9099888801574707, 2.055161714553833, 2.2003345489501953, 2.3455071449279785, 2.490679979324341, 2.635852575302124, 2.7810254096984863, 2.9261980056762695, 3.071370840072632, 3.216543674468994, 3.3617162704467773, 3.5068891048431396, 3.652061939239502, 3.797234535217285, 3.9424073696136475, 4.08758020401001, 4.232752799987793, 4.377925395965576, 4.523098468780518, 4.668271064758301]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 6.0, 5.0, 10.0, 4.0, 10.0, 8.0, 20.0, 18.0, 18.0, 17.0, 29.0, 30.0, 30.0, 28.0, 33.0, 36.0, 31.0, 52.0, 47.0, 44.0, 36.0, 38.0, 34.0, 43.0, 45.0, 49.0, 44.0, 30.0, 31.0, 26.0, 24.0, 21.0, 12.0, 23.0, 14.0, 8.0, 11.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.436288833618164, -4.295776844024658, -4.155264854431152, -4.0147528648376465, -3.8742411136627197, -3.733729124069214, -3.593217134475708, -3.452705144882202, -3.3121933937072754, -3.1716814041137695, -3.0311694145202637, -2.890657424926758, -2.750145673751831, -2.609633684158325, -2.4691216945648193, -2.3286097049713135, -2.1880977153778076, -2.0475857257843018, -1.9070738554000854, -1.7665618658065796, -1.6260499954223633, -1.4855380058288574, -1.3450260162353516, -1.2045140266418457, -1.0640021562576294, -0.9234902262687683, -0.7829782962799072, -0.6424663066864014, -0.5019543766975403, -0.3614424467086792, -0.22093045711517334, -0.08041852712631226, 0.06009340286254883, 0.2006053477525711, 0.3411172926425934, 0.48162925243377686, 0.6221411824226379, 0.762653112411499, 0.9031651020050049, 1.0436770915985107, 1.184188961982727, 1.324700951576233, 1.4652128219604492, 1.605724811553955, 1.746236801147461, 1.8867486715316772, 2.0272607803344727, 2.1677725315093994, 2.3082845211029053, 2.448796510696411, 2.589308500289917, 2.7298202514648438, 2.8703322410583496, 3.0108442306518555, 3.1513562202453613, 3.291868209838867, 3.432380199432373, 3.572892189025879, 3.7134041786193848, 3.8539161682128906, 3.9944279193878174, 4.134940147399902, 4.27545166015625, 4.415963649749756, 4.556475639343262]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 13.0, 17.0, 16.0, 23.0, 34.0, 35.0, 59.0, 97.0, 97.0, 172.0, 276.0, 362.0, 626.0, 906.0, 1376.0, 2305.0, 3566.0, 6194.0, 10581.0, 19192.0, 36073.0, 70033.0, 142788.0, 308416.0, 649365.0, 1036560.0, 935023.0, 508756.0, 231103.0, 108813.0, 54278.0, 28962.0, 15667.0, 8942.0, 5265.0, 3067.0, 1959.0, 1171.0, 749.0, 444.0, 294.0, 200.0, 122.0, 86.0, 68.0, 27.0, 33.0, 22.0, 14.0, 16.0, 4.0, 3.0, 4.0, 4.0, 3.0], "bins": [-4.91015625, -4.7691650390625, -4.628173828125, -4.4871826171875, -4.34619140625, -4.2052001953125, -4.064208984375, -3.9232177734375, -3.7822265625, -3.6412353515625, -3.500244140625, -3.3592529296875, -3.21826171875, -3.0772705078125, -2.936279296875, -2.7952880859375, -2.654296875, -2.5133056640625, -2.372314453125, -2.2313232421875, -2.09033203125, -1.9493408203125, -1.808349609375, -1.6673583984375, -1.5263671875, -1.3853759765625, -1.244384765625, -1.1033935546875, -0.96240234375, -0.8214111328125, -0.680419921875, -0.5394287109375, -0.3984375, -0.2574462890625, -0.116455078125, 0.0245361328125, 0.16552734375, 0.3065185546875, 0.447509765625, 0.5885009765625, 0.7294921875, 0.8704833984375, 1.011474609375, 1.1524658203125, 1.29345703125, 1.4344482421875, 1.575439453125, 1.7164306640625, 1.857421875, 1.9984130859375, 2.139404296875, 2.2803955078125, 2.42138671875, 2.5623779296875, 2.703369140625, 2.8443603515625, 2.9853515625, 3.1263427734375, 3.267333984375, 3.4083251953125, 3.54931640625, 3.6903076171875, 3.831298828125, 3.9722900390625, 4.11328125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 12.0, 16.0, 18.0, 14.0, 20.0, 24.0, 37.0, 21.0, 33.0, 26.0, 41.0, 29.0, 45.0, 36.0, 48.0, 43.0, 34.0, 43.0, 50.0, 37.0, 39.0, 29.0, 36.0, 32.0, 36.0, 15.0, 21.0, 23.0, 21.0, 13.0, 20.0, 12.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.900390625, -2.80963134765625, -2.7188720703125, -2.62811279296875, -2.537353515625, -2.44659423828125, -2.3558349609375, -2.26507568359375, -2.17431640625, -2.08355712890625, -1.9927978515625, -1.90203857421875, -1.811279296875, -1.72052001953125, -1.6297607421875, -1.53900146484375, -1.4482421875, -1.35748291015625, -1.2667236328125, -1.17596435546875, -1.085205078125, -0.99444580078125, -0.9036865234375, -0.81292724609375, -0.72216796875, -0.63140869140625, -0.5406494140625, -0.44989013671875, -0.359130859375, -0.26837158203125, -0.1776123046875, -0.08685302734375, 0.00390625, 0.09466552734375, 0.1854248046875, 0.27618408203125, 0.366943359375, 0.45770263671875, 0.5484619140625, 0.63922119140625, 0.72998046875, 0.82073974609375, 0.9114990234375, 1.00225830078125, 1.093017578125, 1.18377685546875, 1.2745361328125, 1.36529541015625, 1.4560546875, 1.54681396484375, 1.6375732421875, 1.72833251953125, 1.819091796875, 1.90985107421875, 2.0006103515625, 2.09136962890625, 2.18212890625, 2.27288818359375, 2.3636474609375, 2.45440673828125, 2.545166015625, 2.63592529296875, 2.7266845703125, 2.81744384765625, 2.908203125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 13.0, 15.0, 18.0, 31.0, 38.0, 60.0, 107.0, 142.0, 216.0, 355.0, 527.0, 825.0, 1352.0, 2203.0, 3662.0, 6057.0, 10577.0, 18454.0, 32916.0, 60866.0, 116394.0, 230098.0, 449685.0, 798183.0, 983465.0, 698195.0, 375836.0, 190721.0, 97123.0, 50759.0, 27680.0, 15450.0, 8953.0, 5234.0, 3049.0, 1822.0, 1157.0, 771.0, 442.0, 308.0, 186.0, 110.0, 71.0, 58.0, 35.0, 20.0, 20.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.890625, -4.748291015625, -4.60595703125, -4.463623046875, -4.3212890625, -4.178955078125, -4.03662109375, -3.894287109375, -3.751953125, -3.609619140625, -3.46728515625, -3.324951171875, -3.1826171875, -3.040283203125, -2.89794921875, -2.755615234375, -2.61328125, -2.470947265625, -2.32861328125, -2.186279296875, -2.0439453125, -1.901611328125, -1.75927734375, -1.616943359375, -1.474609375, -1.332275390625, -1.18994140625, -1.047607421875, -0.9052734375, -0.762939453125, -0.62060546875, -0.478271484375, -0.3359375, -0.193603515625, -0.05126953125, 0.091064453125, 0.2333984375, 0.375732421875, 0.51806640625, 0.660400390625, 0.802734375, 0.945068359375, 1.08740234375, 1.229736328125, 1.3720703125, 1.514404296875, 1.65673828125, 1.799072265625, 1.94140625, 2.083740234375, 2.22607421875, 2.368408203125, 2.5107421875, 2.653076171875, 2.79541015625, 2.937744140625, 3.080078125, 3.222412109375, 3.36474609375, 3.507080078125, 3.6494140625, 3.791748046875, 3.93408203125, 4.076416015625, 4.21875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 15.0, 18.0, 33.0, 31.0, 38.0, 48.0, 66.0, 79.0, 85.0, 136.0, 153.0, 171.0, 189.0, 253.0, 283.0, 311.0, 311.0, 250.0, 259.0, 206.0, 207.0, 171.0, 132.0, 131.0, 102.0, 87.0, 45.0, 64.0, 47.0, 34.0, 22.0, 19.0, 20.0, 16.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7607421875, -1.711456298828125, -1.66217041015625, -1.612884521484375, -1.5635986328125, -1.514312744140625, -1.46502685546875, -1.415740966796875, -1.366455078125, -1.317169189453125, -1.26788330078125, -1.218597412109375, -1.1693115234375, -1.120025634765625, -1.07073974609375, -1.021453857421875, -0.97216796875, -0.922882080078125, -0.87359619140625, -0.824310302734375, -0.7750244140625, -0.725738525390625, -0.67645263671875, -0.627166748046875, -0.577880859375, -0.528594970703125, -0.47930908203125, -0.430023193359375, -0.3807373046875, -0.331451416015625, -0.28216552734375, -0.232879638671875, -0.18359375, -0.134307861328125, -0.08502197265625, -0.035736083984375, 0.0135498046875, 0.062835693359375, 0.11212158203125, 0.161407470703125, 0.210693359375, 0.259979248046875, 0.30926513671875, 0.358551025390625, 0.4078369140625, 0.457122802734375, 0.50640869140625, 0.555694580078125, 0.60498046875, 0.654266357421875, 0.70355224609375, 0.752838134765625, 0.8021240234375, 0.851409912109375, 0.90069580078125, 0.949981689453125, 0.999267578125, 1.048553466796875, 1.09783935546875, 1.147125244140625, 1.1964111328125, 1.245697021484375, 1.29498291015625, 1.344268798828125, 1.3935546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 17.0, 15.0, 17.0, 16.0, 31.0, 34.0, 46.0, 44.0, 58.0, 58.0, 73.0, 69.0, 69.0, 70.0, 65.0, 50.0, 45.0, 36.0, 41.0, 23.0, 21.0, 9.0, 12.0, 15.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6409735679626465, -4.479150772094727, -4.317328453063965, -4.155505657196045, -3.993682861328125, -3.831860303878784, -3.6700377464294434, -3.5082149505615234, -3.3463921546936035, -3.1845695972442627, -3.0227468013763428, -2.860924243927002, -2.699101448059082, -2.537278890609741, -2.3754563331604004, -2.2136335372924805, -2.0518109798431396, -1.8899883031845093, -1.728165626525879, -1.566343069076538, -1.4045202732086182, -1.2426977157592773, -1.080875039100647, -0.9190523624420166, -0.7572296857833862, -0.5954070091247559, -0.4335843622684479, -0.2717617154121399, -0.10993903875350952, 0.05188363790512085, 0.21370625495910645, 0.3755289316177368, 0.5373516082763672, 0.6991742849349976, 0.8609969615936279, 1.0228195190429688, 1.1846423149108887, 1.3464648723602295, 1.5082875490188599, 1.6701102256774902, 1.8319329023361206, 1.993755578994751, 2.155578136444092, 2.3174009323120117, 2.4792234897613525, 2.6410462856292725, 2.8028688430786133, 2.964691638946533, 3.126514196395874, 3.288336753845215, 3.4501595497131348, 3.6119821071624756, 3.7738049030303955, 3.9356274604797363, 4.097450256347656, 4.259272575378418, 4.421095371246338, 4.582918167114258, 4.7447404861450195, 4.9065632820129395, 5.068386077880859, 5.230208873748779, 5.392031192779541, 5.553853988647461, 5.715676784515381]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 5.0, 10.0, 9.0, 12.0, 27.0, 22.0, 15.0, 15.0, 32.0, 41.0, 37.0, 38.0, 40.0, 46.0, 48.0, 49.0, 48.0, 40.0, 46.0, 46.0, 48.0, 46.0, 26.0, 28.0, 37.0, 31.0, 20.0, 22.0, 25.0, 19.0, 13.0, 14.0, 5.0, 5.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.124532222747803, -3.994530200958252, -3.864528179168701, -3.7345261573791504, -3.6045241355895996, -3.474522113800049, -3.344520330429077, -3.2145183086395264, -3.0845162868499756, -2.954514265060425, -2.824512243270874, -2.6945102214813232, -2.5645084381103516, -2.434506416320801, -2.30450439453125, -2.174502372741699, -2.0445003509521484, -1.9144983291625977, -1.7844963073730469, -1.6544944047927856, -1.5244923830032349, -1.394490361213684, -1.2644884586334229, -1.134486436843872, -1.0044844150543213, -0.8744823932647705, -0.7444804310798645, -0.6144784688949585, -0.4844764471054077, -0.35447442531585693, -0.22447246313095093, -0.09447050094604492, 0.035531044006347656, 0.16553303599357605, 0.29553502798080444, 0.42553701996803284, 0.5555390119552612, 0.685541033744812, 0.815542995929718, 0.945544958114624, 1.0755469799041748, 1.2055490016937256, 1.3355510234832764, 1.4655529260635376, 1.5955549478530884, 1.7255569696426392, 1.8555588722229004, 1.9855608940124512, 2.115562915802002, 2.2455649375915527, 2.3755669593811035, 2.5055689811706543, 2.635571002960205, 2.765573024749756, 2.8955748081207275, 3.0255768299102783, 3.155578851699829, 3.28558087348938, 3.4155828952789307, 3.5455849170684814, 3.675586700439453, 3.805588722229004, 3.9355907440185547, 4.0655927658081055, 4.195594787597656]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 25.0, 19.0, 35.0, 51.0, 66.0, 82.0, 117.0, 183.0, 251.0, 347.0, 423.0, 688.0, 949.0, 1385.0, 1965.0, 2956.0, 4411.0, 6537.0, 10010.0, 15489.0, 25015.0, 40474.0, 66490.0, 110043.0, 171175.0, 199124.0, 148767.0, 91829.0, 55319.0, 33828.0, 20852.0, 13203.0, 8575.0, 5729.0, 3785.0, 2515.0, 1771.0, 1218.0, 806.0, 614.0, 415.0, 255.0, 211.0, 157.0, 112.0, 88.0, 52.0, 39.0, 26.0, 19.0, 11.0, 11.0, 4.0, 5.0, 4.0, 4.0, 3.0], "bins": [-0.56982421875, -0.5521926879882812, -0.5345611572265625, -0.5169296264648438, -0.499298095703125, -0.48166656494140625, -0.4640350341796875, -0.44640350341796875, -0.42877197265625, -0.41114044189453125, -0.3935089111328125, -0.37587738037109375, -0.358245849609375, -0.34061431884765625, -0.3229827880859375, -0.30535125732421875, -0.2877197265625, -0.27008819580078125, -0.2524566650390625, -0.23482513427734375, -0.217193603515625, -0.19956207275390625, -0.1819305419921875, -0.16429901123046875, -0.14666748046875, -0.12903594970703125, -0.1114044189453125, -0.09377288818359375, -0.076141357421875, -0.05850982666015625, -0.0408782958984375, -0.02324676513671875, -0.005615234375, 0.01201629638671875, 0.0296478271484375, 0.04727935791015625, 0.064910888671875, 0.08254241943359375, 0.1001739501953125, 0.11780548095703125, 0.13543701171875, 0.15306854248046875, 0.1707000732421875, 0.18833160400390625, 0.205963134765625, 0.22359466552734375, 0.2412261962890625, 0.25885772705078125, 0.2764892578125, 0.29412078857421875, 0.3117523193359375, 0.32938385009765625, 0.347015380859375, 0.36464691162109375, 0.3822784423828125, 0.39990997314453125, 0.41754150390625, 0.43517303466796875, 0.4528045654296875, 0.47043609619140625, 0.488067626953125, 0.5056991577148438, 0.5233306884765625, 0.5409622192382812, 0.55859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 11.0, 13.0, 11.0, 13.0, 20.0, 16.0, 20.0, 25.0, 29.0, 34.0, 33.0, 47.0, 43.0, 37.0, 34.0, 44.0, 53.0, 47.0, 42.0, 40.0, 50.0, 38.0, 30.0, 28.0, 28.0, 31.0, 33.0, 21.0, 22.0, 16.0, 16.0, 16.0, 4.0, 6.0, 10.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.390625, -4.26104736328125, -4.1314697265625, -4.00189208984375, -3.872314453125, -3.74273681640625, -3.6131591796875, -3.48358154296875, -3.35400390625, -3.22442626953125, -3.0948486328125, -2.96527099609375, -2.835693359375, -2.70611572265625, -2.5765380859375, -2.44696044921875, -2.3173828125, -2.18780517578125, -2.0582275390625, -1.92864990234375, -1.799072265625, -1.66949462890625, -1.5399169921875, -1.41033935546875, -1.28076171875, -1.15118408203125, -1.0216064453125, -0.89202880859375, -0.762451171875, -0.63287353515625, -0.5032958984375, -0.37371826171875, -0.244140625, -0.11456298828125, 0.0150146484375, 0.14459228515625, 0.274169921875, 0.40374755859375, 0.5333251953125, 0.66290283203125, 0.79248046875, 0.92205810546875, 1.0516357421875, 1.18121337890625, 1.310791015625, 1.44036865234375, 1.5699462890625, 1.69952392578125, 1.8291015625, 1.95867919921875, 2.0882568359375, 2.21783447265625, 2.347412109375, 2.47698974609375, 2.6065673828125, 2.73614501953125, 2.86572265625, 2.99530029296875, 3.1248779296875, 3.25445556640625, 3.384033203125, 3.51361083984375, 3.6431884765625, 3.77276611328125, 3.90234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 10.0, 12.0, 8.0, 8.0, 33.0, 38.0, 81.0, 76.0, 142.0, 171.0, 353.0, 529.0, 901.0, 1660.0, 3173.0, 6395.0, 14765.0, 47387.0, 848985.0, 87991.0, 19356.0, 7966.0, 3851.0, 1899.0, 1085.0, 639.0, 379.0, 197.0, 126.0, 108.0, 60.0, 44.0, 40.0, 20.0, 22.0, 14.0, 9.0, 8.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.556854248046875, -1.50433349609375, -1.451812744140625, -1.3992919921875, -1.346771240234375, -1.29425048828125, -1.241729736328125, -1.189208984375, -1.136688232421875, -1.08416748046875, -1.031646728515625, -0.9791259765625, -0.926605224609375, -0.87408447265625, -0.821563720703125, -0.76904296875, -0.716522216796875, -0.66400146484375, -0.611480712890625, -0.5589599609375, -0.506439208984375, -0.45391845703125, -0.401397705078125, -0.348876953125, -0.296356201171875, -0.24383544921875, -0.191314697265625, -0.1387939453125, -0.086273193359375, -0.03375244140625, 0.018768310546875, 0.0712890625, 0.123809814453125, 0.17633056640625, 0.228851318359375, 0.2813720703125, 0.333892822265625, 0.38641357421875, 0.438934326171875, 0.491455078125, 0.543975830078125, 0.59649658203125, 0.649017333984375, 0.7015380859375, 0.754058837890625, 0.80657958984375, 0.859100341796875, 0.91162109375, 0.964141845703125, 1.01666259765625, 1.069183349609375, 1.1217041015625, 1.174224853515625, 1.22674560546875, 1.279266357421875, 1.331787109375, 1.384307861328125, 1.43682861328125, 1.489349365234375, 1.5418701171875, 1.594390869140625, 1.64691162109375, 1.699432373046875, 1.751953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 13.0, 15.0, 18.0, 19.0, 23.0, 20.0, 22.0, 24.0, 39.0, 38.0, 34.0, 30.0, 52.0, 32.0, 35.0, 38.0, 33.0, 42.0, 33.0, 44.0, 39.0, 30.0, 32.0, 33.0, 28.0, 23.0, 22.0, 31.0, 18.0, 21.0, 18.0, 10.0, 9.0, 17.0, 8.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.136627197265625, -2.06036376953125, -1.984100341796875, -1.9078369140625, -1.831573486328125, -1.75531005859375, -1.679046630859375, -1.602783203125, -1.526519775390625, -1.45025634765625, -1.373992919921875, -1.2977294921875, -1.221466064453125, -1.14520263671875, -1.068939208984375, -0.99267578125, -0.916412353515625, -0.84014892578125, -0.763885498046875, -0.6876220703125, -0.611358642578125, -0.53509521484375, -0.458831787109375, -0.382568359375, -0.306304931640625, -0.23004150390625, -0.153778076171875, -0.0775146484375, -0.001251220703125, 0.07501220703125, 0.151275634765625, 0.2275390625, 0.303802490234375, 0.38006591796875, 0.456329345703125, 0.5325927734375, 0.608856201171875, 0.68511962890625, 0.761383056640625, 0.837646484375, 0.913909912109375, 0.99017333984375, 1.066436767578125, 1.1427001953125, 1.218963623046875, 1.29522705078125, 1.371490478515625, 1.44775390625, 1.524017333984375, 1.60028076171875, 1.676544189453125, 1.7528076171875, 1.829071044921875, 1.90533447265625, 1.981597900390625, 2.057861328125, 2.134124755859375, 2.21038818359375, 2.286651611328125, 2.3629150390625, 2.439178466796875, 2.51544189453125, 2.591705322265625, 2.66796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 9.0, 15.0, 25.0, 17.0, 33.0, 47.0, 51.0, 88.0, 110.0, 178.0, 242.0, 336.0, 542.0, 803.0, 1272.0, 1918.0, 3123.0, 5080.0, 8787.0, 15442.0, 31680.0, 767926.0, 153628.0, 24711.0, 12955.0, 7453.0, 4264.0, 2635.0, 1752.0, 1130.0, 709.0, 501.0, 309.0, 229.0, 158.0, 124.0, 70.0, 57.0, 37.0, 30.0, 18.0, 15.0, 15.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.28173828125, -0.27260589599609375, -0.2634735107421875, -0.25434112548828125, -0.245208740234375, -0.23607635498046875, -0.2269439697265625, -0.21781158447265625, -0.20867919921875, -0.19954681396484375, -0.1904144287109375, -0.18128204345703125, -0.172149658203125, -0.16301727294921875, -0.1538848876953125, -0.14475250244140625, -0.1356201171875, -0.12648773193359375, -0.1173553466796875, -0.10822296142578125, -0.099090576171875, -0.08995819091796875, -0.0808258056640625, -0.07169342041015625, -0.06256103515625, -0.05342864990234375, -0.0442962646484375, -0.03516387939453125, -0.026031494140625, -0.01689910888671875, -0.0077667236328125, 0.00136566162109375, 0.010498046875, 0.01963043212890625, 0.0287628173828125, 0.03789520263671875, 0.047027587890625, 0.05615997314453125, 0.0652923583984375, 0.07442474365234375, 0.08355712890625, 0.09268951416015625, 0.1018218994140625, 0.11095428466796875, 0.120086669921875, 0.12921905517578125, 0.1383514404296875, 0.14748382568359375, 0.1566162109375, 0.16574859619140625, 0.1748809814453125, 0.18401336669921875, 0.193145751953125, 0.20227813720703125, 0.2114105224609375, 0.22054290771484375, 0.22967529296875, 0.23880767822265625, 0.2479400634765625, 0.25707244873046875, 0.266204833984375, 0.27533721923828125, 0.2844696044921875, 0.29360198974609375, 0.302734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 7.0, 12.0, 20.0, 13.0, 22.0, 14.0, 22.0, 19.0, 26.0, 40.0, 27.0, 39.0, 52.0, 42.0, 35.0, 44.0, 51.0, 54.0, 54.0, 48.0, 42.0, 39.0, 27.0, 36.0, 34.0, 24.0, 21.0, 26.0, 19.0, 12.0, 12.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4960765838623047e-05, -1.4374032616615295e-05, -1.3787299394607544e-05, -1.3200566172599792e-05, -1.2613832950592041e-05, -1.202709972858429e-05, -1.1440366506576538e-05, -1.0853633284568787e-05, -1.0266900062561035e-05, -9.680166840553284e-06, -9.093433618545532e-06, -8.50670039653778e-06, -7.91996717453003e-06, -7.333233952522278e-06, -6.746500730514526e-06, -6.159767508506775e-06, -5.5730342864990234e-06, -4.986301064491272e-06, -4.3995678424835205e-06, -3.812834620475769e-06, -3.2261013984680176e-06, -2.639368176460266e-06, -2.0526349544525146e-06, -1.4659017324447632e-06, -8.791685104370117e-07, -2.9243528842926025e-07, 2.942979335784912e-07, 8.810311555862427e-07, 1.4677643775939941e-06, 2.0544975996017456e-06, 2.641230821609497e-06, 3.2279640436172485e-06, 3.814697265625e-06, 4.4014304876327515e-06, 4.988163709640503e-06, 5.574896931648254e-06, 6.161630153656006e-06, 6.748363375663757e-06, 7.335096597671509e-06, 7.92182981967926e-06, 8.508563041687012e-06, 9.095296263694763e-06, 9.682029485702515e-06, 1.0268762707710266e-05, 1.0855495929718018e-05, 1.1442229151725769e-05, 1.202896237373352e-05, 1.2615695595741272e-05, 1.3202428817749023e-05, 1.3789162039756775e-05, 1.4375895261764526e-05, 1.4962628483772278e-05, 1.554936170578003e-05, 1.613609492778778e-05, 1.6722828149795532e-05, 1.7309561371803284e-05, 1.7896294593811035e-05, 1.8483027815818787e-05, 1.9069761037826538e-05, 1.965649425983429e-05, 2.024322748184204e-05, 2.0829960703849792e-05, 2.1416693925857544e-05, 2.2003427147865295e-05, 2.2590160369873047e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 8.0, 12.0, 16.0, 29.0, 38.0, 45.0, 65.0, 83.0, 87.0, 171.0, 257.0, 392.0, 643.0, 998.0, 1807.0, 3264.0, 6018.0, 11587.0, 23527.0, 49211.0, 106267.0, 219268.0, 287063.0, 177467.0, 82346.0, 38489.0, 18572.0, 9217.0, 4936.0, 2659.0, 1499.0, 863.0, 519.0, 340.0, 210.0, 165.0, 134.0, 62.0, 64.0, 32.0, 24.0, 19.0, 25.0, 11.0, 6.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.15887069702148438, -0.15380096435546875, -0.14873123168945312, -0.1436614990234375, -0.13859176635742188, -0.13352203369140625, -0.12845230102539062, -0.123382568359375, -0.11831283569335938, -0.11324310302734375, -0.10817337036132812, -0.1031036376953125, -0.09803390502929688, -0.09296417236328125, -0.08789443969726562, -0.08282470703125, -0.07775497436523438, -0.07268524169921875, -0.06761550903320312, -0.0625457763671875, -0.057476043701171875, -0.05240631103515625, -0.047336578369140625, -0.042266845703125, -0.037197113037109375, -0.03212738037109375, -0.027057647705078125, -0.0219879150390625, -0.016918182373046875, -0.01184844970703125, -0.006778717041015625, -0.001708984375, 0.003360748291015625, 0.00843048095703125, 0.013500213623046875, 0.0185699462890625, 0.023639678955078125, 0.02870941162109375, 0.033779144287109375, 0.038848876953125, 0.043918609619140625, 0.04898834228515625, 0.054058074951171875, 0.0591278076171875, 0.06419754028320312, 0.06926727294921875, 0.07433700561523438, 0.07940673828125, 0.08447647094726562, 0.08954620361328125, 0.09461593627929688, 0.0996856689453125, 0.10475540161132812, 0.10982513427734375, 0.11489486694335938, 0.119964599609375, 0.12503433227539062, 0.13010406494140625, 0.13517379760742188, 0.1402435302734375, 0.14531326293945312, 0.15038299560546875, 0.15545272827148438, 0.1605224609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 14.0, 16.0, 25.0, 21.0, 35.0, 58.0, 74.0, 93.0, 103.0, 96.0, 79.0, 81.0, 70.0, 37.0, 38.0, 34.0, 26.0, 16.0, 9.0, 7.0, 9.0, 10.0, 5.0, 2.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06365966796875, -0.061743736267089844, -0.05982780456542969, -0.05791187286376953, -0.055995941162109375, -0.05408000946044922, -0.05216407775878906, -0.050248146057128906, -0.04833221435546875, -0.046416282653808594, -0.04450035095214844, -0.04258441925048828, -0.040668487548828125, -0.03875255584716797, -0.03683662414550781, -0.034920692443847656, -0.0330047607421875, -0.031088829040527344, -0.029172897338867188, -0.02725696563720703, -0.025341033935546875, -0.02342510223388672, -0.021509170532226562, -0.019593238830566406, -0.01767730712890625, -0.015761375427246094, -0.013845443725585938, -0.011929512023925781, -0.010013580322265625, -0.008097648620605469, -0.0061817169189453125, -0.004265785217285156, -0.002349853515625, -0.00043392181396484375, 0.0014820098876953125, 0.0033979415893554688, 0.005313873291015625, 0.007229804992675781, 0.009145736694335938, 0.011061668395996094, 0.01297760009765625, 0.014893531799316406, 0.016809463500976562, 0.01872539520263672, 0.020641326904296875, 0.02255725860595703, 0.024473190307617188, 0.026389122009277344, 0.0283050537109375, 0.030220985412597656, 0.03213691711425781, 0.03405284881591797, 0.035968780517578125, 0.03788471221923828, 0.03980064392089844, 0.041716575622558594, 0.04363250732421875, 0.045548439025878906, 0.04746437072753906, 0.04938030242919922, 0.051296234130859375, 0.05321216583251953, 0.05512809753417969, 0.057044029235839844, 0.0589599609375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 9.0, 5.0, 7.0, 10.0, 19.0, 15.0, 17.0, 14.0, 27.0, 31.0, 44.0, 45.0, 50.0, 61.0, 68.0, 63.0, 77.0, 61.0, 67.0, 69.0, 32.0, 41.0, 33.0, 35.0, 26.0, 11.0, 12.0, 13.0, 12.0, 9.0, 1.0, 6.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.431341171264648, -4.272763252258301, -4.114185810089111, -3.9556081295013428, -3.797030448913574, -3.6384525299072266, -3.479874849319458, -3.3212971687316895, -3.162719488143921, -3.0041418075561523, -2.845564126968384, -2.6869864463806152, -2.5284085273742676, -2.369831085205078, -2.2112531661987305, -2.052675485610962, -1.8940978050231934, -1.7355201244354248, -1.5769424438476562, -1.4183646440505981, -1.2597869634628296, -1.101209282875061, -0.9426315426826477, -0.7840538024902344, -0.6254761219024658, -0.4668984115123749, -0.30832070112228394, -0.149742990732193, 0.00883471965789795, 0.1674124002456665, 0.32599014043807983, 0.48456788063049316, 0.6431460380554199, 0.8017237186431885, 0.9603014588356018, 1.1188791990280151, 1.2774568796157837, 1.4360345602035522, 1.5946123600006104, 1.753190040588379, 1.9117677211761475, 2.070345401763916, 2.2289230823516846, 2.387500762939453, 2.546078681945801, 2.7046561241149902, 2.863234043121338, 3.0218117237091064, 3.180389404296875, 3.3389670848846436, 3.497544765472412, 3.6561224460601807, 3.814700126647949, 3.973278045654297, 4.131855487823486, 4.290433406829834, 4.449010848999023, 4.607588768005371, 4.7661662101745605, 4.924744129180908, 5.083321571350098, 5.241899490356445, 5.400476932525635, 5.559054851531982, 5.71763277053833]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 10.0, 12.0, 25.0, 23.0, 16.0, 14.0, 33.0, 44.0, 34.0, 44.0, 35.0, 47.0, 50.0, 47.0, 47.0, 38.0, 46.0, 47.0, 52.0, 41.0, 29.0, 32.0, 33.0, 30.0, 23.0, 18.0, 28.0, 18.0, 14.0, 10.0, 5.0, 5.0, 8.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.104467391967773, -3.9746875762939453, -3.844907760620117, -3.715127944946289, -3.585348129272461, -3.455568313598633, -3.3257882595062256, -3.1960084438323975, -3.0662286281585693, -2.936448812484741, -2.806668996810913, -2.676889181137085, -2.5471091270446777, -2.4173293113708496, -2.2875494956970215, -2.1577696800231934, -2.0279898643493652, -1.898210048675537, -1.768430233001709, -1.6386502981185913, -1.5088704824447632, -1.379090666770935, -1.2493107318878174, -1.1195309162139893, -0.9897511005401611, -0.859971284866333, -0.7301914095878601, -0.6004115343093872, -0.4706317186355591, -0.34085190296173096, -0.21107202768325806, -0.08129215240478516, 0.048487186431884766, 0.17826703190803528, 0.3080468773841858, 0.4378267228603363, 0.5676065683364868, 0.6973863840103149, 0.8271662592887878, 0.9569461345672607, 1.0867259502410889, 1.216505765914917, 1.3462855815887451, 1.4760655164718628, 1.605845332145691, 1.735625147819519, 1.8654050827026367, 1.9951848983764648, 2.124964714050293, 2.254744529724121, 2.384524345397949, 2.5143041610717773, 2.6440839767456055, 2.7738637924194336, 2.903643846511841, 3.033423662185669, 3.163203477859497, 3.292983293533325, 3.4227631092071533, 3.5525429248809814, 3.6823229789733887, 3.812102794647217, 3.941882610321045, 4.071662425994873, 4.201442241668701]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 13.0, 27.0, 39.0, 48.0, 111.0, 169.0, 321.0, 594.0, 1062.0, 2006.0, 3840.0, 7515.0, 14831.0, 29882.0, 58313.0, 106094.0, 166314.0, 203366.0, 183045.0, 124605.0, 71340.0, 36758.0, 18746.0, 9374.0, 4769.0, 2430.0, 1275.0, 703.0, 424.0, 224.0, 125.0, 59.0, 45.0, 25.0, 15.0, 9.0, 9.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.198974609375, -4.06201171875, -3.925048828125, -3.7880859375, -3.651123046875, -3.51416015625, -3.377197265625, -3.240234375, -3.103271484375, -2.96630859375, -2.829345703125, -2.6923828125, -2.555419921875, -2.41845703125, -2.281494140625, -2.14453125, -2.007568359375, -1.87060546875, -1.733642578125, -1.5966796875, -1.459716796875, -1.32275390625, -1.185791015625, -1.048828125, -0.911865234375, -0.77490234375, -0.637939453125, -0.5009765625, -0.364013671875, -0.22705078125, -0.090087890625, 0.046875, 0.183837890625, 0.32080078125, 0.457763671875, 0.5947265625, 0.731689453125, 0.86865234375, 1.005615234375, 1.142578125, 1.279541015625, 1.41650390625, 1.553466796875, 1.6904296875, 1.827392578125, 1.96435546875, 2.101318359375, 2.23828125, 2.375244140625, 2.51220703125, 2.649169921875, 2.7861328125, 2.923095703125, 3.06005859375, 3.197021484375, 3.333984375, 3.470947265625, 3.60791015625, 3.744873046875, 3.8818359375, 4.018798828125, 4.15576171875, 4.292724609375, 4.4296875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 13.0, 13.0, 14.0, 20.0, 16.0, 16.0, 29.0, 31.0, 25.0, 29.0, 44.0, 38.0, 37.0, 37.0, 40.0, 54.0, 40.0, 48.0, 45.0, 48.0, 40.0, 45.0, 39.0, 43.0, 32.0, 26.0, 15.0, 17.0, 7.0, 18.0, 11.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.84832763671875, -3.7200927734375, -3.59185791015625, -3.463623046875, -3.33538818359375, -3.2071533203125, -3.07891845703125, -2.95068359375, -2.82244873046875, -2.6942138671875, -2.56597900390625, -2.437744140625, -2.30950927734375, -2.1812744140625, -2.05303955078125, -1.9248046875, -1.79656982421875, -1.6683349609375, -1.54010009765625, -1.411865234375, -1.28363037109375, -1.1553955078125, -1.02716064453125, -0.89892578125, -0.77069091796875, -0.6424560546875, -0.51422119140625, -0.385986328125, -0.25775146484375, -0.1295166015625, -0.00128173828125, 0.126953125, 0.25518798828125, 0.3834228515625, 0.51165771484375, 0.639892578125, 0.76812744140625, 0.8963623046875, 1.02459716796875, 1.15283203125, 1.28106689453125, 1.4093017578125, 1.53753662109375, 1.665771484375, 1.79400634765625, 1.9222412109375, 2.05047607421875, 2.1787109375, 2.30694580078125, 2.4351806640625, 2.56341552734375, 2.691650390625, 2.81988525390625, 2.9481201171875, 3.07635498046875, 3.20458984375, 3.33282470703125, 3.4610595703125, 3.58929443359375, 3.717529296875, 3.84576416015625, 3.9739990234375, 4.10223388671875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 14.0, 4.0, 13.0, 15.0, 25.0, 42.0, 60.0, 89.0, 139.0, 278.0, 424.0, 735.0, 1293.0, 2369.0, 4316.0, 7919.0, 14908.0, 27964.0, 50975.0, 88945.0, 141476.0, 184797.0, 184115.0, 139950.0, 88171.0, 50343.0, 27217.0, 14465.0, 7866.0, 4239.0, 2291.0, 1294.0, 754.0, 377.0, 232.0, 162.0, 100.0, 59.0, 46.0, 32.0, 17.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.3125, -4.18560791015625, -4.0587158203125, -3.93182373046875, -3.804931640625, -3.67803955078125, -3.5511474609375, -3.42425537109375, -3.29736328125, -3.17047119140625, -3.0435791015625, -2.91668701171875, -2.789794921875, -2.66290283203125, -2.5360107421875, -2.40911865234375, -2.2822265625, -2.15533447265625, -2.0284423828125, -1.90155029296875, -1.774658203125, -1.64776611328125, -1.5208740234375, -1.39398193359375, -1.26708984375, -1.14019775390625, -1.0133056640625, -0.88641357421875, -0.759521484375, -0.63262939453125, -0.5057373046875, -0.37884521484375, -0.251953125, -0.12506103515625, 0.0018310546875, 0.12872314453125, 0.255615234375, 0.38250732421875, 0.5093994140625, 0.63629150390625, 0.76318359375, 0.89007568359375, 1.0169677734375, 1.14385986328125, 1.270751953125, 1.39764404296875, 1.5245361328125, 1.65142822265625, 1.7783203125, 1.90521240234375, 2.0321044921875, 2.15899658203125, 2.285888671875, 2.41278076171875, 2.5396728515625, 2.66656494140625, 2.79345703125, 2.92034912109375, 3.0472412109375, 3.17413330078125, 3.301025390625, 3.42791748046875, 3.5548095703125, 3.68170166015625, 3.80859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 13.0, 17.0, 19.0, 29.0, 24.0, 30.0, 32.0, 33.0, 41.0, 33.0, 48.0, 55.0, 56.0, 44.0, 40.0, 43.0, 42.0, 35.0, 31.0, 28.0, 35.0, 25.0, 31.0, 27.0, 22.0, 21.0, 6.0, 21.0, 7.0, 10.0, 8.0, 4.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.1575927734375, -2.080810546875, -2.0040283203125, -1.92724609375, -1.8504638671875, -1.773681640625, -1.6968994140625, -1.6201171875, -1.5433349609375, -1.466552734375, -1.3897705078125, -1.31298828125, -1.2362060546875, -1.159423828125, -1.0826416015625, -1.005859375, -0.9290771484375, -0.852294921875, -0.7755126953125, -0.69873046875, -0.6219482421875, -0.545166015625, -0.4683837890625, -0.3916015625, -0.3148193359375, -0.238037109375, -0.1612548828125, -0.08447265625, -0.0076904296875, 0.069091796875, 0.1458740234375, 0.22265625, 0.2994384765625, 0.376220703125, 0.4530029296875, 0.52978515625, 0.6065673828125, 0.683349609375, 0.7601318359375, 0.8369140625, 0.9136962890625, 0.990478515625, 1.0672607421875, 1.14404296875, 1.2208251953125, 1.297607421875, 1.3743896484375, 1.451171875, 1.5279541015625, 1.604736328125, 1.6815185546875, 1.75830078125, 1.8350830078125, 1.911865234375, 1.9886474609375, 2.0654296875, 2.1422119140625, 2.218994140625, 2.2957763671875, 2.37255859375, 2.4493408203125, 2.526123046875, 2.6029052734375, 2.6796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 6.0, 10.0, 19.0, 18.0, 40.0, 44.0, 74.0, 109.0, 134.0, 202.0, 323.0, 469.0, 731.0, 1123.0, 1733.0, 2723.0, 4219.0, 6601.0, 10396.0, 16551.0, 26063.0, 40742.0, 62680.0, 90710.0, 121396.0, 143818.0, 141938.0, 119207.0, 88102.0, 59615.0, 39626.0, 24963.0, 16318.0, 10092.0, 6386.0, 4036.0, 2600.0, 1605.0, 1075.0, 688.0, 428.0, 300.0, 201.0, 137.0, 89.0, 64.0, 62.0, 28.0, 21.0, 8.0, 12.0, 4.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.421875, -1.37738037109375, -1.3328857421875, -1.28839111328125, -1.243896484375, -1.19940185546875, -1.1549072265625, -1.11041259765625, -1.06591796875, -1.02142333984375, -0.9769287109375, -0.93243408203125, -0.887939453125, -0.84344482421875, -0.7989501953125, -0.75445556640625, -0.7099609375, -0.66546630859375, -0.6209716796875, -0.57647705078125, -0.531982421875, -0.48748779296875, -0.4429931640625, -0.39849853515625, -0.35400390625, -0.30950927734375, -0.2650146484375, -0.22052001953125, -0.176025390625, -0.13153076171875, -0.0870361328125, -0.04254150390625, 0.001953125, 0.04644775390625, 0.0909423828125, 0.13543701171875, 0.179931640625, 0.22442626953125, 0.2689208984375, 0.31341552734375, 0.35791015625, 0.40240478515625, 0.4468994140625, 0.49139404296875, 0.535888671875, 0.58038330078125, 0.6248779296875, 0.66937255859375, 0.7138671875, 0.75836181640625, 0.8028564453125, 0.84735107421875, 0.891845703125, 0.93634033203125, 0.9808349609375, 1.02532958984375, 1.06982421875, 1.11431884765625, 1.1588134765625, 1.20330810546875, 1.247802734375, 1.29229736328125, 1.3367919921875, 1.38128662109375, 1.42578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 22.0, 20.0, 23.0, 33.0, 39.0, 47.0, 42.0, 57.0, 71.0, 52.0, 61.0, 60.0, 56.0, 60.0, 54.0, 36.0, 36.0, 25.0, 32.0, 22.0, 17.0, 16.0, 15.0, 9.0, 6.0, 2.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001773834228515625, -0.00017171725630760193, -0.00016605108976364136, -0.00016038492321968079, -0.00015471875667572021, -0.00014905259013175964, -0.00014338642358779907, -0.0001377202570438385, -0.00013205409049987793, -0.00012638792395591736, -0.00012072175741195679, -0.00011505559086799622, -0.00010938942432403564, -0.00010372325778007507, -9.80570912361145e-05, -9.239092469215393e-05, -8.672475814819336e-05, -8.105859160423279e-05, -7.539242506027222e-05, -6.972625851631165e-05, -6.406009197235107e-05, -5.83939254283905e-05, -5.272775888442993e-05, -4.706159234046936e-05, -4.139542579650879e-05, -3.572925925254822e-05, -3.0063092708587646e-05, -2.4396926164627075e-05, -1.8730759620666504e-05, -1.3064593076705933e-05, -7.398426532745361e-06, -1.73225998878479e-06, 3.933906555175781e-06, 9.600073099136353e-06, 1.5266239643096924e-05, 2.0932406187057495e-05, 2.6598572731018066e-05, 3.226473927497864e-05, 3.793090581893921e-05, 4.359707236289978e-05, 4.926323890686035e-05, 5.492940545082092e-05, 6.0595571994781494e-05, 6.626173853874207e-05, 7.192790508270264e-05, 7.759407162666321e-05, 8.326023817062378e-05, 8.892640471458435e-05, 9.459257125854492e-05, 0.00010025873780250549, 0.00010592490434646606, 0.00011159107089042664, 0.00011725723743438721, 0.00012292340397834778, 0.00012858957052230835, 0.00013425573706626892, 0.0001399219036102295, 0.00014558807015419006, 0.00015125423669815063, 0.0001569204032421112, 0.00016258656978607178, 0.00016825273633003235, 0.00017391890287399292, 0.0001795850694179535, 0.00018525123596191406]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 23.0, 26.0, 28.0, 57.0, 82.0, 132.0, 204.0, 296.0, 497.0, 764.0, 1243.0, 1963.0, 3149.0, 5061.0, 8195.0, 13557.0, 22240.0, 36454.0, 57793.0, 88343.0, 123760.0, 150267.0, 152716.0, 128470.0, 92292.0, 61159.0, 38349.0, 23870.0, 14374.0, 8817.0, 5347.0, 3349.0, 2027.0, 1337.0, 787.0, 528.0, 325.0, 220.0, 141.0, 100.0, 64.0, 52.0, 23.0, 17.0, 14.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4877777099609375, -1.441375732421875, -1.3949737548828125, -1.34857177734375, -1.3021697998046875, -1.255767822265625, -1.2093658447265625, -1.1629638671875, -1.1165618896484375, -1.070159912109375, -1.0237579345703125, -0.97735595703125, -0.9309539794921875, -0.884552001953125, -0.8381500244140625, -0.791748046875, -0.7453460693359375, -0.698944091796875, -0.6525421142578125, -0.60614013671875, -0.5597381591796875, -0.513336181640625, -0.4669342041015625, -0.4205322265625, -0.3741302490234375, -0.327728271484375, -0.2813262939453125, -0.23492431640625, -0.1885223388671875, -0.142120361328125, -0.0957183837890625, -0.04931640625, -0.0029144287109375, 0.043487548828125, 0.0898895263671875, 0.13629150390625, 0.1826934814453125, 0.229095458984375, 0.2754974365234375, 0.3218994140625, 0.3683013916015625, 0.414703369140625, 0.4611053466796875, 0.50750732421875, 0.5539093017578125, 0.600311279296875, 0.6467132568359375, 0.693115234375, 0.7395172119140625, 0.785919189453125, 0.8323211669921875, 0.87872314453125, 0.9251251220703125, 0.971527099609375, 1.0179290771484375, 1.0643310546875, 1.1107330322265625, 1.157135009765625, 1.2035369873046875, 1.24993896484375, 1.2963409423828125, 1.342742919921875, 1.3891448974609375, 1.435546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 8.0, 4.0, 10.0, 7.0, 8.0, 21.0, 12.0, 20.0, 28.0, 29.0, 36.0, 38.0, 49.0, 50.0, 49.0, 53.0, 58.0, 49.0, 45.0, 45.0, 51.0, 52.0, 49.0, 32.0, 35.0, 21.0, 22.0, 15.0, 24.0, 6.0, 15.0, 7.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.57568359375, -0.5580520629882812, -0.5404205322265625, -0.5227890014648438, -0.505157470703125, -0.48752593994140625, -0.4698944091796875, -0.45226287841796875, -0.43463134765625, -0.41699981689453125, -0.3993682861328125, -0.38173675537109375, -0.364105224609375, -0.34647369384765625, -0.3288421630859375, -0.31121063232421875, -0.2935791015625, -0.27594757080078125, -0.2583160400390625, -0.24068450927734375, -0.223052978515625, -0.20542144775390625, -0.1877899169921875, -0.17015838623046875, -0.15252685546875, -0.13489532470703125, -0.1172637939453125, -0.09963226318359375, -0.082000732421875, -0.06436920166015625, -0.0467376708984375, -0.02910614013671875, -0.011474609375, 0.00615692138671875, 0.0237884521484375, 0.04141998291015625, 0.059051513671875, 0.07668304443359375, 0.0943145751953125, 0.11194610595703125, 0.12957763671875, 0.14720916748046875, 0.1648406982421875, 0.18247222900390625, 0.200103759765625, 0.21773529052734375, 0.2353668212890625, 0.25299835205078125, 0.2706298828125, 0.28826141357421875, 0.3058929443359375, 0.32352447509765625, 0.341156005859375, 0.35878753662109375, 0.3764190673828125, 0.39405059814453125, 0.41168212890625, 0.42931365966796875, 0.4469451904296875, 0.46457672119140625, 0.482208251953125, 0.49983978271484375, 0.5174713134765625, 0.5351028442382812, 0.552734375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 6.0, 6.0, 7.0, 17.0, 22.0, 27.0, 27.0, 43.0, 47.0, 53.0, 56.0, 63.0, 54.0, 80.0, 68.0, 74.0, 62.0, 49.0, 36.0, 44.0, 35.0, 29.0, 13.0, 13.0, 22.0, 8.0, 7.0, 3.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.682610988616943, -4.518340110778809, -4.354068756103516, -4.189797878265381, -4.025526523590088, -3.861255407333374, -3.69698429107666, -3.5327134132385254, -3.3684420585632324, -3.2041709423065186, -3.0398998260498047, -2.875628709793091, -2.711357593536377, -2.547086477279663, -2.382815361022949, -2.2185444831848145, -2.0542733669281006, -1.8900022506713867, -1.7257311344146729, -1.561460018157959, -1.3971889019012451, -1.2329177856445312, -1.068646788597107, -0.9043756723403931, -0.7401045560836792, -0.5758334398269653, -0.41156235337257385, -0.24729126691818237, -0.0830201506614685, 0.08125096559524536, 0.24552202224731445, 0.4097931385040283, 0.5740642547607422, 0.738335371017456, 0.9026064872741699, 1.0668776035308838, 1.2311487197875977, 1.3954198360443115, 1.5596908330917358, 1.7239619493484497, 1.8882330656051636, 2.052504062652588, 2.2167751789093018, 2.3810462951660156, 2.5453174114227295, 2.7095885276794434, 2.8738596439361572, 3.038130760192871, 3.202401876449585, 3.366672992706299, 3.5309441089630127, 3.6952152252197266, 3.8594863414764404, 4.023757457733154, 4.188028335571289, 4.352299690246582, 4.516570568084717, 4.680841445922852, 4.8451128005981445, 5.009383678436279, 5.173655033111572, 5.337925910949707, 5.502197265625, 5.666468143463135, 5.830739498138428]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 7.0, 10.0, 17.0, 16.0, 19.0, 25.0, 28.0, 31.0, 35.0, 37.0, 50.0, 46.0, 45.0, 55.0, 48.0, 38.0, 45.0, 58.0, 48.0, 45.0, 54.0, 37.0, 32.0, 31.0, 24.0, 28.0, 26.0, 17.0, 6.0, 7.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.908332824707031, -4.764987945556641, -4.621642589569092, -4.478297233581543, -4.334952354431152, -4.191607475280762, -4.048262119293213, -3.904917001724243, -3.7615718841552734, -3.6182267665863037, -3.474881649017334, -3.3315365314483643, -3.1881914138793945, -3.044846296310425, -2.901501178741455, -2.7581560611724854, -2.6148109436035156, -2.471465826034546, -2.328120708465576, -2.1847755908966064, -2.0414304733276367, -1.898085355758667, -1.7547402381896973, -1.6113951206207275, -1.4680500030517578, -1.324704885482788, -1.1813597679138184, -1.0380146503448486, -0.8946695327758789, -0.7513244152069092, -0.6079792976379395, -0.4646341800689697, -0.3212890625, -0.17794394493103027, -0.03459882736206055, 0.10874629020690918, 0.2520914077758789, 0.39543652534484863, 0.5387816429138184, 0.6821267604827881, 0.8254718780517578, 0.9688169956207275, 1.1121621131896973, 1.255507230758667, 1.3988523483276367, 1.5421974658966064, 1.6855425834655762, 1.828887701034546, 1.9722328186035156, 2.1155779361724854, 2.258923053741455, 2.402268171310425, 2.5456132888793945, 2.6889584064483643, 2.832303524017334, 2.9756486415863037, 3.1189937591552734, 3.262338876724243, 3.405683994293213, 3.5490291118621826, 3.6923742294311523, 3.835719347000122, 3.979064464569092, 4.122409820556641, 4.265754699707031]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 13.0, 13.0, 10.0, 23.0, 32.0, 41.0, 54.0, 84.0, 109.0, 145.0, 271.0, 376.0, 600.0, 926.0, 1446.0, 2499.0, 4088.0, 6929.0, 12124.0, 22281.0, 42288.0, 85819.0, 187338.0, 433477.0, 911232.0, 1151379.0, 726460.0, 319728.0, 140733.0, 66534.0, 34056.0, 18281.0, 10062.0, 5916.0, 3422.0, 2027.0, 1276.0, 834.0, 506.0, 298.0, 179.0, 134.0, 85.0, 57.0, 37.0, 20.0, 23.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.58984375, -4.45208740234375, -4.3143310546875, -4.17657470703125, -4.038818359375, -3.90106201171875, -3.7633056640625, -3.62554931640625, -3.48779296875, -3.35003662109375, -3.2122802734375, -3.07452392578125, -2.936767578125, -2.79901123046875, -2.6612548828125, -2.52349853515625, -2.3857421875, -2.24798583984375, -2.1102294921875, -1.97247314453125, -1.834716796875, -1.69696044921875, -1.5592041015625, -1.42144775390625, -1.28369140625, -1.14593505859375, -1.0081787109375, -0.87042236328125, -0.732666015625, -0.59490966796875, -0.4571533203125, -0.31939697265625, -0.181640625, -0.04388427734375, 0.0938720703125, 0.23162841796875, 0.369384765625, 0.50714111328125, 0.6448974609375, 0.78265380859375, 0.92041015625, 1.05816650390625, 1.1959228515625, 1.33367919921875, 1.471435546875, 1.60919189453125, 1.7469482421875, 1.88470458984375, 2.0224609375, 2.16021728515625, 2.2979736328125, 2.43572998046875, 2.573486328125, 2.71124267578125, 2.8489990234375, 2.98675537109375, 3.12451171875, 3.26226806640625, 3.4000244140625, 3.53778076171875, 3.675537109375, 3.81329345703125, 3.9510498046875, 4.08880615234375, 4.2265625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 12.0, 8.0, 8.0, 11.0, 11.0, 20.0, 22.0, 25.0, 25.0, 30.0, 32.0, 31.0, 45.0, 50.0, 48.0, 48.0, 53.0, 40.0, 53.0, 48.0, 47.0, 38.0, 36.0, 41.0, 35.0, 34.0, 29.0, 28.0, 21.0, 22.0, 16.0, 8.0, 5.0, 4.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.41796875, -3.3232421875, -3.228515625, -3.1337890625, -3.0390625, -2.9443359375, -2.849609375, -2.7548828125, -2.66015625, -2.5654296875, -2.470703125, -2.3759765625, -2.28125, -2.1865234375, -2.091796875, -1.9970703125, -1.90234375, -1.8076171875, -1.712890625, -1.6181640625, -1.5234375, -1.4287109375, -1.333984375, -1.2392578125, -1.14453125, -1.0498046875, -0.955078125, -0.8603515625, -0.765625, -0.6708984375, -0.576171875, -0.4814453125, -0.38671875, -0.2919921875, -0.197265625, -0.1025390625, -0.0078125, 0.0869140625, 0.181640625, 0.2763671875, 0.37109375, 0.4658203125, 0.560546875, 0.6552734375, 0.75, 0.8447265625, 0.939453125, 1.0341796875, 1.12890625, 1.2236328125, 1.318359375, 1.4130859375, 1.5078125, 1.6025390625, 1.697265625, 1.7919921875, 1.88671875, 1.9814453125, 2.076171875, 2.1708984375, 2.265625, 2.3603515625, 2.455078125, 2.5498046875, 2.64453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 13.0, 24.0, 41.0, 68.0, 128.0, 177.0, 226.0, 429.0, 670.0, 1192.0, 1990.0, 3261.0, 6086.0, 11142.0, 21417.0, 42274.0, 88009.0, 193106.0, 434460.0, 916579.0, 1175838.0, 703373.0, 316401.0, 142712.0, 66227.0, 32104.0, 16350.0, 8527.0, 4900.0, 2674.0, 1596.0, 871.0, 497.0, 331.0, 204.0, 141.0, 91.0, 59.0, 28.0, 29.0, 8.0, 7.0, 9.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0], "bins": [-5.6328125, -5.4732666015625, -5.313720703125, -5.1541748046875, -4.99462890625, -4.8350830078125, -4.675537109375, -4.5159912109375, -4.3564453125, -4.1968994140625, -4.037353515625, -3.8778076171875, -3.71826171875, -3.5587158203125, -3.399169921875, -3.2396240234375, -3.080078125, -2.9205322265625, -2.760986328125, -2.6014404296875, -2.44189453125, -2.2823486328125, -2.122802734375, -1.9632568359375, -1.8037109375, -1.6441650390625, -1.484619140625, -1.3250732421875, -1.16552734375, -1.0059814453125, -0.846435546875, -0.6868896484375, -0.52734375, -0.3677978515625, -0.208251953125, -0.0487060546875, 0.11083984375, 0.2703857421875, 0.429931640625, 0.5894775390625, 0.7490234375, 0.9085693359375, 1.068115234375, 1.2276611328125, 1.38720703125, 1.5467529296875, 1.706298828125, 1.8658447265625, 2.025390625, 2.1849365234375, 2.344482421875, 2.5040283203125, 2.66357421875, 2.8231201171875, 2.982666015625, 3.1422119140625, 3.3017578125, 3.4613037109375, 3.620849609375, 3.7803955078125, 3.93994140625, 4.0994873046875, 4.259033203125, 4.4185791015625, 4.578125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 13.0, 12.0, 25.0, 24.0, 49.0, 49.0, 61.0, 72.0, 96.0, 145.0, 142.0, 165.0, 209.0, 231.0, 254.0, 261.0, 267.0, 253.0, 295.0, 230.0, 258.0, 180.0, 146.0, 111.0, 91.0, 89.0, 58.0, 67.0, 35.0, 36.0, 19.0, 31.0, 17.0, 9.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.328125, -1.2847747802734375, -1.241424560546875, -1.1980743408203125, -1.15472412109375, -1.1113739013671875, -1.068023681640625, -1.0246734619140625, -0.9813232421875, -0.9379730224609375, -0.894622802734375, -0.8512725830078125, -0.80792236328125, -0.7645721435546875, -0.721221923828125, -0.6778717041015625, -0.634521484375, -0.5911712646484375, -0.547821044921875, -0.5044708251953125, -0.46112060546875, -0.4177703857421875, -0.374420166015625, -0.3310699462890625, -0.2877197265625, -0.2443695068359375, -0.201019287109375, -0.1576690673828125, -0.11431884765625, -0.0709686279296875, -0.027618408203125, 0.0157318115234375, 0.05908203125, 0.1024322509765625, 0.145782470703125, 0.1891326904296875, 0.23248291015625, 0.2758331298828125, 0.319183349609375, 0.3625335693359375, 0.4058837890625, 0.4492340087890625, 0.492584228515625, 0.5359344482421875, 0.57928466796875, 0.6226348876953125, 0.665985107421875, 0.7093353271484375, 0.752685546875, 0.7960357666015625, 0.839385986328125, 0.8827362060546875, 0.92608642578125, 0.9694366455078125, 1.012786865234375, 1.0561370849609375, 1.0994873046875, 1.1428375244140625, 1.186187744140625, 1.2295379638671875, 1.27288818359375, 1.3162384033203125, 1.359588623046875, 1.4029388427734375, 1.4462890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 1.0, 6.0, 9.0, 5.0, 7.0, 12.0, 16.0, 20.0, 42.0, 42.0, 56.0, 43.0, 67.0, 65.0, 72.0, 78.0, 74.0, 63.0, 69.0, 41.0, 43.0, 39.0, 26.0, 27.0, 15.0, 12.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32554817199707, -4.1618146896362305, -3.9980812072753906, -3.83434796333313, -3.67061448097229, -3.50688099861145, -3.3431477546691895, -3.1794142723083496, -3.0156807899475098, -2.85194730758667, -2.68821382522583, -2.5244805812835693, -2.3607470989227295, -2.1970136165618896, -2.033280372619629, -1.869546890258789, -1.7058134078979492, -1.5420799255371094, -1.378346562385559, -1.2146131992340088, -1.050879716873169, -0.8871462941169739, -0.7234128713607788, -0.5596795082092285, -0.39594602584838867, -0.2322126030921936, -0.06847918033599854, 0.09525424242019653, 0.2589876651763916, 0.42272108793258667, 0.5864545106887817, 0.750187873840332, 0.9139208793640137, 1.0776543617248535, 1.2413877248764038, 1.405121088027954, 1.568854570388794, 1.7325880527496338, 1.896321415901184, 2.0600547790527344, 2.223788261413574, 2.387521743774414, 2.551255226135254, 2.7149884700775146, 2.8787219524383545, 3.0424554347991943, 3.206188678741455, 3.369922161102295, 3.5336556434631348, 3.6973891258239746, 3.8611226081848145, 4.024856090545654, 4.188589096069336, 4.352322578430176, 4.516056060791016, 4.6797895431518555, 4.843523025512695, 5.007256507873535, 5.170989990234375, 5.334723472595215, 5.498456954956055, 5.662189960479736, 5.825923442840576, 5.989656925201416, 6.153390407562256]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 10.0, 10.0, 8.0, 15.0, 21.0, 12.0, 26.0, 27.0, 30.0, 25.0, 29.0, 30.0, 34.0, 40.0, 61.0, 60.0, 48.0, 51.0, 46.0, 46.0, 42.0, 50.0, 20.0, 33.0, 32.0, 34.0, 28.0, 23.0, 24.0, 18.0, 9.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.472722291946411, -3.3598921298980713, -3.2470619678497314, -3.1342320442199707, -3.021401882171631, -2.908571720123291, -2.795741558074951, -2.6829113960266113, -2.5700814723968506, -2.4572513103485107, -2.344421148300171, -2.23159122467041, -2.1187610626220703, -2.0059309005737305, -1.8931007385253906, -1.7802706956863403, -1.6674405336380005, -1.5546103715896606, -1.4417803287506104, -1.3289501667022705, -1.2161201238632202, -1.1032899618148804, -0.9904598593711853, -0.8776297569274902, -0.7647996544837952, -0.6519695520401001, -0.539139449596405, -0.4263093173503876, -0.3134792149066925, -0.20064908266067505, -0.08781898021697998, 0.025011122226715088, 0.13784122467041016, 0.2506713271141052, 0.3635014295578003, 0.47633156180381775, 0.5891616344451904, 0.7019917964935303, 0.8148218989372253, 0.9276520013809204, 1.0404820442199707, 1.1533122062683105, 1.2661422491073608, 1.3789724111557007, 1.491802453994751, 1.6046326160430908, 1.7174627780914307, 1.830292820930481, 1.9431229829788208, 2.055953025817871, 2.168783187866211, 2.281613349914551, 2.3944435119628906, 2.5072736740112305, 2.620103597640991, 2.732933759689331, 2.845763921737671, 2.9585940837860107, 3.0714242458343506, 3.1842541694641113, 3.297084331512451, 3.409914493560791, 3.522744655609131, 3.6355748176574707, 3.7484047412872314]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 16.0, 27.0, 32.0, 58.0, 73.0, 125.0, 185.0, 303.0, 435.0, 664.0, 1051.0, 1614.0, 2629.0, 4271.0, 7306.0, 12308.0, 20714.0, 37333.0, 69182.0, 128845.0, 217259.0, 227832.0, 142693.0, 76358.0, 40850.0, 22574.0, 13255.0, 7856.0, 4757.0, 2981.0, 1767.0, 1093.0, 714.0, 503.0, 276.0, 178.0, 137.0, 104.0, 72.0, 30.0, 31.0, 12.0, 13.0, 12.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.56591796875, -0.5497856140136719, -0.5336532592773438, -0.5175209045410156, -0.5013885498046875, -0.4852561950683594, -0.46912384033203125, -0.4529914855957031, -0.436859130859375, -0.4207267761230469, -0.40459442138671875, -0.3884620666503906, -0.3723297119140625, -0.3561973571777344, -0.34006500244140625, -0.3239326477050781, -0.30780029296875, -0.2916679382324219, -0.27553558349609375, -0.2594032287597656, -0.2432708740234375, -0.22713851928710938, -0.21100616455078125, -0.19487380981445312, -0.178741455078125, -0.16260910034179688, -0.14647674560546875, -0.13034439086914062, -0.1142120361328125, -0.09807968139648438, -0.08194732666015625, -0.06581497192382812, -0.0496826171875, -0.033550262451171875, -0.01741790771484375, -0.001285552978515625, 0.0148468017578125, 0.030979156494140625, 0.04711151123046875, 0.06324386596679688, 0.079376220703125, 0.09550857543945312, 0.11164093017578125, 0.12777328491210938, 0.1439056396484375, 0.16003799438476562, 0.17617034912109375, 0.19230270385742188, 0.20843505859375, 0.22456741333007812, 0.24069976806640625, 0.2568321228027344, 0.2729644775390625, 0.2890968322753906, 0.30522918701171875, 0.3213615417480469, 0.337493896484375, 0.3536262512207031, 0.36975860595703125, 0.3858909606933594, 0.4020233154296875, 0.4181556701660156, 0.43428802490234375, 0.4504203796386719, 0.466552734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 2.0, 9.0, 11.0, 14.0, 18.0, 21.0, 26.0, 29.0, 27.0, 29.0, 40.0, 36.0, 55.0, 35.0, 48.0, 60.0, 46.0, 53.0, 39.0, 49.0, 44.0, 46.0, 24.0, 32.0, 27.0, 28.0, 22.0, 31.0, 23.0, 8.0, 14.0, 12.0, 11.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.1351318359375, -4.012451171875, -3.8897705078125, -3.76708984375, -3.6444091796875, -3.521728515625, -3.3990478515625, -3.2763671875, -3.1536865234375, -3.031005859375, -2.9083251953125, -2.78564453125, -2.6629638671875, -2.540283203125, -2.4176025390625, -2.294921875, -2.1722412109375, -2.049560546875, -1.9268798828125, -1.80419921875, -1.6815185546875, -1.558837890625, -1.4361572265625, -1.3134765625, -1.1907958984375, -1.068115234375, -0.9454345703125, -0.82275390625, -0.7000732421875, -0.577392578125, -0.4547119140625, -0.33203125, -0.2093505859375, -0.086669921875, 0.0360107421875, 0.15869140625, 0.2813720703125, 0.404052734375, 0.5267333984375, 0.6494140625, 0.7720947265625, 0.894775390625, 1.0174560546875, 1.14013671875, 1.2628173828125, 1.385498046875, 1.5081787109375, 1.630859375, 1.7535400390625, 1.876220703125, 1.9989013671875, 2.12158203125, 2.2442626953125, 2.366943359375, 2.4896240234375, 2.6123046875, 2.7349853515625, 2.857666015625, 2.9803466796875, 3.10302734375, 3.2257080078125, 3.348388671875, 3.4710693359375, 3.59375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 13.0, 10.0, 16.0, 20.0, 28.0, 31.0, 57.0, 68.0, 95.0, 133.0, 200.0, 290.0, 458.0, 743.0, 1165.0, 2081.0, 3832.0, 7469.0, 16828.0, 51456.0, 813687.0, 106768.0, 22475.0, 9614.0, 4722.0, 2413.0, 1375.0, 821.0, 558.0, 361.0, 226.0, 154.0, 112.0, 69.0, 53.0, 36.0, 27.0, 18.0, 16.0, 16.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.166015625, -1.12799072265625, -1.0899658203125, -1.05194091796875, -1.013916015625, -0.97589111328125, -0.9378662109375, -0.89984130859375, -0.86181640625, -0.82379150390625, -0.7857666015625, -0.74774169921875, -0.709716796875, -0.67169189453125, -0.6336669921875, -0.59564208984375, -0.5576171875, -0.51959228515625, -0.4815673828125, -0.44354248046875, -0.405517578125, -0.36749267578125, -0.3294677734375, -0.29144287109375, -0.25341796875, -0.21539306640625, -0.1773681640625, -0.13934326171875, -0.101318359375, -0.06329345703125, -0.0252685546875, 0.01275634765625, 0.05078125, 0.08880615234375, 0.1268310546875, 0.16485595703125, 0.202880859375, 0.24090576171875, 0.2789306640625, 0.31695556640625, 0.35498046875, 0.39300537109375, 0.4310302734375, 0.46905517578125, 0.507080078125, 0.54510498046875, 0.5831298828125, 0.62115478515625, 0.6591796875, 0.69720458984375, 0.7352294921875, 0.77325439453125, 0.811279296875, 0.84930419921875, 0.8873291015625, 0.92535400390625, 0.96337890625, 1.00140380859375, 1.0394287109375, 1.07745361328125, 1.115478515625, 1.15350341796875, 1.1915283203125, 1.22955322265625, 1.267578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 14.0, 14.0, 9.0, 9.0, 20.0, 22.0, 23.0, 29.0, 25.0, 26.0, 30.0, 39.0, 39.0, 52.0, 40.0, 39.0, 37.0, 44.0, 36.0, 34.0, 42.0, 45.0, 41.0, 28.0, 38.0, 31.0, 26.0, 22.0, 22.0, 17.0, 13.0, 11.0, 12.0, 8.0, 13.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1328125, -2.062286376953125, -1.99176025390625, -1.921234130859375, -1.8507080078125, -1.780181884765625, -1.70965576171875, -1.639129638671875, -1.568603515625, -1.498077392578125, -1.42755126953125, -1.357025146484375, -1.2864990234375, -1.215972900390625, -1.14544677734375, -1.074920654296875, -1.00439453125, -0.933868408203125, -0.86334228515625, -0.792816162109375, -0.7222900390625, -0.651763916015625, -0.58123779296875, -0.510711669921875, -0.440185546875, -0.369659423828125, -0.29913330078125, -0.228607177734375, -0.1580810546875, -0.087554931640625, -0.01702880859375, 0.053497314453125, 0.1240234375, 0.194549560546875, 0.26507568359375, 0.335601806640625, 0.4061279296875, 0.476654052734375, 0.54718017578125, 0.617706298828125, 0.688232421875, 0.758758544921875, 0.82928466796875, 0.899810791015625, 0.9703369140625, 1.040863037109375, 1.11138916015625, 1.181915283203125, 1.25244140625, 1.322967529296875, 1.39349365234375, 1.464019775390625, 1.5345458984375, 1.605072021484375, 1.67559814453125, 1.746124267578125, 1.816650390625, 1.887176513671875, 1.95770263671875, 2.028228759765625, 2.0987548828125, 2.169281005859375, 2.23980712890625, 2.310333251953125, 2.380859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 11.0, 17.0, 14.0, 31.0, 48.0, 73.0, 105.0, 190.0, 312.0, 492.0, 925.0, 1602.0, 3037.0, 5779.0, 11562.0, 26057.0, 426919.0, 520002.0, 26730.0, 11889.0, 5861.0, 3064.0, 1602.0, 922.0, 525.0, 312.0, 186.0, 119.0, 47.0, 48.0, 32.0, 9.0, 9.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.292633056640625, -0.28179931640625, -0.270965576171875, -0.2601318359375, -0.249298095703125, -0.23846435546875, -0.227630615234375, -0.216796875, -0.205963134765625, -0.19512939453125, -0.184295654296875, -0.1734619140625, -0.162628173828125, -0.15179443359375, -0.140960693359375, -0.130126953125, -0.119293212890625, -0.10845947265625, -0.097625732421875, -0.0867919921875, -0.075958251953125, -0.06512451171875, -0.054290771484375, -0.04345703125, -0.032623291015625, -0.02178955078125, -0.010955810546875, -0.0001220703125, 0.010711669921875, 0.02154541015625, 0.032379150390625, 0.043212890625, 0.054046630859375, 0.06488037109375, 0.075714111328125, 0.0865478515625, 0.097381591796875, 0.10821533203125, 0.119049072265625, 0.1298828125, 0.140716552734375, 0.15155029296875, 0.162384033203125, 0.1732177734375, 0.184051513671875, 0.19488525390625, 0.205718994140625, 0.216552734375, 0.227386474609375, 0.23822021484375, 0.249053955078125, 0.2598876953125, 0.270721435546875, 0.28155517578125, 0.292388916015625, 0.30322265625, 0.314056396484375, 0.32489013671875, 0.335723876953125, 0.3465576171875, 0.357391357421875, 0.36822509765625, 0.379058837890625, 0.389892578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 7.0, 7.0, 16.0, 18.0, 21.0, 23.0, 25.0, 32.0, 32.0, 40.0, 43.0, 39.0, 48.0, 42.0, 48.0, 41.0, 54.0, 50.0, 47.0, 48.0, 43.0, 32.0, 41.0, 20.0, 28.0, 26.0, 25.0, 15.0, 17.0, 14.0, 12.0, 3.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.8034130334854126e-05, -1.7352402210235596e-05, -1.6670674085617065e-05, -1.5988945960998535e-05, -1.5307217836380005e-05, -1.4625489711761475e-05, -1.3943761587142944e-05, -1.3262033462524414e-05, -1.2580305337905884e-05, -1.1898577213287354e-05, -1.1216849088668823e-05, -1.0535120964050293e-05, -9.853392839431763e-06, -9.171664714813232e-06, -8.489936590194702e-06, -7.808208465576172e-06, -7.126480340957642e-06, -6.444752216339111e-06, -5.763024091720581e-06, -5.081295967102051e-06, -4.3995678424835205e-06, -3.7178397178649902e-06, -3.03611159324646e-06, -2.3543834686279297e-06, -1.6726553440093994e-06, -9.909272193908691e-07, -3.0919909477233887e-07, 3.725290298461914e-07, 1.0542571544647217e-06, 1.735985279083252e-06, 2.4177134037017822e-06, 3.0994415283203125e-06, 3.7811696529388428e-06, 4.462897777557373e-06, 5.144625902175903e-06, 5.826354026794434e-06, 6.508082151412964e-06, 7.189810276031494e-06, 7.871538400650024e-06, 8.553266525268555e-06, 9.234994649887085e-06, 9.916722774505615e-06, 1.0598450899124146e-05, 1.1280179023742676e-05, 1.1961907148361206e-05, 1.2643635272979736e-05, 1.3325363397598267e-05, 1.4007091522216797e-05, 1.4688819646835327e-05, 1.5370547771453857e-05, 1.6052275896072388e-05, 1.6734004020690918e-05, 1.7415732145309448e-05, 1.809746026992798e-05, 1.877918839454651e-05, 1.946091651916504e-05, 2.014264464378357e-05, 2.08243727684021e-05, 2.150610089302063e-05, 2.218782901763916e-05, 2.286955714225769e-05, 2.355128526687622e-05, 2.423301339149475e-05, 2.491474151611328e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 14.0, 13.0, 16.0, 16.0, 30.0, 46.0, 63.0, 86.0, 126.0, 187.0, 284.0, 459.0, 686.0, 1148.0, 1816.0, 3154.0, 5509.0, 9919.0, 18442.0, 35376.0, 69101.0, 136310.0, 234514.0, 238400.0, 141564.0, 71480.0, 36382.0, 19151.0, 10332.0, 5655.0, 3147.0, 1873.0, 1176.0, 693.0, 487.0, 287.0, 218.0, 120.0, 81.0, 51.0, 54.0, 19.0, 21.0, 17.0, 6.0, 9.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1175537109375, -0.11376476287841797, -0.10997581481933594, -0.1061868667602539, -0.10239791870117188, -0.09860897064208984, -0.09482002258300781, -0.09103107452392578, -0.08724212646484375, -0.08345317840576172, -0.07966423034667969, -0.07587528228759766, -0.07208633422851562, -0.0682973861694336, -0.06450843811035156, -0.06071949005126953, -0.0569305419921875, -0.05314159393310547, -0.04935264587402344, -0.045563697814941406, -0.041774749755859375, -0.037985801696777344, -0.03419685363769531, -0.03040790557861328, -0.02661895751953125, -0.02283000946044922, -0.019041061401367188, -0.015252113342285156, -0.011463165283203125, -0.007674217224121094, -0.0038852691650390625, -9.632110595703125e-05, 0.003692626953125, 0.007481575012207031, 0.011270523071289062, 0.015059471130371094, 0.018848419189453125, 0.022637367248535156, 0.026426315307617188, 0.03021526336669922, 0.03400421142578125, 0.03779315948486328, 0.04158210754394531, 0.045371055603027344, 0.049160003662109375, 0.052948951721191406, 0.05673789978027344, 0.06052684783935547, 0.0643157958984375, 0.06810474395751953, 0.07189369201660156, 0.0756826400756836, 0.07947158813476562, 0.08326053619384766, 0.08704948425292969, 0.09083843231201172, 0.09462738037109375, 0.09841632843017578, 0.10220527648925781, 0.10599422454833984, 0.10978317260742188, 0.1135721206665039, 0.11736106872558594, 0.12115001678466797, 0.12493896484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 14.0, 5.0, 17.0, 14.0, 20.0, 22.0, 22.0, 31.0, 35.0, 42.0, 47.0, 61.0, 67.0, 77.0, 97.0, 75.0, 73.0, 68.0, 44.0, 29.0, 20.0, 23.0, 22.0, 18.0, 8.0, 7.0, 5.0, 8.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050018310546875, -0.04846668243408203, -0.04691505432128906, -0.045363426208496094, -0.043811798095703125, -0.042260169982910156, -0.04070854187011719, -0.03915691375732422, -0.03760528564453125, -0.03605365753173828, -0.03450202941894531, -0.032950401306152344, -0.031398773193359375, -0.029847145080566406, -0.028295516967773438, -0.02674388885498047, -0.0251922607421875, -0.02364063262939453, -0.022089004516601562, -0.020537376403808594, -0.018985748291015625, -0.017434120178222656, -0.015882492065429688, -0.014330863952636719, -0.01277923583984375, -0.011227607727050781, -0.009675979614257812, -0.008124351501464844, -0.006572723388671875, -0.005021095275878906, -0.0034694671630859375, -0.0019178390502929688, -0.0003662109375, 0.0011854171752929688, 0.0027370452880859375, 0.004288673400878906, 0.005840301513671875, 0.007391929626464844, 0.008943557739257812, 0.010495185852050781, 0.01204681396484375, 0.013598442077636719, 0.015150070190429688, 0.016701698303222656, 0.018253326416015625, 0.019804954528808594, 0.021356582641601562, 0.02290821075439453, 0.0244598388671875, 0.02601146697998047, 0.027563095092773438, 0.029114723205566406, 0.030666351318359375, 0.032217979431152344, 0.03376960754394531, 0.03532123565673828, 0.03687286376953125, 0.03842449188232422, 0.03997611999511719, 0.041527748107910156, 0.043079376220703125, 0.044631004333496094, 0.04618263244628906, 0.04773426055908203, 0.049285888671875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 5.0, 8.0, 12.0, 13.0, 17.0, 29.0, 44.0, 44.0, 55.0, 50.0, 69.0, 78.0, 73.0, 72.0, 73.0, 62.0, 55.0, 43.0, 39.0, 36.0, 22.0, 25.0, 9.0, 13.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.401505470275879, -4.237415313720703, -4.073324680328369, -3.9092342853546143, -3.7451438903808594, -3.5810537338256836, -3.4169633388519287, -3.252872943878174, -3.088782548904419, -2.924692153930664, -2.760601758956909, -2.5965113639831543, -2.4324212074279785, -2.2683305740356445, -2.1042404174804688, -1.9401500225067139, -1.776059627532959, -1.611969232559204, -1.4478788375854492, -1.2837885618209839, -1.119698166847229, -0.9556077718734741, -0.791517436504364, -0.6274271011352539, -0.463336706161499, -0.29924634099006653, -0.13515597581863403, 0.028934389352798462, 0.19302475452423096, 0.35711514949798584, 0.521205484867096, 0.685295820236206, 0.8493862152099609, 1.0134766101837158, 1.1775670051574707, 1.341657280921936, 1.505747675895691, 1.6698380708694458, 1.8339283466339111, 1.998018741607666, 2.162109136581421, 2.326199531555176, 2.4902899265289307, 2.6543803215026855, 2.8184704780578613, 2.9825611114501953, 3.146651268005371, 3.310741662979126, 3.474832057952881, 3.6389224529266357, 3.8030128479003906, 3.9671032428741455, 4.1311936378479, 4.295283794403076, 4.45937442779541, 4.623464584350586, 4.787554740905762, 4.9516448974609375, 5.1157355308532715, 5.279825687408447, 5.443916320800781, 5.608006477355957, 5.772097110748291, 5.936187267303467, 6.100277900695801]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 13.0, 7.0, 16.0, 19.0, 11.0, 23.0, 32.0, 25.0, 25.0, 26.0, 32.0, 33.0, 40.0, 57.0, 59.0, 57.0, 41.0, 52.0, 46.0, 38.0, 54.0, 24.0, 30.0, 31.0, 36.0, 26.0, 27.0, 24.0, 18.0, 11.0, 15.0, 12.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4923160076141357, -3.380154609680176, -3.2679929733276367, -3.1558315753936768, -3.0436699390411377, -2.9315085411071777, -2.8193469047546387, -2.7071855068206787, -2.5950241088867188, -2.482862710952759, -2.3707010746002197, -2.2585396766662598, -2.1463780403137207, -2.0342166423797607, -1.9220551252365112, -1.8098936080932617, -1.6977319717407227, -1.5855704545974731, -1.4734089374542236, -1.3612475395202637, -1.2490859031677246, -1.1369245052337646, -1.0247629880905151, -0.9126014709472656, -0.8004399538040161, -0.6882784366607666, -0.5761169195175171, -0.46395546197891235, -0.35179394483566284, -0.23963242769241333, -0.1274709701538086, -0.015309453010559082, 0.09685230255126953, 0.20901380479335785, 0.32117530703544617, 0.4333367943763733, 0.5454983115196228, 0.6576598286628723, 0.769821286201477, 0.8819828033447266, 0.9941443204879761, 1.1063058376312256, 1.218467354774475, 1.3306288719177246, 1.4427902698516846, 1.5549519062042236, 1.6671133041381836, 1.779274821281433, 1.8914363384246826, 2.0035977363586426, 2.1157593727111816, 2.2279207706451416, 2.3400824069976807, 2.4522438049316406, 2.5644054412841797, 2.6765668392181396, 2.7887282371520996, 2.9008896350860596, 3.0130512714385986, 3.1252126693725586, 3.2373743057250977, 3.3495357036590576, 3.4616971015930176, 3.5738587379455566, 3.6860203742980957]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 14.0, 16.0, 17.0, 28.0, 45.0, 89.0, 120.0, 159.0, 242.0, 347.0, 547.0, 885.0, 1260.0, 2108.0, 3247.0, 5512.0, 8909.0, 15112.0, 24881.0, 41613.0, 67119.0, 103554.0, 141480.0, 162716.0, 150723.0, 116190.0, 78014.0, 48608.0, 29213.0, 17672.0, 10769.0, 6561.0, 3945.0, 2371.0, 1540.0, 1009.0, 650.0, 431.0, 292.0, 175.0, 113.0, 64.0, 52.0, 38.0, 33.0, 22.0, 21.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.798828125, -2.707550048828125, -2.61627197265625, -2.524993896484375, -2.4337158203125, -2.342437744140625, -2.25115966796875, -2.159881591796875, -2.068603515625, -1.977325439453125, -1.88604736328125, -1.794769287109375, -1.7034912109375, -1.612213134765625, -1.52093505859375, -1.429656982421875, -1.33837890625, -1.247100830078125, -1.15582275390625, -1.064544677734375, -0.9732666015625, -0.881988525390625, -0.79071044921875, -0.699432373046875, -0.608154296875, -0.516876220703125, -0.42559814453125, -0.334320068359375, -0.2430419921875, -0.151763916015625, -0.06048583984375, 0.030792236328125, 0.1220703125, 0.213348388671875, 0.30462646484375, 0.395904541015625, 0.4871826171875, 0.578460693359375, 0.66973876953125, 0.761016845703125, 0.852294921875, 0.943572998046875, 1.03485107421875, 1.126129150390625, 1.2174072265625, 1.308685302734375, 1.39996337890625, 1.491241455078125, 1.58251953125, 1.673797607421875, 1.76507568359375, 1.856353759765625, 1.9476318359375, 2.038909912109375, 2.13018798828125, 2.221466064453125, 2.312744140625, 2.404022216796875, 2.49530029296875, 2.586578369140625, 2.6778564453125, 2.769134521484375, 2.86041259765625, 2.951690673828125, 3.04296875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 6.0, 9.0, 13.0, 17.0, 18.0, 22.0, 27.0, 15.0, 42.0, 35.0, 40.0, 36.0, 38.0, 50.0, 62.0, 42.0, 47.0, 60.0, 50.0, 43.0, 43.0, 37.0, 30.0, 23.0, 33.0, 30.0, 24.0, 18.0, 14.0, 19.0, 18.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.955078125, -3.828460693359375, -3.70184326171875, -3.575225830078125, -3.4486083984375, -3.321990966796875, -3.19537353515625, -3.068756103515625, -2.942138671875, -2.815521240234375, -2.68890380859375, -2.562286376953125, -2.4356689453125, -2.309051513671875, -2.18243408203125, -2.055816650390625, -1.92919921875, -1.802581787109375, -1.67596435546875, -1.549346923828125, -1.4227294921875, -1.296112060546875, -1.16949462890625, -1.042877197265625, -0.916259765625, -0.789642333984375, -0.66302490234375, -0.536407470703125, -0.4097900390625, -0.283172607421875, -0.15655517578125, -0.029937744140625, 0.0966796875, 0.223297119140625, 0.34991455078125, 0.476531982421875, 0.6031494140625, 0.729766845703125, 0.85638427734375, 0.983001708984375, 1.109619140625, 1.236236572265625, 1.36285400390625, 1.489471435546875, 1.6160888671875, 1.742706298828125, 1.86932373046875, 1.995941162109375, 2.12255859375, 2.249176025390625, 2.37579345703125, 2.502410888671875, 2.6290283203125, 2.755645751953125, 2.88226318359375, 3.008880615234375, 3.135498046875, 3.262115478515625, 3.38873291015625, 3.515350341796875, 3.6419677734375, 3.768585205078125, 3.89520263671875, 4.021820068359375, 4.1484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 21.0, 28.0, 42.0, 51.0, 69.0, 98.0, 179.0, 267.0, 398.0, 592.0, 916.0, 1443.0, 2235.0, 3758.0, 5789.0, 9495.0, 15357.0, 25125.0, 41112.0, 65601.0, 99222.0, 135652.0, 157189.0, 149176.0, 117721.0, 81083.0, 52115.0, 32258.0, 19627.0, 11909.0, 7209.0, 4708.0, 2897.0, 1863.0, 1153.0, 732.0, 492.0, 344.0, 211.0, 123.0, 99.0, 64.0, 42.0, 30.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.814453125, -2.725799560546875, -2.63714599609375, -2.548492431640625, -2.4598388671875, -2.371185302734375, -2.28253173828125, -2.193878173828125, -2.105224609375, -2.016571044921875, -1.92791748046875, -1.839263916015625, -1.7506103515625, -1.661956787109375, -1.57330322265625, -1.484649658203125, -1.39599609375, -1.307342529296875, -1.21868896484375, -1.130035400390625, -1.0413818359375, -0.952728271484375, -0.86407470703125, -0.775421142578125, -0.686767578125, -0.598114013671875, -0.50946044921875, -0.420806884765625, -0.3321533203125, -0.243499755859375, -0.15484619140625, -0.066192626953125, 0.0224609375, 0.111114501953125, 0.19976806640625, 0.288421630859375, 0.3770751953125, 0.465728759765625, 0.55438232421875, 0.643035888671875, 0.731689453125, 0.820343017578125, 0.90899658203125, 0.997650146484375, 1.0863037109375, 1.174957275390625, 1.26361083984375, 1.352264404296875, 1.44091796875, 1.529571533203125, 1.61822509765625, 1.706878662109375, 1.7955322265625, 1.884185791015625, 1.97283935546875, 2.061492919921875, 2.150146484375, 2.238800048828125, 2.32745361328125, 2.416107177734375, 2.5047607421875, 2.593414306640625, 2.68206787109375, 2.770721435546875, 2.859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 2.0, 8.0, 8.0, 7.0, 12.0, 16.0, 24.0, 19.0, 19.0, 20.0, 22.0, 26.0, 32.0, 23.0, 38.0, 38.0, 33.0, 41.0, 31.0, 45.0, 33.0, 44.0, 37.0, 29.0, 41.0, 34.0, 50.0, 31.0, 34.0, 20.0, 27.0, 15.0, 24.0, 19.0, 15.0, 17.0, 12.0, 3.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.830078125, -1.770050048828125, -1.71002197265625, -1.649993896484375, -1.5899658203125, -1.529937744140625, -1.46990966796875, -1.409881591796875, -1.349853515625, -1.289825439453125, -1.22979736328125, -1.169769287109375, -1.1097412109375, -1.049713134765625, -0.98968505859375, -0.929656982421875, -0.86962890625, -0.809600830078125, -0.74957275390625, -0.689544677734375, -0.6295166015625, -0.569488525390625, -0.50946044921875, -0.449432373046875, -0.389404296875, -0.329376220703125, -0.26934814453125, -0.209320068359375, -0.1492919921875, -0.089263916015625, -0.02923583984375, 0.030792236328125, 0.0908203125, 0.150848388671875, 0.21087646484375, 0.270904541015625, 0.3309326171875, 0.390960693359375, 0.45098876953125, 0.511016845703125, 0.571044921875, 0.631072998046875, 0.69110107421875, 0.751129150390625, 0.8111572265625, 0.871185302734375, 0.93121337890625, 0.991241455078125, 1.05126953125, 1.111297607421875, 1.17132568359375, 1.231353759765625, 1.2913818359375, 1.351409912109375, 1.41143798828125, 1.471466064453125, 1.531494140625, 1.591522216796875, 1.65155029296875, 1.711578369140625, 1.7716064453125, 1.831634521484375, 1.89166259765625, 1.951690673828125, 2.01171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 3.0, 12.0, 11.0, 21.0, 28.0, 48.0, 66.0, 93.0, 168.0, 227.0, 350.0, 514.0, 843.0, 1307.0, 2023.0, 3198.0, 5226.0, 8751.0, 14563.0, 24495.0, 41743.0, 70061.0, 109414.0, 152868.0, 175323.0, 153386.0, 109991.0, 69810.0, 41901.0, 24688.0, 14550.0, 8752.0, 5347.0, 3128.0, 2023.0, 1270.0, 821.0, 513.0, 343.0, 209.0, 162.0, 99.0, 68.0, 41.0, 30.0, 16.0, 14.0, 11.0, 11.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.4501953125, -1.4041595458984375, -1.358123779296875, -1.3120880126953125, -1.26605224609375, -1.2200164794921875, -1.173980712890625, -1.1279449462890625, -1.0819091796875, -1.0358734130859375, -0.989837646484375, -0.9438018798828125, -0.89776611328125, -0.8517303466796875, -0.805694580078125, -0.7596588134765625, -0.713623046875, -0.6675872802734375, -0.621551513671875, -0.5755157470703125, -0.52947998046875, -0.4834442138671875, -0.437408447265625, -0.3913726806640625, -0.3453369140625, -0.2993011474609375, -0.253265380859375, -0.2072296142578125, -0.16119384765625, -0.1151580810546875, -0.069122314453125, -0.0230865478515625, 0.02294921875, 0.0689849853515625, 0.115020751953125, 0.1610565185546875, 0.20709228515625, 0.2531280517578125, 0.299163818359375, 0.3451995849609375, 0.3912353515625, 0.4372711181640625, 0.483306884765625, 0.5293426513671875, 0.57537841796875, 0.6214141845703125, 0.667449951171875, 0.7134857177734375, 0.759521484375, 0.8055572509765625, 0.851593017578125, 0.8976287841796875, 0.94366455078125, 0.9897003173828125, 1.035736083984375, 1.0817718505859375, 1.1278076171875, 1.1738433837890625, 1.219879150390625, 1.2659149169921875, 1.31195068359375, 1.3579864501953125, 1.404022216796875, 1.4500579833984375, 1.49609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 16.0, 16.0, 19.0, 27.0, 24.0, 39.0, 39.0, 26.0, 37.0, 53.0, 61.0, 64.0, 48.0, 51.0, 53.0, 65.0, 54.0, 43.0, 34.0, 30.0, 33.0, 33.0, 21.0, 14.0, 5.0, 11.0, 7.0, 9.0, 5.0, 7.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00013637542724609375, -0.00013181939721107483, -0.0001272633671760559, -0.000122707337141037, -0.00011815130710601807, -0.00011359527707099915, -0.00010903924703598022, -0.0001044832170009613, -9.992718696594238e-05, -9.537115693092346e-05, -9.081512689590454e-05, -8.625909686088562e-05, -8.17030668258667e-05, -7.714703679084778e-05, -7.259100675582886e-05, -6.803497672080994e-05, -6.347894668579102e-05, -5.8922916650772095e-05, -5.4366886615753174e-05, -4.981085658073425e-05, -4.525482654571533e-05, -4.069879651069641e-05, -3.614276647567749e-05, -3.158673644065857e-05, -2.703070640563965e-05, -2.2474676370620728e-05, -1.7918646335601807e-05, -1.3362616300582886e-05, -8.806586265563965e-06, -4.250556230545044e-06, 3.0547380447387695e-07, 4.861503839492798e-06, 9.417533874511719e-06, 1.397356390953064e-05, 1.852959394454956e-05, 2.308562397956848e-05, 2.7641654014587402e-05, 3.219768404960632e-05, 3.6753714084625244e-05, 4.1309744119644165e-05, 4.5865774154663086e-05, 5.042180418968201e-05, 5.497783422470093e-05, 5.953386425971985e-05, 6.408989429473877e-05, 6.864592432975769e-05, 7.320195436477661e-05, 7.775798439979553e-05, 8.231401443481445e-05, 8.687004446983337e-05, 9.14260745048523e-05, 9.598210453987122e-05, 0.00010053813457489014, 0.00010509416460990906, 0.00010965019464492798, 0.0001142062246799469, 0.00011876225471496582, 0.00012331828474998474, 0.00012787431478500366, 0.00013243034482002258, 0.0001369863748550415, 0.00014154240489006042, 0.00014609843492507935, 0.00015065446496009827, 0.0001552104949951172]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 5.0, 15.0, 27.0, 29.0, 60.0, 65.0, 98.0, 146.0, 209.0, 360.0, 534.0, 783.0, 1165.0, 1795.0, 2752.0, 4341.0, 6845.0, 11015.0, 17530.0, 27979.0, 44890.0, 69772.0, 102714.0, 137309.0, 155398.0, 143376.0, 110913.0, 75660.0, 49285.0, 30954.0, 19677.0, 11852.0, 7549.0, 4713.0, 3009.0, 1972.0, 1300.0, 805.0, 560.0, 366.0, 240.0, 169.0, 110.0, 68.0, 49.0, 41.0, 22.0, 5.0, 7.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.29296875, -1.2533111572265625, -1.213653564453125, -1.1739959716796875, -1.13433837890625, -1.0946807861328125, -1.055023193359375, -1.0153656005859375, -0.9757080078125, -0.9360504150390625, -0.896392822265625, -0.8567352294921875, -0.81707763671875, -0.7774200439453125, -0.737762451171875, -0.6981048583984375, -0.658447265625, -0.6187896728515625, -0.579132080078125, -0.5394744873046875, -0.49981689453125, -0.4601593017578125, -0.420501708984375, -0.3808441162109375, -0.3411865234375, -0.3015289306640625, -0.261871337890625, -0.2222137451171875, -0.18255615234375, -0.1428985595703125, -0.103240966796875, -0.0635833740234375, -0.02392578125, 0.0157318115234375, 0.055389404296875, 0.0950469970703125, 0.13470458984375, 0.1743621826171875, 0.214019775390625, 0.2536773681640625, 0.2933349609375, 0.3329925537109375, 0.372650146484375, 0.4123077392578125, 0.45196533203125, 0.4916229248046875, 0.531280517578125, 0.5709381103515625, 0.610595703125, 0.6502532958984375, 0.689910888671875, 0.7295684814453125, 0.76922607421875, 0.8088836669921875, 0.848541259765625, 0.8881988525390625, 0.9278564453125, 0.9675140380859375, 1.007171630859375, 1.0468292236328125, 1.08648681640625, 1.1261444091796875, 1.165802001953125, 1.2054595947265625, 1.2451171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 11.0, 6.0, 15.0, 10.0, 23.0, 14.0, 25.0, 16.0, 22.0, 24.0, 31.0, 24.0, 30.0, 39.0, 48.0, 36.0, 44.0, 48.0, 45.0, 52.0, 43.0, 42.0, 28.0, 39.0, 35.0, 43.0, 27.0, 27.0, 27.0, 14.0, 15.0, 18.0, 9.0, 13.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.36574554443359375, -0.3535614013671875, -0.34137725830078125, -0.329193115234375, -0.31700897216796875, -0.3048248291015625, -0.29264068603515625, -0.28045654296875, -0.26827239990234375, -0.2560882568359375, -0.24390411376953125, -0.231719970703125, -0.21953582763671875, -0.2073516845703125, -0.19516754150390625, -0.1829833984375, -0.17079925537109375, -0.1586151123046875, -0.14643096923828125, -0.134246826171875, -0.12206268310546875, -0.1098785400390625, -0.09769439697265625, -0.08551025390625, -0.07332611083984375, -0.0611419677734375, -0.04895782470703125, -0.036773681640625, -0.02458953857421875, -0.0124053955078125, -0.00022125244140625, 0.011962890625, 0.02414703369140625, 0.0363311767578125, 0.04851531982421875, 0.060699462890625, 0.07288360595703125, 0.0850677490234375, 0.09725189208984375, 0.10943603515625, 0.12162017822265625, 0.1338043212890625, 0.14598846435546875, 0.158172607421875, 0.17035675048828125, 0.1825408935546875, 0.19472503662109375, 0.2069091796875, 0.21909332275390625, 0.2312774658203125, 0.24346160888671875, 0.255645751953125, 0.26782989501953125, 0.2800140380859375, 0.29219818115234375, 0.30438232421875, 0.31656646728515625, 0.3287506103515625, 0.34093475341796875, 0.353118896484375, 0.36530303955078125, 0.3774871826171875, 0.38967132568359375, 0.40185546875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 13.0, 9.0, 23.0, 27.0, 27.0, 38.0, 50.0, 58.0, 64.0, 84.0, 63.0, 77.0, 76.0, 57.0, 57.0, 51.0, 51.0, 39.0, 28.0, 18.0, 16.0, 16.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.052423477172852, -3.884748935699463, -3.717074394226074, -3.5493998527526855, -3.381725311279297, -3.214050769805908, -3.0463764667510986, -2.87870192527771, -2.7110273838043213, -2.5433528423309326, -2.375678300857544, -2.2080039978027344, -2.0403294563293457, -1.8726547956466675, -1.7049803733825684, -1.5373058319091797, -1.369631290435791, -1.2019567489624023, -1.0342822074890137, -0.8666077852249146, -0.6989332437515259, -0.5312587022781372, -0.3635842800140381, -0.19590973854064941, -0.028235197067260742, 0.13943931460380554, 0.3071138262748718, 0.4747883081436157, 0.6424628496170044, 0.8101373910903931, 0.9778118133544922, 1.1454863548278809, 1.3131604194641113, 1.4808349609375, 1.6485095024108887, 1.8161839246749878, 1.9838584661483765, 2.1515331268310547, 2.3192074298858643, 2.486881971359253, 2.6545565128326416, 2.8222310543060303, 2.989905595779419, 3.1575798988342285, 3.325254440307617, 3.492928981781006, 3.6606035232543945, 3.828278064727783, 3.995952606201172, 4.1636271476745605, 4.331301689147949, 4.498976230621338, 4.666650772094727, 4.834325313568115, 5.001999855041504, 5.169673919677734, 5.337348937988281, 5.50502347946167, 5.672698020935059, 5.840372562408447, 6.008047103881836, 6.175721645355225, 6.343396186828613, 6.511070251464844, 6.678744792938232]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 6.0, 9.0, 15.0, 11.0, 17.0, 17.0, 21.0, 26.0, 36.0, 20.0, 28.0, 42.0, 39.0, 48.0, 41.0, 47.0, 41.0, 53.0, 42.0, 39.0, 46.0, 38.0, 30.0, 49.0, 33.0, 33.0, 33.0, 26.0, 20.0, 17.0, 14.0, 13.0, 11.0, 4.0, 9.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283984661102295, -3.1750056743621826, -3.066026449203491, -2.957047462463379, -2.8480682373046875, -2.739089250564575, -2.630110263824463, -2.5211310386657715, -2.412152051925659, -2.303173065185547, -2.1941938400268555, -2.085214853286743, -1.9762357473373413, -1.8672566413879395, -1.7582776546478271, -1.6492985486984253, -1.5403194427490234, -1.4313403367996216, -1.3223612308502197, -1.2133822441101074, -1.1044031381607056, -0.9954240322113037, -0.8864449858665466, -0.7774659395217896, -0.6684868335723877, -0.5595077276229858, -0.45052868127822876, -0.3415496051311493, -0.23257052898406982, -0.12359142303466797, -0.014612376689910889, 0.09436666965484619, 0.20334577560424805, 0.3123248517513275, 0.421303927898407, 0.5302829742431641, 0.6392620801925659, 0.7482411861419678, 0.8572202324867249, 0.9661992788314819, 1.0751783847808838, 1.1841574907302856, 1.2931365966796875, 1.4021155834197998, 1.5110946893692017, 1.6200737953186035, 1.7290527820587158, 1.8380318880081177, 1.9470109939575195, 2.055989980697632, 2.1649692058563232, 2.2739481925964355, 2.382927417755127, 2.4919064044952393, 2.6008853912353516, 2.709864616394043, 2.8188436031341553, 2.9278225898742676, 3.036801815032959, 3.1457808017730713, 3.2547597885131836, 3.363739013671875, 3.4727180004119873, 3.5816969871520996, 3.690676212310791]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 23.0, 35.0, 55.0, 66.0, 117.0, 156.0, 282.0, 431.0, 659.0, 1008.0, 1658.0, 2756.0, 4457.0, 7922.0, 14438.0, 26289.0, 52670.0, 109433.0, 247390.0, 581787.0, 1089495.0, 1058603.0, 547382.0, 232953.0, 104091.0, 50201.0, 25895.0, 14270.0, 7955.0, 4599.0, 2742.0, 1632.0, 1032.0, 697.0, 372.0, 263.0, 153.0, 98.0, 70.0, 44.0, 30.0, 19.0, 13.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.99932861328125, -3.8658447265625, -3.73236083984375, -3.598876953125, -3.46539306640625, -3.3319091796875, -3.19842529296875, -3.06494140625, -2.93145751953125, -2.7979736328125, -2.66448974609375, -2.531005859375, -2.39752197265625, -2.2640380859375, -2.13055419921875, -1.9970703125, -1.86358642578125, -1.7301025390625, -1.59661865234375, -1.463134765625, -1.32965087890625, -1.1961669921875, -1.06268310546875, -0.92919921875, -0.79571533203125, -0.6622314453125, -0.52874755859375, -0.395263671875, -0.26177978515625, -0.1282958984375, 0.00518798828125, 0.138671875, 0.27215576171875, 0.4056396484375, 0.53912353515625, 0.672607421875, 0.80609130859375, 0.9395751953125, 1.07305908203125, 1.20654296875, 1.34002685546875, 1.4735107421875, 1.60699462890625, 1.740478515625, 1.87396240234375, 2.0074462890625, 2.14093017578125, 2.2744140625, 2.40789794921875, 2.5413818359375, 2.67486572265625, 2.808349609375, 2.94183349609375, 3.0753173828125, 3.20880126953125, 3.34228515625, 3.47576904296875, 3.6092529296875, 3.74273681640625, 3.876220703125, 4.00970458984375, 4.1431884765625, 4.27667236328125, 4.41015625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 2.0, 7.0, 8.0, 8.0, 10.0, 9.0, 19.0, 34.0, 28.0, 32.0, 29.0, 34.0, 45.0, 44.0, 50.0, 50.0, 51.0, 44.0, 47.0, 49.0, 44.0, 41.0, 37.0, 50.0, 41.0, 30.0, 26.0, 21.0, 23.0, 17.0, 16.0, 15.0, 5.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.822265625, -2.735595703125, -2.64892578125, -2.562255859375, -2.4755859375, -2.388916015625, -2.30224609375, -2.215576171875, -2.12890625, -2.042236328125, -1.95556640625, -1.868896484375, -1.7822265625, -1.695556640625, -1.60888671875, -1.522216796875, -1.435546875, -1.348876953125, -1.26220703125, -1.175537109375, -1.0888671875, -1.002197265625, -0.91552734375, -0.828857421875, -0.7421875, -0.655517578125, -0.56884765625, -0.482177734375, -0.3955078125, -0.308837890625, -0.22216796875, -0.135498046875, -0.048828125, 0.037841796875, 0.12451171875, 0.211181640625, 0.2978515625, 0.384521484375, 0.47119140625, 0.557861328125, 0.64453125, 0.731201171875, 0.81787109375, 0.904541015625, 0.9912109375, 1.077880859375, 1.16455078125, 1.251220703125, 1.337890625, 1.424560546875, 1.51123046875, 1.597900390625, 1.6845703125, 1.771240234375, 1.85791015625, 1.944580078125, 2.03125, 2.117919921875, 2.20458984375, 2.291259765625, 2.3779296875, 2.464599609375, 2.55126953125, 2.637939453125, 2.724609375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 9.0, 12.0, 24.0, 29.0, 54.0, 70.0, 105.0, 170.0, 271.0, 472.0, 754.0, 1330.0, 2234.0, 3892.0, 7243.0, 13458.0, 25037.0, 49942.0, 102516.0, 215123.0, 461634.0, 908566.0, 1104904.0, 675027.0, 322403.0, 150352.0, 72403.0, 35694.0, 18600.0, 9641.0, 5211.0, 2932.0, 1683.0, 966.0, 601.0, 342.0, 212.0, 141.0, 87.0, 56.0, 32.0, 18.0, 14.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.39385986328125, -4.2486572265625, -4.10345458984375, -3.958251953125, -3.81304931640625, -3.6678466796875, -3.52264404296875, -3.37744140625, -3.23223876953125, -3.0870361328125, -2.94183349609375, -2.796630859375, -2.65142822265625, -2.5062255859375, -2.36102294921875, -2.2158203125, -2.07061767578125, -1.9254150390625, -1.78021240234375, -1.635009765625, -1.48980712890625, -1.3446044921875, -1.19940185546875, -1.05419921875, -0.90899658203125, -0.7637939453125, -0.61859130859375, -0.473388671875, -0.32818603515625, -0.1829833984375, -0.03778076171875, 0.107421875, 0.25262451171875, 0.3978271484375, 0.54302978515625, 0.688232421875, 0.83343505859375, 0.9786376953125, 1.12384033203125, 1.26904296875, 1.41424560546875, 1.5594482421875, 1.70465087890625, 1.849853515625, 1.99505615234375, 2.1402587890625, 2.28546142578125, 2.4306640625, 2.57586669921875, 2.7210693359375, 2.86627197265625, 3.011474609375, 3.15667724609375, 3.3018798828125, 3.44708251953125, 3.59228515625, 3.73748779296875, 3.8826904296875, 4.02789306640625, 4.173095703125, 4.31829833984375, 4.4635009765625, 4.60870361328125, 4.75390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 6.0, 7.0, 6.0, 13.0, 20.0, 23.0, 20.0, 32.0, 46.0, 67.0, 82.0, 111.0, 146.0, 171.0, 187.0, 197.0, 231.0, 277.0, 306.0, 289.0, 277.0, 272.0, 244.0, 231.0, 183.0, 129.0, 109.0, 103.0, 61.0, 53.0, 45.0, 38.0, 14.0, 14.0, 13.0, 14.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.341796875, -1.2975921630859375, -1.253387451171875, -1.2091827392578125, -1.16497802734375, -1.1207733154296875, -1.076568603515625, -1.0323638916015625, -0.9881591796875, -0.9439544677734375, -0.899749755859375, -0.8555450439453125, -0.81134033203125, -0.7671356201171875, -0.722930908203125, -0.6787261962890625, -0.634521484375, -0.5903167724609375, -0.546112060546875, -0.5019073486328125, -0.45770263671875, -0.4134979248046875, -0.369293212890625, -0.3250885009765625, -0.2808837890625, -0.2366790771484375, -0.192474365234375, -0.1482696533203125, -0.10406494140625, -0.0598602294921875, -0.015655517578125, 0.0285491943359375, 0.07275390625, 0.1169586181640625, 0.161163330078125, 0.2053680419921875, 0.24957275390625, 0.2937774658203125, 0.337982177734375, 0.3821868896484375, 0.4263916015625, 0.4705963134765625, 0.514801025390625, 0.5590057373046875, 0.60321044921875, 0.6474151611328125, 0.691619873046875, 0.7358245849609375, 0.780029296875, 0.8242340087890625, 0.868438720703125, 0.9126434326171875, 0.95684814453125, 1.0010528564453125, 1.045257568359375, 1.0894622802734375, 1.1336669921875, 1.1778717041015625, 1.222076416015625, 1.2662811279296875, 1.31048583984375, 1.3546905517578125, 1.398895263671875, 1.4430999755859375, 1.4873046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 13.0, 20.0, 18.0, 22.0, 26.0, 35.0, 32.0, 40.0, 56.0, 70.0, 79.0, 80.0, 87.0, 60.0, 69.0, 52.0, 43.0, 37.0, 37.0, 17.0, 18.0, 18.0, 10.0, 6.0, 2.0, 7.0, 4.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.834712982177734, -4.677600860595703, -4.520488739013672, -4.363376617431641, -4.206264495849609, -4.049152374267578, -3.8920400142669678, -3.7349278926849365, -3.5778157711029053, -3.420703649520874, -3.2635915279388428, -3.1064794063568115, -2.949367046356201, -2.79225492477417, -2.6351428031921387, -2.4780306816101074, -2.320918560028076, -2.163806438446045, -2.0066943168640137, -1.8495820760726929, -1.6924699544906616, -1.5353578329086304, -1.3782455921173096, -1.2211334705352783, -1.064021348953247, -0.9069092273712158, -0.7497970461845398, -0.5926848649978638, -0.4355727434158325, -0.27846062183380127, -0.12134844064712524, 0.03576374053955078, 0.19287586212158203, 0.34998801350593567, 0.5071001648902893, 0.6642123460769653, 0.8213244676589966, 0.9784365892410278, 1.1355488300323486, 1.2926609516143799, 1.4497730731964111, 1.6068851947784424, 1.7639973163604736, 1.9211095571517944, 2.0782217979431152, 2.2353339195251465, 2.3924460411071777, 2.549558162689209, 2.7066702842712402, 2.8637824058532715, 3.0208945274353027, 3.178006649017334, 3.3351187705993652, 3.4922308921813965, 3.649343252182007, 3.806455373764038, 3.9635674953460693, 4.12067985534668, 4.277791976928711, 4.434904098510742, 4.592016220092773, 4.749128341674805, 4.906240463256836, 5.063352584838867, 5.220464706420898]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 10.0, 20.0, 19.0, 20.0, 20.0, 21.0, 32.0, 21.0, 44.0, 35.0, 55.0, 52.0, 51.0, 63.0, 56.0, 48.0, 53.0, 51.0, 48.0, 33.0, 29.0, 23.0, 28.0, 28.0, 22.0, 16.0, 20.0, 10.0, 14.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4806437492370605, -3.3726115226745605, -3.2645792961120605, -3.1565470695495605, -3.0485148429870605, -2.9404826164245605, -2.8324503898620605, -2.7244184017181396, -2.6163861751556396, -2.5083539485931396, -2.4003217220306396, -2.2922894954681396, -2.1842572689056396, -2.0762252807617188, -1.9681929349899292, -1.8601608276367188, -1.7521284818649292, -1.6440962553024292, -1.5360640287399292, -1.4280319213867188, -1.3199996948242188, -1.2119674682617188, -1.1039352416992188, -0.9959030747413635, -0.8878708481788635, -0.7798386216163635, -0.6718064546585083, -0.5637742280960083, -0.4557420313358307, -0.3477098345756531, -0.23967760801315308, -0.13164544105529785, -0.02361321449279785, 0.08441898971796036, 0.19245119392871857, 0.3004834055900574, 0.408515602350235, 0.5165477991104126, 0.6245800256729126, 0.7326121926307678, 0.8406444191932678, 0.9486766457557678, 1.056708812713623, 1.164741039276123, 1.272773265838623, 1.380805492401123, 1.488837718963623, 1.5968698263168335, 1.7049020528793335, 1.8129342794418335, 1.9209665060043335, 2.028998613357544, 2.137030839920044, 2.245063066482544, 2.353095293045044, 2.461127519607544, 2.569159746170044, 2.677191972732544, 2.785224199295044, 2.893256425857544, 3.001288652420044, 3.109320640563965, 3.217352867126465, 3.325385093688965, 3.433417320251465]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 8.0, 20.0, 20.0, 29.0, 28.0, 35.0, 56.0, 71.0, 95.0, 109.0, 151.0, 236.0, 359.0, 543.0, 828.0, 1390.0, 2383.0, 4530.0, 8607.0, 17937.0, 40174.0, 99170.0, 249758.0, 339483.0, 163917.0, 64011.0, 27062.0, 12709.0, 6456.0, 3210.0, 1875.0, 1087.0, 679.0, 405.0, 298.0, 202.0, 147.0, 115.0, 81.0, 47.0, 44.0, 36.0, 35.0, 31.0, 20.0, 15.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.7783203125, -0.7541961669921875, -0.730072021484375, -0.7059478759765625, -0.68182373046875, -0.6576995849609375, -0.633575439453125, -0.6094512939453125, -0.5853271484375, -0.5612030029296875, -0.537078857421875, -0.5129547119140625, -0.48883056640625, -0.4647064208984375, -0.440582275390625, -0.4164581298828125, -0.392333984375, -0.3682098388671875, -0.344085693359375, -0.3199615478515625, -0.29583740234375, -0.2717132568359375, -0.247589111328125, -0.2234649658203125, -0.1993408203125, -0.1752166748046875, -0.151092529296875, -0.1269683837890625, -0.10284423828125, -0.0787200927734375, -0.054595947265625, -0.0304718017578125, -0.00634765625, 0.0177764892578125, 0.041900634765625, 0.0660247802734375, 0.09014892578125, 0.1142730712890625, 0.138397216796875, 0.1625213623046875, 0.1866455078125, 0.2107696533203125, 0.234893798828125, 0.2590179443359375, 0.28314208984375, 0.3072662353515625, 0.331390380859375, 0.3555145263671875, 0.379638671875, 0.4037628173828125, 0.427886962890625, 0.4520111083984375, 0.47613525390625, 0.5002593994140625, 0.524383544921875, 0.5485076904296875, 0.5726318359375, 0.5967559814453125, 0.620880126953125, 0.6450042724609375, 0.66912841796875, 0.6932525634765625, 0.717376708984375, 0.7415008544921875, 0.765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 8.0, 11.0, 14.0, 17.0, 9.0, 23.0, 12.0, 24.0, 32.0, 26.0, 38.0, 33.0, 48.0, 43.0, 40.0, 52.0, 49.0, 60.0, 48.0, 42.0, 45.0, 40.0, 34.0, 29.0, 32.0, 28.0, 24.0, 23.0, 19.0, 18.0, 16.0, 10.0, 8.0, 9.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.186279296875, -3.07568359375, -2.965087890625, -2.8544921875, -2.743896484375, -2.63330078125, -2.522705078125, -2.412109375, -2.301513671875, -2.19091796875, -2.080322265625, -1.9697265625, -1.859130859375, -1.74853515625, -1.637939453125, -1.52734375, -1.416748046875, -1.30615234375, -1.195556640625, -1.0849609375, -0.974365234375, -0.86376953125, -0.753173828125, -0.642578125, -0.531982421875, -0.42138671875, -0.310791015625, -0.2001953125, -0.089599609375, 0.02099609375, 0.131591796875, 0.2421875, 0.352783203125, 0.46337890625, 0.573974609375, 0.6845703125, 0.795166015625, 0.90576171875, 1.016357421875, 1.126953125, 1.237548828125, 1.34814453125, 1.458740234375, 1.5693359375, 1.679931640625, 1.79052734375, 1.901123046875, 2.01171875, 2.122314453125, 2.23291015625, 2.343505859375, 2.4541015625, 2.564697265625, 2.67529296875, 2.785888671875, 2.896484375, 3.007080078125, 3.11767578125, 3.228271484375, 3.3388671875, 3.449462890625, 3.56005859375, 3.670654296875, 3.78125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 7.0, 14.0, 24.0, 32.0, 32.0, 53.0, 60.0, 92.0, 159.0, 238.0, 366.0, 604.0, 1062.0, 2063.0, 4452.0, 10982.0, 36877.0, 874190.0, 88359.0, 16630.0, 6190.0, 2762.0, 1355.0, 703.0, 375.0, 280.0, 162.0, 113.0, 107.0, 52.0, 41.0, 30.0, 18.0, 18.0, 13.0, 7.0, 9.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.9404296875, -1.8845062255859375, -1.828582763671875, -1.7726593017578125, -1.71673583984375, -1.6608123779296875, -1.604888916015625, -1.5489654541015625, -1.4930419921875, -1.4371185302734375, -1.381195068359375, -1.3252716064453125, -1.26934814453125, -1.2134246826171875, -1.157501220703125, -1.1015777587890625, -1.045654296875, -0.9897308349609375, -0.933807373046875, -0.8778839111328125, -0.82196044921875, -0.7660369873046875, -0.710113525390625, -0.6541900634765625, -0.5982666015625, -0.5423431396484375, -0.486419677734375, -0.4304962158203125, -0.37457275390625, -0.3186492919921875, -0.262725830078125, -0.2068023681640625, -0.15087890625, -0.0949554443359375, -0.039031982421875, 0.0168914794921875, 0.07281494140625, 0.1287384033203125, 0.184661865234375, 0.2405853271484375, 0.2965087890625, 0.3524322509765625, 0.408355712890625, 0.4642791748046875, 0.52020263671875, 0.5761260986328125, 0.632049560546875, 0.6879730224609375, 0.743896484375, 0.7998199462890625, 0.855743408203125, 0.9116668701171875, 0.96759033203125, 1.0235137939453125, 1.079437255859375, 1.1353607177734375, 1.1912841796875, 1.2472076416015625, 1.303131103515625, 1.3590545654296875, 1.41497802734375, 1.4709014892578125, 1.526824951171875, 1.5827484130859375, 1.638671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 16.0, 10.0, 20.0, 18.0, 21.0, 19.0, 26.0, 32.0, 30.0, 29.0, 35.0, 48.0, 29.0, 39.0, 46.0, 44.0, 40.0, 31.0, 33.0, 40.0, 39.0, 36.0, 39.0, 28.0, 30.0, 25.0, 22.0, 20.0, 23.0, 11.0, 17.0, 9.0, 10.0, 20.0, 7.0, 6.0, 10.0, 10.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.05859375, -1.994293212890625, -1.92999267578125, -1.865692138671875, -1.8013916015625, -1.737091064453125, -1.67279052734375, -1.608489990234375, -1.544189453125, -1.479888916015625, -1.41558837890625, -1.351287841796875, -1.2869873046875, -1.222686767578125, -1.15838623046875, -1.094085693359375, -1.02978515625, -0.965484619140625, -0.90118408203125, -0.836883544921875, -0.7725830078125, -0.708282470703125, -0.64398193359375, -0.579681396484375, -0.515380859375, -0.451080322265625, -0.38677978515625, -0.322479248046875, -0.2581787109375, -0.193878173828125, -0.12957763671875, -0.065277099609375, -0.0009765625, 0.063323974609375, 0.12762451171875, 0.191925048828125, 0.2562255859375, 0.320526123046875, 0.38482666015625, 0.449127197265625, 0.513427734375, 0.577728271484375, 0.64202880859375, 0.706329345703125, 0.7706298828125, 0.834930419921875, 0.89923095703125, 0.963531494140625, 1.02783203125, 1.092132568359375, 1.15643310546875, 1.220733642578125, 1.2850341796875, 1.349334716796875, 1.41363525390625, 1.477935791015625, 1.542236328125, 1.606536865234375, 1.67083740234375, 1.735137939453125, 1.7994384765625, 1.863739013671875, 1.92803955078125, 1.992340087890625, 2.056640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 12.0, 12.0, 16.0, 15.0, 20.0, 26.0, 63.0, 52.0, 95.0, 113.0, 197.0, 231.0, 385.0, 574.0, 927.0, 1670.0, 3575.0, 9192.0, 33364.0, 926675.0, 49883.0, 12026.0, 4463.0, 2028.0, 1045.0, 612.0, 362.0, 259.0, 187.0, 119.0, 92.0, 68.0, 48.0, 31.0, 32.0, 16.0, 17.0, 16.0, 9.0, 5.0, 5.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5185546875, -0.502655029296875, -0.48675537109375, -0.470855712890625, -0.4549560546875, -0.439056396484375, -0.42315673828125, -0.407257080078125, -0.391357421875, -0.375457763671875, -0.35955810546875, -0.343658447265625, -0.3277587890625, -0.311859130859375, -0.29595947265625, -0.280059814453125, -0.26416015625, -0.248260498046875, -0.23236083984375, -0.216461181640625, -0.2005615234375, -0.184661865234375, -0.16876220703125, -0.152862548828125, -0.136962890625, -0.121063232421875, -0.10516357421875, -0.089263916015625, -0.0733642578125, -0.057464599609375, -0.04156494140625, -0.025665283203125, -0.009765625, 0.006134033203125, 0.02203369140625, 0.037933349609375, 0.0538330078125, 0.069732666015625, 0.08563232421875, 0.101531982421875, 0.117431640625, 0.133331298828125, 0.14923095703125, 0.165130615234375, 0.1810302734375, 0.196929931640625, 0.21282958984375, 0.228729248046875, 0.24462890625, 0.260528564453125, 0.27642822265625, 0.292327880859375, 0.3082275390625, 0.324127197265625, 0.34002685546875, 0.355926513671875, 0.371826171875, 0.387725830078125, 0.40362548828125, 0.419525146484375, 0.4354248046875, 0.451324462890625, 0.46722412109375, 0.483123779296875, 0.4990234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 4.0, 7.0, 8.0, 13.0, 18.0, 45.0, 51.0, 104.0, 93.0, 119.0, 122.0, 133.0, 89.0, 59.0, 39.0, 34.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.121397018432617e-05, -5.9478916227817535e-05, -5.77438622713089e-05, -5.600880831480026e-05, -5.4273754358291626e-05, -5.253870040178299e-05, -5.080364644527435e-05, -4.9068592488765717e-05, -4.733353853225708e-05, -4.5598484575748444e-05, -4.386343061923981e-05, -4.212837666273117e-05, -4.0393322706222534e-05, -3.86582687497139e-05, -3.692321479320526e-05, -3.5188160836696625e-05, -3.345310688018799e-05, -3.171805292367935e-05, -2.9982998967170715e-05, -2.824794501066208e-05, -2.6512891054153442e-05, -2.4777837097644806e-05, -2.304278314113617e-05, -2.1307729184627533e-05, -1.9572675228118896e-05, -1.783762127161026e-05, -1.6102567315101624e-05, -1.4367513358592987e-05, -1.263245940208435e-05, -1.0897405445575714e-05, -9.162351489067078e-06, -7.427297532558441e-06, -5.692243576049805e-06, -3.957189619541168e-06, -2.2221356630325317e-06, -4.870817065238953e-07, 1.2479722499847412e-06, 2.9830262064933777e-06, 4.718080163002014e-06, 6.453134119510651e-06, 8.188188076019287e-06, 9.923242032527924e-06, 1.165829598903656e-05, 1.3393349945545197e-05, 1.5128403902053833e-05, 1.686345785856247e-05, 1.8598511815071106e-05, 2.0333565771579742e-05, 2.206861972808838e-05, 2.3803673684597015e-05, 2.5538727641105652e-05, 2.727378159761429e-05, 2.9008835554122925e-05, 3.074388951063156e-05, 3.24789434671402e-05, 3.4213997423648834e-05, 3.594905138015747e-05, 3.768410533666611e-05, 3.9419159293174744e-05, 4.115421324968338e-05, 4.2889267206192017e-05, 4.462432116270065e-05, 4.635937511920929e-05, 4.8094429075717926e-05, 4.982948303222656e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 13.0, 10.0, 25.0, 28.0, 34.0, 28.0, 59.0, 71.0, 130.0, 152.0, 226.0, 369.0, 496.0, 759.0, 1211.0, 1935.0, 3012.0, 5158.0, 8925.0, 18448.0, 48265.0, 150867.0, 385524.0, 274337.0, 87507.0, 29962.0, 13149.0, 6915.0, 3954.0, 2472.0, 1538.0, 970.0, 632.0, 447.0, 274.0, 165.0, 127.0, 100.0, 61.0, 50.0, 40.0, 22.0, 24.0, 14.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 4.0, 1.0], "bins": [-0.19580078125, -0.19000244140625, -0.1842041015625, -0.17840576171875, -0.172607421875, -0.16680908203125, -0.1610107421875, -0.15521240234375, -0.1494140625, -0.14361572265625, -0.1378173828125, -0.13201904296875, -0.126220703125, -0.12042236328125, -0.1146240234375, -0.10882568359375, -0.10302734375, -0.09722900390625, -0.0914306640625, -0.08563232421875, -0.079833984375, -0.07403564453125, -0.0682373046875, -0.06243896484375, -0.056640625, -0.05084228515625, -0.0450439453125, -0.03924560546875, -0.033447265625, -0.02764892578125, -0.0218505859375, -0.01605224609375, -0.01025390625, -0.00445556640625, 0.0013427734375, 0.00714111328125, 0.012939453125, 0.01873779296875, 0.0245361328125, 0.03033447265625, 0.0361328125, 0.04193115234375, 0.0477294921875, 0.05352783203125, 0.059326171875, 0.06512451171875, 0.0709228515625, 0.07672119140625, 0.08251953125, 0.08831787109375, 0.0941162109375, 0.09991455078125, 0.105712890625, 0.11151123046875, 0.1173095703125, 0.12310791015625, 0.12890625, 0.13470458984375, 0.1405029296875, 0.14630126953125, 0.152099609375, 0.15789794921875, 0.1636962890625, 0.16949462890625, 0.17529296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 11.0, 11.0, 12.0, 10.0, 16.0, 27.0, 36.0, 36.0, 45.0, 68.0, 59.0, 64.0, 71.0, 86.0, 78.0, 79.0, 60.0, 39.0, 22.0, 39.0, 23.0, 20.0, 14.0, 12.0, 11.0, 4.0, 2.0, 8.0, 4.0, 7.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.038665771484375, -0.037572383880615234, -0.03647899627685547, -0.0353856086730957, -0.03429222106933594, -0.03319883346557617, -0.032105445861816406, -0.03101205825805664, -0.029918670654296875, -0.02882528305053711, -0.027731895446777344, -0.026638507843017578, -0.025545120239257812, -0.024451732635498047, -0.02335834503173828, -0.022264957427978516, -0.02117156982421875, -0.020078182220458984, -0.01898479461669922, -0.017891407012939453, -0.016798019409179688, -0.015704631805419922, -0.014611244201660156, -0.01351785659790039, -0.012424468994140625, -0.01133108139038086, -0.010237693786621094, -0.009144306182861328, -0.008050918579101562, -0.006957530975341797, -0.005864143371582031, -0.004770755767822266, -0.0036773681640625, -0.0025839805603027344, -0.0014905929565429688, -0.0003972053527832031, 0.0006961822509765625, 0.0017895698547363281, 0.0028829574584960938, 0.003976345062255859, 0.005069732666015625, 0.006163120269775391, 0.007256507873535156, 0.008349895477294922, 0.009443283081054688, 0.010536670684814453, 0.011630058288574219, 0.012723445892333984, 0.01381683349609375, 0.014910221099853516, 0.01600360870361328, 0.017096996307373047, 0.018190383911132812, 0.019283771514892578, 0.020377159118652344, 0.02147054672241211, 0.022563934326171875, 0.02365732192993164, 0.024750709533691406, 0.025844097137451172, 0.026937484741210938, 0.028030872344970703, 0.02912425994873047, 0.030217647552490234, 0.03131103515625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 6.0, 11.0, 7.0, 15.0, 23.0, 15.0, 26.0, 27.0, 32.0, 41.0, 34.0, 71.0, 77.0, 74.0, 84.0, 86.0, 59.0, 63.0, 50.0, 40.0, 35.0, 30.0, 19.0, 18.0, 11.0, 7.0, 8.0, 3.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.78282356262207, -4.625185012817383, -4.467546463012695, -4.309907913208008, -4.15226936340332, -3.994630813598633, -3.836992025375366, -3.6793534755706787, -3.521714925765991, -3.3640763759613037, -3.206437826156616, -3.0487992763519287, -2.891160488128662, -2.7335219383239746, -2.575883388519287, -2.4182448387145996, -2.260606288909912, -2.1029677391052246, -1.945329189300537, -1.78769052028656, -1.6300519704818726, -1.472413420677185, -1.314774751663208, -1.1571362018585205, -0.999497652053833, -0.8418591022491455, -0.6842204928398132, -0.526581883430481, -0.36894333362579346, -0.21130478382110596, -0.05366617441177368, 0.1039724349975586, 0.2616105079650879, 0.4192490875720978, 0.5768876671791077, 0.7345262765884399, 0.8921648263931274, 1.049803376197815, 1.207442045211792, 1.3650805950164795, 1.522719144821167, 1.6803576946258545, 1.837996244430542, 1.995634913444519, 2.153273582458496, 2.3109121322631836, 2.468550682067871, 2.6261892318725586, 2.783827781677246, 2.9414663314819336, 3.099104881286621, 3.2567434310913086, 3.414381980895996, 3.5720205307006836, 3.72965931892395, 3.8872978687286377, 4.044936180114746, 4.202574729919434, 4.360213279724121, 4.517851829528809, 4.675490379333496, 4.833128929138184, 4.990767478942871, 5.148406028747559, 5.306045055389404]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 8.0, 19.0, 19.0, 20.0, 19.0, 22.0, 29.0, 23.0, 39.0, 44.0, 50.0, 48.0, 52.0, 64.0, 60.0, 44.0, 56.0, 52.0, 43.0, 36.0, 33.0, 21.0, 27.0, 28.0, 24.0, 19.0, 15.0, 14.0, 12.0, 11.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4642462730407715, -3.3566370010375977, -3.2490274906158447, -3.141418218612671, -3.033808946609497, -2.926199436187744, -2.8185901641845703, -2.7109808921813965, -2.6033713817596436, -2.4957621097564697, -2.388152599334717, -2.280543327331543, -2.172934055328369, -2.065324544906616, -1.9577152729034424, -1.850105881690979, -1.7424966096878052, -1.6348872184753418, -1.527277946472168, -1.4196685552597046, -1.3120591640472412, -1.2044498920440674, -1.096840500831604, -0.9892311096191406, -0.881621778011322, -0.7740124464035034, -0.66640305519104, -0.5587937235832214, -0.45118436217308044, -0.34357500076293945, -0.23596566915512085, -0.12835627794265747, -0.020746946334838867, 0.08686240762472153, 0.19447176158428192, 0.3020811080932617, 0.4096904695034027, 0.5172998309135437, 0.6249091625213623, 0.7325185537338257, 0.8401278853416443, 0.9477372169494629, 1.0553466081619263, 1.1629559993743896, 1.2705652713775635, 1.3781746625900269, 1.4857840538024902, 1.593393325805664, 1.7010027170181274, 1.8086121082305908, 1.9162213802337646, 2.0238308906555176, 2.1314401626586914, 2.2390494346618652, 2.346658706665039, 2.454268217086792, 2.561877489089966, 2.6694867610931396, 2.7770962715148926, 2.8847055435180664, 2.9923148155212402, 3.099924325942993, 3.207533597946167, 3.31514310836792, 3.4227523803710938]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 10.0, 14.0, 32.0, 28.0, 55.0, 96.0, 142.0, 189.0, 262.0, 446.0, 712.0, 1207.0, 1970.0, 3230.0, 5543.0, 9686.0, 17087.0, 29882.0, 52272.0, 87158.0, 133918.0, 172855.0, 174677.0, 137208.0, 91173.0, 54783.0, 31489.0, 17655.0, 10122.0, 5863.0, 3356.0, 2044.0, 1204.0, 813.0, 447.0, 313.0, 205.0, 139.0, 93.0, 49.0, 38.0, 23.0, 22.0, 18.0, 10.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.96875, -2.8760986328125, -2.783447265625, -2.6907958984375, -2.59814453125, -2.5054931640625, -2.412841796875, -2.3201904296875, -2.2275390625, -2.1348876953125, -2.042236328125, -1.9495849609375, -1.85693359375, -1.7642822265625, -1.671630859375, -1.5789794921875, -1.486328125, -1.3936767578125, -1.301025390625, -1.2083740234375, -1.11572265625, -1.0230712890625, -0.930419921875, -0.8377685546875, -0.7451171875, -0.6524658203125, -0.559814453125, -0.4671630859375, -0.37451171875, -0.2818603515625, -0.189208984375, -0.0965576171875, -0.00390625, 0.0887451171875, 0.181396484375, 0.2740478515625, 0.36669921875, 0.4593505859375, 0.552001953125, 0.6446533203125, 0.7373046875, 0.8299560546875, 0.922607421875, 1.0152587890625, 1.10791015625, 1.2005615234375, 1.293212890625, 1.3858642578125, 1.478515625, 1.5711669921875, 1.663818359375, 1.7564697265625, 1.84912109375, 1.9417724609375, 2.034423828125, 2.1270751953125, 2.2197265625, 2.3123779296875, 2.405029296875, 2.4976806640625, 2.59033203125, 2.6829833984375, 2.775634765625, 2.8682861328125, 2.9609375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 10.0, 18.0, 25.0, 14.0, 31.0, 23.0, 27.0, 37.0, 36.0, 51.0, 51.0, 52.0, 64.0, 58.0, 42.0, 74.0, 44.0, 51.0, 53.0, 46.0, 34.0, 26.0, 23.0, 18.0, 16.0, 15.0, 10.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.859375, -4.733367919921875, -4.60736083984375, -4.481353759765625, -4.3553466796875, -4.229339599609375, -4.10333251953125, -3.977325439453125, -3.851318359375, -3.725311279296875, -3.59930419921875, -3.473297119140625, -3.3472900390625, -3.221282958984375, -3.09527587890625, -2.969268798828125, -2.84326171875, -2.717254638671875, -2.59124755859375, -2.465240478515625, -2.3392333984375, -2.213226318359375, -2.08721923828125, -1.961212158203125, -1.835205078125, -1.709197998046875, -1.58319091796875, -1.457183837890625, -1.3311767578125, -1.205169677734375, -1.07916259765625, -0.953155517578125, -0.8271484375, -0.701141357421875, -0.57513427734375, -0.449127197265625, -0.3231201171875, -0.197113037109375, -0.07110595703125, 0.054901123046875, 0.180908203125, 0.306915283203125, 0.43292236328125, 0.558929443359375, 0.6849365234375, 0.810943603515625, 0.93695068359375, 1.062957763671875, 1.18896484375, 1.314971923828125, 1.44097900390625, 1.566986083984375, 1.6929931640625, 1.819000244140625, 1.94500732421875, 2.071014404296875, 2.197021484375, 2.323028564453125, 2.44903564453125, 2.575042724609375, 2.7010498046875, 2.827056884765625, 2.95306396484375, 3.079071044921875, 3.205078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 15.0, 26.0, 26.0, 33.0, 55.0, 94.0, 129.0, 202.0, 257.0, 441.0, 692.0, 1081.0, 1572.0, 2601.0, 4231.0, 6829.0, 11153.0, 18371.0, 30550.0, 48946.0, 75975.0, 111344.0, 144012.0, 157137.0, 139014.0, 104698.0, 71480.0, 45219.0, 27808.0, 17270.0, 10420.0, 6274.0, 3876.0, 2377.0, 1568.0, 928.0, 643.0, 405.0, 275.0, 179.0, 114.0, 70.0, 47.0, 26.0, 28.0, 17.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-2.767578125, -2.687164306640625, -2.60675048828125, -2.526336669921875, -2.4459228515625, -2.365509033203125, -2.28509521484375, -2.204681396484375, -2.124267578125, -2.043853759765625, -1.96343994140625, -1.883026123046875, -1.8026123046875, -1.722198486328125, -1.64178466796875, -1.561370849609375, -1.48095703125, -1.400543212890625, -1.32012939453125, -1.239715576171875, -1.1593017578125, -1.078887939453125, -0.99847412109375, -0.918060302734375, -0.837646484375, -0.757232666015625, -0.67681884765625, -0.596405029296875, -0.5159912109375, -0.435577392578125, -0.35516357421875, -0.274749755859375, -0.1943359375, -0.113922119140625, -0.03350830078125, 0.046905517578125, 0.1273193359375, 0.207733154296875, 0.28814697265625, 0.368560791015625, 0.448974609375, 0.529388427734375, 0.60980224609375, 0.690216064453125, 0.7706298828125, 0.851043701171875, 0.93145751953125, 1.011871337890625, 1.09228515625, 1.172698974609375, 1.25311279296875, 1.333526611328125, 1.4139404296875, 1.494354248046875, 1.57476806640625, 1.655181884765625, 1.735595703125, 1.816009521484375, 1.89642333984375, 1.976837158203125, 2.0572509765625, 2.137664794921875, 2.21807861328125, 2.298492431640625, 2.37890625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 7.0, 7.0, 16.0, 7.0, 15.0, 21.0, 15.0, 22.0, 29.0, 38.0, 32.0, 40.0, 51.0, 47.0, 47.0, 43.0, 38.0, 33.0, 46.0, 39.0, 35.0, 50.0, 37.0, 35.0, 29.0, 28.0, 30.0, 25.0, 18.0, 18.0, 22.0, 10.0, 16.0, 13.0, 6.0, 8.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.03515625, -1.97265625, -1.91015625, -1.84765625, -1.78515625, -1.72265625, -1.66015625, -1.59765625, -1.53515625, -1.47265625, -1.41015625, -1.34765625, -1.28515625, -1.22265625, -1.16015625, -1.09765625, -1.03515625, -0.97265625, -0.91015625, -0.84765625, -0.78515625, -0.72265625, -0.66015625, -0.59765625, -0.53515625, -0.47265625, -0.41015625, -0.34765625, -0.28515625, -0.22265625, -0.16015625, -0.09765625, -0.03515625, 0.02734375, 0.08984375, 0.15234375, 0.21484375, 0.27734375, 0.33984375, 0.40234375, 0.46484375, 0.52734375, 0.58984375, 0.65234375, 0.71484375, 0.77734375, 0.83984375, 0.90234375, 0.96484375, 1.02734375, 1.08984375, 1.15234375, 1.21484375, 1.27734375, 1.33984375, 1.40234375, 1.46484375, 1.52734375, 1.58984375, 1.65234375, 1.71484375, 1.77734375, 1.83984375, 1.90234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 24.0, 37.0, 51.0, 81.0, 131.0, 217.0, 366.0, 685.0, 1111.0, 2041.0, 4113.0, 8585.0, 18646.0, 42539.0, 97592.0, 200974.0, 280759.0, 207124.0, 101734.0, 44014.0, 19416.0, 9035.0, 4359.0, 2128.0, 1173.0, 633.0, 373.0, 209.0, 130.0, 78.0, 61.0, 30.0, 26.0, 14.0, 10.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.142578125, -2.0723876953125, -2.002197265625, -1.9320068359375, -1.86181640625, -1.7916259765625, -1.721435546875, -1.6512451171875, -1.5810546875, -1.5108642578125, -1.440673828125, -1.3704833984375, -1.30029296875, -1.2301025390625, -1.159912109375, -1.0897216796875, -1.01953125, -0.9493408203125, -0.879150390625, -0.8089599609375, -0.73876953125, -0.6685791015625, -0.598388671875, -0.5281982421875, -0.4580078125, -0.3878173828125, -0.317626953125, -0.2474365234375, -0.17724609375, -0.1070556640625, -0.036865234375, 0.0333251953125, 0.103515625, 0.1737060546875, 0.243896484375, 0.3140869140625, 0.38427734375, 0.4544677734375, 0.524658203125, 0.5948486328125, 0.6650390625, 0.7352294921875, 0.805419921875, 0.8756103515625, 0.94580078125, 1.0159912109375, 1.086181640625, 1.1563720703125, 1.2265625, 1.2967529296875, 1.366943359375, 1.4371337890625, 1.50732421875, 1.5775146484375, 1.647705078125, 1.7178955078125, 1.7880859375, 1.8582763671875, 1.928466796875, 1.9986572265625, 2.06884765625, 2.1390380859375, 2.209228515625, 2.2794189453125, 2.349609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 12.0, 11.0, 12.0, 18.0, 18.0, 28.0, 27.0, 46.0, 64.0, 68.0, 79.0, 88.0, 76.0, 84.0, 85.0, 66.0, 58.0, 32.0, 22.0, 19.0, 21.0, 16.0, 7.0, 5.0, 7.0, 4.0, 7.0, 2.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001800060272216797, -0.0001732073724269867, -0.0001664087176322937, -0.0001596100628376007, -0.00015281140804290771, -0.00014601275324821472, -0.00013921409845352173, -0.00013241544365882874, -0.00012561678886413574, -0.00011881813406944275, -0.00011201947927474976, -0.00010522082448005676, -9.842216968536377e-05, -9.162351489067078e-05, -8.482486009597778e-05, -7.802620530128479e-05, -7.12275505065918e-05, -6.44288957118988e-05, -5.763024091720581e-05, -5.083158612251282e-05, -4.4032931327819824e-05, -3.723427653312683e-05, -3.0435621738433838e-05, -2.3636966943740845e-05, -1.683831214904785e-05, -1.0039657354354858e-05, -3.2410025596618652e-06, 3.557652235031128e-06, 1.0356307029724121e-05, 1.7154961824417114e-05, 2.3953616619110107e-05, 3.07522714138031e-05, 3.7550926208496094e-05, 4.434958100318909e-05, 5.114823579788208e-05, 5.794689059257507e-05, 6.474554538726807e-05, 7.154420018196106e-05, 7.834285497665405e-05, 8.514150977134705e-05, 9.194016456604004e-05, 9.873881936073303e-05, 0.00010553747415542603, 0.00011233612895011902, 0.00011913478374481201, 0.000125933438539505, 0.000132732093334198, 0.000139530748128891, 0.00014632940292358398, 0.00015312805771827698, 0.00015992671251296997, 0.00016672536730766296, 0.00017352402210235596, 0.00018032267689704895, 0.00018712133169174194, 0.00019391998648643494, 0.00020071864128112793, 0.00020751729607582092, 0.00021431595087051392, 0.0002211146056652069, 0.0002279132604598999, 0.0002347119152545929, 0.0002415105700492859, 0.0002483092248439789, 0.0002551078796386719]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 20.0, 19.0, 38.0, 45.0, 75.0, 82.0, 160.0, 222.0, 353.0, 527.0, 765.0, 1255.0, 1955.0, 3157.0, 5178.0, 8687.0, 14951.0, 26557.0, 46598.0, 81086.0, 130774.0, 179551.0, 185499.0, 143306.0, 91479.0, 53192.0, 30187.0, 17263.0, 10032.0, 5924.0, 3446.0, 2191.0, 1447.0, 879.0, 545.0, 391.0, 227.0, 163.0, 94.0, 66.0, 57.0, 40.0, 24.0, 15.0, 15.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.6279296875, -1.581573486328125, -1.53521728515625, -1.488861083984375, -1.4425048828125, -1.396148681640625, -1.34979248046875, -1.303436279296875, -1.257080078125, -1.210723876953125, -1.16436767578125, -1.118011474609375, -1.0716552734375, -1.025299072265625, -0.97894287109375, -0.932586669921875, -0.88623046875, -0.839874267578125, -0.79351806640625, -0.747161865234375, -0.7008056640625, -0.654449462890625, -0.60809326171875, -0.561737060546875, -0.515380859375, -0.469024658203125, -0.42266845703125, -0.376312255859375, -0.3299560546875, -0.283599853515625, -0.23724365234375, -0.190887451171875, -0.14453125, -0.098175048828125, -0.05181884765625, -0.005462646484375, 0.0408935546875, 0.087249755859375, 0.13360595703125, 0.179962158203125, 0.226318359375, 0.272674560546875, 0.31903076171875, 0.365386962890625, 0.4117431640625, 0.458099365234375, 0.50445556640625, 0.550811767578125, 0.59716796875, 0.643524169921875, 0.68988037109375, 0.736236572265625, 0.7825927734375, 0.828948974609375, 0.87530517578125, 0.921661376953125, 0.968017578125, 1.014373779296875, 1.06072998046875, 1.107086181640625, 1.1534423828125, 1.199798583984375, 1.24615478515625, 1.292510986328125, 1.3388671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 11.0, 18.0, 14.0, 11.0, 25.0, 25.0, 34.0, 55.0, 62.0, 56.0, 69.0, 68.0, 67.0, 69.0, 64.0, 52.0, 54.0, 39.0, 36.0, 28.0, 21.0, 24.0, 20.0, 16.0, 18.0, 7.0, 3.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.612213134765625, -0.59405517578125, -0.575897216796875, -0.5577392578125, -0.539581298828125, -0.52142333984375, -0.503265380859375, -0.485107421875, -0.466949462890625, -0.44879150390625, -0.430633544921875, -0.4124755859375, -0.394317626953125, -0.37615966796875, -0.358001708984375, -0.33984375, -0.321685791015625, -0.30352783203125, -0.285369873046875, -0.2672119140625, -0.249053955078125, -0.23089599609375, -0.212738037109375, -0.194580078125, -0.176422119140625, -0.15826416015625, -0.140106201171875, -0.1219482421875, -0.103790283203125, -0.08563232421875, -0.067474365234375, -0.04931640625, -0.031158447265625, -0.01300048828125, 0.005157470703125, 0.0233154296875, 0.041473388671875, 0.05963134765625, 0.077789306640625, 0.095947265625, 0.114105224609375, 0.13226318359375, 0.150421142578125, 0.1685791015625, 0.186737060546875, 0.20489501953125, 0.223052978515625, 0.2412109375, 0.259368896484375, 0.27752685546875, 0.295684814453125, 0.3138427734375, 0.332000732421875, 0.35015869140625, 0.368316650390625, 0.386474609375, 0.404632568359375, 0.42279052734375, 0.440948486328125, 0.4591064453125, 0.477264404296875, 0.49542236328125, 0.513580322265625, 0.53173828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 15.0, 10.0, 14.0, 17.0, 27.0, 35.0, 36.0, 45.0, 45.0, 52.0, 57.0, 77.0, 61.0, 66.0, 84.0, 61.0, 42.0, 52.0, 40.0, 31.0, 33.0, 16.0, 9.0, 9.0, 6.0, 9.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.544699192047119, -4.395304203033447, -4.245909690856934, -4.096514701843262, -3.94711971282959, -3.797724723815918, -3.648329973220825, -3.4989352226257324, -3.3495402336120605, -3.2001452445983887, -3.050750494003296, -2.901355743408203, -2.7519607543945312, -2.6025657653808594, -2.4531710147857666, -2.303776264190674, -2.154381275177002, -2.00498628616333, -1.8555915355682373, -1.706196665763855, -1.5568017959594727, -1.4074069261550903, -1.258012056350708, -1.1086171865463257, -0.9592223167419434, -0.809827446937561, -0.6604325771331787, -0.5110377073287964, -0.36164283752441406, -0.21224796772003174, -0.06285309791564941, 0.08654177188873291, 0.23593664169311523, 0.38533151149749756, 0.5347263813018799, 0.6841212511062622, 0.8335161209106445, 0.9829109907150269, 1.1323058605194092, 1.2817007303237915, 1.4310956001281738, 1.5804904699325562, 1.7298853397369385, 1.8792802095413208, 2.028675079345703, 2.178070068359375, 2.3274648189544678, 2.4768595695495605, 2.6262545585632324, 2.7756495475769043, 2.925044298171997, 3.07443904876709, 3.2238340377807617, 3.3732290267944336, 3.5226237773895264, 3.672018527984619, 3.821413516998291, 3.970808506011963, 4.120203018188477, 4.269598007202148, 4.41899299621582, 4.568387985229492, 4.717782974243164, 4.867177486419678, 5.01657247543335]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 1.0, 0.0, 3.0, 5.0, 8.0, 10.0, 6.0, 20.0, 15.0, 13.0, 22.0, 25.0, 17.0, 31.0, 38.0, 56.0, 41.0, 52.0, 52.0, 49.0, 46.0, 57.0, 60.0, 50.0, 43.0, 37.0, 38.0, 31.0, 30.0, 27.0, 23.0, 27.0, 16.0, 18.0, 12.0, 10.0, 9.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4886584281921387, -3.3750526905059814, -3.261446952819824, -3.147841453552246, -3.034235715866089, -2.9206299781799316, -2.8070244789123535, -2.6934187412261963, -2.579813003540039, -2.466207265853882, -2.3526015281677246, -2.2389960289001465, -2.1253902912139893, -2.011784553527832, -1.8981789350509644, -1.7845733165740967, -1.6709675788879395, -1.5573618412017822, -1.4437562227249146, -1.3301506042480469, -1.2165448665618896, -1.1029391288757324, -0.9893335103988647, -0.8757278323173523, -0.7621221542358398, -0.6485164761543274, -0.5349107980728149, -0.4213051199913025, -0.30769944190979004, -0.1940937638282776, -0.08048808574676514, 0.033117592334747314, 0.14672327041625977, 0.2603289484977722, 0.37393462657928467, 0.4875403046607971, 0.6011459827423096, 0.714751660823822, 0.8283573389053345, 0.9419630169868469, 1.0555686950683594, 1.1691744327545166, 1.2827800512313843, 1.396385669708252, 1.5099914073944092, 1.6235971450805664, 1.737202763557434, 1.8508083820343018, 1.964414119720459, 2.078019857406616, 2.1916255950927734, 2.3052310943603516, 2.418836832046509, 2.532442569732666, 2.646048069000244, 2.7596538066864014, 2.8732595443725586, 2.986865282058716, 3.100471019744873, 3.214076519012451, 3.3276822566986084, 3.4412879943847656, 3.5548934936523438, 3.668499231338501, 3.782104969024658]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 11.0, 9.0, 14.0, 17.0, 25.0, 35.0, 51.0, 84.0, 121.0, 191.0, 242.0, 405.0, 620.0, 978.0, 1516.0, 2618.0, 4210.0, 7294.0, 12687.0, 22965.0, 43738.0, 87558.0, 189565.0, 440461.0, 930094.0, 1155416.0, 705022.0, 309709.0, 137022.0, 65684.0, 33196.0, 17842.0, 9998.0, 5893.0, 3405.0, 2104.0, 1258.0, 837.0, 500.0, 337.0, 198.0, 128.0, 87.0, 44.0, 35.0, 23.0, 12.0, 9.0, 4.0, 7.0, 2.0, 0.0, 3.0], "bins": [-4.62109375, -4.493743896484375, -4.36639404296875, -4.239044189453125, -4.1116943359375, -3.984344482421875, -3.85699462890625, -3.729644775390625, -3.602294921875, -3.474945068359375, -3.34759521484375, -3.220245361328125, -3.0928955078125, -2.965545654296875, -2.83819580078125, -2.710845947265625, -2.58349609375, -2.456146240234375, -2.32879638671875, -2.201446533203125, -2.0740966796875, -1.946746826171875, -1.81939697265625, -1.692047119140625, -1.564697265625, -1.437347412109375, -1.30999755859375, -1.182647705078125, -1.0552978515625, -0.927947998046875, -0.80059814453125, -0.673248291015625, -0.5458984375, -0.418548583984375, -0.29119873046875, -0.163848876953125, -0.0364990234375, 0.090850830078125, 0.21820068359375, 0.345550537109375, 0.472900390625, 0.600250244140625, 0.72760009765625, 0.854949951171875, 0.9822998046875, 1.109649658203125, 1.23699951171875, 1.364349365234375, 1.49169921875, 1.619049072265625, 1.74639892578125, 1.873748779296875, 2.0010986328125, 2.128448486328125, 2.25579833984375, 2.383148193359375, 2.510498046875, 2.637847900390625, 2.76519775390625, 2.892547607421875, 3.0198974609375, 3.147247314453125, 3.27459716796875, 3.401947021484375, 3.529296875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 12.0, 12.0, 10.0, 17.0, 20.0, 25.0, 27.0, 31.0, 33.0, 29.0, 35.0, 47.0, 44.0, 38.0, 47.0, 45.0, 45.0, 43.0, 53.0, 47.0, 42.0, 52.0, 33.0, 39.0, 30.0, 21.0, 22.0, 20.0, 16.0, 14.0, 6.0, 6.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158203125, -2.080718994140625, -2.00323486328125, -1.925750732421875, -1.8482666015625, -1.770782470703125, -1.69329833984375, -1.615814208984375, -1.538330078125, -1.460845947265625, -1.38336181640625, -1.305877685546875, -1.2283935546875, -1.150909423828125, -1.07342529296875, -0.995941162109375, -0.91845703125, -0.840972900390625, -0.76348876953125, -0.686004638671875, -0.6085205078125, -0.531036376953125, -0.45355224609375, -0.376068115234375, -0.298583984375, -0.221099853515625, -0.14361572265625, -0.066131591796875, 0.0113525390625, 0.088836669921875, 0.16632080078125, 0.243804931640625, 0.3212890625, 0.398773193359375, 0.47625732421875, 0.553741455078125, 0.6312255859375, 0.708709716796875, 0.78619384765625, 0.863677978515625, 0.941162109375, 1.018646240234375, 1.09613037109375, 1.173614501953125, 1.2510986328125, 1.328582763671875, 1.40606689453125, 1.483551025390625, 1.56103515625, 1.638519287109375, 1.71600341796875, 1.793487548828125, 1.8709716796875, 1.948455810546875, 2.02593994140625, 2.103424072265625, 2.180908203125, 2.258392333984375, 2.33587646484375, 2.413360595703125, 2.4908447265625, 2.568328857421875, 2.64581298828125, 2.723297119140625, 2.80078125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 27.0, 27.0, 32.0, 51.0, 70.0, 147.0, 178.0, 293.0, 450.0, 668.0, 1115.0, 1713.0, 2657.0, 4331.0, 7002.0, 11909.0, 19924.0, 34891.0, 62601.0, 117873.0, 225025.0, 436110.0, 782583.0, 985691.0, 698189.0, 375902.0, 192632.0, 101597.0, 55110.0, 30693.0, 17587.0, 10411.0, 6148.0, 3853.0, 2487.0, 1508.0, 995.0, 622.0, 404.0, 255.0, 185.0, 112.0, 80.0, 39.0, 34.0, 21.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.94140625, -3.8197021484375, -3.697998046875, -3.5762939453125, -3.45458984375, -3.3328857421875, -3.211181640625, -3.0894775390625, -2.9677734375, -2.8460693359375, -2.724365234375, -2.6026611328125, -2.48095703125, -2.3592529296875, -2.237548828125, -2.1158447265625, -1.994140625, -1.8724365234375, -1.750732421875, -1.6290283203125, -1.50732421875, -1.3856201171875, -1.263916015625, -1.1422119140625, -1.0205078125, -0.8988037109375, -0.777099609375, -0.6553955078125, -0.53369140625, -0.4119873046875, -0.290283203125, -0.1685791015625, -0.046875, 0.0748291015625, 0.196533203125, 0.3182373046875, 0.43994140625, 0.5616455078125, 0.683349609375, 0.8050537109375, 0.9267578125, 1.0484619140625, 1.170166015625, 1.2918701171875, 1.41357421875, 1.5352783203125, 1.656982421875, 1.7786865234375, 1.900390625, 2.0220947265625, 2.143798828125, 2.2655029296875, 2.38720703125, 2.5089111328125, 2.630615234375, 2.7523193359375, 2.8740234375, 2.9957275390625, 3.117431640625, 3.2391357421875, 3.36083984375, 3.4825439453125, 3.604248046875, 3.7259521484375, 3.84765625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 11.0, 7.0, 16.0, 20.0, 21.0, 33.0, 37.0, 49.0, 62.0, 82.0, 101.0, 110.0, 146.0, 172.0, 230.0, 251.0, 280.0, 266.0, 302.0, 251.0, 258.0, 215.0, 213.0, 166.0, 158.0, 123.0, 89.0, 79.0, 70.0, 51.0, 38.0, 35.0, 22.0, 31.0, 15.0, 11.0, 11.0, 11.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.1075897216796875, -1.068695068359375, -1.0298004150390625, -0.99090576171875, -0.9520111083984375, -0.913116455078125, -0.8742218017578125, -0.8353271484375, -0.7964324951171875, -0.757537841796875, -0.7186431884765625, -0.67974853515625, -0.6408538818359375, -0.601959228515625, -0.5630645751953125, -0.524169921875, -0.4852752685546875, -0.446380615234375, -0.4074859619140625, -0.36859130859375, -0.3296966552734375, -0.290802001953125, -0.2519073486328125, -0.2130126953125, -0.1741180419921875, -0.135223388671875, -0.0963287353515625, -0.05743408203125, -0.0185394287109375, 0.020355224609375, 0.0592498779296875, 0.09814453125, 0.1370391845703125, 0.175933837890625, 0.2148284912109375, 0.25372314453125, 0.2926177978515625, 0.331512451171875, 0.3704071044921875, 0.4093017578125, 0.4481964111328125, 0.487091064453125, 0.5259857177734375, 0.56488037109375, 0.6037750244140625, 0.642669677734375, 0.6815643310546875, 0.720458984375, 0.7593536376953125, 0.798248291015625, 0.8371429443359375, 0.87603759765625, 0.9149322509765625, 0.953826904296875, 0.9927215576171875, 1.0316162109375, 1.0705108642578125, 1.109405517578125, 1.1483001708984375, 1.18719482421875, 1.2260894775390625, 1.264984130859375, 1.3038787841796875, 1.3427734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 16.0, 11.0, 13.0, 18.0, 18.0, 27.0, 27.0, 37.0, 35.0, 50.0, 61.0, 57.0, 62.0, 75.0, 70.0, 63.0, 41.0, 52.0, 34.0, 36.0, 34.0, 19.0, 18.0, 17.0, 23.0, 14.0, 15.0, 4.0, 9.0, 6.0, 6.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.879155397415161, -3.7437703609466553, -3.6083853244781494, -3.4730002880096436, -3.3376152515411377, -3.202230215072632, -3.066845417022705, -2.931460380554199, -2.7960753440856934, -2.6606903076171875, -2.5253052711486816, -2.389920234680176, -2.25453519821167, -2.119150161743164, -1.9837652444839478, -1.848380208015442, -1.7129950523376465, -1.5776100158691406, -1.4422249794006348, -1.306839942932129, -1.171454906463623, -1.0360698699951172, -0.9006849527359009, -0.765299916267395, -0.6299148797988892, -0.4945298433303833, -0.35914483666419983, -0.22375982999801636, -0.0883747935295105, 0.04701024293899536, 0.18239521980285645, 0.3177802562713623, 0.45316553115844727, 0.5885505676269531, 0.723935604095459, 0.8593205809593201, 0.9947056174278259, 1.1300907135009766, 1.2654756307601929, 1.4008606672286987, 1.5362457036972046, 1.6716307401657104, 1.8070157766342163, 1.9424006938934326, 2.0777857303619385, 2.2131707668304443, 2.34855580329895, 2.483940839767456, 2.619325876235962, 2.7547109127044678, 2.8900959491729736, 3.0254809856414795, 3.1608660221099854, 3.296251058578491, 3.431635856628418, 3.567020893096924, 3.7024059295654297, 3.8377909660339355, 3.9731760025024414, 4.108561038970947, 4.243946075439453, 4.379331111907959, 4.514716148376465, 4.650101184844971, 4.785486221313477]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 6.0, 10.0, 16.0, 11.0, 19.0, 20.0, 27.0, 27.0, 26.0, 27.0, 35.0, 38.0, 38.0, 35.0, 50.0, 43.0, 43.0, 39.0, 41.0, 41.0, 36.0, 36.0, 33.0, 38.0, 28.0, 32.0, 25.0, 29.0, 27.0, 22.0, 11.0, 7.0, 9.0, 9.0, 9.0, 5.0, 9.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.609907865524292, -2.525479316711426, -2.4410510063171387, -2.3566224575042725, -2.2721941471099854, -2.187765598297119, -2.103337287902832, -2.018908739089966, -1.9344803094863892, -1.8500518798828125, -1.7656234502792358, -1.6811950206756592, -1.596766471862793, -1.5123381614685059, -1.4279096126556396, -1.343481183052063, -1.2590527534484863, -1.1746243238449097, -1.090195894241333, -1.0057673454284668, -0.9213389754295349, -0.8369105458259583, -0.7524820566177368, -0.6680536270141602, -0.5836251974105835, -0.49919676780700684, -0.4147683084011078, -0.33033984899520874, -0.24591141939163208, -0.16148298978805542, -0.07705450057983398, 0.007373929023742676, 0.09180212020874023, 0.1762305647134781, 0.26065900921821594, 0.345087468624115, 0.42951589822769165, 0.5139443278312683, 0.5983728170394897, 0.6828012466430664, 0.7672296762466431, 0.8516581058502197, 0.9360865354537964, 1.020514965057373, 1.1049435138702393, 1.1893718242645264, 1.2738003730773926, 1.3582288026809692, 1.442657232284546, 1.5270856618881226, 1.6115140914916992, 1.6959426403045654, 1.7803709506988525, 1.8647994995117188, 1.9492279291152954, 2.033656358718872, 2.1180849075317383, 2.2025134563446045, 2.2869417667388916, 2.371370315551758, 2.455798625946045, 2.540227174758911, 2.6246557235717773, 2.7090840339660645, 2.7935123443603516]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 14.0, 21.0, 28.0, 51.0, 78.0, 119.0, 226.0, 343.0, 546.0, 861.0, 1567.0, 2514.0, 4346.0, 7772.0, 14075.0, 27113.0, 55223.0, 113766.0, 215393.0, 263345.0, 169441.0, 84421.0, 41009.0, 20590.0, 10972.0, 5983.0, 3470.0, 2074.0, 1240.0, 781.0, 417.0, 285.0, 184.0, 101.0, 61.0, 42.0, 29.0, 18.0, 10.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3681640625, -0.353607177734375, -0.33905029296875, -0.324493408203125, -0.3099365234375, -0.295379638671875, -0.28082275390625, -0.266265869140625, -0.251708984375, -0.237152099609375, -0.22259521484375, -0.208038330078125, -0.1934814453125, -0.178924560546875, -0.16436767578125, -0.149810791015625, -0.13525390625, -0.120697021484375, -0.10614013671875, -0.091583251953125, -0.0770263671875, -0.062469482421875, -0.04791259765625, -0.033355712890625, -0.018798828125, -0.004241943359375, 0.01031494140625, 0.024871826171875, 0.0394287109375, 0.053985595703125, 0.06854248046875, 0.083099365234375, 0.09765625, 0.112213134765625, 0.12677001953125, 0.141326904296875, 0.1558837890625, 0.170440673828125, 0.18499755859375, 0.199554443359375, 0.214111328125, 0.228668212890625, 0.24322509765625, 0.257781982421875, 0.2723388671875, 0.286895751953125, 0.30145263671875, 0.316009521484375, 0.33056640625, 0.345123291015625, 0.35968017578125, 0.374237060546875, 0.3887939453125, 0.403350830078125, 0.41790771484375, 0.432464599609375, 0.447021484375, 0.461578369140625, 0.47613525390625, 0.490692138671875, 0.5052490234375, 0.519805908203125, 0.53436279296875, 0.548919677734375, 0.5634765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 7.0, 10.0, 15.0, 21.0, 14.0, 28.0, 22.0, 34.0, 47.0, 27.0, 36.0, 54.0, 50.0, 41.0, 45.0, 33.0, 39.0, 46.0, 47.0, 40.0, 32.0, 51.0, 41.0, 27.0, 22.0, 31.0, 19.0, 16.0, 16.0, 7.0, 11.0, 11.0, 7.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.6640625, -3.56134033203125, -3.4586181640625, -3.35589599609375, -3.253173828125, -3.15045166015625, -3.0477294921875, -2.94500732421875, -2.84228515625, -2.73956298828125, -2.6368408203125, -2.53411865234375, -2.431396484375, -2.32867431640625, -2.2259521484375, -2.12322998046875, -2.0205078125, -1.91778564453125, -1.8150634765625, -1.71234130859375, -1.609619140625, -1.50689697265625, -1.4041748046875, -1.30145263671875, -1.19873046875, -1.09600830078125, -0.9932861328125, -0.89056396484375, -0.787841796875, -0.68511962890625, -0.5823974609375, -0.47967529296875, -0.376953125, -0.27423095703125, -0.1715087890625, -0.06878662109375, 0.033935546875, 0.13665771484375, 0.2393798828125, 0.34210205078125, 0.44482421875, 0.54754638671875, 0.6502685546875, 0.75299072265625, 0.855712890625, 0.95843505859375, 1.0611572265625, 1.16387939453125, 1.2666015625, 1.36932373046875, 1.4720458984375, 1.57476806640625, 1.677490234375, 1.78021240234375, 1.8829345703125, 1.98565673828125, 2.08837890625, 2.19110107421875, 2.2938232421875, 2.39654541015625, 2.499267578125, 2.60198974609375, 2.7047119140625, 2.80743408203125, 2.91015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 19.0, 19.0, 31.0, 58.0, 56.0, 110.0, 136.0, 268.0, 402.0, 690.0, 1181.0, 2317.0, 4777.0, 10930.0, 31822.0, 697579.0, 255311.0, 24822.0, 9182.0, 4147.0, 1918.0, 1151.0, 570.0, 403.0, 226.0, 129.0, 78.0, 70.0, 36.0, 26.0, 19.0, 17.0, 15.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.940155029296875, -0.90081787109375, -0.861480712890625, -0.8221435546875, -0.782806396484375, -0.74346923828125, -0.704132080078125, -0.664794921875, -0.625457763671875, -0.58612060546875, -0.546783447265625, -0.5074462890625, -0.468109130859375, -0.42877197265625, -0.389434814453125, -0.35009765625, -0.310760498046875, -0.27142333984375, -0.232086181640625, -0.1927490234375, -0.153411865234375, -0.11407470703125, -0.074737548828125, -0.035400390625, 0.003936767578125, 0.04327392578125, 0.082611083984375, 0.1219482421875, 0.161285400390625, 0.20062255859375, 0.239959716796875, 0.279296875, 0.318634033203125, 0.35797119140625, 0.397308349609375, 0.4366455078125, 0.475982666015625, 0.51531982421875, 0.554656982421875, 0.593994140625, 0.633331298828125, 0.67266845703125, 0.712005615234375, 0.7513427734375, 0.790679931640625, 0.83001708984375, 0.869354248046875, 0.90869140625, 0.948028564453125, 0.98736572265625, 1.026702880859375, 1.0660400390625, 1.105377197265625, 1.14471435546875, 1.184051513671875, 1.223388671875, 1.262725830078125, 1.30206298828125, 1.341400146484375, 1.3807373046875, 1.420074462890625, 1.45941162109375, 1.498748779296875, 1.5380859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 4.0, 5.0, 3.0, 6.0, 9.0, 10.0, 9.0, 19.0, 15.0, 24.0, 22.0, 36.0, 44.0, 42.0, 33.0, 34.0, 50.0, 42.0, 48.0, 42.0, 48.0, 51.0, 51.0, 38.0, 37.0, 36.0, 26.0, 33.0, 42.0, 22.0, 30.0, 21.0, 11.0, 18.0, 7.0, 3.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.927734375, -1.861724853515625, -1.79571533203125, -1.729705810546875, -1.6636962890625, -1.597686767578125, -1.53167724609375, -1.465667724609375, -1.399658203125, -1.333648681640625, -1.26763916015625, -1.201629638671875, -1.1356201171875, -1.069610595703125, -1.00360107421875, -0.937591552734375, -0.87158203125, -0.805572509765625, -0.73956298828125, -0.673553466796875, -0.6075439453125, -0.541534423828125, -0.47552490234375, -0.409515380859375, -0.343505859375, -0.277496337890625, -0.21148681640625, -0.145477294921875, -0.0794677734375, -0.013458251953125, 0.05255126953125, 0.118560791015625, 0.1845703125, 0.250579833984375, 0.31658935546875, 0.382598876953125, 0.4486083984375, 0.514617919921875, 0.58062744140625, 0.646636962890625, 0.712646484375, 0.778656005859375, 0.84466552734375, 0.910675048828125, 0.9766845703125, 1.042694091796875, 1.10870361328125, 1.174713134765625, 1.24072265625, 1.306732177734375, 1.37274169921875, 1.438751220703125, 1.5047607421875, 1.570770263671875, 1.63677978515625, 1.702789306640625, 1.768798828125, 1.834808349609375, 1.90081787109375, 1.966827392578125, 2.0328369140625, 2.098846435546875, 2.16485595703125, 2.230865478515625, 2.296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 6.0, 14.0, 20.0, 21.0, 16.0, 53.0, 69.0, 80.0, 142.0, 202.0, 288.0, 420.0, 650.0, 1043.0, 1638.0, 2750.0, 4457.0, 7778.0, 14057.0, 27967.0, 510242.0, 415809.0, 27284.0, 13734.0, 7828.0, 4559.0, 2669.0, 1657.0, 1017.0, 697.0, 447.0, 292.0, 195.0, 127.0, 94.0, 72.0, 42.0, 31.0, 20.0, 21.0, 7.0, 10.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1943359375, -0.18785476684570312, -0.18137359619140625, -0.17489242553710938, -0.1684112548828125, -0.16193008422851562, -0.15544891357421875, -0.14896774291992188, -0.142486572265625, -0.13600540161132812, -0.12952423095703125, -0.12304306030273438, -0.1165618896484375, -0.11008071899414062, -0.10359954833984375, -0.09711837768554688, -0.09063720703125, -0.08415603637695312, -0.07767486572265625, -0.07119369506835938, -0.0647125244140625, -0.058231353759765625, -0.05175018310546875, -0.045269012451171875, -0.038787841796875, -0.032306671142578125, -0.02582550048828125, -0.019344329833984375, -0.0128631591796875, -0.006381988525390625, 9.918212890625e-05, 0.006580352783203125, 0.0130615234375, 0.019542694091796875, 0.02602386474609375, 0.032505035400390625, 0.0389862060546875, 0.045467376708984375, 0.05194854736328125, 0.058429718017578125, 0.064910888671875, 0.07139205932617188, 0.07787322998046875, 0.08435440063476562, 0.0908355712890625, 0.09731674194335938, 0.10379791259765625, 0.11027908325195312, 0.11676025390625, 0.12324142456054688, 0.12972259521484375, 0.13620376586914062, 0.1426849365234375, 0.14916610717773438, 0.15564727783203125, 0.16212844848632812, 0.168609619140625, 0.17509078979492188, 0.18157196044921875, 0.18805313110351562, 0.1945343017578125, 0.20101547241210938, 0.20749664306640625, 0.21397781372070312, 0.220458984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 15.0, 14.0, 8.0, 16.0, 23.0, 25.0, 31.0, 41.0, 56.0, 39.0, 46.0, 44.0, 66.0, 70.0, 57.0, 53.0, 57.0, 48.0, 47.0, 46.0, 39.0, 31.0, 21.0, 23.0, 23.0, 8.0, 6.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187490463256836e-05, -2.1115876734256744e-05, -2.035684883594513e-05, -1.9597820937633514e-05, -1.88387930393219e-05, -1.8079765141010284e-05, -1.732073724269867e-05, -1.6561709344387054e-05, -1.580268144607544e-05, -1.5043653547763824e-05, -1.428462564945221e-05, -1.3525597751140594e-05, -1.276656985282898e-05, -1.2007541954517365e-05, -1.124851405620575e-05, -1.0489486157894135e-05, -9.73045825958252e-06, -8.971430361270905e-06, -8.21240246295929e-06, -7.4533745646476746e-06, -6.6943466663360596e-06, -5.935318768024445e-06, -5.17629086971283e-06, -4.417262971401215e-06, -3.6582350730895996e-06, -2.8992071747779846e-06, -2.1401792764663696e-06, -1.3811513781547546e-06, -6.221234798431396e-07, 1.3690441846847534e-07, 8.959323167800903e-07, 1.6549602150917053e-06, 2.4139881134033203e-06, 3.1730160117149353e-06, 3.93204391002655e-06, 4.691071808338165e-06, 5.45009970664978e-06, 6.209127604961395e-06, 6.96815550327301e-06, 7.727183401584625e-06, 8.48621129989624e-06, 9.245239198207855e-06, 1.000426709651947e-05, 1.0763294994831085e-05, 1.15223228931427e-05, 1.2281350791454315e-05, 1.304037868976593e-05, 1.3799406588077545e-05, 1.455843448638916e-05, 1.5317462384700775e-05, 1.607649028301239e-05, 1.6835518181324005e-05, 1.759454607963562e-05, 1.8353573977947235e-05, 1.911260187625885e-05, 1.9871629774570465e-05, 2.063065767288208e-05, 2.1389685571193695e-05, 2.214871346950531e-05, 2.2907741367816925e-05, 2.366676926612854e-05, 2.4425797164440155e-05, 2.518482506275177e-05, 2.5943852961063385e-05, 2.6702880859375e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 12.0, 14.0, 20.0, 31.0, 36.0, 73.0, 102.0, 165.0, 254.0, 372.0, 581.0, 970.0, 1581.0, 2579.0, 4217.0, 6983.0, 12020.0, 20659.0, 36521.0, 64584.0, 111092.0, 174734.0, 208315.0, 163437.0, 101758.0, 58601.0, 33119.0, 18557.0, 10705.0, 6385.0, 3918.0, 2332.0, 1398.0, 906.0, 537.0, 371.0, 234.0, 128.0, 99.0, 62.0, 40.0, 30.0, 8.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06571769714355469, -0.06332015991210938, -0.06092262268066406, -0.05852508544921875, -0.05612754821777344, -0.053730010986328125, -0.05133247375488281, -0.0489349365234375, -0.04653739929199219, -0.044139862060546875, -0.04174232482910156, -0.03934478759765625, -0.03694725036621094, -0.034549713134765625, -0.03215217590332031, -0.029754638671875, -0.027357101440429688, -0.024959564208984375, -0.022562026977539062, -0.02016448974609375, -0.017766952514648438, -0.015369415283203125, -0.012971878051757812, -0.0105743408203125, -0.008176803588867188, -0.005779266357421875, -0.0033817291259765625, -0.00098419189453125, 0.0014133453369140625, 0.003810882568359375, 0.0062084197998046875, 0.00860595703125, 0.011003494262695312, 0.013401031494140625, 0.015798568725585938, 0.01819610595703125, 0.020593643188476562, 0.022991180419921875, 0.025388717651367188, 0.0277862548828125, 0.030183792114257812, 0.032581329345703125, 0.03497886657714844, 0.03737640380859375, 0.03977394104003906, 0.042171478271484375, 0.04456901550292969, 0.046966552734375, 0.04936408996582031, 0.051761627197265625, 0.05415916442871094, 0.05655670166015625, 0.05895423889160156, 0.061351776123046875, 0.06374931335449219, 0.0661468505859375, 0.06854438781738281, 0.07094192504882812, 0.07333946228027344, 0.07573699951171875, 0.07813453674316406, 0.08053207397460938, 0.08292961120605469, 0.0853271484375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 3.0, 4.0, 12.0, 5.0, 14.0, 8.0, 17.0, 26.0, 29.0, 25.0, 39.0, 41.0, 45.0, 58.0, 40.0, 59.0, 52.0, 55.0, 58.0, 58.0, 56.0, 57.0, 34.0, 49.0, 29.0, 30.0, 19.0, 10.0, 14.0, 12.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.02012491226196289, -0.01945209503173828, -0.018779277801513672, -0.018106460571289062, -0.017433643341064453, -0.016760826110839844, -0.016088008880615234, -0.015415191650390625, -0.014742374420166016, -0.014069557189941406, -0.013396739959716797, -0.012723922729492188, -0.012051105499267578, -0.011378288269042969, -0.01070547103881836, -0.01003265380859375, -0.00935983657836914, -0.008687019348144531, -0.008014202117919922, -0.0073413848876953125, -0.006668567657470703, -0.005995750427246094, -0.005322933197021484, -0.004650115966796875, -0.003977298736572266, -0.0033044815063476562, -0.002631664276123047, -0.0019588470458984375, -0.0012860298156738281, -0.0006132125854492188, 5.9604644775390625e-05, 0.000732421875, 0.0014052391052246094, 0.0020780563354492188, 0.002750873565673828, 0.0034236907958984375, 0.004096508026123047, 0.004769325256347656, 0.005442142486572266, 0.006114959716796875, 0.006787776947021484, 0.007460594177246094, 0.008133411407470703, 0.008806228637695312, 0.009479045867919922, 0.010151863098144531, 0.01082468032836914, 0.01149749755859375, 0.01217031478881836, 0.012843132019042969, 0.013515949249267578, 0.014188766479492188, 0.014861583709716797, 0.015534400939941406, 0.016207218170166016, 0.016880035400390625, 0.017552852630615234, 0.018225669860839844, 0.018898487091064453, 0.019571304321289062, 0.020244121551513672, 0.02091693878173828, 0.02158975601196289, 0.0222625732421875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 14.0, 10.0, 17.0, 18.0, 18.0, 25.0, 42.0, 38.0, 43.0, 54.0, 58.0, 49.0, 82.0, 70.0, 74.0, 41.0, 50.0, 40.0, 32.0, 38.0, 22.0, 19.0, 22.0, 16.0, 22.0, 11.0, 11.0, 4.0, 10.0, 6.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9336400032043457, -3.7984774112701416, -3.6633148193359375, -3.5281522274017334, -3.3929896354675293, -3.257827043533325, -3.122664451599121, -2.987501621246338, -2.852339267730713, -2.717176675796509, -2.5820140838623047, -2.4468514919281006, -2.3116888999938965, -2.1765263080596924, -2.0413637161254883, -1.9062010049819946, -1.771038293838501, -1.6358757019042969, -1.5007131099700928, -1.3655505180358887, -1.2303879261016846, -1.0952253341674805, -0.9600626230239868, -0.8249000310897827, -0.6897374391555786, -0.5545748472213745, -0.419412225484848, -0.28424960374832153, -0.14908701181411743, -0.01392441987991333, 0.12123823165893555, 0.25640082359313965, 0.39156341552734375, 0.5267260074615479, 0.661888599395752, 0.7970512509346008, 0.9322138428688049, 1.0673763751983643, 1.202539086341858, 1.337701678276062, 1.4728642702102661, 1.6080268621444702, 1.7431894540786743, 1.878352165222168, 2.013514757156372, 2.148677349090576, 2.2838399410247803, 2.4190025329589844, 2.5541651248931885, 2.6893277168273926, 2.8244903087615967, 2.959652900695801, 3.094815492630005, 3.229978084564209, 3.365140914916992, 3.500303268432617, 3.6354660987854004, 3.7706286907196045, 3.9057912826538086, 4.040954113006592, 4.176116466522217, 4.311279296875, 4.446441650390625, 4.581604480743408, 4.716766834259033]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 3.0, 5.0, 6.0, 7.0, 8.0, 17.0, 10.0, 19.0, 18.0, 27.0, 29.0, 26.0, 29.0, 36.0, 35.0, 37.0, 39.0, 46.0, 43.0, 43.0, 41.0, 38.0, 46.0, 31.0, 42.0, 32.0, 39.0, 28.0, 29.0, 22.0, 36.0, 23.0, 23.0, 11.0, 6.0, 9.0, 12.0, 7.0, 4.0, 10.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6143991947174072, -2.530123472213745, -2.445847749710083, -2.361572265625, -2.277296543121338, -2.193020820617676, -2.1087450981140137, -2.0244693756103516, -1.940193772315979, -1.855918049812317, -1.7716424465179443, -1.6873667240142822, -1.6030910015106201, -1.5188153982162476, -1.4345396757125854, -1.350264072418213, -1.2659883499145508, -1.1817126274108887, -1.0974370241165161, -1.013161301612854, -0.9288856387138367, -0.8446099758148193, -0.7603342533111572, -0.6760585904121399, -0.5917829275131226, -0.5075072646141052, -0.4232315719127655, -0.3389558792114258, -0.25468021631240845, -0.1704045534133911, -0.086128830909729, -0.00185316801071167, 0.08242225646972656, 0.1666979342699051, 0.2509736120700836, 0.33524930477142334, 0.4195249676704407, 0.503800630569458, 0.5880763530731201, 0.6723520159721375, 0.7566276788711548, 0.8409033417701721, 0.9251790046691895, 1.0094547271728516, 1.0937304496765137, 1.1780060529708862, 1.2622817754745483, 1.346557378768921, 1.430833101272583, 1.5151088237762451, 1.5993844270706177, 1.6836601495742798, 1.7679357528686523, 1.8522114753723145, 1.9364871978759766, 2.0207629203796387, 2.105038642883301, 2.189314365386963, 2.273590087890625, 2.357865810394287, 2.44214129447937, 2.5264170169830322, 2.6106927394866943, 2.6949684619903564, 2.7792439460754395]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 7.0, 14.0, 10.0, 22.0, 23.0, 51.0, 78.0, 96.0, 143.0, 205.0, 356.0, 488.0, 855.0, 1416.0, 2395.0, 4256.0, 7382.0, 12992.0, 23257.0, 41503.0, 72808.0, 118052.0, 167225.0, 185886.0, 156676.0, 105623.0, 63904.0, 36025.0, 20153.0, 11201.0, 6281.0, 3564.0, 2096.0, 1243.0, 799.0, 533.0, 316.0, 209.0, 134.0, 86.0, 55.0, 51.0, 27.0, 17.0, 17.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.88671875, -2.79168701171875, -2.6966552734375, -2.60162353515625, -2.506591796875, -2.41156005859375, -2.3165283203125, -2.22149658203125, -2.12646484375, -2.03143310546875, -1.9364013671875, -1.84136962890625, -1.746337890625, -1.65130615234375, -1.5562744140625, -1.46124267578125, -1.3662109375, -1.27117919921875, -1.1761474609375, -1.08111572265625, -0.986083984375, -0.89105224609375, -0.7960205078125, -0.70098876953125, -0.60595703125, -0.51092529296875, -0.4158935546875, -0.32086181640625, -0.225830078125, -0.13079833984375, -0.0357666015625, 0.05926513671875, 0.154296875, 0.24932861328125, 0.3443603515625, 0.43939208984375, 0.534423828125, 0.62945556640625, 0.7244873046875, 0.81951904296875, 0.91455078125, 1.00958251953125, 1.1046142578125, 1.19964599609375, 1.294677734375, 1.38970947265625, 1.4847412109375, 1.57977294921875, 1.6748046875, 1.76983642578125, 1.8648681640625, 1.95989990234375, 2.054931640625, 2.14996337890625, 2.2449951171875, 2.34002685546875, 2.43505859375, 2.53009033203125, 2.6251220703125, 2.72015380859375, 2.815185546875, 2.91021728515625, 3.0052490234375, 3.10028076171875, 3.1953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 8.0, 7.0, 7.0, 9.0, 9.0, 14.0, 17.0, 18.0, 19.0, 20.0, 29.0, 27.0, 26.0, 26.0, 46.0, 33.0, 37.0, 32.0, 40.0, 41.0, 39.0, 54.0, 41.0, 32.0, 50.0, 37.0, 34.0, 32.0, 28.0, 29.0, 19.0, 30.0, 16.0, 11.0, 8.0, 14.0, 11.0, 7.0, 9.0, 6.0, 8.0, 3.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.931640625, -2.841094970703125, -2.75054931640625, -2.660003662109375, -2.5694580078125, -2.478912353515625, -2.38836669921875, -2.297821044921875, -2.207275390625, -2.116729736328125, -2.02618408203125, -1.935638427734375, -1.8450927734375, -1.754547119140625, -1.66400146484375, -1.573455810546875, -1.48291015625, -1.392364501953125, -1.30181884765625, -1.211273193359375, -1.1207275390625, -1.030181884765625, -0.93963623046875, -0.849090576171875, -0.758544921875, -0.667999267578125, -0.57745361328125, -0.486907958984375, -0.3963623046875, -0.305816650390625, -0.21527099609375, -0.124725341796875, -0.0341796875, 0.056365966796875, 0.14691162109375, 0.237457275390625, 0.3280029296875, 0.418548583984375, 0.50909423828125, 0.599639892578125, 0.690185546875, 0.780731201171875, 0.87127685546875, 0.961822509765625, 1.0523681640625, 1.142913818359375, 1.23345947265625, 1.324005126953125, 1.41455078125, 1.505096435546875, 1.59564208984375, 1.686187744140625, 1.7767333984375, 1.867279052734375, 1.95782470703125, 2.048370361328125, 2.138916015625, 2.229461669921875, 2.32000732421875, 2.410552978515625, 2.5010986328125, 2.591644287109375, 2.68218994140625, 2.772735595703125, 2.86328125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 16.0, 27.0, 33.0, 43.0, 70.0, 90.0, 106.0, 212.0, 315.0, 515.0, 785.0, 1254.0, 2049.0, 3387.0, 5860.0, 10531.0, 19362.0, 34523.0, 62013.0, 105086.0, 157728.0, 189088.0, 170573.0, 119537.0, 71854.0, 41196.0, 22693.0, 12306.0, 6974.0, 4001.0, 2420.0, 1460.0, 869.0, 554.0, 325.0, 251.0, 134.0, 92.0, 67.0, 41.0, 34.0, 27.0, 15.0, 13.0, 9.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.837890625, -2.738800048828125, -2.63970947265625, -2.540618896484375, -2.4415283203125, -2.342437744140625, -2.24334716796875, -2.144256591796875, -2.045166015625, -1.946075439453125, -1.84698486328125, -1.747894287109375, -1.6488037109375, -1.549713134765625, -1.45062255859375, -1.351531982421875, -1.25244140625, -1.153350830078125, -1.05426025390625, -0.955169677734375, -0.8560791015625, -0.756988525390625, -0.65789794921875, -0.558807373046875, -0.459716796875, -0.360626220703125, -0.26153564453125, -0.162445068359375, -0.0633544921875, 0.035736083984375, 0.13482666015625, 0.233917236328125, 0.3330078125, 0.432098388671875, 0.53118896484375, 0.630279541015625, 0.7293701171875, 0.828460693359375, 0.92755126953125, 1.026641845703125, 1.125732421875, 1.224822998046875, 1.32391357421875, 1.423004150390625, 1.5220947265625, 1.621185302734375, 1.72027587890625, 1.819366455078125, 1.91845703125, 2.017547607421875, 2.11663818359375, 2.215728759765625, 2.3148193359375, 2.413909912109375, 2.51300048828125, 2.612091064453125, 2.711181640625, 2.810272216796875, 2.90936279296875, 3.008453369140625, 3.1075439453125, 3.206634521484375, 3.30572509765625, 3.404815673828125, 3.50390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 9.0, 14.0, 8.0, 14.0, 23.0, 12.0, 28.0, 19.0, 14.0, 29.0, 25.0, 24.0, 34.0, 29.0, 35.0, 45.0, 39.0, 39.0, 44.0, 48.0, 42.0, 36.0, 42.0, 34.0, 33.0, 26.0, 29.0, 22.0, 18.0, 29.0, 25.0, 22.0, 18.0, 15.0, 9.0, 9.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.712890625, -1.661163330078125, -1.60943603515625, -1.557708740234375, -1.5059814453125, -1.454254150390625, -1.40252685546875, -1.350799560546875, -1.299072265625, -1.247344970703125, -1.19561767578125, -1.143890380859375, -1.0921630859375, -1.040435791015625, -0.98870849609375, -0.936981201171875, -0.88525390625, -0.833526611328125, -0.78179931640625, -0.730072021484375, -0.6783447265625, -0.626617431640625, -0.57489013671875, -0.523162841796875, -0.471435546875, -0.419708251953125, -0.36798095703125, -0.316253662109375, -0.2645263671875, -0.212799072265625, -0.16107177734375, -0.109344482421875, -0.0576171875, -0.005889892578125, 0.04583740234375, 0.097564697265625, 0.1492919921875, 0.201019287109375, 0.25274658203125, 0.304473876953125, 0.356201171875, 0.407928466796875, 0.45965576171875, 0.511383056640625, 0.5631103515625, 0.614837646484375, 0.66656494140625, 0.718292236328125, 0.77001953125, 0.821746826171875, 0.87347412109375, 0.925201416015625, 0.9769287109375, 1.028656005859375, 1.08038330078125, 1.132110595703125, 1.183837890625, 1.235565185546875, 1.28729248046875, 1.339019775390625, 1.3907470703125, 1.442474365234375, 1.49420166015625, 1.545928955078125, 1.59765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 5.0, 19.0, 23.0, 30.0, 42.0, 58.0, 84.0, 138.0, 201.0, 306.0, 476.0, 809.0, 1278.0, 2073.0, 3431.0, 6171.0, 11411.0, 21687.0, 43342.0, 86810.0, 162603.0, 232870.0, 211291.0, 127716.0, 65488.0, 32208.0, 16882.0, 8865.0, 4905.0, 2823.0, 1677.0, 1039.0, 607.0, 408.0, 234.0, 167.0, 129.0, 84.0, 47.0, 36.0, 28.0, 16.0, 11.0, 5.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.944610595703125, -1.88531494140625, -1.826019287109375, -1.7667236328125, -1.707427978515625, -1.64813232421875, -1.588836669921875, -1.529541015625, -1.470245361328125, -1.41094970703125, -1.351654052734375, -1.2923583984375, -1.233062744140625, -1.17376708984375, -1.114471435546875, -1.05517578125, -0.995880126953125, -0.93658447265625, -0.877288818359375, -0.8179931640625, -0.758697509765625, -0.69940185546875, -0.640106201171875, -0.580810546875, -0.521514892578125, -0.46221923828125, -0.402923583984375, -0.3436279296875, -0.284332275390625, -0.22503662109375, -0.165740966796875, -0.1064453125, -0.047149658203125, 0.01214599609375, 0.071441650390625, 0.1307373046875, 0.190032958984375, 0.24932861328125, 0.308624267578125, 0.367919921875, 0.427215576171875, 0.48651123046875, 0.545806884765625, 0.6051025390625, 0.664398193359375, 0.72369384765625, 0.782989501953125, 0.84228515625, 0.901580810546875, 0.96087646484375, 1.020172119140625, 1.0794677734375, 1.138763427734375, 1.19805908203125, 1.257354736328125, 1.316650390625, 1.375946044921875, 1.43524169921875, 1.494537353515625, 1.5538330078125, 1.613128662109375, 1.67242431640625, 1.731719970703125, 1.791015625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 3.0, 17.0, 16.0, 23.0, 26.0, 70.0, 53.0, 72.0, 102.0, 95.0, 103.0, 94.0, 78.0, 60.0, 47.0, 30.0, 28.0, 17.0, 13.0, 12.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021827220916748047, -0.00021053291857242584, -0.00020279362797737122, -0.0001950543373823166, -0.00018731504678726196, -0.00017957575619220734, -0.0001718364655971527, -0.00016409717500209808, -0.00015635788440704346, -0.00014861859381198883, -0.0001408793032169342, -0.00013314001262187958, -0.00012540072202682495, -0.00011766143143177032, -0.0001099221408367157, -0.00010218285024166107, -9.444355964660645e-05, -8.670426905155182e-05, -7.896497845649719e-05, -7.122568786144257e-05, -6.348639726638794e-05, -5.574710667133331e-05, -4.8007816076278687e-05, -4.026852548122406e-05, -3.2529234886169434e-05, -2.4789944291114807e-05, -1.705065369606018e-05, -9.311363101005554e-06, -1.5720725059509277e-06, 6.167218089103699e-06, 1.3906508684158325e-05, 2.164579927921295e-05, 2.9385089874267578e-05, 3.7124380469322205e-05, 4.486367106437683e-05, 5.260296165943146e-05, 6.0342252254486084e-05, 6.808154284954071e-05, 7.582083344459534e-05, 8.356012403964996e-05, 9.129941463470459e-05, 9.903870522975922e-05, 0.00010677799582481384, 0.00011451728641986847, 0.0001222565770149231, 0.00012999586760997772, 0.00013773515820503235, 0.00014547444880008698, 0.0001532137393951416, 0.00016095302999019623, 0.00016869232058525085, 0.00017643161118030548, 0.0001841709017753601, 0.00019191019237041473, 0.00019964948296546936, 0.000207388773560524, 0.0002151280641555786, 0.00022286735475063324, 0.00023060664534568787, 0.0002383459359407425, 0.0002460852265357971, 0.00025382451713085175, 0.00026156380772590637, 0.000269303098320961, 0.0002770423889160156]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 8.0, 12.0, 19.0, 35.0, 48.0, 59.0, 78.0, 136.0, 206.0, 292.0, 421.0, 669.0, 966.0, 1477.0, 2327.0, 3485.0, 5617.0, 9059.0, 14739.0, 23991.0, 40081.0, 66547.0, 105844.0, 151662.0, 176482.0, 155662.0, 110555.0, 69736.0, 41990.0, 25278.0, 15387.0, 9124.0, 5896.0, 3594.0, 2368.0, 1544.0, 997.0, 702.0, 505.0, 281.0, 220.0, 137.0, 95.0, 73.0, 51.0, 37.0, 22.0, 14.0, 10.0, 11.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3261260986328125, -1.284088134765625, -1.2420501708984375, -1.20001220703125, -1.1579742431640625, -1.115936279296875, -1.0738983154296875, -1.0318603515625, -0.9898223876953125, -0.947784423828125, -0.9057464599609375, -0.86370849609375, -0.8216705322265625, -0.779632568359375, -0.7375946044921875, -0.695556640625, -0.6535186767578125, -0.611480712890625, -0.5694427490234375, -0.52740478515625, -0.4853668212890625, -0.443328857421875, -0.4012908935546875, -0.3592529296875, -0.3172149658203125, -0.275177001953125, -0.2331390380859375, -0.19110107421875, -0.1490631103515625, -0.107025146484375, -0.0649871826171875, -0.02294921875, 0.0190887451171875, 0.061126708984375, 0.1031646728515625, 0.14520263671875, 0.1872406005859375, 0.229278564453125, 0.2713165283203125, 0.3133544921875, 0.3553924560546875, 0.397430419921875, 0.4394683837890625, 0.48150634765625, 0.5235443115234375, 0.565582275390625, 0.6076202392578125, 0.649658203125, 0.6916961669921875, 0.733734130859375, 0.7757720947265625, 0.81781005859375, 0.8598480224609375, 0.901885986328125, 0.9439239501953125, 0.9859619140625, 1.0279998779296875, 1.070037841796875, 1.1120758056640625, 1.15411376953125, 1.1961517333984375, 1.238189697265625, 1.2802276611328125, 1.322265625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 4.0, 9.0, 9.0, 8.0, 10.0, 14.0, 17.0, 13.0, 25.0, 22.0, 44.0, 51.0, 37.0, 65.0, 59.0, 54.0, 71.0, 53.0, 70.0, 59.0, 43.0, 39.0, 37.0, 24.0, 34.0, 19.0, 17.0, 15.0, 11.0, 16.0, 12.0, 7.0, 5.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4609375, -0.445037841796875, -0.42913818359375, -0.413238525390625, -0.3973388671875, -0.381439208984375, -0.36553955078125, -0.349639892578125, -0.333740234375, -0.317840576171875, -0.30194091796875, -0.286041259765625, -0.2701416015625, -0.254241943359375, -0.23834228515625, -0.222442626953125, -0.20654296875, -0.190643310546875, -0.17474365234375, -0.158843994140625, -0.1429443359375, -0.127044677734375, -0.11114501953125, -0.095245361328125, -0.079345703125, -0.063446044921875, -0.04754638671875, -0.031646728515625, -0.0157470703125, 0.000152587890625, 0.01605224609375, 0.031951904296875, 0.0478515625, 0.063751220703125, 0.07965087890625, 0.095550537109375, 0.1114501953125, 0.127349853515625, 0.14324951171875, 0.159149169921875, 0.175048828125, 0.190948486328125, 0.20684814453125, 0.222747802734375, 0.2386474609375, 0.254547119140625, 0.27044677734375, 0.286346435546875, 0.30224609375, 0.318145751953125, 0.33404541015625, 0.349945068359375, 0.3658447265625, 0.381744384765625, 0.39764404296875, 0.413543701171875, 0.429443359375, 0.445343017578125, 0.46124267578125, 0.477142333984375, 0.4930419921875, 0.508941650390625, 0.52484130859375, 0.540740966796875, 0.556640625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 0.0, 8.0, 8.0, 10.0, 6.0, 8.0, 13.0, 18.0, 29.0, 27.0, 21.0, 34.0, 40.0, 46.0, 51.0, 58.0, 61.0, 53.0, 65.0, 47.0, 51.0, 56.0, 34.0, 36.0, 33.0, 28.0, 21.0, 14.0, 19.0, 21.0, 17.0, 14.0, 10.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5796639919281006, -3.455317974090576, -3.330972194671631, -3.2066264152526855, -3.082280397415161, -2.9579343795776367, -2.8335886001586914, -2.709242820739746, -2.5848968029022217, -2.4605507850646973, -2.336205005645752, -2.2118592262268066, -2.0875132083892822, -1.9631673097610474, -1.8388214111328125, -1.7144755125045776, -1.5901296138763428, -1.465783715248108, -1.341437816619873, -1.2170919179916382, -1.0927460193634033, -0.9684001207351685, -0.8440542221069336, -0.7197083234786987, -0.5953624248504639, -0.471016526222229, -0.34667062759399414, -0.22232472896575928, -0.09797883033752441, 0.02636706829071045, 0.1507129669189453, 0.2750588655471802, 0.39940452575683594, 0.5237504243850708, 0.6480963230133057, 0.7724422216415405, 0.8967881202697754, 1.0211340188980103, 1.1454799175262451, 1.26982581615448, 1.3941717147827148, 1.5185176134109497, 1.6428635120391846, 1.7672094106674194, 1.8915553092956543, 2.0159010887145996, 2.140247106552124, 2.2645931243896484, 2.3889389038085938, 2.513284683227539, 2.6376307010650635, 2.761976718902588, 2.886322498321533, 3.0106682777404785, 3.135014295578003, 3.2593603134155273, 3.3837060928344727, 3.508051872253418, 3.6323978900909424, 3.756743907928467, 3.881089687347412, 4.005435466766357, 4.129781723022461, 4.254127502441406, 4.378473281860352]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 10.0, 17.0, 14.0, 17.0, 12.0, 33.0, 26.0, 27.0, 23.0, 28.0, 30.0, 28.0, 38.0, 41.0, 30.0, 38.0, 41.0, 42.0, 49.0, 46.0, 33.0, 32.0, 34.0, 29.0, 35.0, 29.0, 27.0, 29.0, 24.0, 17.0, 21.0, 19.0, 12.0, 7.0, 8.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.772695302963257, -2.6886179447174072, -2.6045405864715576, -2.520463228225708, -2.4363858699798584, -2.352308511734009, -2.2682313919067383, -2.1841540336608887, -2.100076675415039, -2.0159993171691895, -1.9319219589233398, -1.8478446006774902, -1.7637672424316406, -1.679689884185791, -1.595612645149231, -1.5115352869033813, -1.4274578094482422, -1.3433804512023926, -1.259303092956543, -1.1752257347106934, -1.0911483764648438, -1.0070710182189941, -0.9229937791824341, -0.8389164209365845, -0.7548390626907349, -0.6707617044448853, -0.5866843461990356, -0.5026070475578308, -0.4185296893119812, -0.3344523310661316, -0.25037503242492676, -0.16629767417907715, -0.08222031593322754, 0.0018570274114608765, 0.08593437075614929, 0.1700116991996765, 0.2540890574455261, 0.33816641569137573, 0.42224371433258057, 0.5063210725784302, 0.5903984308242798, 0.6744757890701294, 0.758553147315979, 0.8426304459571838, 0.9267078042030334, 1.0107851028442383, 1.094862461090088, 1.1789398193359375, 1.263017177581787, 1.3470945358276367, 1.4311718940734863, 1.515249252319336, 1.5993266105651855, 1.6834039688110352, 1.7674812078475952, 1.8515585660934448, 1.9356359243392944, 2.0197131633758545, 2.103790521621704, 2.1878678798675537, 2.2719452381134033, 2.356022596359253, 2.4400999546051025, 2.524177312850952, 2.6082546710968018]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 13.0, 17.0, 21.0, 26.0, 43.0, 60.0, 111.0, 138.0, 206.0, 338.0, 494.0, 799.0, 1229.0, 1902.0, 3032.0, 4753.0, 7999.0, 13031.0, 22007.0, 38866.0, 69766.0, 132836.0, 263011.0, 525158.0, 895709.0, 960537.0, 609575.0, 304787.0, 151061.0, 78713.0, 43273.0, 24996.0, 15041.0, 9179.0, 5574.0, 3484.0, 2172.0, 1490.0, 990.0, 613.0, 431.0, 262.0, 180.0, 118.0, 76.0, 49.0, 43.0, 29.0, 7.0, 13.0, 12.0, 6.0, 1.0, 4.0, 3.0], "bins": [-3.72265625, -3.613525390625, -3.50439453125, -3.395263671875, -3.2861328125, -3.177001953125, -3.06787109375, -2.958740234375, -2.849609375, -2.740478515625, -2.63134765625, -2.522216796875, -2.4130859375, -2.303955078125, -2.19482421875, -2.085693359375, -1.9765625, -1.867431640625, -1.75830078125, -1.649169921875, -1.5400390625, -1.430908203125, -1.32177734375, -1.212646484375, -1.103515625, -0.994384765625, -0.88525390625, -0.776123046875, -0.6669921875, -0.557861328125, -0.44873046875, -0.339599609375, -0.23046875, -0.121337890625, -0.01220703125, 0.096923828125, 0.2060546875, 0.315185546875, 0.42431640625, 0.533447265625, 0.642578125, 0.751708984375, 0.86083984375, 0.969970703125, 1.0791015625, 1.188232421875, 1.29736328125, 1.406494140625, 1.515625, 1.624755859375, 1.73388671875, 1.843017578125, 1.9521484375, 2.061279296875, 2.17041015625, 2.279541015625, 2.388671875, 2.497802734375, 2.60693359375, 2.716064453125, 2.8251953125, 2.934326171875, 3.04345703125, 3.152587890625, 3.26171875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 1.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 10.0, 11.0, 12.0, 21.0, 22.0, 29.0, 19.0, 20.0, 34.0, 27.0, 37.0, 36.0, 47.0, 31.0, 33.0, 40.0, 34.0, 47.0, 34.0, 45.0, 41.0, 26.0, 31.0, 32.0, 33.0, 37.0, 24.0, 28.0, 16.0, 22.0, 15.0, 9.0, 13.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9384765625, -1.8764801025390625, -1.814483642578125, -1.7524871826171875, -1.69049072265625, -1.6284942626953125, -1.566497802734375, -1.5045013427734375, -1.4425048828125, -1.3805084228515625, -1.318511962890625, -1.2565155029296875, -1.19451904296875, -1.1325225830078125, -1.070526123046875, -1.0085296630859375, -0.946533203125, -0.8845367431640625, -0.822540283203125, -0.7605438232421875, -0.69854736328125, -0.6365509033203125, -0.574554443359375, -0.5125579833984375, -0.4505615234375, -0.3885650634765625, -0.326568603515625, -0.2645721435546875, -0.20257568359375, -0.1405792236328125, -0.078582763671875, -0.0165863037109375, 0.04541015625, 0.1074066162109375, 0.169403076171875, 0.2313995361328125, 0.29339599609375, 0.3553924560546875, 0.417388916015625, 0.4793853759765625, 0.5413818359375, 0.6033782958984375, 0.665374755859375, 0.7273712158203125, 0.78936767578125, 0.8513641357421875, 0.913360595703125, 0.9753570556640625, 1.037353515625, 1.0993499755859375, 1.161346435546875, 1.2233428955078125, 1.28533935546875, 1.3473358154296875, 1.409332275390625, 1.4713287353515625, 1.5333251953125, 1.5953216552734375, 1.657318115234375, 1.7193145751953125, 1.78131103515625, 1.8433074951171875, 1.905303955078125, 1.9673004150390625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 7.0, 5.0, 7.0, 14.0, 20.0, 23.0, 36.0, 61.0, 70.0, 122.0, 179.0, 234.0, 345.0, 479.0, 770.0, 1258.0, 1799.0, 2800.0, 4225.0, 7085.0, 11143.0, 18753.0, 31769.0, 55263.0, 98765.0, 180792.0, 334167.0, 602512.0, 892245.0, 821963.0, 506113.0, 275508.0, 148540.0, 82486.0, 45859.0, 26553.0, 16116.0, 9600.0, 5842.0, 3632.0, 2430.0, 1505.0, 1019.0, 693.0, 487.0, 295.0, 211.0, 150.0, 108.0, 68.0, 52.0, 34.0, 28.0, 15.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.5625, -3.446990966796875, -3.33148193359375, -3.215972900390625, -3.1004638671875, -2.984954833984375, -2.86944580078125, -2.753936767578125, -2.638427734375, -2.522918701171875, -2.40740966796875, -2.291900634765625, -2.1763916015625, -2.060882568359375, -1.94537353515625, -1.829864501953125, -1.71435546875, -1.598846435546875, -1.48333740234375, -1.367828369140625, -1.2523193359375, -1.136810302734375, -1.02130126953125, -0.905792236328125, -0.790283203125, -0.674774169921875, -0.55926513671875, -0.443756103515625, -0.3282470703125, -0.212738037109375, -0.09722900390625, 0.018280029296875, 0.1337890625, 0.249298095703125, 0.36480712890625, 0.480316162109375, 0.5958251953125, 0.711334228515625, 0.82684326171875, 0.942352294921875, 1.057861328125, 1.173370361328125, 1.28887939453125, 1.404388427734375, 1.5198974609375, 1.635406494140625, 1.75091552734375, 1.866424560546875, 1.98193359375, 2.097442626953125, 2.21295166015625, 2.328460693359375, 2.4439697265625, 2.559478759765625, 2.67498779296875, 2.790496826171875, 2.906005859375, 3.021514892578125, 3.13702392578125, 3.252532958984375, 3.3680419921875, 3.483551025390625, 3.59906005859375, 3.714569091796875, 3.830078125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 15.0, 16.0, 25.0, 35.0, 31.0, 41.0, 55.0, 61.0, 84.0, 113.0, 113.0, 149.0, 153.0, 186.0, 210.0, 250.0, 243.0, 280.0, 246.0, 279.0, 210.0, 198.0, 189.0, 135.0, 135.0, 125.0, 91.0, 80.0, 53.0, 43.0, 41.0, 31.0, 30.0, 18.0, 23.0, 23.0, 6.0, 9.0, 5.0, 2.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.2822265625, -1.24560546875, -1.208984375, -1.17236328125, -1.1357421875, -1.09912109375, -1.0625, -1.02587890625, -0.9892578125, -0.95263671875, -0.916015625, -0.87939453125, -0.8427734375, -0.80615234375, -0.76953125, -0.73291015625, -0.6962890625, -0.65966796875, -0.623046875, -0.58642578125, -0.5498046875, -0.51318359375, -0.4765625, -0.43994140625, -0.4033203125, -0.36669921875, -0.330078125, -0.29345703125, -0.2568359375, -0.22021484375, -0.18359375, -0.14697265625, -0.1103515625, -0.07373046875, -0.037109375, -0.00048828125, 0.0361328125, 0.07275390625, 0.109375, 0.14599609375, 0.1826171875, 0.21923828125, 0.255859375, 0.29248046875, 0.3291015625, 0.36572265625, 0.40234375, 0.43896484375, 0.4755859375, 0.51220703125, 0.548828125, 0.58544921875, 0.6220703125, 0.65869140625, 0.6953125, 0.73193359375, 0.7685546875, 0.80517578125, 0.841796875, 0.87841796875, 0.9150390625, 0.95166015625, 0.98828125, 1.02490234375, 1.0615234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 9.0, 15.0, 14.0, 19.0, 25.0, 24.0, 38.0, 40.0, 47.0, 51.0, 54.0, 71.0, 49.0, 61.0, 57.0, 56.0, 47.0, 48.0, 37.0, 30.0, 27.0, 27.0, 21.0, 17.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 2.0, 10.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.496438026428223, -4.368464469909668, -4.2404913902282715, -4.112517833709717, -3.984544515609741, -3.8565711975097656, -3.72859787940979, -3.6006245613098145, -3.4726510047912598, -3.344677686691284, -3.2167043685913086, -3.088730812072754, -2.9607574939727783, -2.8327841758728027, -2.704810857772827, -2.5768375396728516, -2.448864221572876, -2.3208909034729004, -2.192917585372925, -2.064944267272949, -1.9369707107543945, -1.808997392654419, -1.6810240745544434, -1.5530507564544678, -1.4250773191452026, -1.297104001045227, -1.169130563735962, -1.0411572456359863, -0.913183867931366, -0.7852104902267456, -0.65723717212677, -0.5292637944221497, -0.4012901782989502, -0.27331680059432983, -0.14534345269203186, -0.017370104789733887, 0.11060327291488647, 0.23857665061950684, 0.3665499687194824, 0.4945233464241028, 0.6224967241287231, 0.7504701018333435, 0.8784434795379639, 1.0064167976379395, 1.134390115737915, 1.2623635530471802, 1.3903368711471558, 1.518310308456421, 1.6462836265563965, 1.774256944656372, 1.9022303819656372, 2.0302038192749023, 2.158177137374878, 2.2861504554748535, 2.414123773574829, 2.5420970916748047, 2.6700706481933594, 2.798043966293335, 2.9260172843933105, 3.0539908409118652, 3.181964159011841, 3.3099374771118164, 3.437910795211792, 3.5658841133117676, 3.693857431411743]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 7.0, 10.0, 10.0, 13.0, 13.0, 11.0, 16.0, 14.0, 13.0, 24.0, 26.0, 24.0, 40.0, 36.0, 33.0, 43.0, 35.0, 44.0, 42.0, 50.0, 42.0, 42.0, 40.0, 39.0, 51.0, 40.0, 37.0, 38.0, 30.0, 20.0, 21.0, 15.0, 12.0, 15.0, 11.0, 10.0, 1.0, 6.0, 3.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6131093502044678, -2.5276355743408203, -2.442161798477173, -2.3566880226135254, -2.271214246749878, -2.1857404708862305, -2.100266695022583, -2.0147929191589355, -1.929319143295288, -1.8438453674316406, -1.7583715915679932, -1.6728978157043457, -1.5874240398406982, -1.5019502639770508, -1.4164764881134033, -1.3310027122497559, -1.2455288171768188, -1.1600550413131714, -1.074581265449524, -0.9891074895858765, -0.903633713722229, -0.8181599378585815, -0.7326861023902893, -0.6472123265266418, -0.5617385506629944, -0.4762647747993469, -0.39079099893569946, -0.3053171932697296, -0.21984341740608215, -0.1343696415424347, -0.048895835876464844, 0.03657793998718262, 0.12205171585083008, 0.20752549171447754, 0.292999267578125, 0.37847307324409485, 0.4639468491077423, 0.5494205951690674, 0.6348944306373596, 0.7203682065010071, 0.8058419823646545, 0.891315758228302, 0.9767895340919495, 1.0622633695602417, 1.1477371454238892, 1.2332109212875366, 1.318684697151184, 1.4041584730148315, 1.489632248878479, 1.5751060247421265, 1.660579800605774, 1.7460535764694214, 1.8315273523330688, 1.9170011281967163, 2.0024750232696533, 2.087948799133301, 2.1734225749969482, 2.2588963508605957, 2.344370126724243, 2.4298439025878906, 2.515317678451538, 2.6007914543151855, 2.686265230178833, 2.7717390060424805, 2.857212781906128]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 16.0, 21.0, 31.0, 45.0, 74.0, 96.0, 113.0, 168.0, 306.0, 396.0, 681.0, 1029.0, 1532.0, 2516.0, 4023.0, 6822.0, 11860.0, 21531.0, 40597.0, 79134.0, 152402.0, 242129.0, 218644.0, 124461.0, 63906.0, 33248.0, 17540.0, 9842.0, 5729.0, 3483.0, 2186.0, 1364.0, 867.0, 591.0, 392.0, 249.0, 172.0, 118.0, 64.0, 53.0, 30.0, 31.0, 23.0, 11.0, 9.0, 11.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.367431640625, -0.3558921813964844, -0.34435272216796875, -0.3328132629394531, -0.3212738037109375, -0.3097343444824219, -0.29819488525390625, -0.2866554260253906, -0.275115966796875, -0.2635765075683594, -0.25203704833984375, -0.24049758911132812, -0.2289581298828125, -0.21741867065429688, -0.20587921142578125, -0.19433975219726562, -0.18280029296875, -0.17126083374023438, -0.15972137451171875, -0.14818191528320312, -0.1366424560546875, -0.12510299682617188, -0.11356353759765625, -0.10202407836914062, -0.090484619140625, -0.07894515991210938, -0.06740570068359375, -0.055866241455078125, -0.0443267822265625, -0.032787322998046875, -0.02124786376953125, -0.009708404541015625, 0.0018310546875, 0.013370513916015625, 0.02490997314453125, 0.036449432373046875, 0.0479888916015625, 0.059528350830078125, 0.07106781005859375, 0.08260726928710938, 0.094146728515625, 0.10568618774414062, 0.11722564697265625, 0.12876510620117188, 0.1403045654296875, 0.15184402465820312, 0.16338348388671875, 0.17492294311523438, 0.18646240234375, 0.19800186157226562, 0.20954132080078125, 0.22108078002929688, 0.2326202392578125, 0.24415969848632812, 0.25569915771484375, 0.2672386169433594, 0.278778076171875, 0.2903175354003906, 0.30185699462890625, 0.3133964538574219, 0.3249359130859375, 0.3364753723144531, 0.34801483154296875, 0.3595542907714844, 0.37109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 16.0, 17.0, 15.0, 25.0, 27.0, 29.0, 35.0, 39.0, 47.0, 50.0, 65.0, 52.0, 42.0, 71.0, 51.0, 56.0, 34.0, 43.0, 46.0, 32.0, 33.0, 18.0, 24.0, 20.0, 18.0, 14.0, 7.0, 3.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337890625, -3.22503662109375, -3.1121826171875, -2.99932861328125, -2.886474609375, -2.77362060546875, -2.6607666015625, -2.54791259765625, -2.43505859375, -2.32220458984375, -2.2093505859375, -2.09649658203125, -1.983642578125, -1.87078857421875, -1.7579345703125, -1.64508056640625, -1.5322265625, -1.41937255859375, -1.3065185546875, -1.19366455078125, -1.080810546875, -0.96795654296875, -0.8551025390625, -0.74224853515625, -0.62939453125, -0.51654052734375, -0.4036865234375, -0.29083251953125, -0.177978515625, -0.06512451171875, 0.0477294921875, 0.16058349609375, 0.2734375, 0.38629150390625, 0.4991455078125, 0.61199951171875, 0.724853515625, 0.83770751953125, 0.9505615234375, 1.06341552734375, 1.17626953125, 1.28912353515625, 1.4019775390625, 1.51483154296875, 1.627685546875, 1.74053955078125, 1.8533935546875, 1.96624755859375, 2.0791015625, 2.19195556640625, 2.3048095703125, 2.41766357421875, 2.530517578125, 2.64337158203125, 2.7562255859375, 2.86907958984375, 2.98193359375, 3.09478759765625, 3.2076416015625, 3.32049560546875, 3.433349609375, 3.54620361328125, 3.6590576171875, 3.77191162109375, 3.884765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 5.0, 7.0, 10.0, 6.0, 16.0, 22.0, 32.0, 43.0, 49.0, 62.0, 86.0, 110.0, 191.0, 288.0, 393.0, 593.0, 897.0, 1366.0, 2463.0, 4203.0, 8344.0, 18001.0, 62307.0, 821098.0, 86651.0, 20708.0, 9069.0, 4653.0, 2621.0, 1514.0, 875.0, 580.0, 372.0, 277.0, 173.0, 140.0, 90.0, 68.0, 40.0, 37.0, 21.0, 20.0, 14.0, 7.0, 10.0, 6.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.875, -0.8454132080078125, -0.815826416015625, -0.7862396240234375, -0.75665283203125, -0.7270660400390625, -0.697479248046875, -0.6678924560546875, -0.6383056640625, -0.6087188720703125, -0.579132080078125, -0.5495452880859375, -0.51995849609375, -0.4903717041015625, -0.460784912109375, -0.4311981201171875, -0.401611328125, -0.3720245361328125, -0.342437744140625, -0.3128509521484375, -0.28326416015625, -0.2536773681640625, -0.224090576171875, -0.1945037841796875, -0.1649169921875, -0.1353302001953125, -0.105743408203125, -0.0761566162109375, -0.04656982421875, -0.0169830322265625, 0.012603759765625, 0.0421905517578125, 0.07177734375, 0.1013641357421875, 0.130950927734375, 0.1605377197265625, 0.19012451171875, 0.2197113037109375, 0.249298095703125, 0.2788848876953125, 0.3084716796875, 0.3380584716796875, 0.367645263671875, 0.3972320556640625, 0.42681884765625, 0.4564056396484375, 0.485992431640625, 0.5155792236328125, 0.545166015625, 0.5747528076171875, 0.604339599609375, 0.6339263916015625, 0.66351318359375, 0.6930999755859375, 0.722686767578125, 0.7522735595703125, 0.7818603515625, 0.8114471435546875, 0.841033935546875, 0.8706207275390625, 0.90020751953125, 0.9297943115234375, 0.959381103515625, 0.9889678955078125, 1.0185546875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 7.0, 7.0, 7.0, 5.0, 6.0, 6.0, 9.0, 11.0, 25.0, 17.0, 23.0, 20.0, 22.0, 24.0, 32.0, 28.0, 25.0, 28.0, 41.0, 25.0, 43.0, 39.0, 47.0, 30.0, 45.0, 46.0, 43.0, 42.0, 32.0, 28.0, 29.0, 22.0, 24.0, 27.0, 12.0, 18.0, 21.0, 10.0, 19.0, 20.0, 9.0, 6.0, 6.0, 5.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.612030029296875, -1.55609130859375, -1.500152587890625, -1.4442138671875, -1.388275146484375, -1.33233642578125, -1.276397705078125, -1.220458984375, -1.164520263671875, -1.10858154296875, -1.052642822265625, -0.9967041015625, -0.940765380859375, -0.88482666015625, -0.828887939453125, -0.77294921875, -0.717010498046875, -0.66107177734375, -0.605133056640625, -0.5491943359375, -0.493255615234375, -0.43731689453125, -0.381378173828125, -0.325439453125, -0.269500732421875, -0.21356201171875, -0.157623291015625, -0.1016845703125, -0.045745849609375, 0.01019287109375, 0.066131591796875, 0.1220703125, 0.178009033203125, 0.23394775390625, 0.289886474609375, 0.3458251953125, 0.401763916015625, 0.45770263671875, 0.513641357421875, 0.569580078125, 0.625518798828125, 0.68145751953125, 0.737396240234375, 0.7933349609375, 0.849273681640625, 0.90521240234375, 0.961151123046875, 1.01708984375, 1.073028564453125, 1.12896728515625, 1.184906005859375, 1.2408447265625, 1.296783447265625, 1.35272216796875, 1.408660888671875, 1.464599609375, 1.520538330078125, 1.57647705078125, 1.632415771484375, 1.6883544921875, 1.744293212890625, 1.80023193359375, 1.856170654296875, 1.912109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 14.0, 25.0, 25.0, 38.0, 52.0, 79.0, 128.0, 175.0, 278.0, 371.0, 571.0, 845.0, 1380.0, 2124.0, 3315.0, 5229.0, 8823.0, 14982.0, 28882.0, 520861.0, 395118.0, 27700.0, 14742.0, 8471.0, 5116.0, 3170.0, 2091.0, 1330.0, 902.0, 531.0, 352.0, 245.0, 181.0, 118.0, 83.0, 59.0, 44.0, 22.0, 22.0, 11.0, 15.0, 7.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1239013671875, -0.11947250366210938, -0.11504364013671875, -0.11061477661132812, -0.1061859130859375, -0.10175704956054688, -0.09732818603515625, -0.09289932250976562, -0.088470458984375, -0.08404159545898438, -0.07961273193359375, -0.07518386840820312, -0.0707550048828125, -0.06632614135742188, -0.06189727783203125, -0.057468414306640625, -0.05303955078125, -0.048610687255859375, -0.04418182373046875, -0.039752960205078125, -0.0353240966796875, -0.030895233154296875, -0.02646636962890625, -0.022037506103515625, -0.017608642578125, -0.013179779052734375, -0.00875091552734375, -0.004322052001953125, 0.0001068115234375, 0.004535675048828125, 0.00896453857421875, 0.013393402099609375, 0.017822265625, 0.022251129150390625, 0.02667999267578125, 0.031108856201171875, 0.0355377197265625, 0.039966583251953125, 0.04439544677734375, 0.048824310302734375, 0.053253173828125, 0.057682037353515625, 0.06211090087890625, 0.06653976440429688, 0.0709686279296875, 0.07539749145507812, 0.07982635498046875, 0.08425521850585938, 0.08868408203125, 0.09311294555664062, 0.09754180908203125, 0.10197067260742188, 0.1063995361328125, 0.11082839965820312, 0.11525726318359375, 0.11968612670898438, 0.124114990234375, 0.12854385375976562, 0.13297271728515625, 0.13740158081054688, 0.1418304443359375, 0.14625930786132812, 0.15068817138671875, 0.15511703491210938, 0.1595458984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 5.0, 8.0, 14.0, 12.0, 14.0, 15.0, 14.0, 20.0, 19.0, 25.0, 21.0, 41.0, 33.0, 40.0, 36.0, 36.0, 37.0, 39.0, 33.0, 42.0, 46.0, 38.0, 42.0, 47.0, 44.0, 40.0, 29.0, 34.0, 29.0, 10.0, 17.0, 18.0, 17.0, 16.0, 14.0, 9.0, 10.0, 8.0, 8.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-05, -1.322571188211441e-05, -1.2742355465888977e-05, -1.2258999049663544e-05, -1.177564263343811e-05, -1.1292286217212677e-05, -1.0808929800987244e-05, -1.032557338476181e-05, -9.842216968536377e-06, -9.358860552310944e-06, -8.87550413608551e-06, -8.392147719860077e-06, -7.908791303634644e-06, -7.42543488740921e-06, -6.942078471183777e-06, -6.4587220549583435e-06, -5.97536563873291e-06, -5.492009222507477e-06, -5.0086528062820435e-06, -4.52529639005661e-06, -4.041939973831177e-06, -3.5585835576057434e-06, -3.07522714138031e-06, -2.5918707251548767e-06, -2.1085143089294434e-06, -1.62515789270401e-06, -1.1418014764785767e-06, -6.584450602531433e-07, -1.7508864402770996e-07, 3.082677721977234e-07, 7.916241884231567e-07, 1.27498060464859e-06, 1.7583370208740234e-06, 2.2416934370994568e-06, 2.72504985332489e-06, 3.2084062695503235e-06, 3.691762685775757e-06, 4.17511910200119e-06, 4.6584755182266235e-06, 5.141831934452057e-06, 5.62518835067749e-06, 6.108544766902924e-06, 6.591901183128357e-06, 7.07525759935379e-06, 7.558614015579224e-06, 8.041970431804657e-06, 8.52532684803009e-06, 9.008683264255524e-06, 9.492039680480957e-06, 9.97539609670639e-06, 1.0458752512931824e-05, 1.0942108929157257e-05, 1.142546534538269e-05, 1.1908821761608124e-05, 1.2392178177833557e-05, 1.287553459405899e-05, 1.3358891010284424e-05, 1.3842247426509857e-05, 1.432560384273529e-05, 1.4808960258960724e-05, 1.5292316675186157e-05, 1.577567309141159e-05, 1.6259029507637024e-05, 1.6742385923862457e-05, 1.722574234008789e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 12.0, 8.0, 10.0, 28.0, 28.0, 48.0, 77.0, 109.0, 179.0, 271.0, 466.0, 616.0, 1077.0, 1704.0, 2758.0, 4774.0, 7850.0, 13115.0, 22629.0, 38990.0, 66707.0, 110457.0, 164014.0, 191656.0, 159762.0, 106611.0, 64029.0, 37358.0, 21464.0, 12611.0, 7439.0, 4481.0, 2680.0, 1716.0, 967.0, 648.0, 416.0, 233.0, 211.0, 102.0, 85.0, 46.0, 33.0, 26.0, 17.0, 9.0, 13.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0582275390625, -0.056433677673339844, -0.05463981628417969, -0.05284595489501953, -0.051052093505859375, -0.04925823211669922, -0.04746437072753906, -0.045670509338378906, -0.04387664794921875, -0.042082786560058594, -0.04028892517089844, -0.03849506378173828, -0.036701202392578125, -0.03490734100341797, -0.03311347961425781, -0.031319618225097656, -0.0295257568359375, -0.027731895446777344, -0.025938034057617188, -0.02414417266845703, -0.022350311279296875, -0.02055644989013672, -0.018762588500976562, -0.016968727111816406, -0.01517486572265625, -0.013381004333496094, -0.011587142944335938, -0.009793281555175781, -0.007999420166015625, -0.006205558776855469, -0.0044116973876953125, -0.0026178359985351562, -0.000823974609375, 0.0009698867797851562, 0.0027637481689453125, 0.004557609558105469, 0.006351470947265625, 0.008145332336425781, 0.009939193725585938, 0.011733055114746094, 0.01352691650390625, 0.015320777893066406, 0.017114639282226562, 0.01890850067138672, 0.020702362060546875, 0.02249622344970703, 0.024290084838867188, 0.026083946228027344, 0.0278778076171875, 0.029671669006347656, 0.03146553039550781, 0.03325939178466797, 0.035053253173828125, 0.03684711456298828, 0.03864097595214844, 0.040434837341308594, 0.04222869873046875, 0.044022560119628906, 0.04581642150878906, 0.04761028289794922, 0.049404144287109375, 0.05119800567626953, 0.05299186706542969, 0.054785728454589844, 0.05657958984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 14.0, 23.0, 21.0, 37.0, 48.0, 54.0, 67.0, 93.0, 82.0, 79.0, 90.0, 72.0, 81.0, 49.0, 40.0, 28.0, 27.0, 19.0, 13.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02734375, -0.026546716690063477, -0.025749683380126953, -0.02495265007019043, -0.024155616760253906, -0.023358583450317383, -0.02256155014038086, -0.021764516830444336, -0.020967483520507812, -0.02017045021057129, -0.019373416900634766, -0.018576383590698242, -0.01777935028076172, -0.016982316970825195, -0.016185283660888672, -0.015388250350952148, -0.014591217041015625, -0.013794183731079102, -0.012997150421142578, -0.012200117111206055, -0.011403083801269531, -0.010606050491333008, -0.009809017181396484, -0.009011983871459961, -0.008214950561523438, -0.007417917251586914, -0.006620883941650391, -0.005823850631713867, -0.005026817321777344, -0.00422978401184082, -0.003432750701904297, -0.0026357173919677734, -0.00183868408203125, -0.0010416507720947266, -0.0002446174621582031, 0.0005524158477783203, 0.0013494491577148438, 0.002146482467651367, 0.0029435157775878906, 0.003740549087524414, 0.0045375823974609375, 0.005334615707397461, 0.006131649017333984, 0.006928682327270508, 0.007725715637207031, 0.008522748947143555, 0.009319782257080078, 0.010116815567016602, 0.010913848876953125, 0.011710882186889648, 0.012507915496826172, 0.013304948806762695, 0.014101982116699219, 0.014899015426635742, 0.015696048736572266, 0.01649308204650879, 0.017290115356445312, 0.018087148666381836, 0.01888418197631836, 0.019681215286254883, 0.020478248596191406, 0.02127528190612793, 0.022072315216064453, 0.022869348526000977, 0.0236663818359375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 8.0, 12.0, 16.0, 11.0, 19.0, 19.0, 27.0, 26.0, 46.0, 41.0, 51.0, 53.0, 56.0, 64.0, 63.0, 57.0, 57.0, 48.0, 54.0, 41.0, 34.0, 22.0, 30.0, 24.0, 20.0, 13.0, 11.0, 10.0, 10.0, 9.0, 3.0, 4.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.615414142608643, -4.485564231872559, -4.355713844299316, -4.225863933563232, -4.096014022827148, -3.9661636352539062, -3.8363137245178223, -3.706463575363159, -3.576613426208496, -3.446763277053833, -3.316913366317749, -3.187063217163086, -3.057213068008423, -2.9273629188537598, -2.797513008117676, -2.6676628589630127, -2.5378129482269287, -2.4079627990722656, -2.2781128883361816, -2.1482627391815186, -2.0184125900268555, -1.888562560081482, -1.7587125301361084, -1.6288623809814453, -1.4990123510360718, -1.3691623210906982, -1.2393121719360352, -1.1094621419906616, -0.9796120524406433, -0.849761962890625, -0.7199119329452515, -0.5900618433952332, -0.46021151542663574, -0.33036142587661743, -0.2005113661289215, -0.07066130638122559, 0.059188783168792725, 0.18903887271881104, 0.31888890266418457, 0.4487389922142029, 0.5785890817642212, 0.7084391713142395, 0.8382892608642578, 0.9681392908096313, 1.0979893207550049, 1.227839469909668, 1.3576894998550415, 1.487539529800415, 1.6173896789550781, 1.7472397089004517, 1.8770898580551147, 2.0069398880004883, 2.1367900371551514, 2.2666401863098145, 2.3964900970458984, 2.5263402462005615, 2.6561903953552246, 2.7860405445098877, 2.9158904552459717, 3.0457406044006348, 3.175590753555298, 3.305440902709961, 3.435290813446045, 3.565140962600708, 3.694990873336792]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 12.0, 8.0, 16.0, 12.0, 11.0, 18.0, 10.0, 13.0, 27.0, 26.0, 27.0, 34.0, 41.0, 30.0, 44.0, 36.0, 43.0, 46.0, 47.0, 42.0, 45.0, 37.0, 40.0, 48.0, 39.0, 37.0, 40.0, 30.0, 18.0, 23.0, 12.0, 13.0, 14.0, 12.0, 9.0, 1.0, 6.0, 4.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.592935085296631, -2.507789134979248, -2.4226431846618652, -2.3374974727630615, -2.2523515224456787, -2.167205572128296, -2.082059621810913, -1.9969137907028198, -1.9117679595947266, -1.8266220092773438, -1.7414761781692505, -1.6563302278518677, -1.5711843967437744, -1.4860384464263916, -1.4008924961090088, -1.3157466650009155, -1.2306007146835327, -1.14545476436615, -1.0603089332580566, -0.9751629829406738, -0.8900171518325806, -0.8048712015151978, -0.7197253108024597, -0.6345794200897217, -0.5494335293769836, -0.4642876386642456, -0.37914174795150757, -0.29399582743644714, -0.2088499367237091, -0.12370404601097107, -0.038558125495910645, 0.04658776521682739, 0.13173365592956543, 0.21687954664230347, 0.3020254373550415, 0.38717135787010193, 0.47231724858283997, 0.5574631690979004, 0.6426090598106384, 0.7277549505233765, 0.8129008412361145, 0.8980467319488525, 0.9831926226615906, 1.0683385133743286, 1.1534844636917114, 1.2386302947998047, 1.3237762451171875, 1.4089221954345703, 1.4940680265426636, 1.5792139768600464, 1.6643598079681396, 1.7495057582855225, 1.8346515893936157, 1.9197975397109985, 2.004943370819092, 2.0900893211364746, 2.1752352714538574, 2.2603812217712402, 2.345527172088623, 2.4306728839874268, 2.5158188343048096, 2.6009647846221924, 2.686110734939575, 2.771256446838379, 2.8564023971557617]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 12.0, 8.0, 20.0, 22.0, 49.0, 52.0, 98.0, 150.0, 213.0, 337.0, 549.0, 877.0, 1357.0, 2396.0, 4162.0, 7593.0, 14313.0, 27009.0, 51777.0, 95480.0, 156596.0, 204335.0, 189142.0, 130639.0, 74832.0, 40063.0, 20976.0, 10979.0, 6037.0, 3355.0, 1978.0, 1206.0, 675.0, 454.0, 296.0, 164.0, 102.0, 92.0, 48.0, 41.0, 17.0, 18.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.384765625, -3.2783203125, -3.171875, -3.0654296875, -2.958984375, -2.8525390625, -2.74609375, -2.6396484375, -2.533203125, -2.4267578125, -2.3203125, -2.2138671875, -2.107421875, -2.0009765625, -1.89453125, -1.7880859375, -1.681640625, -1.5751953125, -1.46875, -1.3623046875, -1.255859375, -1.1494140625, -1.04296875, -0.9365234375, -0.830078125, -0.7236328125, -0.6171875, -0.5107421875, -0.404296875, -0.2978515625, -0.19140625, -0.0849609375, 0.021484375, 0.1279296875, 0.234375, 0.3408203125, 0.447265625, 0.5537109375, 0.66015625, 0.7666015625, 0.873046875, 0.9794921875, 1.0859375, 1.1923828125, 1.298828125, 1.4052734375, 1.51171875, 1.6181640625, 1.724609375, 1.8310546875, 1.9375, 2.0439453125, 2.150390625, 2.2568359375, 2.36328125, 2.4697265625, 2.576171875, 2.6826171875, 2.7890625, 2.8955078125, 3.001953125, 3.1083984375, 3.21484375, 3.3212890625, 3.427734375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 8.0, 12.0, 5.0, 13.0, 15.0, 10.0, 21.0, 21.0, 16.0, 26.0, 36.0, 25.0, 30.0, 26.0, 47.0, 33.0, 43.0, 30.0, 46.0, 42.0, 34.0, 43.0, 50.0, 39.0, 53.0, 21.0, 27.0, 30.0, 26.0, 24.0, 17.0, 21.0, 10.0, 13.0, 12.0, 9.0, 8.0, 5.0, 4.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.796875, -2.7100830078125, -2.623291015625, -2.5364990234375, -2.44970703125, -2.3629150390625, -2.276123046875, -2.1893310546875, -2.1025390625, -2.0157470703125, -1.928955078125, -1.8421630859375, -1.75537109375, -1.6685791015625, -1.581787109375, -1.4949951171875, -1.408203125, -1.3214111328125, -1.234619140625, -1.1478271484375, -1.06103515625, -0.9742431640625, -0.887451171875, -0.8006591796875, -0.7138671875, -0.6270751953125, -0.540283203125, -0.4534912109375, -0.36669921875, -0.2799072265625, -0.193115234375, -0.1063232421875, -0.01953125, 0.0672607421875, 0.154052734375, 0.2408447265625, 0.32763671875, 0.4144287109375, 0.501220703125, 0.5880126953125, 0.6748046875, 0.7615966796875, 0.848388671875, 0.9351806640625, 1.02197265625, 1.1087646484375, 1.195556640625, 1.2823486328125, 1.369140625, 1.4559326171875, 1.542724609375, 1.6295166015625, 1.71630859375, 1.8031005859375, 1.889892578125, 1.9766845703125, 2.0634765625, 2.1502685546875, 2.237060546875, 2.3238525390625, 2.41064453125, 2.4974365234375, 2.584228515625, 2.6710205078125, 2.7578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 8.0, 12.0, 20.0, 28.0, 61.0, 88.0, 179.0, 270.0, 496.0, 954.0, 1703.0, 3367.0, 6769.0, 13599.0, 27218.0, 54835.0, 105702.0, 177670.0, 223102.0, 189862.0, 118262.0, 62079.0, 31096.0, 15294.0, 7641.0, 3918.0, 2015.0, 1045.0, 521.0, 315.0, 169.0, 90.0, 58.0, 32.0, 23.0, 18.0, 11.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.48760986328125, -3.3697509765625, -3.25189208984375, -3.134033203125, -3.01617431640625, -2.8983154296875, -2.78045654296875, -2.66259765625, -2.54473876953125, -2.4268798828125, -2.30902099609375, -2.191162109375, -2.07330322265625, -1.9554443359375, -1.83758544921875, -1.7197265625, -1.60186767578125, -1.4840087890625, -1.36614990234375, -1.248291015625, -1.13043212890625, -1.0125732421875, -0.89471435546875, -0.77685546875, -0.65899658203125, -0.5411376953125, -0.42327880859375, -0.305419921875, -0.18756103515625, -0.0697021484375, 0.04815673828125, 0.166015625, 0.28387451171875, 0.4017333984375, 0.51959228515625, 0.637451171875, 0.75531005859375, 0.8731689453125, 0.99102783203125, 1.10888671875, 1.22674560546875, 1.3446044921875, 1.46246337890625, 1.580322265625, 1.69818115234375, 1.8160400390625, 1.93389892578125, 2.0517578125, 2.16961669921875, 2.2874755859375, 2.40533447265625, 2.523193359375, 2.64105224609375, 2.7589111328125, 2.87677001953125, 2.99462890625, 3.11248779296875, 3.2303466796875, 3.34820556640625, 3.466064453125, 3.58392333984375, 3.7017822265625, 3.81964111328125, 3.9375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 1.0, 6.0, 4.0, 3.0, 4.0, 11.0, 9.0, 14.0, 6.0, 10.0, 14.0, 10.0, 25.0, 20.0, 17.0, 17.0, 34.0, 24.0, 39.0, 32.0, 26.0, 34.0, 39.0, 45.0, 40.0, 26.0, 48.0, 42.0, 31.0, 31.0, 35.0, 36.0, 33.0, 26.0, 25.0, 23.0, 38.0, 19.0, 11.0, 17.0, 20.0, 10.0, 7.0, 8.0, 12.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.6494140625, -1.599700927734375, -1.54998779296875, -1.500274658203125, -1.4505615234375, -1.400848388671875, -1.35113525390625, -1.301422119140625, -1.251708984375, -1.201995849609375, -1.15228271484375, -1.102569580078125, -1.0528564453125, -1.003143310546875, -0.95343017578125, -0.903717041015625, -0.85400390625, -0.804290771484375, -0.75457763671875, -0.704864501953125, -0.6551513671875, -0.605438232421875, -0.55572509765625, -0.506011962890625, -0.456298828125, -0.406585693359375, -0.35687255859375, -0.307159423828125, -0.2574462890625, -0.207733154296875, -0.15802001953125, -0.108306884765625, -0.05859375, -0.008880615234375, 0.04083251953125, 0.090545654296875, 0.1402587890625, 0.189971923828125, 0.23968505859375, 0.289398193359375, 0.339111328125, 0.388824462890625, 0.43853759765625, 0.488250732421875, 0.5379638671875, 0.587677001953125, 0.63739013671875, 0.687103271484375, 0.73681640625, 0.786529541015625, 0.83624267578125, 0.885955810546875, 0.9356689453125, 0.985382080078125, 1.03509521484375, 1.084808349609375, 1.134521484375, 1.184234619140625, 1.23394775390625, 1.283660888671875, 1.3333740234375, 1.383087158203125, 1.43280029296875, 1.482513427734375, 1.5322265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 20.0, 21.0, 26.0, 32.0, 52.0, 56.0, 107.0, 159.0, 198.0, 278.0, 406.0, 774.0, 1257.0, 2260.0, 4837.0, 13036.0, 47725.0, 205549.0, 457208.0, 232842.0, 55723.0, 14656.0, 5211.0, 2447.0, 1304.0, 763.0, 506.0, 348.0, 205.0, 159.0, 117.0, 71.0, 50.0, 37.0, 34.0, 18.0, 9.0, 7.0, 10.0, 7.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.42578125, -3.31719970703125, -3.2086181640625, -3.10003662109375, -2.991455078125, -2.88287353515625, -2.7742919921875, -2.66571044921875, -2.55712890625, -2.44854736328125, -2.3399658203125, -2.23138427734375, -2.122802734375, -2.01422119140625, -1.9056396484375, -1.79705810546875, -1.6884765625, -1.57989501953125, -1.4713134765625, -1.36273193359375, -1.254150390625, -1.14556884765625, -1.0369873046875, -0.92840576171875, -0.81982421875, -0.71124267578125, -0.6026611328125, -0.49407958984375, -0.385498046875, -0.27691650390625, -0.1683349609375, -0.05975341796875, 0.048828125, 0.15740966796875, 0.2659912109375, 0.37457275390625, 0.483154296875, 0.59173583984375, 0.7003173828125, 0.80889892578125, 0.91748046875, 1.02606201171875, 1.1346435546875, 1.24322509765625, 1.351806640625, 1.46038818359375, 1.5689697265625, 1.67755126953125, 1.7861328125, 1.89471435546875, 2.0032958984375, 2.11187744140625, 2.220458984375, 2.32904052734375, 2.4376220703125, 2.54620361328125, 2.65478515625, 2.76336669921875, 2.8719482421875, 2.98052978515625, 3.089111328125, 3.19769287109375, 3.3062744140625, 3.41485595703125, 3.5234375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 3.0, 14.0, 28.0, 41.0, 60.0, 85.0, 89.0, 128.0, 127.0, 95.0, 101.0, 64.0, 55.0, 34.0, 24.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023293495178222656, -0.00022500008344650269, -0.0002170652151107788, -0.00020913034677505493, -0.00020119547843933105, -0.00019326061010360718, -0.0001853257417678833, -0.00017739087343215942, -0.00016945600509643555, -0.00016152113676071167, -0.0001535862684249878, -0.00014565140008926392, -0.00013771653175354004, -0.00012978166341781616, -0.00012184679508209229, -0.00011391192674636841, -0.00010597705841064453, -9.804219007492065e-05, -9.010732173919678e-05, -8.21724534034729e-05, -7.423758506774902e-05, -6.630271673202515e-05, -5.836784839630127e-05, -5.043298006057739e-05, -4.2498111724853516e-05, -3.456324338912964e-05, -2.6628375053405762e-05, -1.8693506717681885e-05, -1.0758638381958008e-05, -2.823770046234131e-06, 5.111098289489746e-06, 1.3045966625213623e-05, 2.09808349609375e-05, 2.8915703296661377e-05, 3.6850571632385254e-05, 4.478543996810913e-05, 5.272030830383301e-05, 6.0655176639556885e-05, 6.859004497528076e-05, 7.652491331100464e-05, 8.445978164672852e-05, 9.239464998245239e-05, 0.00010032951831817627, 0.00010826438665390015, 0.00011619925498962402, 0.0001241341233253479, 0.00013206899166107178, 0.00014000385999679565, 0.00014793872833251953, 0.0001558735966682434, 0.00016380846500396729, 0.00017174333333969116, 0.00017967820167541504, 0.00018761307001113892, 0.0001955479383468628, 0.00020348280668258667, 0.00021141767501831055, 0.00021935254335403442, 0.0002272874116897583, 0.00023522228002548218, 0.00024315714836120605, 0.00025109201669692993, 0.0002590268850326538, 0.0002669617533683777, 0.00027489662170410156]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 9.0, 12.0, 20.0, 25.0, 21.0, 43.0, 71.0, 122.0, 163.0, 272.0, 414.0, 642.0, 1109.0, 1950.0, 3893.0, 8349.0, 20409.0, 56984.0, 158527.0, 316922.0, 282127.0, 123262.0, 42970.0, 15870.0, 6770.0, 3226.0, 1738.0, 982.0, 563.0, 336.0, 239.0, 161.0, 116.0, 68.0, 60.0, 34.0, 20.0, 13.0, 6.0, 11.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.4765625, -2.4034423828125, -2.330322265625, -2.2572021484375, -2.18408203125, -2.1109619140625, -2.037841796875, -1.9647216796875, -1.8916015625, -1.8184814453125, -1.745361328125, -1.6722412109375, -1.59912109375, -1.5260009765625, -1.452880859375, -1.3797607421875, -1.306640625, -1.2335205078125, -1.160400390625, -1.0872802734375, -1.01416015625, -0.9410400390625, -0.867919921875, -0.7947998046875, -0.7216796875, -0.6485595703125, -0.575439453125, -0.5023193359375, -0.42919921875, -0.3560791015625, -0.282958984375, -0.2098388671875, -0.13671875, -0.0635986328125, 0.009521484375, 0.0826416015625, 0.15576171875, 0.2288818359375, 0.302001953125, 0.3751220703125, 0.4482421875, 0.5213623046875, 0.594482421875, 0.6676025390625, 0.74072265625, 0.8138427734375, 0.886962890625, 0.9600830078125, 1.033203125, 1.1063232421875, 1.179443359375, 1.2525634765625, 1.32568359375, 1.3988037109375, 1.471923828125, 1.5450439453125, 1.6181640625, 1.6912841796875, 1.764404296875, 1.8375244140625, 1.91064453125, 1.9837646484375, 2.056884765625, 2.1300048828125, 2.203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 9.0, 13.0, 17.0, 21.0, 32.0, 24.0, 34.0, 41.0, 60.0, 50.0, 63.0, 58.0, 69.0, 64.0, 50.0, 58.0, 46.0, 34.0, 29.0, 22.0, 37.0, 29.0, 24.0, 11.0, 11.0, 14.0, 9.0, 6.0, 10.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.373046875, -0.3606109619140625, -0.348175048828125, -0.3357391357421875, -0.32330322265625, -0.3108673095703125, -0.298431396484375, -0.2859954833984375, -0.2735595703125, -0.2611236572265625, -0.248687744140625, -0.2362518310546875, -0.22381591796875, -0.2113800048828125, -0.198944091796875, -0.1865081787109375, -0.174072265625, -0.1616363525390625, -0.149200439453125, -0.1367645263671875, -0.12432861328125, -0.1118927001953125, -0.099456787109375, -0.0870208740234375, -0.0745849609375, -0.0621490478515625, -0.049713134765625, -0.0372772216796875, -0.02484130859375, -0.0124053955078125, 3.0517578125e-05, 0.0124664306640625, 0.02490234375, 0.0373382568359375, 0.049774169921875, 0.0622100830078125, 0.07464599609375, 0.0870819091796875, 0.099517822265625, 0.1119537353515625, 0.1243896484375, 0.1368255615234375, 0.149261474609375, 0.1616973876953125, 0.17413330078125, 0.1865692138671875, 0.199005126953125, 0.2114410400390625, 0.223876953125, 0.2363128662109375, 0.248748779296875, 0.2611846923828125, 0.27362060546875, 0.2860565185546875, 0.298492431640625, 0.3109283447265625, 0.3233642578125, 0.3358001708984375, 0.348236083984375, 0.3606719970703125, 0.37310791015625, 0.3855438232421875, 0.397979736328125, 0.4104156494140625, 0.4228515625]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 10.0, 16.0, 21.0, 22.0, 36.0, 37.0, 51.0, 45.0, 52.0, 51.0, 72.0, 75.0, 66.0, 61.0, 55.0, 47.0, 49.0, 31.0, 38.0, 29.0, 17.0, 11.0, 13.0, 14.0, 13.0, 5.0, 3.0, 11.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.992527484893799, -4.848790168762207, -4.705052852630615, -4.561315536499023, -4.417578220367432, -4.27384090423584, -4.130103588104248, -3.9863665103912354, -3.8426291942596436, -3.6988918781280518, -3.55515456199646, -3.411417245864868, -3.2676801681518555, -3.1239428520202637, -2.980205535888672, -2.83646821975708, -2.6927309036254883, -2.5489935874938965, -2.4052562713623047, -2.261518955230713, -2.117781639099121, -1.9740444421768188, -1.8303072452545166, -1.6865699291229248, -1.542832612991333, -1.3990952968597412, -1.2553579807281494, -1.1116207838058472, -0.9678834676742554, -0.8241461515426636, -0.6804088950157166, -0.5366716384887695, -0.39293432235717773, -0.24919703602790833, -0.10545974969863892, 0.03827753663063049, 0.1820148229598999, 0.3257521390914917, 0.4694893956184387, 0.6132266521453857, 0.7569639682769775, 0.9007012844085693, 1.0444386005401611, 1.1881757974624634, 1.3319131135940552, 1.475650429725647, 1.6193876266479492, 1.763124942779541, 1.9068622589111328, 2.0505995750427246, 2.1943368911743164, 2.338074207305908, 2.4818115234375, 2.625548839569092, 2.7692859172821045, 2.9130232334136963, 3.056760549545288, 3.20049786567688, 3.3442351818084717, 3.4879724979400635, 3.631709575653076, 3.775446891784668, 3.9191842079162598, 4.062921524047852, 4.206658840179443]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 10.0, 3.0, 7.0, 6.0, 10.0, 14.0, 12.0, 12.0, 17.0, 20.0, 22.0, 21.0, 24.0, 24.0, 27.0, 27.0, 30.0, 38.0, 42.0, 42.0, 44.0, 35.0, 34.0, 38.0, 44.0, 35.0, 45.0, 41.0, 33.0, 31.0, 25.0, 30.0, 24.0, 26.0, 22.0, 15.0, 12.0, 15.0, 9.0, 5.0, 5.0, 6.0, 6.0, 8.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.913811206817627, -2.8311164379119873, -2.7484216690063477, -2.665726900100708, -2.5830321311950684, -2.5003373622894287, -2.417642593383789, -2.3349475860595703, -2.2522530555725098, -2.16955828666687, -2.0868635177612305, -2.004168748855591, -1.9214739799499512, -1.8387792110443115, -1.7560843229293823, -1.6733895540237427, -1.5906946659088135, -1.5079998970031738, -1.4253051280975342, -1.3426103591918945, -1.2599155902862549, -1.1772208213806152, -1.094525933265686, -1.0118311643600464, -0.9291363954544067, -0.8464416265487671, -0.7637468576431274, -0.681052029132843, -0.5983572602272034, -0.5156624913215637, -0.4329676926136017, -0.35027289390563965, -0.2675778865814209, -0.18488310277462006, -0.10218831896781921, -0.01949353516101837, 0.06320124864578247, 0.14589601755142212, 0.22859081625938416, 0.3112856149673462, 0.39398038387298584, 0.4766751527786255, 0.5593699216842651, 0.6420647501945496, 0.7247595191001892, 0.8074542880058289, 0.8901491165161133, 0.9728438854217529, 1.0555386543273926, 1.1382334232330322, 1.2209281921386719, 1.3036229610443115, 1.3863177299499512, 1.4690124988555908, 1.55170738697052, 1.6344021558761597, 1.7170969247817993, 1.799791693687439, 1.8824864625930786, 1.9651812314987183, 2.0478761196136475, 2.130570888519287, 2.2132656574249268, 2.2959604263305664, 2.378655195236206]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 1.0, 2.0, 5.0, 7.0, 5.0, 23.0, 12.0, 34.0, 39.0, 62.0, 80.0, 133.0, 200.0, 305.0, 466.0, 748.0, 1133.0, 1989.0, 3382.0, 5994.0, 10817.0, 20320.0, 40412.0, 84921.0, 195216.0, 496890.0, 1133539.0, 1220581.0, 571054.0, 220362.0, 94121.0, 44198.0, 21728.0, 11151.0, 6090.0, 3384.0, 1907.0, 1144.0, 702.0, 416.0, 249.0, 156.0, 95.0, 70.0, 45.0, 30.0, 19.0, 21.0, 11.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.13671875, -4.990234375, -4.84375, -4.697265625, -4.55078125, -4.404296875, -4.2578125, -4.111328125, -3.96484375, -3.818359375, -3.671875, -3.525390625, -3.37890625, -3.232421875, -3.0859375, -2.939453125, -2.79296875, -2.646484375, -2.5, -2.353515625, -2.20703125, -2.060546875, -1.9140625, -1.767578125, -1.62109375, -1.474609375, -1.328125, -1.181640625, -1.03515625, -0.888671875, -0.7421875, -0.595703125, -0.44921875, -0.302734375, -0.15625, -0.009765625, 0.13671875, 0.283203125, 0.4296875, 0.576171875, 0.72265625, 0.869140625, 1.015625, 1.162109375, 1.30859375, 1.455078125, 1.6015625, 1.748046875, 1.89453125, 2.041015625, 2.1875, 2.333984375, 2.48046875, 2.626953125, 2.7734375, 2.919921875, 3.06640625, 3.212890625, 3.359375, 3.505859375, 3.65234375, 3.798828125, 3.9453125, 4.091796875, 4.23828125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 5.0, 10.0, 10.0, 8.0, 18.0, 10.0, 9.0, 15.0, 15.0, 23.0, 17.0, 26.0, 35.0, 45.0, 33.0, 39.0, 33.0, 43.0, 50.0, 46.0, 44.0, 49.0, 47.0, 30.0, 27.0, 32.0, 35.0, 43.0, 25.0, 29.0, 25.0, 29.0, 18.0, 19.0, 8.0, 9.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.30078125, -2.231292724609375, -2.16180419921875, -2.092315673828125, -2.0228271484375, -1.953338623046875, -1.88385009765625, -1.814361572265625, -1.744873046875, -1.675384521484375, -1.60589599609375, -1.536407470703125, -1.4669189453125, -1.397430419921875, -1.32794189453125, -1.258453369140625, -1.18896484375, -1.119476318359375, -1.04998779296875, -0.980499267578125, -0.9110107421875, -0.841522216796875, -0.77203369140625, -0.702545166015625, -0.633056640625, -0.563568115234375, -0.49407958984375, -0.424591064453125, -0.3551025390625, -0.285614013671875, -0.21612548828125, -0.146636962890625, -0.0771484375, -0.007659912109375, 0.06182861328125, 0.131317138671875, 0.2008056640625, 0.270294189453125, 0.33978271484375, 0.409271240234375, 0.478759765625, 0.548248291015625, 0.61773681640625, 0.687225341796875, 0.7567138671875, 0.826202392578125, 0.89569091796875, 0.965179443359375, 1.03466796875, 1.104156494140625, 1.17364501953125, 1.243133544921875, 1.3126220703125, 1.382110595703125, 1.45159912109375, 1.521087646484375, 1.590576171875, 1.660064697265625, 1.72955322265625, 1.799041748046875, 1.8685302734375, 1.938018798828125, 2.00750732421875, 2.076995849609375, 2.146484375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 14.0, 15.0, 33.0, 47.0, 83.0, 113.0, 150.0, 203.0, 338.0, 511.0, 797.0, 1266.0, 2037.0, 3327.0, 5225.0, 8822.0, 14665.0, 25899.0, 45744.0, 83516.0, 158130.0, 308328.0, 597766.0, 968742.0, 893252.0, 511557.0, 261149.0, 134853.0, 71926.0, 39815.0, 22429.0, 12958.0, 7747.0, 4658.0, 2962.0, 1818.0, 1185.0, 753.0, 499.0, 341.0, 206.0, 144.0, 90.0, 52.0, 35.0, 30.0, 18.0, 14.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.9501953125, -3.822265625, -3.6943359375, -3.56640625, -3.4384765625, -3.310546875, -3.1826171875, -3.0546875, -2.9267578125, -2.798828125, -2.6708984375, -2.54296875, -2.4150390625, -2.287109375, -2.1591796875, -2.03125, -1.9033203125, -1.775390625, -1.6474609375, -1.51953125, -1.3916015625, -1.263671875, -1.1357421875, -1.0078125, -0.8798828125, -0.751953125, -0.6240234375, -0.49609375, -0.3681640625, -0.240234375, -0.1123046875, 0.015625, 0.1435546875, 0.271484375, 0.3994140625, 0.52734375, 0.6552734375, 0.783203125, 0.9111328125, 1.0390625, 1.1669921875, 1.294921875, 1.4228515625, 1.55078125, 1.6787109375, 1.806640625, 1.9345703125, 2.0625, 2.1904296875, 2.318359375, 2.4462890625, 2.57421875, 2.7021484375, 2.830078125, 2.9580078125, 3.0859375, 3.2138671875, 3.341796875, 3.4697265625, 3.59765625, 3.7255859375, 3.853515625, 3.9814453125, 4.109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 15.0, 13.0, 15.0, 26.0, 33.0, 45.0, 49.0, 67.0, 66.0, 102.0, 122.0, 130.0, 170.0, 189.0, 242.0, 295.0, 302.0, 300.0, 267.0, 243.0, 233.0, 210.0, 176.0, 161.0, 119.0, 93.0, 66.0, 75.0, 50.0, 52.0, 35.0, 21.0, 15.0, 22.0, 9.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3837890625, -1.3425445556640625, -1.301300048828125, -1.2600555419921875, -1.21881103515625, -1.1775665283203125, -1.136322021484375, -1.0950775146484375, -1.0538330078125, -1.0125885009765625, -0.971343994140625, -0.9300994873046875, -0.88885498046875, -0.8476104736328125, -0.806365966796875, -0.7651214599609375, -0.723876953125, -0.6826324462890625, -0.641387939453125, -0.6001434326171875, -0.55889892578125, -0.5176544189453125, -0.476409912109375, -0.4351654052734375, -0.3939208984375, -0.3526763916015625, -0.311431884765625, -0.2701873779296875, -0.22894287109375, -0.1876983642578125, -0.146453857421875, -0.1052093505859375, -0.06396484375, -0.0227203369140625, 0.018524169921875, 0.0597686767578125, 0.10101318359375, 0.1422576904296875, 0.183502197265625, 0.2247467041015625, 0.2659912109375, 0.3072357177734375, 0.348480224609375, 0.3897247314453125, 0.43096923828125, 0.4722137451171875, 0.513458251953125, 0.5547027587890625, 0.595947265625, 0.6371917724609375, 0.678436279296875, 0.7196807861328125, 0.76092529296875, 0.8021697998046875, 0.843414306640625, 0.8846588134765625, 0.9259033203125, 0.9671478271484375, 1.008392333984375, 1.0496368408203125, 1.09088134765625, 1.1321258544921875, 1.173370361328125, 1.2146148681640625, 1.255859375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 2.0, 6.0, 12.0, 12.0, 13.0, 35.0, 25.0, 36.0, 47.0, 69.0, 58.0, 73.0, 60.0, 85.0, 68.0, 51.0, 63.0, 50.0, 36.0, 30.0, 29.0, 23.0, 20.0, 13.0, 14.0, 11.0, 8.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.848748683929443, -5.6829633712768555, -5.517178058624268, -5.35139274597168, -5.185607433319092, -5.019822120666504, -4.854036808013916, -4.688251495361328, -4.522466659545898, -4.3566813468933105, -4.190896034240723, -4.025110721588135, -3.859325408935547, -3.693540096282959, -3.52775502204895, -3.3619697093963623, -3.1961841583251953, -3.0303988456726074, -2.8646135330200195, -2.6988282203674316, -2.5330429077148438, -2.367257595062256, -2.201472520828247, -2.035687208175659, -1.8699018955230713, -1.7041165828704834, -1.5383312702178955, -1.3725460767745972, -1.2067607641220093, -1.0409754514694214, -0.8751901984214783, -0.7094049453735352, -0.5436191558837891, -0.37783387303352356, -0.21204859018325806, -0.046263307332992554, 0.11952197551727295, 0.28530728816986084, 0.45109254121780396, 0.6168777942657471, 0.782663106918335, 0.9484484195709229, 1.1142337322235107, 1.280018925666809, 1.445804238319397, 1.6115895509719849, 1.7773747444152832, 1.943160057067871, 2.108945369720459, 2.274730682373047, 2.4405159950256348, 2.6063013076782227, 2.7720866203308105, 2.9378719329833984, 3.1036570072174072, 3.269442319869995, 3.435227632522583, 3.601012945175171, 3.766798257827759, 3.9325835704803467, 4.0983686447143555, 4.264153957366943, 4.429939270019531, 4.595724582672119, 4.761509895324707]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 6.0, 8.0, 12.0, 16.0, 10.0, 6.0, 26.0, 20.0, 16.0, 24.0, 32.0, 36.0, 34.0, 34.0, 46.0, 39.0, 42.0, 47.0, 37.0, 39.0, 50.0, 39.0, 33.0, 43.0, 33.0, 40.0, 28.0, 27.0, 24.0, 28.0, 25.0, 16.0, 11.0, 13.0, 11.0, 11.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.831474542617798, -2.7447054386138916, -2.6579365730285645, -2.571167469024658, -2.484398365020752, -2.3976292610168457, -2.3108603954315186, -2.2240912914276123, -2.137322425842285, -2.050553321838379, -1.9637843370437622, -1.8770153522491455, -1.7902462482452393, -1.7034772634506226, -1.6167082786560059, -1.5299391746520996, -1.4431700706481934, -1.3564010858535767, -1.2696319818496704, -1.1828629970550537, -1.0960938930511475, -1.0093249082565308, -0.9225559234619141, -0.8357868790626526, -0.7490178346633911, -0.6622487902641296, -0.5754797458648682, -0.48871076107025146, -0.40194171667099, -0.3151726722717285, -0.22840368747711182, -0.14163464307785034, -0.05486559867858887, 0.031903430819511414, 0.1186724603176117, 0.20544147491455078, 0.29221051931381226, 0.37897956371307373, 0.46574854850769043, 0.5525175929069519, 0.6392866373062134, 0.7260556817054749, 0.8128247261047363, 0.899593710899353, 0.9863627552986145, 1.073131799697876, 1.1599007844924927, 1.2466697692871094, 1.3334388732910156, 1.4202078580856323, 1.5069769620895386, 1.5937459468841553, 1.6805150508880615, 1.7672840356826782, 1.854053020477295, 1.9408221244812012, 2.0275912284851074, 2.1143603324890137, 2.201129198074341, 2.287898302078247, 2.3746674060821533, 2.4614362716674805, 2.5482053756713867, 2.634974479675293, 2.72174334526062]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 19.0, 31.0, 50.0, 79.0, 122.0, 182.0, 270.0, 428.0, 714.0, 1053.0, 1669.0, 2665.0, 4493.0, 7487.0, 12709.0, 22244.0, 40753.0, 76440.0, 141034.0, 223254.0, 216572.0, 133689.0, 71984.0, 38784.0, 21223.0, 12218.0, 7186.0, 4271.0, 2489.0, 1582.0, 1039.0, 659.0, 391.0, 267.0, 157.0, 103.0, 79.0, 51.0, 21.0, 22.0, 16.0, 6.0, 11.0, 5.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.428466796875, -0.4165496826171875, -0.404632568359375, -0.3927154541015625, -0.38079833984375, -0.3688812255859375, -0.356964111328125, -0.3450469970703125, -0.3331298828125, -0.3212127685546875, -0.309295654296875, -0.2973785400390625, -0.28546142578125, -0.2735443115234375, -0.261627197265625, -0.2497100830078125, -0.23779296875, -0.2258758544921875, -0.213958740234375, -0.2020416259765625, -0.19012451171875, -0.1782073974609375, -0.166290283203125, -0.1543731689453125, -0.1424560546875, -0.1305389404296875, -0.118621826171875, -0.1067047119140625, -0.09478759765625, -0.0828704833984375, -0.070953369140625, -0.0590362548828125, -0.047119140625, -0.0352020263671875, -0.023284912109375, -0.0113677978515625, 0.00054931640625, 0.0124664306640625, 0.024383544921875, 0.0363006591796875, 0.0482177734375, 0.0601348876953125, 0.072052001953125, 0.0839691162109375, 0.09588623046875, 0.1078033447265625, 0.119720458984375, 0.1316375732421875, 0.1435546875, 0.1554718017578125, 0.167388916015625, 0.1793060302734375, 0.19122314453125, 0.2031402587890625, 0.215057373046875, 0.2269744873046875, 0.2388916015625, 0.2508087158203125, 0.262725830078125, 0.2746429443359375, 0.28656005859375, 0.2984771728515625, 0.310394287109375, 0.3223114013671875, 0.334228515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 12.0, 13.0, 19.0, 14.0, 18.0, 22.0, 32.0, 32.0, 35.0, 40.0, 49.0, 42.0, 53.0, 54.0, 48.0, 58.0, 46.0, 47.0, 36.0, 45.0, 39.0, 35.0, 39.0, 31.0, 29.0, 21.0, 17.0, 12.0, 13.0, 14.0, 5.0, 3.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.002471923828125, -2.89166259765625, -2.780853271484375, -2.6700439453125, -2.559234619140625, -2.44842529296875, -2.337615966796875, -2.226806640625, -2.115997314453125, -2.00518798828125, -1.894378662109375, -1.7835693359375, -1.672760009765625, -1.56195068359375, -1.451141357421875, -1.34033203125, -1.229522705078125, -1.11871337890625, -1.007904052734375, -0.8970947265625, -0.786285400390625, -0.67547607421875, -0.564666748046875, -0.453857421875, -0.343048095703125, -0.23223876953125, -0.121429443359375, -0.0106201171875, 0.100189208984375, 0.21099853515625, 0.321807861328125, 0.4326171875, 0.543426513671875, 0.65423583984375, 0.765045166015625, 0.8758544921875, 0.986663818359375, 1.09747314453125, 1.208282470703125, 1.319091796875, 1.429901123046875, 1.54071044921875, 1.651519775390625, 1.7623291015625, 1.873138427734375, 1.98394775390625, 2.094757080078125, 2.20556640625, 2.316375732421875, 2.42718505859375, 2.537994384765625, 2.6488037109375, 2.759613037109375, 2.87042236328125, 2.981231689453125, 3.092041015625, 3.202850341796875, 3.31365966796875, 3.424468994140625, 3.5352783203125, 3.646087646484375, 3.75689697265625, 3.867706298828125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 10.0, 28.0, 27.0, 41.0, 54.0, 81.0, 108.0, 190.0, 267.0, 412.0, 738.0, 1230.0, 2166.0, 4242.0, 9431.0, 23597.0, 180019.0, 766428.0, 35348.0, 12237.0, 5434.0, 2809.0, 1433.0, 823.0, 490.0, 318.0, 191.0, 123.0, 71.0, 51.0, 44.0, 32.0, 26.0, 13.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0], "bins": [-1.4501953125, -1.4111785888671875, -1.372161865234375, -1.3331451416015625, -1.29412841796875, -1.2551116943359375, -1.216094970703125, -1.1770782470703125, -1.1380615234375, -1.0990447998046875, -1.060028076171875, -1.0210113525390625, -0.98199462890625, -0.9429779052734375, -0.903961181640625, -0.8649444580078125, -0.825927734375, -0.7869110107421875, -0.747894287109375, -0.7088775634765625, -0.66986083984375, -0.6308441162109375, -0.591827392578125, -0.5528106689453125, -0.5137939453125, -0.4747772216796875, -0.435760498046875, -0.3967437744140625, -0.35772705078125, -0.3187103271484375, -0.279693603515625, -0.2406768798828125, -0.20166015625, -0.1626434326171875, -0.123626708984375, -0.0846099853515625, -0.04559326171875, -0.0065765380859375, 0.032440185546875, 0.0714569091796875, 0.1104736328125, 0.1494903564453125, 0.188507080078125, 0.2275238037109375, 0.26654052734375, 0.3055572509765625, 0.344573974609375, 0.3835906982421875, 0.422607421875, 0.4616241455078125, 0.500640869140625, 0.5396575927734375, 0.57867431640625, 0.6176910400390625, 0.656707763671875, 0.6957244873046875, 0.7347412109375, 0.7737579345703125, 0.812774658203125, 0.8517913818359375, 0.89080810546875, 0.9298248291015625, 0.968841552734375, 1.0078582763671875, 1.046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 13.0, 8.0, 10.0, 21.0, 19.0, 12.0, 23.0, 29.0, 28.0, 27.0, 34.0, 34.0, 37.0, 32.0, 43.0, 41.0, 52.0, 45.0, 50.0, 43.0, 42.0, 31.0, 36.0, 28.0, 33.0, 28.0, 29.0, 24.0, 20.0, 14.0, 19.0, 13.0, 13.0, 17.0, 9.0, 11.0, 1.0, 11.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.8038787841796875, -1.741546630859375, -1.6792144775390625, -1.61688232421875, -1.5545501708984375, -1.492218017578125, -1.4298858642578125, -1.3675537109375, -1.3052215576171875, -1.242889404296875, -1.1805572509765625, -1.11822509765625, -1.0558929443359375, -0.993560791015625, -0.9312286376953125, -0.868896484375, -0.8065643310546875, -0.744232177734375, -0.6819000244140625, -0.61956787109375, -0.5572357177734375, -0.494903564453125, -0.4325714111328125, -0.3702392578125, -0.3079071044921875, -0.245574951171875, -0.1832427978515625, -0.12091064453125, -0.0585784912109375, 0.003753662109375, 0.0660858154296875, 0.12841796875, 0.1907501220703125, 0.253082275390625, 0.3154144287109375, 0.37774658203125, 0.4400787353515625, 0.502410888671875, 0.5647430419921875, 0.6270751953125, 0.6894073486328125, 0.751739501953125, 0.8140716552734375, 0.87640380859375, 0.9387359619140625, 1.001068115234375, 1.0634002685546875, 1.125732421875, 1.1880645751953125, 1.250396728515625, 1.3127288818359375, 1.37506103515625, 1.4373931884765625, 1.499725341796875, 1.5620574951171875, 1.6243896484375, 1.6867218017578125, 1.749053955078125, 1.8113861083984375, 1.87371826171875, 1.9360504150390625, 1.998382568359375, 2.0607147216796875, 2.123046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 6.0, 12.0, 8.0, 19.0, 25.0, 31.0, 52.0, 67.0, 78.0, 126.0, 210.0, 285.0, 482.0, 809.0, 1361.0, 2438.0, 4408.0, 9121.0, 20849.0, 81348.0, 867326.0, 32499.0, 12970.0, 6330.0, 3268.0, 1781.0, 962.0, 568.0, 372.0, 241.0, 143.0, 93.0, 73.0, 53.0, 43.0, 19.0, 22.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2481689453125, -0.24047088623046875, -0.2327728271484375, -0.22507476806640625, -0.217376708984375, -0.20967864990234375, -0.2019805908203125, -0.19428253173828125, -0.18658447265625, -0.17888641357421875, -0.1711883544921875, -0.16349029541015625, -0.155792236328125, -0.14809417724609375, -0.1403961181640625, -0.13269805908203125, -0.125, -0.11730194091796875, -0.1096038818359375, -0.10190582275390625, -0.094207763671875, -0.08650970458984375, -0.0788116455078125, -0.07111358642578125, -0.06341552734375, -0.05571746826171875, -0.0480194091796875, -0.04032135009765625, -0.032623291015625, -0.02492523193359375, -0.0172271728515625, -0.00952911376953125, -0.0018310546875, 0.00586700439453125, 0.0135650634765625, 0.02126312255859375, 0.028961181640625, 0.03665924072265625, 0.0443572998046875, 0.05205535888671875, 0.05975341796875, 0.06745147705078125, 0.0751495361328125, 0.08284759521484375, 0.090545654296875, 0.09824371337890625, 0.1059417724609375, 0.11363983154296875, 0.121337890625, 0.12903594970703125, 0.1367340087890625, 0.14443206787109375, 0.152130126953125, 0.15982818603515625, 0.1675262451171875, 0.17522430419921875, 0.18292236328125, 0.19062042236328125, 0.1983184814453125, 0.20601654052734375, 0.213714599609375, 0.22141265869140625, 0.2291107177734375, 0.23680877685546875, 0.2445068359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 6.0, 14.0, 15.0, 16.0, 17.0, 21.0, 30.0, 34.0, 32.0, 37.0, 53.0, 58.0, 46.0, 56.0, 60.0, 49.0, 71.0, 53.0, 49.0, 32.0, 36.0, 31.0, 23.0, 31.0, 21.0, 21.0, 19.0, 9.0, 6.0, 10.0, 4.0, 8.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3424625396728516e-05, -2.272985875606537e-05, -2.203509211540222e-05, -2.1340325474739075e-05, -2.0645558834075928e-05, -1.995079219341278e-05, -1.9256025552749634e-05, -1.8561258912086487e-05, -1.786649227142334e-05, -1.7171725630760193e-05, -1.6476958990097046e-05, -1.57821923494339e-05, -1.5087425708770752e-05, -1.4392659068107605e-05, -1.3697892427444458e-05, -1.3003125786781311e-05, -1.2308359146118164e-05, -1.1613592505455017e-05, -1.091882586479187e-05, -1.0224059224128723e-05, -9.529292583465576e-06, -8.83452594280243e-06, -8.139759302139282e-06, -7.444992661476135e-06, -6.750226020812988e-06, -6.055459380149841e-06, -5.360692739486694e-06, -4.665926098823547e-06, -3.9711594581604e-06, -3.2763928174972534e-06, -2.5816261768341064e-06, -1.8868595361709595e-06, -1.1920928955078125e-06, -4.973262548446655e-07, 1.9744038581848145e-07, 8.922070264816284e-07, 1.5869736671447754e-06, 2.2817403078079224e-06, 2.9765069484710693e-06, 3.6712735891342163e-06, 4.366040229797363e-06, 5.06080687046051e-06, 5.755573511123657e-06, 6.450340151786804e-06, 7.145106792449951e-06, 7.839873433113098e-06, 8.534640073776245e-06, 9.229406714439392e-06, 9.924173355102539e-06, 1.0618939995765686e-05, 1.1313706636428833e-05, 1.200847327709198e-05, 1.2703239917755127e-05, 1.3398006558418274e-05, 1.4092773199081421e-05, 1.4787539839744568e-05, 1.5482306480407715e-05, 1.6177073121070862e-05, 1.687183976173401e-05, 1.7566606402397156e-05, 1.8261373043060303e-05, 1.895613968372345e-05, 1.9650906324386597e-05, 2.0345672965049744e-05, 2.104043960571289e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 12.0, 19.0, 21.0, 37.0, 40.0, 42.0, 88.0, 100.0, 166.0, 220.0, 310.0, 450.0, 605.0, 898.0, 1344.0, 2061.0, 3187.0, 5163.0, 8423.0, 14741.0, 26667.0, 48780.0, 90379.0, 157148.0, 220346.0, 195072.0, 120715.0, 66278.0, 35924.0, 19706.0, 11089.0, 6553.0, 4179.0, 2548.0, 1654.0, 1135.0, 712.0, 500.0, 384.0, 253.0, 188.0, 125.0, 105.0, 40.0, 55.0, 27.0, 20.0, 13.0, 11.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.07470703125, -0.07242584228515625, -0.0701446533203125, -0.06786346435546875, -0.065582275390625, -0.06330108642578125, -0.0610198974609375, -0.05873870849609375, -0.05645751953125, -0.05417633056640625, -0.0518951416015625, -0.04961395263671875, -0.047332763671875, -0.04505157470703125, -0.0427703857421875, -0.04048919677734375, -0.0382080078125, -0.03592681884765625, -0.0336456298828125, -0.03136444091796875, -0.029083251953125, -0.02680206298828125, -0.0245208740234375, -0.02223968505859375, -0.01995849609375, -0.01767730712890625, -0.0153961181640625, -0.01311492919921875, -0.010833740234375, -0.00855255126953125, -0.0062713623046875, -0.00399017333984375, -0.001708984375, 0.00057220458984375, 0.0028533935546875, 0.00513458251953125, 0.007415771484375, 0.00969696044921875, 0.0119781494140625, 0.01425933837890625, 0.01654052734375, 0.01882171630859375, 0.0211029052734375, 0.02338409423828125, 0.025665283203125, 0.02794647216796875, 0.0302276611328125, 0.03250885009765625, 0.0347900390625, 0.03707122802734375, 0.0393524169921875, 0.04163360595703125, 0.043914794921875, 0.04619598388671875, 0.0484771728515625, 0.05075836181640625, 0.05303955078125, 0.05532073974609375, 0.0576019287109375, 0.05988311767578125, 0.062164306640625, 0.06444549560546875, 0.0667266845703125, 0.06900787353515625, 0.0712890625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 11.0, 9.0, 8.0, 12.0, 17.0, 29.0, 32.0, 42.0, 40.0, 50.0, 65.0, 73.0, 68.0, 77.0, 64.0, 63.0, 60.0, 44.0, 47.0, 33.0, 26.0, 23.0, 18.0, 14.0, 11.0, 8.0, 9.0, 7.0, 3.0, 1.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0217742919921875, -0.021143674850463867, -0.020513057708740234, -0.0198824405670166, -0.01925182342529297, -0.018621206283569336, -0.017990589141845703, -0.01735997200012207, -0.016729354858398438, -0.016098737716674805, -0.015468120574951172, -0.014837503433227539, -0.014206886291503906, -0.013576269149780273, -0.01294565200805664, -0.012315034866333008, -0.011684417724609375, -0.011053800582885742, -0.01042318344116211, -0.009792566299438477, -0.009161949157714844, -0.008531332015991211, -0.007900714874267578, -0.007270097732543945, -0.0066394805908203125, -0.00600886344909668, -0.005378246307373047, -0.004747629165649414, -0.004117012023925781, -0.0034863948822021484, -0.0028557777404785156, -0.002225160598754883, -0.00159454345703125, -0.0009639263153076172, -0.0003333091735839844, 0.00029730796813964844, 0.0009279251098632812, 0.001558542251586914, 0.002189159393310547, 0.0028197765350341797, 0.0034503936767578125, 0.004081010818481445, 0.004711627960205078, 0.005342245101928711, 0.005972862243652344, 0.0066034793853759766, 0.007234096527099609, 0.007864713668823242, 0.008495330810546875, 0.009125947952270508, 0.00975656509399414, 0.010387182235717773, 0.011017799377441406, 0.011648416519165039, 0.012279033660888672, 0.012909650802612305, 0.013540267944335938, 0.01417088508605957, 0.014801502227783203, 0.015432119369506836, 0.01606273651123047, 0.0166933536529541, 0.017323970794677734, 0.017954587936401367, 0.018585205078125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 10.0, 3.0, 6.0, 10.0, 17.0, 13.0, 32.0, 23.0, 40.0, 49.0, 68.0, 57.0, 69.0, 67.0, 83.0, 65.0, 59.0, 59.0, 48.0, 37.0, 28.0, 32.0, 20.0, 19.0, 16.0, 12.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.861233711242676, -5.695018291473389, -5.528802871704102, -5.362587928771973, -5.1963725090026855, -5.030157089233398, -4.863941669464111, -4.697726249694824, -4.531511306762695, -4.365295886993408, -4.199080467224121, -4.032865524291992, -3.866650104522705, -3.700434684753418, -3.534219264984131, -3.3680038452148438, -3.2017884254455566, -3.0355730056762695, -2.8693578243255615, -2.7031424045562744, -2.5369272232055664, -2.3707118034362793, -2.204496383666992, -2.038280963897705, -1.872065782546997, -1.7058504819869995, -1.539635181427002, -1.3734197616577148, -1.2072044610977173, -1.0409891605377197, -0.8747738003730774, -0.7085584402084351, -0.5423436164855957, -0.37612828612327576, -0.2099129557609558, -0.043697625398635864, 0.12251770496368408, 0.28873300552368164, 0.454948365688324, 0.6211637258529663, 0.7873790264129639, 0.9535943269729614, 1.119809627532959, 1.286025047302246, 1.4522403478622437, 1.6184556484222412, 1.7846710681915283, 1.9508863687515259, 2.1171016693115234, 2.2833170890808105, 2.4495322704315186, 2.6157476902008057, 2.7819628715515137, 2.948178291320801, 3.114393711090088, 3.280609130859375, 3.446824312210083, 3.61303973197937, 3.779254913330078, 3.9454703330993652, 4.111685752868652, 4.277900695800781, 4.444116115570068, 4.6103315353393555, 4.776546955108643]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 4.0, 10.0, 11.0, 15.0, 10.0, 6.0, 27.0, 22.0, 15.0, 24.0, 32.0, 35.0, 38.0, 38.0, 39.0, 43.0, 41.0, 47.0, 37.0, 40.0, 49.0, 39.0, 31.0, 45.0, 34.0, 38.0, 28.0, 26.0, 28.0, 26.0, 21.0, 16.0, 13.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.807745933532715, -2.7214558124542236, -2.6351656913757324, -2.548875570297241, -2.46258544921875, -2.376295328140259, -2.2900052070617676, -2.2037150859832764, -2.117424964904785, -2.031134843826294, -1.9448447227478027, -1.8585546016693115, -1.7722644805908203, -1.685974359512329, -1.599684238433838, -1.5133941173553467, -1.4271039962768555, -1.3408138751983643, -1.254523754119873, -1.1682336330413818, -1.0819435119628906, -0.9956533908843994, -0.9093632698059082, -0.823073148727417, -0.7367830276489258, -0.6504929065704346, -0.5642027854919434, -0.47791266441345215, -0.39162254333496094, -0.3053324222564697, -0.21904230117797852, -0.1327521800994873, -0.04646182060241699, 0.03982830047607422, 0.12611842155456543, 0.21240854263305664, 0.29869866371154785, 0.38498878479003906, 0.4712789058685303, 0.5575690269470215, 0.6438591480255127, 0.7301492691040039, 0.8164393901824951, 0.9027295112609863, 0.9890196323394775, 1.0753097534179688, 1.16159987449646, 1.2478899955749512, 1.3341801166534424, 1.4204702377319336, 1.5067603588104248, 1.593050479888916, 1.6793406009674072, 1.7656307220458984, 1.8519208431243896, 1.9382109642028809, 2.024501085281372, 2.1107912063598633, 2.1970813274383545, 2.2833714485168457, 2.369661569595337, 2.455951690673828, 2.5422418117523193, 2.6285319328308105, 2.7148220539093018]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 4.0, 7.0, 15.0, 26.0, 37.0, 41.0, 81.0, 134.0, 155.0, 269.0, 422.0, 681.0, 1089.0, 1798.0, 3045.0, 5246.0, 9280.0, 17090.0, 31339.0, 57234.0, 100977.0, 159705.0, 200052.0, 178969.0, 122085.0, 70944.0, 39223.0, 20958.0, 11620.0, 6543.0, 3742.0, 2193.0, 1362.0, 748.0, 509.0, 320.0, 179.0, 162.0, 93.0, 65.0, 33.0, 30.0, 12.0, 20.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.501953125, -3.394805908203125, -3.28765869140625, -3.180511474609375, -3.0733642578125, -2.966217041015625, -2.85906982421875, -2.751922607421875, -2.644775390625, -2.537628173828125, -2.43048095703125, -2.323333740234375, -2.2161865234375, -2.109039306640625, -2.00189208984375, -1.894744873046875, -1.78759765625, -1.680450439453125, -1.57330322265625, -1.466156005859375, -1.3590087890625, -1.251861572265625, -1.14471435546875, -1.037567138671875, -0.930419921875, -0.823272705078125, -0.71612548828125, -0.608978271484375, -0.5018310546875, -0.394683837890625, -0.28753662109375, -0.180389404296875, -0.0732421875, 0.033905029296875, 0.14105224609375, 0.248199462890625, 0.3553466796875, 0.462493896484375, 0.56964111328125, 0.676788330078125, 0.783935546875, 0.891082763671875, 0.99822998046875, 1.105377197265625, 1.2125244140625, 1.319671630859375, 1.42681884765625, 1.533966064453125, 1.64111328125, 1.748260498046875, 1.85540771484375, 1.962554931640625, 2.0697021484375, 2.176849365234375, 2.28399658203125, 2.391143798828125, 2.498291015625, 2.605438232421875, 2.71258544921875, 2.819732666015625, 2.9268798828125, 3.034027099609375, 3.14117431640625, 3.248321533203125, 3.35546875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 18.0, 18.0, 17.0, 14.0, 20.0, 17.0, 24.0, 27.0, 29.0, 32.0, 37.0, 33.0, 42.0, 52.0, 33.0, 46.0, 50.0, 40.0, 37.0, 52.0, 34.0, 33.0, 33.0, 29.0, 24.0, 29.0, 28.0, 17.0, 12.0, 15.0, 16.0, 5.0, 7.0, 9.0, 6.0, 7.0, 7.0, 6.0, 3.0, 1.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.01171875, -2.920196533203125, -2.82867431640625, -2.737152099609375, -2.6456298828125, -2.554107666015625, -2.46258544921875, -2.371063232421875, -2.279541015625, -2.188018798828125, -2.09649658203125, -2.004974365234375, -1.9134521484375, -1.821929931640625, -1.73040771484375, -1.638885498046875, -1.54736328125, -1.455841064453125, -1.36431884765625, -1.272796630859375, -1.1812744140625, -1.089752197265625, -0.99822998046875, -0.906707763671875, -0.815185546875, -0.723663330078125, -0.63214111328125, -0.540618896484375, -0.4490966796875, -0.357574462890625, -0.26605224609375, -0.174530029296875, -0.0830078125, 0.008514404296875, 0.10003662109375, 0.191558837890625, 0.2830810546875, 0.374603271484375, 0.46612548828125, 0.557647705078125, 0.649169921875, 0.740692138671875, 0.83221435546875, 0.923736572265625, 1.0152587890625, 1.106781005859375, 1.19830322265625, 1.289825439453125, 1.38134765625, 1.472869873046875, 1.56439208984375, 1.655914306640625, 1.7474365234375, 1.838958740234375, 1.93048095703125, 2.022003173828125, 2.113525390625, 2.205047607421875, 2.29656982421875, 2.388092041015625, 2.4796142578125, 2.571136474609375, 2.66265869140625, 2.754180908203125, 2.845703125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 16.0, 15.0, 20.0, 21.0, 36.0, 48.0, 90.0, 105.0, 151.0, 239.0, 364.0, 607.0, 992.0, 1602.0, 2466.0, 4070.0, 7050.0, 11742.0, 20363.0, 34710.0, 59817.0, 97494.0, 142686.0, 175172.0, 165757.0, 124868.0, 80807.0, 48685.0, 28051.0, 16381.0, 9515.0, 5693.0, 3299.0, 2104.0, 1261.0, 789.0, 489.0, 313.0, 208.0, 152.0, 97.0, 79.0, 55.0, 24.0, 12.0, 15.0, 13.0, 10.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.063812255859375, -2.96746826171875, -2.871124267578125, -2.7747802734375, -2.678436279296875, -2.58209228515625, -2.485748291015625, -2.389404296875, -2.293060302734375, -2.19671630859375, -2.100372314453125, -2.0040283203125, -1.907684326171875, -1.81134033203125, -1.714996337890625, -1.61865234375, -1.522308349609375, -1.42596435546875, -1.329620361328125, -1.2332763671875, -1.136932373046875, -1.04058837890625, -0.944244384765625, -0.847900390625, -0.751556396484375, -0.65521240234375, -0.558868408203125, -0.4625244140625, -0.366180419921875, -0.26983642578125, -0.173492431640625, -0.0771484375, 0.019195556640625, 0.11553955078125, 0.211883544921875, 0.3082275390625, 0.404571533203125, 0.50091552734375, 0.597259521484375, 0.693603515625, 0.789947509765625, 0.88629150390625, 0.982635498046875, 1.0789794921875, 1.175323486328125, 1.27166748046875, 1.368011474609375, 1.46435546875, 1.560699462890625, 1.65704345703125, 1.753387451171875, 1.8497314453125, 1.946075439453125, 2.04241943359375, 2.138763427734375, 2.235107421875, 2.331451416015625, 2.42779541015625, 2.524139404296875, 2.6204833984375, 2.716827392578125, 2.81317138671875, 2.909515380859375, 3.005859375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 16.0, 18.0, 18.0, 19.0, 11.0, 19.0, 20.0, 22.0, 25.0, 23.0, 23.0, 39.0, 30.0, 37.0, 38.0, 42.0, 23.0, 41.0, 33.0, 43.0, 37.0, 38.0, 39.0, 28.0, 36.0, 22.0, 17.0, 28.0, 21.0, 23.0, 24.0, 22.0, 16.0, 15.0, 14.0, 11.0, 7.0, 7.0, 9.0, 4.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5634765625, -1.5135345458984375, -1.463592529296875, -1.4136505126953125, -1.36370849609375, -1.3137664794921875, -1.263824462890625, -1.2138824462890625, -1.1639404296875, -1.1139984130859375, -1.064056396484375, -1.0141143798828125, -0.96417236328125, -0.9142303466796875, -0.864288330078125, -0.8143463134765625, -0.764404296875, -0.7144622802734375, -0.664520263671875, -0.6145782470703125, -0.56463623046875, -0.5146942138671875, -0.464752197265625, -0.4148101806640625, -0.3648681640625, -0.3149261474609375, -0.264984130859375, -0.2150421142578125, -0.16510009765625, -0.1151580810546875, -0.065216064453125, -0.0152740478515625, 0.03466796875, 0.0846099853515625, 0.134552001953125, 0.1844940185546875, 0.23443603515625, 0.2843780517578125, 0.334320068359375, 0.3842620849609375, 0.4342041015625, 0.4841461181640625, 0.534088134765625, 0.5840301513671875, 0.63397216796875, 0.6839141845703125, 0.733856201171875, 0.7837982177734375, 0.833740234375, 0.8836822509765625, 0.933624267578125, 0.9835662841796875, 1.03350830078125, 1.0834503173828125, 1.133392333984375, 1.1833343505859375, 1.2332763671875, 1.2832183837890625, 1.333160400390625, 1.3831024169921875, 1.43304443359375, 1.4829864501953125, 1.532928466796875, 1.5828704833984375, 1.6328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 21.0, 18.0, 24.0, 34.0, 50.0, 63.0, 112.0, 127.0, 202.0, 324.0, 477.0, 689.0, 1073.0, 1811.0, 3093.0, 5941.0, 11697.0, 25276.0, 56182.0, 124925.0, 234206.0, 267020.0, 167398.0, 78680.0, 35001.0, 15979.0, 7941.0, 4110.0, 2265.0, 1362.0, 798.0, 511.0, 369.0, 215.0, 155.0, 106.0, 79.0, 51.0, 37.0, 30.0, 25.0, 14.0, 17.0, 6.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.0390625, -1.9715576171875, -1.904052734375, -1.8365478515625, -1.76904296875, -1.7015380859375, -1.634033203125, -1.5665283203125, -1.4990234375, -1.4315185546875, -1.364013671875, -1.2965087890625, -1.22900390625, -1.1614990234375, -1.093994140625, -1.0264892578125, -0.958984375, -0.8914794921875, -0.823974609375, -0.7564697265625, -0.68896484375, -0.6214599609375, -0.553955078125, -0.4864501953125, -0.4189453125, -0.3514404296875, -0.283935546875, -0.2164306640625, -0.14892578125, -0.0814208984375, -0.013916015625, 0.0535888671875, 0.12109375, 0.1885986328125, 0.256103515625, 0.3236083984375, 0.39111328125, 0.4586181640625, 0.526123046875, 0.5936279296875, 0.6611328125, 0.7286376953125, 0.796142578125, 0.8636474609375, 0.93115234375, 0.9986572265625, 1.066162109375, 1.1336669921875, 1.201171875, 1.2686767578125, 1.336181640625, 1.4036865234375, 1.47119140625, 1.5386962890625, 1.606201171875, 1.6737060546875, 1.7412109375, 1.8087158203125, 1.876220703125, 1.9437255859375, 2.01123046875, 2.0787353515625, 2.146240234375, 2.2137451171875, 2.28125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 14.0, 30.0, 46.0, 52.0, 108.0, 100.0, 114.0, 108.0, 97.0, 82.0, 62.0, 45.0, 28.0, 28.0, 20.0, 12.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00024318695068359375, -0.0002345442771911621, -0.00022590160369873047, -0.00021725893020629883, -0.0002086162567138672, -0.00019997358322143555, -0.0001913309097290039, -0.00018268823623657227, -0.00017404556274414062, -0.00016540288925170898, -0.00015676021575927734, -0.0001481175422668457, -0.00013947486877441406, -0.00013083219528198242, -0.00012218952178955078, -0.00011354684829711914, -0.0001049041748046875, -9.626150131225586e-05, -8.761882781982422e-05, -7.897615432739258e-05, -7.033348083496094e-05, -6.16908073425293e-05, -5.3048133850097656e-05, -4.4405460357666016e-05, -3.5762786865234375e-05, -2.7120113372802734e-05, -1.8477439880371094e-05, -9.834766387939453e-06, -1.1920928955078125e-06, 7.450580596923828e-06, 1.609325408935547e-05, 2.473592758178711e-05, 3.337860107421875e-05, 4.202127456665039e-05, 5.066394805908203e-05, 5.930662155151367e-05, 6.794929504394531e-05, 7.659196853637695e-05, 8.52346420288086e-05, 9.387731552124023e-05, 0.00010251998901367188, 0.00011116266250610352, 0.00011980533599853516, 0.0001284480094909668, 0.00013709068298339844, 0.00014573335647583008, 0.00015437602996826172, 0.00016301870346069336, 0.000171661376953125, 0.00018030405044555664, 0.00018894672393798828, 0.00019758939743041992, 0.00020623207092285156, 0.0002148747444152832, 0.00022351741790771484, 0.00023216009140014648, 0.00024080276489257812, 0.00024944543838500977, 0.0002580881118774414, 0.00026673078536987305, 0.0002753734588623047, 0.00028401613235473633, 0.00029265880584716797, 0.0003013014793395996, 0.00030994415283203125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 18.0, 14.0, 26.0, 28.0, 45.0, 59.0, 73.0, 128.0, 179.0, 214.0, 318.0, 482.0, 706.0, 1073.0, 1895.0, 3305.0, 5993.0, 11601.0, 23539.0, 48466.0, 100193.0, 185684.0, 249018.0, 198971.0, 108603.0, 54002.0, 25549.0, 12781.0, 6491.0, 3562.0, 1971.0, 1223.0, 728.0, 498.0, 309.0, 202.0, 145.0, 113.0, 80.0, 71.0, 47.0, 35.0, 30.0, 28.0, 13.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.67193603515625, -1.6134033203125, -1.55487060546875, -1.496337890625, -1.43780517578125, -1.3792724609375, -1.32073974609375, -1.26220703125, -1.20367431640625, -1.1451416015625, -1.08660888671875, -1.028076171875, -0.96954345703125, -0.9110107421875, -0.85247802734375, -0.7939453125, -0.73541259765625, -0.6768798828125, -0.61834716796875, -0.559814453125, -0.50128173828125, -0.4427490234375, -0.38421630859375, -0.32568359375, -0.26715087890625, -0.2086181640625, -0.15008544921875, -0.091552734375, -0.03302001953125, 0.0255126953125, 0.08404541015625, 0.142578125, 0.20111083984375, 0.2596435546875, 0.31817626953125, 0.376708984375, 0.43524169921875, 0.4937744140625, 0.55230712890625, 0.61083984375, 0.66937255859375, 0.7279052734375, 0.78643798828125, 0.844970703125, 0.90350341796875, 0.9620361328125, 1.02056884765625, 1.0791015625, 1.13763427734375, 1.1961669921875, 1.25469970703125, 1.313232421875, 1.37176513671875, 1.4302978515625, 1.48883056640625, 1.54736328125, 1.60589599609375, 1.6644287109375, 1.72296142578125, 1.781494140625, 1.84002685546875, 1.8985595703125, 1.95709228515625, 2.015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 5.0, 5.0, 12.0, 11.0, 11.0, 23.0, 28.0, 28.0, 30.0, 41.0, 54.0, 47.0, 42.0, 56.0, 47.0, 47.0, 65.0, 57.0, 48.0, 36.0, 42.0, 37.0, 24.0, 39.0, 32.0, 23.0, 18.0, 14.0, 8.0, 7.0, 4.0, 6.0, 9.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.4013671875, -0.3897247314453125, -0.378082275390625, -0.3664398193359375, -0.35479736328125, -0.3431549072265625, -0.331512451171875, -0.3198699951171875, -0.3082275390625, -0.2965850830078125, -0.284942626953125, -0.2733001708984375, -0.26165771484375, -0.2500152587890625, -0.238372802734375, -0.2267303466796875, -0.215087890625, -0.2034454345703125, -0.191802978515625, -0.1801605224609375, -0.16851806640625, -0.1568756103515625, -0.145233154296875, -0.1335906982421875, -0.1219482421875, -0.1103057861328125, -0.098663330078125, -0.0870208740234375, -0.07537841796875, -0.0637359619140625, -0.052093505859375, -0.0404510498046875, -0.02880859375, -0.0171661376953125, -0.005523681640625, 0.0061187744140625, 0.01776123046875, 0.0294036865234375, 0.041046142578125, 0.0526885986328125, 0.0643310546875, 0.0759735107421875, 0.087615966796875, 0.0992584228515625, 0.11090087890625, 0.1225433349609375, 0.134185791015625, 0.1458282470703125, 0.157470703125, 0.1691131591796875, 0.180755615234375, 0.1923980712890625, 0.20404052734375, 0.2156829833984375, 0.227325439453125, 0.2389678955078125, 0.2506103515625, 0.2622528076171875, 0.273895263671875, 0.2855377197265625, 0.29718017578125, 0.3088226318359375, 0.320465087890625, 0.3321075439453125, 0.34375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 15.0, 13.0, 13.0, 15.0, 21.0, 33.0, 36.0, 41.0, 48.0, 75.0, 65.0, 58.0, 72.0, 88.0, 59.0, 48.0, 44.0, 55.0, 32.0, 32.0, 26.0, 16.0, 19.0, 15.0, 12.0, 9.0, 3.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.999162197113037, -5.831065654754639, -5.662968635559082, -5.494872093200684, -5.326775550842285, -5.1586785316467285, -4.99058198928833, -4.822484970092773, -4.654388427734375, -4.486291885375977, -4.31819486618042, -4.1500983238220215, -3.982001543045044, -3.8139047622680664, -3.645808219909668, -3.4777114391326904, -3.309614896774292, -3.1415181159973145, -2.973421573638916, -2.8053247928619385, -2.637228012084961, -2.4691314697265625, -2.301034688949585, -2.1329379081726074, -1.9648412466049194, -1.7967445850372314, -1.628647804260254, -1.460551142692566, -1.292454481124878, -1.1243577003479004, -0.9562610387802124, -0.7881642580032349, -0.6200675964355469, -0.4519708752632141, -0.28387418389320374, -0.11577749252319336, 0.052319228649139404, 0.22041594982147217, 0.38851261138916016, 0.5566093921661377, 0.7247060537338257, 0.8928027749061584, 1.0608994960784912, 1.2289961576461792, 1.3970928192138672, 1.5651895999908447, 1.7332862615585327, 1.9013830423355103, 2.0694797039031982, 2.237576484680176, 2.405673027038574, 2.5737698078155518, 2.7418665885925293, 2.9099631309509277, 3.0780599117279053, 3.246156692504883, 3.4142532348632812, 3.582350015640259, 3.7504465579986572, 3.9185433387756348, 4.086639881134033, 4.25473690032959, 4.422833442687988, 4.590929985046387, 4.759027004241943]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 5.0, 4.0, 11.0, 9.0, 16.0, 18.0, 9.0, 16.0, 30.0, 24.0, 24.0, 31.0, 35.0, 30.0, 30.0, 38.0, 38.0, 56.0, 43.0, 45.0, 46.0, 42.0, 29.0, 30.0, 34.0, 35.0, 34.0, 29.0, 30.0, 33.0, 20.0, 25.0, 15.0, 11.0, 12.0, 9.0, 10.0, 4.0, 10.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8219175338745117, -2.7345430850982666, -2.6471686363220215, -2.5597941875457764, -2.4724197387695312, -2.385045289993286, -2.297670841217041, -2.210296392440796, -2.122921943664551, -2.0355474948883057, -1.9481730461120605, -1.8607985973358154, -1.7734241485595703, -1.6860496997833252, -1.59867525100708, -1.511300802230835, -1.4239263534545898, -1.3365519046783447, -1.2491774559020996, -1.1618030071258545, -1.0744285583496094, -0.9870541095733643, -0.8996796607971191, -0.812305212020874, -0.7249307632446289, -0.6375563144683838, -0.5501818656921387, -0.46280741691589355, -0.37543296813964844, -0.2880585193634033, -0.2006840705871582, -0.11330962181091309, -0.02593541145324707, 0.06143903732299805, 0.14881348609924316, 0.23618793487548828, 0.3235623836517334, 0.4109368324279785, 0.49831128120422363, 0.5856857299804688, 0.6730601787567139, 0.760434627532959, 0.8478090763092041, 0.9351835250854492, 1.0225579738616943, 1.1099324226379395, 1.1973068714141846, 1.2846813201904297, 1.3720557689666748, 1.45943021774292, 1.546804666519165, 1.6341791152954102, 1.7215535640716553, 1.8089280128479004, 1.8963024616241455, 1.9836769104003906, 2.0710513591766357, 2.158425807952881, 2.245800256729126, 2.333174705505371, 2.420549154281616, 2.5079236030578613, 2.5952980518341064, 2.6826725006103516, 2.7700469493865967]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 16.0, 20.0, 17.0, 27.0, 39.0, 77.0, 94.0, 173.0, 250.0, 392.0, 731.0, 1190.0, 1877.0, 3316.0, 5852.0, 10470.0, 19480.0, 37004.0, 76234.0, 172125.0, 430029.0, 1022466.0, 1279485.0, 665221.0, 256497.0, 107413.0, 49786.0, 24690.0, 13027.0, 6999.0, 3847.0, 2222.0, 1275.0, 738.0, 482.0, 235.0, 157.0, 98.0, 73.0, 47.0, 38.0, 20.0, 12.0, 8.0, 13.0, 5.0, 2.0, 0.0, 0.0, 1.0, 5.0], "bins": [-5.24609375, -5.09716796875, -4.9482421875, -4.79931640625, -4.650390625, -4.50146484375, -4.3525390625, -4.20361328125, -4.0546875, -3.90576171875, -3.7568359375, -3.60791015625, -3.458984375, -3.31005859375, -3.1611328125, -3.01220703125, -2.86328125, -2.71435546875, -2.5654296875, -2.41650390625, -2.267578125, -2.11865234375, -1.9697265625, -1.82080078125, -1.671875, -1.52294921875, -1.3740234375, -1.22509765625, -1.076171875, -0.92724609375, -0.7783203125, -0.62939453125, -0.48046875, -0.33154296875, -0.1826171875, -0.03369140625, 0.115234375, 0.26416015625, 0.4130859375, 0.56201171875, 0.7109375, 0.85986328125, 1.0087890625, 1.15771484375, 1.306640625, 1.45556640625, 1.6044921875, 1.75341796875, 1.90234375, 2.05126953125, 2.2001953125, 2.34912109375, 2.498046875, 2.64697265625, 2.7958984375, 2.94482421875, 3.09375, 3.24267578125, 3.3916015625, 3.54052734375, 3.689453125, 3.83837890625, 3.9873046875, 4.13623046875, 4.28515625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 4.0, 3.0, 7.0, 7.0, 16.0, 16.0, 11.0, 18.0, 19.0, 24.0, 29.0, 36.0, 25.0, 27.0, 34.0, 43.0, 54.0, 47.0, 42.0, 49.0, 48.0, 43.0, 41.0, 33.0, 35.0, 40.0, 32.0, 33.0, 27.0, 26.0, 18.0, 18.0, 22.0, 15.0, 11.0, 12.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.396484375, -2.32330322265625, -2.2501220703125, -2.17694091796875, -2.103759765625, -2.03057861328125, -1.9573974609375, -1.88421630859375, -1.81103515625, -1.73785400390625, -1.6646728515625, -1.59149169921875, -1.518310546875, -1.44512939453125, -1.3719482421875, -1.29876708984375, -1.2255859375, -1.15240478515625, -1.0792236328125, -1.00604248046875, -0.932861328125, -0.85968017578125, -0.7864990234375, -0.71331787109375, -0.64013671875, -0.56695556640625, -0.4937744140625, -0.42059326171875, -0.347412109375, -0.27423095703125, -0.2010498046875, -0.12786865234375, -0.0546875, 0.01849365234375, 0.0916748046875, 0.16485595703125, 0.238037109375, 0.31121826171875, 0.3843994140625, 0.45758056640625, 0.53076171875, 0.60394287109375, 0.6771240234375, 0.75030517578125, 0.823486328125, 0.89666748046875, 0.9698486328125, 1.04302978515625, 1.1162109375, 1.18939208984375, 1.2625732421875, 1.33575439453125, 1.408935546875, 1.48211669921875, 1.5552978515625, 1.62847900390625, 1.70166015625, 1.77484130859375, 1.8480224609375, 1.92120361328125, 1.994384765625, 2.06756591796875, 2.1407470703125, 2.21392822265625, 2.287109375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 13.0, 11.0, 26.0, 72.0, 81.0, 143.0, 220.0, 427.0, 731.0, 1440.0, 2567.0, 4874.0, 9441.0, 18633.0, 38537.0, 83064.0, 188194.0, 447615.0, 1025924.0, 1256031.0, 635381.0, 263905.0, 114014.0, 51901.0, 24866.0, 12295.0, 6323.0, 3405.0, 1850.0, 938.0, 582.0, 330.0, 169.0, 115.0, 66.0, 37.0, 24.0, 14.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.37286376953125, -5.1949462890625, -5.01702880859375, -4.839111328125, -4.66119384765625, -4.4832763671875, -4.30535888671875, -4.12744140625, -3.94952392578125, -3.7716064453125, -3.59368896484375, -3.415771484375, -3.23785400390625, -3.0599365234375, -2.88201904296875, -2.7041015625, -2.52618408203125, -2.3482666015625, -2.17034912109375, -1.992431640625, -1.81451416015625, -1.6365966796875, -1.45867919921875, -1.28076171875, -1.10284423828125, -0.9249267578125, -0.74700927734375, -0.569091796875, -0.39117431640625, -0.2132568359375, -0.03533935546875, 0.142578125, 0.32049560546875, 0.4984130859375, 0.67633056640625, 0.854248046875, 1.03216552734375, 1.2100830078125, 1.38800048828125, 1.56591796875, 1.74383544921875, 1.9217529296875, 2.09967041015625, 2.277587890625, 2.45550537109375, 2.6334228515625, 2.81134033203125, 2.9892578125, 3.16717529296875, 3.3450927734375, 3.52301025390625, 3.700927734375, 3.87884521484375, 4.0567626953125, 4.23468017578125, 4.41259765625, 4.59051513671875, 4.7684326171875, 4.94635009765625, 5.124267578125, 5.30218505859375, 5.4801025390625, 5.65802001953125, 5.8359375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 15.0, 17.0, 24.0, 21.0, 26.0, 41.0, 48.0, 87.0, 88.0, 110.0, 143.0, 177.0, 205.0, 248.0, 308.0, 295.0, 324.0, 325.0, 297.0, 226.0, 210.0, 178.0, 152.0, 104.0, 78.0, 69.0, 51.0, 44.0, 30.0, 30.0, 21.0, 12.0, 14.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4149322509765625, -1.369903564453125, -1.3248748779296875, -1.27984619140625, -1.2348175048828125, -1.189788818359375, -1.1447601318359375, -1.0997314453125, -1.0547027587890625, -1.009674072265625, -0.9646453857421875, -0.91961669921875, -0.8745880126953125, -0.829559326171875, -0.7845306396484375, -0.739501953125, -0.6944732666015625, -0.649444580078125, -0.6044158935546875, -0.55938720703125, -0.5143585205078125, -0.469329833984375, -0.4243011474609375, -0.3792724609375, -0.3342437744140625, -0.289215087890625, -0.2441864013671875, -0.19915771484375, -0.1541290283203125, -0.109100341796875, -0.0640716552734375, -0.01904296875, 0.0259857177734375, 0.071014404296875, 0.1160430908203125, 0.16107177734375, 0.2061004638671875, 0.251129150390625, 0.2961578369140625, 0.3411865234375, 0.3862152099609375, 0.431243896484375, 0.4762725830078125, 0.52130126953125, 0.5663299560546875, 0.611358642578125, 0.6563873291015625, 0.701416015625, 0.7464447021484375, 0.791473388671875, 0.8365020751953125, 0.88153076171875, 0.9265594482421875, 0.971588134765625, 1.0166168212890625, 1.0616455078125, 1.1066741943359375, 1.151702880859375, 1.1967315673828125, 1.24176025390625, 1.2867889404296875, 1.331817626953125, 1.3768463134765625, 1.421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 2.0, 5.0, 6.0, 13.0, 12.0, 11.0, 14.0, 18.0, 24.0, 37.0, 41.0, 47.0, 55.0, 72.0, 60.0, 64.0, 67.0, 61.0, 76.0, 55.0, 49.0, 42.0, 28.0, 27.0, 25.0, 14.0, 14.0, 13.0, 8.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.115167617797852, -5.950706958770752, -5.7862467765808105, -5.621786117553711, -5.4573259353637695, -5.29286527633667, -5.1284050941467285, -4.963944435119629, -4.7994842529296875, -4.635023593902588, -4.4705634117126465, -4.306102752685547, -4.1416425704956055, -3.977181911468506, -3.8127214908599854, -3.648261070251465, -3.4838004112243652, -3.3193399906158447, -3.154879570007324, -2.9904191493988037, -2.825958728790283, -2.6614980697631836, -2.497037649154663, -2.3325772285461426, -2.168116807937622, -2.0036563873291016, -1.839195966720581, -1.674735426902771, -1.5102750062942505, -1.34581458568573, -1.18135404586792, -1.0168936252593994, -0.8524336814880371, -0.6879732608795166, -0.5235127806663513, -0.3590523302555084, -0.19459187984466553, -0.03013145923614502, 0.13432902097702026, 0.29878950119018555, 0.46324992179870605, 0.6277103424072266, 0.7921708226203918, 0.9566313028335571, 1.1210917234420776, 1.2855521440505981, 1.4500126838684082, 1.6144731044769287, 1.7789335250854492, 1.9433939456939697, 2.1078543663024902, 2.2723147869110107, 2.4367752075195312, 2.601235866546631, 2.7656962871551514, 2.930156707763672, 3.0946171283721924, 3.259077548980713, 3.4235379695892334, 3.587998390197754, 3.7524590492248535, 3.916919231414795, 4.0813798904418945, 4.245840072631836, 4.4103007316589355]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 8.0, 8.0, 4.0, 10.0, 18.0, 10.0, 16.0, 14.0, 25.0, 20.0, 32.0, 27.0, 32.0, 33.0, 44.0, 42.0, 38.0, 58.0, 25.0, 44.0, 43.0, 38.0, 40.0, 34.0, 42.0, 39.0, 25.0, 30.0, 22.0, 32.0, 21.0, 22.0, 18.0, 17.0, 15.0, 11.0, 8.0, 12.0, 3.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.7552988529205322, -2.6693832874298096, -2.583467960357666, -2.4975523948669434, -2.4116368293762207, -2.325721502304077, -2.2398059368133545, -2.153890609741211, -2.0679750442504883, -1.9820595979690552, -1.896144151687622, -1.8102285861968994, -1.7243131399154663, -1.6383976936340332, -1.5524821281433105, -1.4665666818618774, -1.3806512355804443, -1.2947357892990112, -1.2088203430175781, -1.1229047775268555, -1.0369893312454224, -0.9510738849639893, -0.8651583790779114, -0.7792428731918335, -0.6933274269104004, -0.6074119806289673, -0.5214964747428894, -0.4355809986591339, -0.3496655225753784, -0.2637500464916229, -0.17783457040786743, -0.09191906452178955, -0.006003618240356445, 0.07991185784339905, 0.16582733392715454, 0.25174281001091003, 0.3376582860946655, 0.423573762178421, 0.5094892382621765, 0.5954047441482544, 0.6813201904296875, 0.7672356367111206, 0.8531511425971985, 0.9390666484832764, 1.0249820947647095, 1.1108975410461426, 1.1968131065368652, 1.2827285528182983, 1.3686439990997314, 1.4545594453811646, 1.5404748916625977, 1.6263904571533203, 1.7123059034347534, 1.7982213497161865, 1.8841369152069092, 1.9700523614883423, 2.0559678077697754, 2.141883373260498, 2.2277987003326416, 2.3137142658233643, 2.399629592895508, 2.4855451583862305, 2.571460723876953, 2.657376289367676, 2.7432916164398193]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 15.0, 24.0, 25.0, 25.0, 51.0, 67.0, 122.0, 136.0, 235.0, 364.0, 576.0, 882.0, 1361.0, 2190.0, 3480.0, 6284.0, 10998.0, 19590.0, 36293.0, 67930.0, 128564.0, 214372.0, 230811.0, 148472.0, 80579.0, 42139.0, 22663.0, 12327.0, 7054.0, 4033.0, 2482.0, 1542.0, 985.0, 609.0, 413.0, 274.0, 189.0, 109.0, 87.0, 64.0, 38.0, 25.0, 20.0, 14.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.385498046875, -0.3731117248535156, -0.36072540283203125, -0.3483390808105469, -0.3359527587890625, -0.3235664367675781, -0.31118011474609375, -0.2987937927246094, -0.286407470703125, -0.2740211486816406, -0.26163482666015625, -0.24924850463867188, -0.2368621826171875, -0.22447586059570312, -0.21208953857421875, -0.19970321655273438, -0.18731689453125, -0.17493057250976562, -0.16254425048828125, -0.15015792846679688, -0.1377716064453125, -0.12538528442382812, -0.11299896240234375, -0.10061264038085938, -0.088226318359375, -0.07583999633789062, -0.06345367431640625, -0.051067352294921875, -0.0386810302734375, -0.026294708251953125, -0.01390838623046875, -0.001522064208984375, 0.0108642578125, 0.023250579833984375, 0.03563690185546875, 0.048023223876953125, 0.0604095458984375, 0.07279586791992188, 0.08518218994140625, 0.09756851196289062, 0.109954833984375, 0.12234115600585938, 0.13472747802734375, 0.14711380004882812, 0.1595001220703125, 0.17188644409179688, 0.18427276611328125, 0.19665908813476562, 0.20904541015625, 0.22143173217773438, 0.23381805419921875, 0.24620437622070312, 0.2585906982421875, 0.2709770202636719, 0.28336334228515625, 0.2957496643066406, 0.308135986328125, 0.3205223083496094, 0.33290863037109375, 0.3452949523925781, 0.3576812744140625, 0.3700675964355469, 0.38245391845703125, 0.3948402404785156, 0.4072265625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 7.0, 5.0, 3.0, 11.0, 10.0, 16.0, 23.0, 19.0, 20.0, 25.0, 23.0, 41.0, 35.0, 44.0, 40.0, 39.0, 47.0, 30.0, 48.0, 45.0, 52.0, 37.0, 43.0, 43.0, 32.0, 38.0, 38.0, 28.0, 24.0, 12.0, 24.0, 18.0, 16.0, 19.0, 9.0, 7.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.404296875, -3.302093505859375, -3.19989013671875, -3.097686767578125, -2.9954833984375, -2.893280029296875, -2.79107666015625, -2.688873291015625, -2.586669921875, -2.484466552734375, -2.38226318359375, -2.280059814453125, -2.1778564453125, -2.075653076171875, -1.97344970703125, -1.871246337890625, -1.76904296875, -1.666839599609375, -1.56463623046875, -1.462432861328125, -1.3602294921875, -1.258026123046875, -1.15582275390625, -1.053619384765625, -0.951416015625, -0.849212646484375, -0.74700927734375, -0.644805908203125, -0.5426025390625, -0.440399169921875, -0.33819580078125, -0.235992431640625, -0.1337890625, -0.031585693359375, 0.07061767578125, 0.172821044921875, 0.2750244140625, 0.377227783203125, 0.47943115234375, 0.581634521484375, 0.683837890625, 0.786041259765625, 0.88824462890625, 0.990447998046875, 1.0926513671875, 1.194854736328125, 1.29705810546875, 1.399261474609375, 1.50146484375, 1.603668212890625, 1.70587158203125, 1.808074951171875, 1.9102783203125, 2.012481689453125, 2.11468505859375, 2.216888427734375, 2.319091796875, 2.421295166015625, 2.52349853515625, 2.625701904296875, 2.7279052734375, 2.830108642578125, 2.93231201171875, 3.034515380859375, 3.13671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 6.0, 10.0, 18.0, 30.0, 35.0, 33.0, 53.0, 86.0, 105.0, 153.0, 224.0, 270.0, 468.0, 767.0, 1194.0, 2007.0, 3628.0, 6792.0, 14501.0, 38870.0, 728524.0, 199926.0, 26828.0, 11178.0, 5350.0, 2858.0, 1699.0, 1018.0, 601.0, 434.0, 267.0, 172.0, 124.0, 73.0, 63.0, 45.0, 29.0, 23.0, 27.0, 16.0, 8.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.1845703125, -1.1505661010742188, -1.1165618896484375, -1.0825576782226562, -1.048553466796875, -1.0145492553710938, -0.9805450439453125, -0.9465408325195312, -0.91253662109375, -0.8785324096679688, -0.8445281982421875, -0.8105239868164062, -0.776519775390625, -0.7425155639648438, -0.7085113525390625, -0.6745071411132812, -0.6405029296875, -0.6064987182617188, -0.5724945068359375, -0.5384902954101562, -0.504486083984375, -0.47048187255859375, -0.4364776611328125, -0.40247344970703125, -0.36846923828125, -0.33446502685546875, -0.3004608154296875, -0.26645660400390625, -0.232452392578125, -0.19844818115234375, -0.1644439697265625, -0.13043975830078125, -0.096435546875, -0.06243133544921875, -0.0284271240234375, 0.00557708740234375, 0.039581298828125, 0.07358551025390625, 0.1075897216796875, 0.14159393310546875, 0.17559814453125, 0.20960235595703125, 0.2436065673828125, 0.27761077880859375, 0.311614990234375, 0.34561920166015625, 0.3796234130859375, 0.41362762451171875, 0.4476318359375, 0.48163604736328125, 0.5156402587890625, 0.5496444702148438, 0.583648681640625, 0.6176528930664062, 0.6516571044921875, 0.6856613159179688, 0.71966552734375, 0.7536697387695312, 0.7876739501953125, 0.8216781616210938, 0.855682373046875, 0.8896865844726562, 0.9236907958984375, 0.9576950073242188, 0.99169921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 3.0, 8.0, 11.0, 14.0, 11.0, 18.0, 20.0, 21.0, 27.0, 22.0, 30.0, 31.0, 25.0, 35.0, 19.0, 38.0, 37.0, 37.0, 47.0, 39.0, 37.0, 33.0, 45.0, 36.0, 32.0, 32.0, 38.0, 27.0, 34.0, 40.0, 20.0, 14.0, 14.0, 17.0, 17.0, 12.0, 7.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.017578125, -1.958251953125, -1.89892578125, -1.839599609375, -1.7802734375, -1.720947265625, -1.66162109375, -1.602294921875, -1.54296875, -1.483642578125, -1.42431640625, -1.364990234375, -1.3056640625, -1.246337890625, -1.18701171875, -1.127685546875, -1.068359375, -1.009033203125, -0.94970703125, -0.890380859375, -0.8310546875, -0.771728515625, -0.71240234375, -0.653076171875, -0.59375, -0.534423828125, -0.47509765625, -0.415771484375, -0.3564453125, -0.297119140625, -0.23779296875, -0.178466796875, -0.119140625, -0.059814453125, -0.00048828125, 0.058837890625, 0.1181640625, 0.177490234375, 0.23681640625, 0.296142578125, 0.35546875, 0.414794921875, 0.47412109375, 0.533447265625, 0.5927734375, 0.652099609375, 0.71142578125, 0.770751953125, 0.830078125, 0.889404296875, 0.94873046875, 1.008056640625, 1.0673828125, 1.126708984375, 1.18603515625, 1.245361328125, 1.3046875, 1.364013671875, 1.42333984375, 1.482666015625, 1.5419921875, 1.601318359375, 1.66064453125, 1.719970703125, 1.779296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 14.0, 24.0, 7.0, 33.0, 31.0, 48.0, 63.0, 116.0, 171.0, 244.0, 375.0, 571.0, 935.0, 1667.0, 2980.0, 5600.0, 11065.0, 25333.0, 353166.0, 594630.0, 26702.0, 11657.0, 5597.0, 3028.0, 1676.0, 1001.0, 618.0, 391.0, 247.0, 159.0, 122.0, 78.0, 72.0, 36.0, 27.0, 17.0, 9.0, 11.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.265869140625, -0.25782012939453125, -0.2497711181640625, -0.24172210693359375, -0.233673095703125, -0.22562408447265625, -0.2175750732421875, -0.20952606201171875, -0.20147705078125, -0.19342803955078125, -0.1853790283203125, -0.17733001708984375, -0.169281005859375, -0.16123199462890625, -0.1531829833984375, -0.14513397216796875, -0.1370849609375, -0.12903594970703125, -0.1209869384765625, -0.11293792724609375, -0.104888916015625, -0.09683990478515625, -0.0887908935546875, -0.08074188232421875, -0.07269287109375, -0.06464385986328125, -0.0565948486328125, -0.04854583740234375, -0.040496826171875, -0.03244781494140625, -0.0243988037109375, -0.01634979248046875, -0.00830078125, -0.00025177001953125, 0.0077972412109375, 0.01584625244140625, 0.023895263671875, 0.03194427490234375, 0.0399932861328125, 0.04804229736328125, 0.05609130859375, 0.06414031982421875, 0.0721893310546875, 0.08023834228515625, 0.088287353515625, 0.09633636474609375, 0.1043853759765625, 0.11243438720703125, 0.1204833984375, 0.12853240966796875, 0.1365814208984375, 0.14463043212890625, 0.152679443359375, 0.16072845458984375, 0.1687774658203125, 0.17682647705078125, 0.18487548828125, 0.19292449951171875, 0.2009735107421875, 0.20902252197265625, 0.217071533203125, 0.22512054443359375, 0.2331695556640625, 0.24121856689453125, 0.249267578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 4.0, 7.0, 8.0, 18.0, 13.0, 19.0, 29.0, 29.0, 29.0, 38.0, 40.0, 42.0, 46.0, 52.0, 58.0, 44.0, 34.0, 53.0, 40.0, 32.0, 39.0, 46.0, 47.0, 27.0, 32.0, 21.0, 27.0, 21.0, 27.0, 16.0, 10.0, 12.0, 5.0, 8.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9300729036331177e-05, -1.8753111362457275e-05, -1.8205493688583374e-05, -1.7657876014709473e-05, -1.711025834083557e-05, -1.656264066696167e-05, -1.601502299308777e-05, -1.5467405319213867e-05, -1.4919787645339966e-05, -1.4372169971466064e-05, -1.3824552297592163e-05, -1.3276934623718262e-05, -1.272931694984436e-05, -1.2181699275970459e-05, -1.1634081602096558e-05, -1.1086463928222656e-05, -1.0538846254348755e-05, -9.991228580474854e-06, -9.443610906600952e-06, -8.89599323272705e-06, -8.34837555885315e-06, -7.800757884979248e-06, -7.253140211105347e-06, -6.705522537231445e-06, -6.157904863357544e-06, -5.610287189483643e-06, -5.062669515609741e-06, -4.51505184173584e-06, -3.9674341678619385e-06, -3.419816493988037e-06, -2.8721988201141357e-06, -2.3245811462402344e-06, -1.776963472366333e-06, -1.2293457984924316e-06, -6.817281246185303e-07, -1.341104507446289e-07, 4.1350722312927246e-07, 9.611248970031738e-07, 1.5087425708770752e-06, 2.0563602447509766e-06, 2.603977918624878e-06, 3.1515955924987793e-06, 3.6992132663726807e-06, 4.246830940246582e-06, 4.794448614120483e-06, 5.342066287994385e-06, 5.889683961868286e-06, 6.4373016357421875e-06, 6.984919309616089e-06, 7.53253698348999e-06, 8.080154657363892e-06, 8.627772331237793e-06, 9.175390005111694e-06, 9.723007678985596e-06, 1.0270625352859497e-05, 1.0818243026733398e-05, 1.13658607006073e-05, 1.1913478374481201e-05, 1.2461096048355103e-05, 1.3008713722229004e-05, 1.3556331396102905e-05, 1.4103949069976807e-05, 1.4651566743850708e-05, 1.519918441772461e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 10.0, 10.0, 13.0, 20.0, 24.0, 48.0, 83.0, 77.0, 134.0, 207.0, 301.0, 491.0, 742.0, 1115.0, 1689.0, 2610.0, 4023.0, 6348.0, 10363.0, 16698.0, 28108.0, 48318.0, 81944.0, 135184.0, 187707.0, 186925.0, 133315.0, 81549.0, 47692.0, 27743.0, 17124.0, 10208.0, 6317.0, 3889.0, 2634.0, 1582.0, 1123.0, 692.0, 474.0, 327.0, 215.0, 150.0, 123.0, 67.0, 44.0, 26.0, 14.0, 17.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.07720947265625, -0.07486915588378906, -0.07252883911132812, -0.07018852233886719, -0.06784820556640625, -0.06550788879394531, -0.06316757202148438, -0.06082725524902344, -0.0584869384765625, -0.05614662170410156, -0.053806304931640625, -0.05146598815917969, -0.04912567138671875, -0.04678535461425781, -0.044445037841796875, -0.04210472106933594, -0.039764404296875, -0.03742408752441406, -0.035083770751953125, -0.03274345397949219, -0.03040313720703125, -0.028062820434570312, -0.025722503662109375, -0.023382186889648438, -0.0210418701171875, -0.018701553344726562, -0.016361236572265625, -0.014020919799804688, -0.01168060302734375, -0.009340286254882812, -0.006999969482421875, -0.0046596527099609375, -0.0023193359375, 2.09808349609375e-05, 0.002361297607421875, 0.0047016143798828125, 0.00704193115234375, 0.009382247924804688, 0.011722564697265625, 0.014062881469726562, 0.0164031982421875, 0.018743515014648438, 0.021083831787109375, 0.023424148559570312, 0.02576446533203125, 0.028104782104492188, 0.030445098876953125, 0.03278541564941406, 0.035125732421875, 0.03746604919433594, 0.039806365966796875, 0.04214668273925781, 0.04448699951171875, 0.04682731628417969, 0.049167633056640625, 0.05150794982910156, 0.0538482666015625, 0.05618858337402344, 0.058528900146484375, 0.06086921691894531, 0.06320953369140625, 0.06554985046386719, 0.06789016723632812, 0.07023048400878906, 0.07257080078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 11.0, 13.0, 14.0, 16.0, 19.0, 27.0, 37.0, 35.0, 48.0, 56.0, 44.0, 69.0, 68.0, 66.0, 56.0, 72.0, 48.0, 54.0, 43.0, 32.0, 36.0, 27.0, 19.0, 13.0, 16.0, 8.0, 7.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.01946711540222168, -0.01862478256225586, -0.01778244972229004, -0.01694011688232422, -0.0160977840423584, -0.015255451202392578, -0.014413118362426758, -0.013570785522460938, -0.012728452682495117, -0.011886119842529297, -0.011043787002563477, -0.010201454162597656, -0.009359121322631836, -0.008516788482666016, -0.007674455642700195, -0.006832122802734375, -0.005989789962768555, -0.005147457122802734, -0.004305124282836914, -0.0034627914428710938, -0.0026204586029052734, -0.0017781257629394531, -0.0009357929229736328, -9.34600830078125e-05, 0.0007488727569580078, 0.0015912055969238281, 0.0024335384368896484, 0.0032758712768554688, 0.004118204116821289, 0.004960536956787109, 0.00580286979675293, 0.00664520263671875, 0.00748753547668457, 0.00832986831665039, 0.009172201156616211, 0.010014533996582031, 0.010856866836547852, 0.011699199676513672, 0.012541532516479492, 0.013383865356445312, 0.014226198196411133, 0.015068531036376953, 0.015910863876342773, 0.016753196716308594, 0.017595529556274414, 0.018437862396240234, 0.019280195236206055, 0.020122528076171875, 0.020964860916137695, 0.021807193756103516, 0.022649526596069336, 0.023491859436035156, 0.024334192276000977, 0.025176525115966797, 0.026018857955932617, 0.026861190795898438, 0.027703523635864258, 0.028545856475830078, 0.0293881893157959, 0.03023052215576172, 0.03107285499572754, 0.03191518783569336, 0.03275752067565918, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 1.0, 5.0, 11.0, 11.0, 12.0, 8.0, 15.0, 22.0, 28.0, 33.0, 56.0, 39.0, 61.0, 69.0, 66.0, 63.0, 68.0, 65.0, 77.0, 54.0, 38.0, 41.0, 22.0, 27.0, 25.0, 14.0, 15.0, 11.0, 5.0, 10.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.1463704109191895, -5.979775905609131, -5.813181400299072, -5.646586894989014, -5.479991912841797, -5.313397407531738, -5.14680290222168, -4.980208396911621, -4.8136138916015625, -4.647019386291504, -4.480424880981445, -4.313830375671387, -4.147235870361328, -3.9806411266326904, -3.8140463829040527, -3.647451877593994, -3.4808573722839355, -3.314262866973877, -3.1476683616638184, -2.9810736179351807, -2.814479112625122, -2.6478846073150635, -2.481289863586426, -2.314695358276367, -2.1481008529663086, -1.98150634765625, -1.8149117231369019, -1.6483170986175537, -1.4817225933074951, -1.3151280879974365, -1.1485334634780884, -0.9819388389587402, -0.8153438568115234, -0.6487492918968201, -0.4821547269821167, -0.31556016206741333, -0.14896559715270996, 0.017628967761993408, 0.18422353267669678, 0.3508181571960449, 0.5174126625061035, 0.6840072274208069, 0.8506017923355103, 1.0171964168548584, 1.183790922164917, 1.3503854274749756, 1.5169800519943237, 1.6835746765136719, 1.8501691818237305, 2.016763687133789, 2.1833581924438477, 2.3499529361724854, 2.516547441482544, 2.6831419467926025, 2.8497366905212402, 3.016331195831299, 3.1829257011413574, 3.349520206451416, 3.5161147117614746, 3.6827094554901123, 3.849303960800171, 4.015898704528809, 4.182493209838867, 4.349087715148926, 4.515682220458984]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 6.0, 9.0, 5.0, 9.0, 18.0, 8.0, 17.0, 13.0, 24.0, 20.0, 32.0, 28.0, 33.0, 31.0, 41.0, 43.0, 40.0, 51.0, 34.0, 46.0, 38.0, 42.0, 37.0, 35.0, 39.0, 45.0, 24.0, 30.0, 22.0, 32.0, 18.0, 26.0, 16.0, 18.0, 14.0, 11.0, 8.0, 14.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.7307229042053223, -2.6451244354248047, -2.559526205062866, -2.4739277362823486, -2.38832950592041, -2.3027310371398926, -2.217132568359375, -2.1315343379974365, -2.045936107635498, -1.96033775806427, -1.874739408493042, -1.7891409397125244, -1.703542709350586, -1.6179442405700684, -1.5323458909988403, -1.4467475414276123, -1.3611490726470947, -1.2755507230758667, -1.1899523735046387, -1.104353904724121, -1.0187556743621826, -0.9331572651863098, -0.847558856010437, -0.761960506439209, -0.676362156867981, -0.5907638072967529, -0.5051654577255249, -0.4195670485496521, -0.3339686989784241, -0.24837034940719604, -0.16277194023132324, -0.07717359066009521, 0.008424520492553711, 0.09402288496494293, 0.17962124943733215, 0.26521962881088257, 0.3508179783821106, 0.4364163279533386, 0.5220147371292114, 0.6076130867004395, 0.6932114362716675, 0.7788097858428955, 0.8644081354141235, 0.9500065445899963, 1.0356049537658691, 1.1212031841278076, 1.2068016529083252, 1.2924000024795532, 1.3779983520507812, 1.4635967016220093, 1.5491950511932373, 1.6347935199737549, 1.7203917503356934, 1.805990219116211, 1.891588568687439, 1.977186918258667, 2.0627851486206055, 2.148383617401123, 2.2339818477630615, 2.319580316543579, 2.4051785469055176, 2.490777015686035, 2.5763754844665527, 2.661973714828491, 2.747572183609009]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 19.0, 19.0, 34.0, 44.0, 71.0, 104.0, 194.0, 271.0, 435.0, 726.0, 1282.0, 2249.0, 4417.0, 8200.0, 16104.0, 31684.0, 62185.0, 114471.0, 181745.0, 217199.0, 177109.0, 109108.0, 58651.0, 29738.0, 15167.0, 7912.0, 4044.0, 2314.0, 1181.0, 726.0, 403.0, 249.0, 160.0, 103.0, 72.0, 50.0, 39.0, 19.0, 15.0, 8.0, 9.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.0390625, -3.921844482421875, -3.80462646484375, -3.687408447265625, -3.5701904296875, -3.452972412109375, -3.33575439453125, -3.218536376953125, -3.101318359375, -2.984100341796875, -2.86688232421875, -2.749664306640625, -2.6324462890625, -2.515228271484375, -2.39801025390625, -2.280792236328125, -2.16357421875, -2.046356201171875, -1.92913818359375, -1.811920166015625, -1.6947021484375, -1.577484130859375, -1.46026611328125, -1.343048095703125, -1.225830078125, -1.108612060546875, -0.99139404296875, -0.874176025390625, -0.7569580078125, -0.639739990234375, -0.52252197265625, -0.405303955078125, -0.2880859375, -0.170867919921875, -0.05364990234375, 0.063568115234375, 0.1807861328125, 0.298004150390625, 0.41522216796875, 0.532440185546875, 0.649658203125, 0.766876220703125, 0.88409423828125, 1.001312255859375, 1.1185302734375, 1.235748291015625, 1.35296630859375, 1.470184326171875, 1.58740234375, 1.704620361328125, 1.82183837890625, 1.939056396484375, 2.0562744140625, 2.173492431640625, 2.29071044921875, 2.407928466796875, 2.525146484375, 2.642364501953125, 2.75958251953125, 2.876800537109375, 2.9940185546875, 3.111236572265625, 3.22845458984375, 3.345672607421875, 3.462890625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 4.0, 13.0, 11.0, 17.0, 11.0, 20.0, 30.0, 21.0, 35.0, 33.0, 43.0, 50.0, 36.0, 53.0, 43.0, 60.0, 57.0, 51.0, 37.0, 41.0, 37.0, 46.0, 37.0, 30.0, 28.0, 19.0, 21.0, 11.0, 24.0, 19.0, 13.0, 15.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.681640625, -3.570770263671875, -3.45989990234375, -3.349029541015625, -3.2381591796875, -3.127288818359375, -3.01641845703125, -2.905548095703125, -2.794677734375, -2.683807373046875, -2.57293701171875, -2.462066650390625, -2.3511962890625, -2.240325927734375, -2.12945556640625, -2.018585205078125, -1.90771484375, -1.796844482421875, -1.68597412109375, -1.575103759765625, -1.4642333984375, -1.353363037109375, -1.24249267578125, -1.131622314453125, -1.020751953125, -0.909881591796875, -0.79901123046875, -0.688140869140625, -0.5772705078125, -0.466400146484375, -0.35552978515625, -0.244659423828125, -0.1337890625, -0.022918701171875, 0.08795166015625, 0.198822021484375, 0.3096923828125, 0.420562744140625, 0.53143310546875, 0.642303466796875, 0.753173828125, 0.864044189453125, 0.97491455078125, 1.085784912109375, 1.1966552734375, 1.307525634765625, 1.41839599609375, 1.529266357421875, 1.64013671875, 1.751007080078125, 1.86187744140625, 1.972747802734375, 2.0836181640625, 2.194488525390625, 2.30535888671875, 2.416229248046875, 2.527099609375, 2.637969970703125, 2.74884033203125, 2.859710693359375, 2.9705810546875, 3.081451416015625, 3.19232177734375, 3.303192138671875, 3.4140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 6.0, 12.0, 16.0, 29.0, 38.0, 76.0, 104.0, 159.0, 250.0, 421.0, 712.0, 1137.0, 2021.0, 3218.0, 5919.0, 10013.0, 17492.0, 30475.0, 51204.0, 84044.0, 126125.0, 163229.0, 170057.0, 139323.0, 96736.0, 60314.0, 36081.0, 20816.0, 12020.0, 6773.0, 3811.0, 2276.0, 1414.0, 885.0, 544.0, 280.0, 189.0, 123.0, 66.0, 47.0, 41.0, 19.0, 20.0, 8.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1953125, -3.095947265625, -2.99658203125, -2.897216796875, -2.7978515625, -2.698486328125, -2.59912109375, -2.499755859375, -2.400390625, -2.301025390625, -2.20166015625, -2.102294921875, -2.0029296875, -1.903564453125, -1.80419921875, -1.704833984375, -1.60546875, -1.506103515625, -1.40673828125, -1.307373046875, -1.2080078125, -1.108642578125, -1.00927734375, -0.909912109375, -0.810546875, -0.711181640625, -0.61181640625, -0.512451171875, -0.4130859375, -0.313720703125, -0.21435546875, -0.114990234375, -0.015625, 0.083740234375, 0.18310546875, 0.282470703125, 0.3818359375, 0.481201171875, 0.58056640625, 0.679931640625, 0.779296875, 0.878662109375, 0.97802734375, 1.077392578125, 1.1767578125, 1.276123046875, 1.37548828125, 1.474853515625, 1.57421875, 1.673583984375, 1.77294921875, 1.872314453125, 1.9716796875, 2.071044921875, 2.17041015625, 2.269775390625, 2.369140625, 2.468505859375, 2.56787109375, 2.667236328125, 2.7666015625, 2.865966796875, 2.96533203125, 3.064697265625, 3.1640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 11.0, 13.0, 19.0, 14.0, 24.0, 20.0, 33.0, 20.0, 37.0, 40.0, 34.0, 42.0, 48.0, 30.0, 34.0, 41.0, 49.0, 39.0, 38.0, 45.0, 39.0, 41.0, 31.0, 36.0, 36.0, 27.0, 18.0, 20.0, 18.0, 20.0, 11.0, 9.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7509765625, -1.6909942626953125, -1.631011962890625, -1.5710296630859375, -1.51104736328125, -1.4510650634765625, -1.391082763671875, -1.3311004638671875, -1.2711181640625, -1.2111358642578125, -1.151153564453125, -1.0911712646484375, -1.03118896484375, -0.9712066650390625, -0.911224365234375, -0.8512420654296875, -0.791259765625, -0.7312774658203125, -0.671295166015625, -0.6113128662109375, -0.55133056640625, -0.4913482666015625, -0.431365966796875, -0.3713836669921875, -0.3114013671875, -0.2514190673828125, -0.191436767578125, -0.1314544677734375, -0.07147216796875, -0.0114898681640625, 0.048492431640625, 0.1084747314453125, 0.16845703125, 0.2284393310546875, 0.288421630859375, 0.3484039306640625, 0.40838623046875, 0.4683685302734375, 0.528350830078125, 0.5883331298828125, 0.6483154296875, 0.7082977294921875, 0.768280029296875, 0.8282623291015625, 0.88824462890625, 0.9482269287109375, 1.008209228515625, 1.0681915283203125, 1.128173828125, 1.1881561279296875, 1.248138427734375, 1.3081207275390625, 1.36810302734375, 1.4280853271484375, 1.488067626953125, 1.5480499267578125, 1.6080322265625, 1.6680145263671875, 1.727996826171875, 1.7879791259765625, 1.84796142578125, 1.9079437255859375, 1.967926025390625, 2.0279083251953125, 2.087890625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 10.0, 11.0, 12.0, 15.0, 27.0, 30.0, 55.0, 78.0, 116.0, 123.0, 208.0, 302.0, 424.0, 621.0, 893.0, 1353.0, 2096.0, 3348.0, 5138.0, 8420.0, 13876.0, 23362.0, 40053.0, 67391.0, 107171.0, 153446.0, 177414.0, 156672.0, 110757.0, 70055.0, 42026.0, 24500.0, 14306.0, 8897.0, 5276.0, 3501.0, 2092.0, 1427.0, 974.0, 647.0, 389.0, 325.0, 205.0, 155.0, 89.0, 81.0, 55.0, 37.0, 24.0, 24.0, 12.0, 14.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.4140625, -1.37060546875, -1.3271484375, -1.28369140625, -1.240234375, -1.19677734375, -1.1533203125, -1.10986328125, -1.06640625, -1.02294921875, -0.9794921875, -0.93603515625, -0.892578125, -0.84912109375, -0.8056640625, -0.76220703125, -0.71875, -0.67529296875, -0.6318359375, -0.58837890625, -0.544921875, -0.50146484375, -0.4580078125, -0.41455078125, -0.37109375, -0.32763671875, -0.2841796875, -0.24072265625, -0.197265625, -0.15380859375, -0.1103515625, -0.06689453125, -0.0234375, 0.02001953125, 0.0634765625, 0.10693359375, 0.150390625, 0.19384765625, 0.2373046875, 0.28076171875, 0.32421875, 0.36767578125, 0.4111328125, 0.45458984375, 0.498046875, 0.54150390625, 0.5849609375, 0.62841796875, 0.671875, 0.71533203125, 0.7587890625, 0.80224609375, 0.845703125, 0.88916015625, 0.9326171875, 0.97607421875, 1.01953125, 1.06298828125, 1.1064453125, 1.14990234375, 1.193359375, 1.23681640625, 1.2802734375, 1.32373046875, 1.3671875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 21.0, 10.0, 27.0, 32.0, 53.0, 61.0, 86.0, 110.0, 94.0, 94.0, 91.0, 66.0, 71.0, 43.0, 28.0, 28.0, 28.0, 8.0, 10.0, 8.0, 0.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021326541900634766, -0.00020658224821090698, -0.0001998990774154663, -0.00019321590662002563, -0.00018653273582458496, -0.0001798495650291443, -0.0001731663942337036, -0.00016648322343826294, -0.00015980005264282227, -0.0001531168818473816, -0.00014643371105194092, -0.00013975054025650024, -0.00013306736946105957, -0.0001263841986656189, -0.00011970102787017822, -0.00011301785707473755, -0.00010633468627929688, -9.96515154838562e-05, -9.296834468841553e-05, -8.628517389297485e-05, -7.960200309753418e-05, -7.29188323020935e-05, -6.623566150665283e-05, -5.955249071121216e-05, -5.2869319915771484e-05, -4.618614912033081e-05, -3.950297832489014e-05, -3.281980752944946e-05, -2.613663673400879e-05, -1.9453465938568115e-05, -1.2770295143127441e-05, -6.087124347686768e-06, 5.960464477539062e-07, 7.27921724319458e-06, 1.3962388038635254e-05, 2.0645558834075928e-05, 2.73287296295166e-05, 3.4011900424957275e-05, 4.069507122039795e-05, 4.737824201583862e-05, 5.40614128112793e-05, 6.074458360671997e-05, 6.742775440216064e-05, 7.411092519760132e-05, 8.079409599304199e-05, 8.747726678848267e-05, 9.416043758392334e-05, 0.00010084360837936401, 0.00010752677917480469, 0.00011420994997024536, 0.00012089312076568604, 0.0001275762915611267, 0.00013425946235656738, 0.00014094263315200806, 0.00014762580394744873, 0.0001543089747428894, 0.00016099214553833008, 0.00016767531633377075, 0.00017435848712921143, 0.0001810416579246521, 0.00018772482872009277, 0.00019440799951553345, 0.00020109117031097412, 0.0002077743411064148, 0.00021445751190185547]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 9.0, 8.0, 22.0, 24.0, 29.0, 45.0, 64.0, 103.0, 158.0, 188.0, 296.0, 412.0, 617.0, 972.0, 1381.0, 2081.0, 3310.0, 5331.0, 8801.0, 14298.0, 24063.0, 39653.0, 64733.0, 100756.0, 140575.0, 163931.0, 154229.0, 117938.0, 78416.0, 48909.0, 29901.0, 18027.0, 10692.0, 6720.0, 4166.0, 2661.0, 1727.0, 1032.0, 700.0, 504.0, 312.0, 228.0, 145.0, 109.0, 74.0, 55.0, 42.0, 33.0, 23.0, 17.0, 12.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0], "bins": [-1.2744140625, -1.2354583740234375, -1.196502685546875, -1.1575469970703125, -1.11859130859375, -1.0796356201171875, -1.040679931640625, -1.0017242431640625, -0.9627685546875, -0.9238128662109375, -0.884857177734375, -0.8459014892578125, -0.80694580078125, -0.7679901123046875, -0.729034423828125, -0.6900787353515625, -0.651123046875, -0.6121673583984375, -0.573211669921875, -0.5342559814453125, -0.49530029296875, -0.4563446044921875, -0.417388916015625, -0.3784332275390625, -0.3394775390625, -0.3005218505859375, -0.261566162109375, -0.2226104736328125, -0.18365478515625, -0.1446990966796875, -0.105743408203125, -0.0667877197265625, -0.02783203125, 0.0111236572265625, 0.050079345703125, 0.0890350341796875, 0.12799072265625, 0.1669464111328125, 0.205902099609375, 0.2448577880859375, 0.2838134765625, 0.3227691650390625, 0.361724853515625, 0.4006805419921875, 0.43963623046875, 0.4785919189453125, 0.517547607421875, 0.5565032958984375, 0.595458984375, 0.6344146728515625, 0.673370361328125, 0.7123260498046875, 0.75128173828125, 0.7902374267578125, 0.829193115234375, 0.8681488037109375, 0.9071044921875, 0.9460601806640625, 0.985015869140625, 1.0239715576171875, 1.06292724609375, 1.1018829345703125, 1.140838623046875, 1.1797943115234375, 1.21875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 5.0, 2.0, 10.0, 10.0, 12.0, 21.0, 21.0, 21.0, 25.0, 35.0, 39.0, 40.0, 51.0, 46.0, 51.0, 48.0, 63.0, 67.0, 58.0, 51.0, 44.0, 53.0, 42.0, 31.0, 25.0, 18.0, 22.0, 16.0, 13.0, 9.0, 4.0, 13.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31262969970703125, -0.2998199462890625, -0.28701019287109375, -0.274200439453125, -0.26139068603515625, -0.2485809326171875, -0.23577117919921875, -0.22296142578125, -0.21015167236328125, -0.1973419189453125, -0.18453216552734375, -0.171722412109375, -0.15891265869140625, -0.1461029052734375, -0.13329315185546875, -0.1204833984375, -0.10767364501953125, -0.0948638916015625, -0.08205413818359375, -0.069244384765625, -0.05643463134765625, -0.0436248779296875, -0.03081512451171875, -0.01800537109375, -0.00519561767578125, 0.0076141357421875, 0.02042388916015625, 0.033233642578125, 0.04604339599609375, 0.0588531494140625, 0.07166290283203125, 0.08447265625, 0.09728240966796875, 0.1100921630859375, 0.12290191650390625, 0.135711669921875, 0.14852142333984375, 0.1613311767578125, 0.17414093017578125, 0.18695068359375, 0.19976043701171875, 0.2125701904296875, 0.22537994384765625, 0.238189697265625, 0.25099945068359375, 0.2638092041015625, 0.27661895751953125, 0.2894287109375, 0.30223846435546875, 0.3150482177734375, 0.32785797119140625, 0.340667724609375, 0.35347747802734375, 0.3662872314453125, 0.37909698486328125, 0.39190673828125, 0.40471649169921875, 0.4175262451171875, 0.43033599853515625, 0.443145751953125, 0.45595550537109375, 0.4687652587890625, 0.48157501220703125, 0.494384765625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 3.0, 5.0, 9.0, 9.0, 11.0, 14.0, 15.0, 33.0, 26.0, 39.0, 53.0, 43.0, 56.0, 61.0, 55.0, 59.0, 64.0, 74.0, 50.0, 45.0, 36.0, 32.0, 36.0, 38.0, 18.0, 15.0, 25.0, 11.0, 15.0, 7.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.586828708648682, -5.435853481292725, -5.284878253936768, -5.133902549743652, -4.982927322387695, -4.831952095031738, -4.680976867675781, -4.530001640319824, -4.379026412963867, -4.22805118560791, -4.077075958251953, -3.926100492477417, -3.775125026702881, -3.624149799346924, -3.473174571990967, -3.3221993446350098, -3.1712236404418945, -3.0202484130859375, -2.8692729473114014, -2.7182977199554443, -2.567322254180908, -2.416347026824951, -2.265371799468994, -2.114396572113037, -1.963421106338501, -1.8124457597732544, -1.6614704132080078, -1.5104951858520508, -1.3595198392868042, -1.2085444927215576, -1.0575692653656006, -0.906593918800354, -0.7556185722351074, -0.6046432256698608, -0.45366793870925903, -0.30269262194633484, -0.15171730518341064, -0.0007419586181640625, 0.15023332834243774, 0.30120861530303955, 0.45218396186828613, 0.6031593084335327, 0.7541345953941345, 0.9051098823547363, 1.056085228919983, 1.2070605754852295, 1.3580358028411865, 1.509011149406433, 1.6599864959716797, 1.8109618425369263, 1.9619371891021729, 2.11291241645813, 2.263887882232666, 2.414863109588623, 2.56583833694458, 2.716813564300537, 2.8677890300750732, 3.0187642574310303, 3.1697397232055664, 3.3207149505615234, 3.4716901779174805, 3.6226656436920166, 3.7736408710479736, 3.9246163368225098, 4.075591564178467]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 15.0, 12.0, 13.0, 17.0, 19.0, 22.0, 32.0, 34.0, 35.0, 35.0, 52.0, 35.0, 34.0, 45.0, 43.0, 45.0, 36.0, 43.0, 41.0, 30.0, 30.0, 33.0, 39.0, 29.0, 33.0, 22.0, 22.0, 23.0, 26.0, 18.0, 14.0, 6.0, 11.0, 6.0, 10.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.960685968399048, -2.8687639236450195, -2.776841878890991, -2.684919834136963, -2.5929975509643555, -2.501075506210327, -2.409153461456299, -2.3172314167022705, -2.225309371948242, -2.133387327194214, -2.0414652824401855, -1.9495431184768677, -1.8576210737228394, -1.765699028968811, -1.6737768650054932, -1.5818548202514648, -1.4899327754974365, -1.3980107307434082, -1.3060886859893799, -1.214166522026062, -1.1222444772720337, -1.0303224325180054, -0.9384003281593323, -0.8464782238006592, -0.7545561790466309, -0.6626341342926025, -0.5707120299339294, -0.47878995537757874, -0.386867880821228, -0.2949458062648773, -0.2030237317085266, -0.11110162734985352, -0.019179821014404297, 0.07274225354194641, 0.16466432809829712, 0.2565864026546478, 0.34850847721099854, 0.44043055176734924, 0.5323526263237, 0.624274730682373, 0.7161967754364014, 0.8081188201904297, 0.9000409245491028, 0.9919630289077759, 1.0838850736618042, 1.1758071184158325, 1.2677292823791504, 1.3596513271331787, 1.451573371887207, 1.5434954166412354, 1.6354174613952637, 1.7273396253585815, 1.8192616701126099, 1.9111837148666382, 2.003105878829956, 2.0950279235839844, 2.1869499683380127, 2.278872013092041, 2.3707940578460693, 2.4627161026000977, 2.554638385772705, 2.6465604305267334, 2.7384824752807617, 2.83040452003479, 2.9223265647888184]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 9.0, 14.0, 22.0, 38.0, 44.0, 69.0, 97.0, 142.0, 208.0, 306.0, 490.0, 741.0, 1203.0, 1893.0, 3125.0, 5119.0, 8279.0, 14171.0, 23935.0, 42807.0, 78571.0, 152940.0, 323707.0, 696550.0, 1088655.0, 887205.0, 440143.0, 199750.0, 98811.0, 52476.0, 29462.0, 16860.0, 10058.0, 6035.0, 3876.0, 2351.0, 1452.0, 946.0, 609.0, 385.0, 251.0, 160.0, 114.0, 73.0, 49.0, 22.0, 15.0, 15.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.4296875, -4.2982177734375, -4.166748046875, -4.0352783203125, -3.90380859375, -3.7723388671875, -3.640869140625, -3.5093994140625, -3.3779296875, -3.2464599609375, -3.114990234375, -2.9835205078125, -2.85205078125, -2.7205810546875, -2.589111328125, -2.4576416015625, -2.326171875, -2.1947021484375, -2.063232421875, -1.9317626953125, -1.80029296875, -1.6688232421875, -1.537353515625, -1.4058837890625, -1.2744140625, -1.1429443359375, -1.011474609375, -0.8800048828125, -0.74853515625, -0.6170654296875, -0.485595703125, -0.3541259765625, -0.22265625, -0.0911865234375, 0.040283203125, 0.1717529296875, 0.30322265625, 0.4346923828125, 0.566162109375, 0.6976318359375, 0.8291015625, 0.9605712890625, 1.092041015625, 1.2235107421875, 1.35498046875, 1.4864501953125, 1.617919921875, 1.7493896484375, 1.880859375, 2.0123291015625, 2.143798828125, 2.2752685546875, 2.40673828125, 2.5382080078125, 2.669677734375, 2.8011474609375, 2.9326171875, 3.0640869140625, 3.195556640625, 3.3270263671875, 3.45849609375, 3.5899658203125, 3.721435546875, 3.8529052734375, 3.984375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 8.0, 9.0, 9.0, 14.0, 12.0, 15.0, 23.0, 15.0, 28.0, 25.0, 48.0, 27.0, 32.0, 36.0, 47.0, 38.0, 52.0, 43.0, 42.0, 40.0, 51.0, 32.0, 38.0, 44.0, 31.0, 26.0, 37.0, 27.0, 27.0, 27.0, 12.0, 17.0, 22.0, 10.0, 7.0, 6.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.185333251953125, -2.10894775390625, -2.032562255859375, -1.9561767578125, -1.879791259765625, -1.80340576171875, -1.727020263671875, -1.650634765625, -1.574249267578125, -1.49786376953125, -1.421478271484375, -1.3450927734375, -1.268707275390625, -1.19232177734375, -1.115936279296875, -1.03955078125, -0.963165283203125, -0.88677978515625, -0.810394287109375, -0.7340087890625, -0.657623291015625, -0.58123779296875, -0.504852294921875, -0.428466796875, -0.352081298828125, -0.27569580078125, -0.199310302734375, -0.1229248046875, -0.046539306640625, 0.02984619140625, 0.106231689453125, 0.1826171875, 0.259002685546875, 0.33538818359375, 0.411773681640625, 0.4881591796875, 0.564544677734375, 0.64093017578125, 0.717315673828125, 0.793701171875, 0.870086669921875, 0.94647216796875, 1.022857666015625, 1.0992431640625, 1.175628662109375, 1.25201416015625, 1.328399658203125, 1.40478515625, 1.481170654296875, 1.55755615234375, 1.633941650390625, 1.7103271484375, 1.786712646484375, 1.86309814453125, 1.939483642578125, 2.015869140625, 2.092254638671875, 2.16864013671875, 2.245025634765625, 2.3214111328125, 2.397796630859375, 2.47418212890625, 2.550567626953125, 2.626953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 4.0, 3.0, 10.0, 25.0, 34.0, 36.0, 63.0, 93.0, 155.0, 237.0, 371.0, 576.0, 795.0, 1299.0, 2028.0, 3164.0, 4988.0, 7911.0, 12729.0, 20817.0, 35333.0, 60147.0, 104826.0, 187538.0, 339999.0, 606556.0, 892892.0, 802159.0, 485024.0, 269005.0, 147852.0, 83786.0, 48648.0, 28753.0, 17371.0, 10812.0, 6585.0, 4104.0, 2647.0, 1739.0, 1148.0, 688.0, 501.0, 277.0, 190.0, 151.0, 70.0, 44.0, 39.0, 26.0, 16.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.908203125, -3.777069091796875, -3.64593505859375, -3.514801025390625, -3.3836669921875, -3.252532958984375, -3.12139892578125, -2.990264892578125, -2.859130859375, -2.727996826171875, -2.59686279296875, -2.465728759765625, -2.3345947265625, -2.203460693359375, -2.07232666015625, -1.941192626953125, -1.81005859375, -1.678924560546875, -1.54779052734375, -1.416656494140625, -1.2855224609375, -1.154388427734375, -1.02325439453125, -0.892120361328125, -0.760986328125, -0.629852294921875, -0.49871826171875, -0.367584228515625, -0.2364501953125, -0.105316162109375, 0.02581787109375, 0.156951904296875, 0.2880859375, 0.419219970703125, 0.55035400390625, 0.681488037109375, 0.8126220703125, 0.943756103515625, 1.07489013671875, 1.206024169921875, 1.337158203125, 1.468292236328125, 1.59942626953125, 1.730560302734375, 1.8616943359375, 1.992828369140625, 2.12396240234375, 2.255096435546875, 2.38623046875, 2.517364501953125, 2.64849853515625, 2.779632568359375, 2.9107666015625, 3.041900634765625, 3.17303466796875, 3.304168701171875, 3.435302734375, 3.566436767578125, 3.69757080078125, 3.828704833984375, 3.9598388671875, 4.090972900390625, 4.22210693359375, 4.353240966796875, 4.484375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 10.0, 11.0, 17.0, 34.0, 32.0, 39.0, 59.0, 64.0, 72.0, 119.0, 146.0, 170.0, 202.0, 216.0, 224.0, 261.0, 296.0, 314.0, 276.0, 238.0, 211.0, 191.0, 169.0, 118.0, 114.0, 96.0, 81.0, 62.0, 40.0, 43.0, 32.0, 24.0, 17.0, 12.0, 17.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3173828125, -1.2734222412109375, -1.229461669921875, -1.1855010986328125, -1.14154052734375, -1.0975799560546875, -1.053619384765625, -1.0096588134765625, -0.9656982421875, -0.9217376708984375, -0.877777099609375, -0.8338165283203125, -0.78985595703125, -0.7458953857421875, -0.701934814453125, -0.6579742431640625, -0.614013671875, -0.5700531005859375, -0.526092529296875, -0.4821319580078125, -0.43817138671875, -0.3942108154296875, -0.350250244140625, -0.3062896728515625, -0.2623291015625, -0.2183685302734375, -0.174407958984375, -0.1304473876953125, -0.08648681640625, -0.0425262451171875, 0.001434326171875, 0.0453948974609375, 0.08935546875, 0.1333160400390625, 0.177276611328125, 0.2212371826171875, 0.26519775390625, 0.3091583251953125, 0.353118896484375, 0.3970794677734375, 0.4410400390625, 0.4850006103515625, 0.528961181640625, 0.5729217529296875, 0.61688232421875, 0.6608428955078125, 0.704803466796875, 0.7487640380859375, 0.792724609375, 0.8366851806640625, 0.880645751953125, 0.9246063232421875, 0.96856689453125, 1.0125274658203125, 1.056488037109375, 1.1004486083984375, 1.1444091796875, 1.1883697509765625, 1.232330322265625, 1.2762908935546875, 1.32025146484375, 1.3642120361328125, 1.408172607421875, 1.4521331787109375, 1.49609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 8.0, 6.0, 13.0, 11.0, 8.0, 16.0, 20.0, 29.0, 43.0, 31.0, 57.0, 60.0, 65.0, 62.0, 61.0, 74.0, 58.0, 61.0, 54.0, 36.0, 40.0, 42.0, 25.0, 26.0, 14.0, 22.0, 14.0, 5.0, 4.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3671746253967285, -6.194919109344482, -6.0226640701293945, -5.850408554077148, -5.678153038024902, -5.505897521972656, -5.333642482757568, -5.161386966705322, -4.989131927490234, -4.816876411437988, -4.6446213722229, -4.472365856170654, -4.300110340118408, -4.12785530090332, -3.955599784851074, -3.783344268798828, -3.611088752746582, -3.438833475112915, -3.266577959060669, -3.094322681427002, -2.922067165374756, -2.749811887741089, -2.577556610107422, -2.405301094055176, -2.233045816421509, -2.060790538787842, -1.8885350227355957, -1.7162797451019287, -1.5440243482589722, -1.3717689514160156, -1.1995136737823486, -1.027258276939392, -0.8550024032592773, -0.6827470064163208, -0.510491669178009, -0.33823633193969727, -0.16598093509674072, 0.00627446174621582, 0.1785297393798828, 0.35078513622283936, 0.5230405330657959, 0.6952959299087524, 0.8675512671470642, 1.039806604385376, 1.2120620012283325, 1.384317398071289, 1.556572675704956, 1.7288280725479126, 1.9010834693908691, 2.073338747024536, 2.2455942630767822, 2.417849540710449, 2.5901050567626953, 2.7623603343963623, 2.9346156120300293, 3.1068711280822754, 3.2791264057159424, 3.4513816833496094, 3.6236371994018555, 3.7958924770355225, 3.9681477546691895, 4.1404032707214355, 4.312658309936523, 4.4849138259887695, 4.657169342041016]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 8.0, 6.0, 7.0, 21.0, 16.0, 17.0, 29.0, 30.0, 31.0, 30.0, 36.0, 45.0, 38.0, 42.0, 50.0, 38.0, 40.0, 44.0, 41.0, 39.0, 49.0, 40.0, 40.0, 36.0, 31.0, 28.0, 26.0, 24.0, 21.0, 15.0, 8.0, 15.0, 13.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0973005294799805, -3.001399278640747, -2.9054980278015137, -2.8095967769622803, -2.713695526123047, -2.6177942752838135, -2.52189302444458, -2.4259917736053467, -2.3300905227661133, -2.23418927192688, -2.1382880210876465, -2.042386770248413, -1.9464855194091797, -1.8505842685699463, -1.754683017730713, -1.6587817668914795, -1.562880516052246, -1.4669792652130127, -1.3710780143737793, -1.275176763534546, -1.1792755126953125, -1.083374261856079, -0.9874730110168457, -0.8915717601776123, -0.7956705093383789, -0.6997692584991455, -0.6038680076599121, -0.5079667568206787, -0.4120655059814453, -0.3161642551422119, -0.22026300430297852, -0.12436175346374512, -0.028460264205932617, 0.06744098663330078, 0.16334223747253418, 0.2592434883117676, 0.355144739151001, 0.4510459899902344, 0.5469472408294678, 0.6428484916687012, 0.7387497425079346, 0.834650993347168, 0.9305522441864014, 1.0264534950256348, 1.1223547458648682, 1.2182559967041016, 1.314157247543335, 1.4100584983825684, 1.5059597492218018, 1.6018610000610352, 1.6977622509002686, 1.793663501739502, 1.8895647525787354, 1.9854660034179688, 2.081367254257202, 2.1772685050964355, 2.273169755935669, 2.3690710067749023, 2.4649722576141357, 2.560873508453369, 2.6567747592926025, 2.752676010131836, 2.8485772609710693, 2.9444785118103027, 3.040379762649536]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 3.0, 5.0, 0.0, 6.0, 12.0, 10.0, 28.0, 19.0, 44.0, 51.0, 58.0, 101.0, 166.0, 248.0, 319.0, 513.0, 681.0, 1042.0, 1502.0, 2376.0, 3736.0, 6187.0, 10142.0, 17913.0, 31341.0, 58191.0, 108712.0, 189956.0, 234196.0, 169738.0, 93703.0, 50399.0, 27576.0, 15303.0, 8989.0, 5470.0, 3387.0, 2103.0, 1471.0, 860.0, 648.0, 427.0, 264.0, 178.0, 147.0, 113.0, 62.0, 45.0, 43.0, 16.0, 22.0, 14.0, 9.0, 1.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.383056640625, -0.3712272644042969, -0.35939788818359375, -0.3475685119628906, -0.3357391357421875, -0.3239097595214844, -0.31208038330078125, -0.3002510070800781, -0.288421630859375, -0.2765922546386719, -0.26476287841796875, -0.2529335021972656, -0.2411041259765625, -0.22927474975585938, -0.21744537353515625, -0.20561599731445312, -0.19378662109375, -0.18195724487304688, -0.17012786865234375, -0.15829849243164062, -0.1464691162109375, -0.13463973999023438, -0.12281036376953125, -0.11098098754882812, -0.099151611328125, -0.08732223510742188, -0.07549285888671875, -0.06366348266601562, -0.0518341064453125, -0.040004730224609375, -0.02817535400390625, -0.016345977783203125, -0.0045166015625, 0.007312774658203125, 0.01914215087890625, 0.030971527099609375, 0.0428009033203125, 0.054630279541015625, 0.06645965576171875, 0.07828903198242188, 0.090118408203125, 0.10194778442382812, 0.11377716064453125, 0.12560653686523438, 0.1374359130859375, 0.14926528930664062, 0.16109466552734375, 0.17292404174804688, 0.18475341796875, 0.19658279418945312, 0.20841217041015625, 0.22024154663085938, 0.2320709228515625, 0.24390029907226562, 0.25572967529296875, 0.2675590515136719, 0.279388427734375, 0.2912178039550781, 0.30304718017578125, 0.3148765563964844, 0.3267059326171875, 0.3385353088378906, 0.35036468505859375, 0.3621940612792969, 0.3740234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 7.0, 5.0, 5.0, 13.0, 17.0, 24.0, 24.0, 30.0, 31.0, 29.0, 34.0, 36.0, 37.0, 48.0, 46.0, 52.0, 52.0, 54.0, 47.0, 47.0, 47.0, 38.0, 42.0, 41.0, 25.0, 29.0, 19.0, 20.0, 20.0, 9.0, 11.0, 14.0, 12.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.78125, -3.666168212890625, -3.55108642578125, -3.436004638671875, -3.3209228515625, -3.205841064453125, -3.09075927734375, -2.975677490234375, -2.860595703125, -2.745513916015625, -2.63043212890625, -2.515350341796875, -2.4002685546875, -2.285186767578125, -2.17010498046875, -2.055023193359375, -1.93994140625, -1.824859619140625, -1.70977783203125, -1.594696044921875, -1.4796142578125, -1.364532470703125, -1.24945068359375, -1.134368896484375, -1.019287109375, -0.904205322265625, -0.78912353515625, -0.674041748046875, -0.5589599609375, -0.443878173828125, -0.32879638671875, -0.213714599609375, -0.0986328125, 0.016448974609375, 0.13153076171875, 0.246612548828125, 0.3616943359375, 0.476776123046875, 0.59185791015625, 0.706939697265625, 0.822021484375, 0.937103271484375, 1.05218505859375, 1.167266845703125, 1.2823486328125, 1.397430419921875, 1.51251220703125, 1.627593994140625, 1.74267578125, 1.857757568359375, 1.97283935546875, 2.087921142578125, 2.2030029296875, 2.318084716796875, 2.43316650390625, 2.548248291015625, 2.663330078125, 2.778411865234375, 2.89349365234375, 3.008575439453125, 3.1236572265625, 3.238739013671875, 3.35382080078125, 3.468902587890625, 3.583984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 11.0, 15.0, 17.0, 24.0, 31.0, 41.0, 53.0, 85.0, 117.0, 180.0, 258.0, 384.0, 581.0, 934.0, 1598.0, 2730.0, 5122.0, 10645.0, 25685.0, 164433.0, 762077.0, 42401.0, 15297.0, 6955.0, 3488.0, 2029.0, 1155.0, 723.0, 462.0, 318.0, 189.0, 138.0, 98.0, 73.0, 47.0, 31.0, 29.0, 18.0, 24.0, 12.0, 7.0, 9.0, 6.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.006561279296875, -0.97210693359375, -0.937652587890625, -0.9031982421875, -0.868743896484375, -0.83428955078125, -0.799835205078125, -0.765380859375, -0.730926513671875, -0.69647216796875, -0.662017822265625, -0.6275634765625, -0.593109130859375, -0.55865478515625, -0.524200439453125, -0.48974609375, -0.455291748046875, -0.42083740234375, -0.386383056640625, -0.3519287109375, -0.317474365234375, -0.28302001953125, -0.248565673828125, -0.214111328125, -0.179656982421875, -0.14520263671875, -0.110748291015625, -0.0762939453125, -0.041839599609375, -0.00738525390625, 0.027069091796875, 0.0615234375, 0.095977783203125, 0.13043212890625, 0.164886474609375, 0.1993408203125, 0.233795166015625, 0.26824951171875, 0.302703857421875, 0.337158203125, 0.371612548828125, 0.40606689453125, 0.440521240234375, 0.4749755859375, 0.509429931640625, 0.54388427734375, 0.578338623046875, 0.61279296875, 0.647247314453125, 0.68170166015625, 0.716156005859375, 0.7506103515625, 0.785064697265625, 0.81951904296875, 0.853973388671875, 0.888427734375, 0.922882080078125, 0.95733642578125, 0.991790771484375, 1.0262451171875, 1.060699462890625, 1.09515380859375, 1.129608154296875, 1.1640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 2.0, 6.0, 8.0, 2.0, 8.0, 9.0, 10.0, 12.0, 24.0, 19.0, 22.0, 31.0, 41.0, 23.0, 27.0, 38.0, 30.0, 27.0, 45.0, 33.0, 32.0, 36.0, 41.0, 50.0, 44.0, 48.0, 39.0, 33.0, 33.0, 33.0, 22.0, 32.0, 22.0, 29.0, 9.0, 15.0, 6.0, 13.0, 7.0, 7.0, 6.0, 3.0, 4.0, 7.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9130859375, -1.8503875732421875, -1.787689208984375, -1.7249908447265625, -1.66229248046875, -1.5995941162109375, -1.536895751953125, -1.4741973876953125, -1.4114990234375, -1.3488006591796875, -1.286102294921875, -1.2234039306640625, -1.16070556640625, -1.0980072021484375, -1.035308837890625, -0.9726104736328125, -0.909912109375, -0.8472137451171875, -0.784515380859375, -0.7218170166015625, -0.65911865234375, -0.5964202880859375, -0.533721923828125, -0.4710235595703125, -0.4083251953125, -0.3456268310546875, -0.282928466796875, -0.2202301025390625, -0.15753173828125, -0.0948333740234375, -0.032135009765625, 0.0305633544921875, 0.09326171875, 0.1559600830078125, 0.218658447265625, 0.2813568115234375, 0.34405517578125, 0.4067535400390625, 0.469451904296875, 0.5321502685546875, 0.5948486328125, 0.6575469970703125, 0.720245361328125, 0.7829437255859375, 0.84564208984375, 0.9083404541015625, 0.971038818359375, 1.0337371826171875, 1.096435546875, 1.1591339111328125, 1.221832275390625, 1.2845306396484375, 1.34722900390625, 1.4099273681640625, 1.472625732421875, 1.5353240966796875, 1.5980224609375, 1.6607208251953125, 1.723419189453125, 1.7861175537109375, 1.84881591796875, 1.9115142822265625, 1.974212646484375, 2.0369110107421875, 2.099609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 10.0, 16.0, 20.0, 29.0, 38.0, 58.0, 84.0, 146.0, 215.0, 366.0, 482.0, 841.0, 1423.0, 2371.0, 4365.0, 8279.0, 16225.0, 38475.0, 876541.0, 57108.0, 19937.0, 9621.0, 4968.0, 2777.0, 1611.0, 912.0, 557.0, 330.0, 253.0, 161.0, 87.0, 75.0, 40.0, 33.0, 32.0, 16.0, 13.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19271469116210938, -0.18547821044921875, -0.17824172973632812, -0.1710052490234375, -0.16376876831054688, -0.15653228759765625, -0.14929580688476562, -0.142059326171875, -0.13482284545898438, -0.12758636474609375, -0.12034988403320312, -0.1131134033203125, -0.10587692260742188, -0.09864044189453125, -0.09140396118164062, -0.08416748046875, -0.07693099975585938, -0.06969451904296875, -0.062458038330078125, -0.0552215576171875, -0.047985076904296875, -0.04074859619140625, -0.033512115478515625, -0.026275634765625, -0.019039154052734375, -0.01180267333984375, -0.004566192626953125, 0.0026702880859375, 0.009906768798828125, 0.01714324951171875, 0.024379730224609375, 0.0316162109375, 0.038852691650390625, 0.04608917236328125, 0.053325653076171875, 0.0605621337890625, 0.06779861450195312, 0.07503509521484375, 0.08227157592773438, 0.089508056640625, 0.09674453735351562, 0.10398101806640625, 0.11121749877929688, 0.1184539794921875, 0.12569046020507812, 0.13292694091796875, 0.14016342163085938, 0.14739990234375, 0.15463638305664062, 0.16187286376953125, 0.16910934448242188, 0.1763458251953125, 0.18358230590820312, 0.19081878662109375, 0.19805526733398438, 0.205291748046875, 0.21252822875976562, 0.21976470947265625, 0.22700119018554688, 0.2342376708984375, 0.24147415161132812, 0.24871063232421875, 0.2559471130371094, 0.26318359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 12.0, 9.0, 10.0, 19.0, 13.0, 19.0, 36.0, 34.0, 38.0, 35.0, 40.0, 31.0, 45.0, 46.0, 51.0, 49.0, 56.0, 59.0, 37.0, 55.0, 39.0, 43.0, 34.0, 27.0, 29.0, 33.0, 12.0, 20.0, 7.0, 14.0, 10.0, 11.0, 4.0, 6.0, 10.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8231570720672607e-05, -1.7628073692321777e-05, -1.7024576663970947e-05, -1.6421079635620117e-05, -1.5817582607269287e-05, -1.5214085578918457e-05, -1.4610588550567627e-05, -1.4007091522216797e-05, -1.3403594493865967e-05, -1.2800097465515137e-05, -1.2196600437164307e-05, -1.1593103408813477e-05, -1.0989606380462646e-05, -1.0386109352111816e-05, -9.782612323760986e-06, -9.179115295410156e-06, -8.575618267059326e-06, -7.972121238708496e-06, -7.368624210357666e-06, -6.765127182006836e-06, -6.161630153656006e-06, -5.558133125305176e-06, -4.954636096954346e-06, -4.351139068603516e-06, -3.7476420402526855e-06, -3.1441450119018555e-06, -2.5406479835510254e-06, -1.9371509552001953e-06, -1.3336539268493652e-06, -7.301568984985352e-07, -1.2665987014770508e-07, 4.76837158203125e-07, 1.080334186553955e-06, 1.6838312149047852e-06, 2.2873282432556152e-06, 2.8908252716064453e-06, 3.4943222999572754e-06, 4.0978193283081055e-06, 4.7013163566589355e-06, 5.304813385009766e-06, 5.908310413360596e-06, 6.511807441711426e-06, 7.115304470062256e-06, 7.718801498413086e-06, 8.322298526763916e-06, 8.925795555114746e-06, 9.529292583465576e-06, 1.0132789611816406e-05, 1.0736286640167236e-05, 1.1339783668518066e-05, 1.1943280696868896e-05, 1.2546777725219727e-05, 1.3150274753570557e-05, 1.3753771781921387e-05, 1.4357268810272217e-05, 1.4960765838623047e-05, 1.5564262866973877e-05, 1.6167759895324707e-05, 1.6771256923675537e-05, 1.7374753952026367e-05, 1.7978250980377197e-05, 1.8581748008728027e-05, 1.9185245037078857e-05, 1.9788742065429688e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 12.0, 16.0, 30.0, 20.0, 46.0, 81.0, 91.0, 160.0, 222.0, 346.0, 503.0, 819.0, 1128.0, 1753.0, 2684.0, 4151.0, 6730.0, 10759.0, 18055.0, 30129.0, 51155.0, 86398.0, 139216.0, 190676.0, 182795.0, 126339.0, 78200.0, 46224.0, 26911.0, 16057.0, 9469.0, 6184.0, 3876.0, 2484.0, 1553.0, 1111.0, 722.0, 469.0, 319.0, 222.0, 119.0, 110.0, 77.0, 41.0, 32.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.06953620910644531, -0.06735610961914062, -0.06517601013183594, -0.06299591064453125, -0.06081581115722656, -0.058635711669921875, -0.05645561218261719, -0.0542755126953125, -0.05209541320800781, -0.049915313720703125, -0.04773521423339844, -0.04555511474609375, -0.04337501525878906, -0.041194915771484375, -0.03901481628417969, -0.036834716796875, -0.03465461730957031, -0.032474517822265625, -0.030294418334960938, -0.02811431884765625, -0.025934219360351562, -0.023754119873046875, -0.021574020385742188, -0.0193939208984375, -0.017213821411132812, -0.015033721923828125, -0.012853622436523438, -0.01067352294921875, -0.008493423461914062, -0.006313323974609375, -0.0041332244873046875, -0.001953125, 0.0002269744873046875, 0.002407073974609375, 0.0045871734619140625, 0.00676727294921875, 0.008947372436523438, 0.011127471923828125, 0.013307571411132812, 0.0154876708984375, 0.017667770385742188, 0.019847869873046875, 0.022027969360351562, 0.02420806884765625, 0.026388168334960938, 0.028568267822265625, 0.030748367309570312, 0.032928466796875, 0.03510856628417969, 0.037288665771484375, 0.03946876525878906, 0.04164886474609375, 0.04382896423339844, 0.046009063720703125, 0.04818916320800781, 0.0503692626953125, 0.05254936218261719, 0.054729461669921875, 0.05690956115722656, 0.05908966064453125, 0.06126976013183594, 0.06344985961914062, 0.06562995910644531, 0.06781005859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 1.0, 9.0, 2.0, 6.0, 10.0, 11.0, 14.0, 13.0, 17.0, 30.0, 25.0, 25.0, 41.0, 56.0, 51.0, 52.0, 62.0, 75.0, 67.0, 68.0, 62.0, 48.0, 40.0, 36.0, 30.0, 29.0, 19.0, 21.0, 21.0, 9.0, 12.0, 12.0, 5.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017608642578125, -0.016898632049560547, -0.016188621520996094, -0.01547861099243164, -0.014768600463867188, -0.014058589935302734, -0.013348579406738281, -0.012638568878173828, -0.011928558349609375, -0.011218547821044922, -0.010508537292480469, -0.009798526763916016, -0.009088516235351562, -0.00837850570678711, -0.007668495178222656, -0.006958484649658203, -0.00624847412109375, -0.005538463592529297, -0.004828453063964844, -0.004118442535400391, -0.0034084320068359375, -0.0026984214782714844, -0.0019884109497070312, -0.0012784004211425781, -0.000568389892578125, 0.00014162063598632812, 0.0008516311645507812, 0.0015616416931152344, 0.0022716522216796875, 0.0029816627502441406, 0.0036916732788085938, 0.004401683807373047, 0.0051116943359375, 0.005821704864501953, 0.006531715393066406, 0.007241725921630859, 0.007951736450195312, 0.008661746978759766, 0.009371757507324219, 0.010081768035888672, 0.010791778564453125, 0.011501789093017578, 0.012211799621582031, 0.012921810150146484, 0.013631820678710938, 0.01434183120727539, 0.015051841735839844, 0.015761852264404297, 0.01647186279296875, 0.017181873321533203, 0.017891883850097656, 0.01860189437866211, 0.019311904907226562, 0.020021915435791016, 0.02073192596435547, 0.021441936492919922, 0.022151947021484375, 0.022861957550048828, 0.02357196807861328, 0.024281978607177734, 0.024991989135742188, 0.02570199966430664, 0.026412010192871094, 0.027122020721435547, 0.02783203125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 12.0, 11.0, 8.0, 16.0, 15.0, 33.0, 41.0, 33.0, 53.0, 58.0, 67.0, 60.0, 58.0, 74.0, 65.0, 63.0, 47.0, 39.0, 35.0, 44.0, 29.0, 30.0, 13.0, 16.0, 19.0, 8.0, 2.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.321294784545898, -6.150835990905762, -5.980377197265625, -5.809918403625488, -5.639459609985352, -5.469001293182373, -5.298542499542236, -5.1280837059021, -4.957624912261963, -4.787166118621826, -4.6167073249816895, -4.446248531341553, -4.275790214538574, -4.1053314208984375, -3.934872627258301, -3.764413833618164, -3.5939550399780273, -3.4234962463378906, -3.253037452697754, -3.0825788974761963, -2.9121201038360596, -2.741661310195923, -2.5712027549743652, -2.4007439613342285, -2.230285167694092, -2.059826374053955, -1.889367699623108, -1.7189090251922607, -1.548450231552124, -1.3779914379119873, -1.2075327634811401, -1.037074089050293, -0.8666157722473145, -0.6961570382118225, -0.5256983041763306, -0.3552395701408386, -0.18478083610534668, -0.014322102069854736, 0.1561366319656372, 0.3265953063964844, 0.4970541000366211, 0.667512834072113, 0.837971568107605, 1.0084302425384521, 1.1788890361785889, 1.3493478298187256, 1.5198065042495728, 1.69026517868042, 1.8607239723205566, 2.0311827659606934, 2.20164155960083, 2.3721001148223877, 2.5425589084625244, 2.713017702102661, 2.8834762573242188, 3.0539350509643555, 3.224393844604492, 3.394852638244629, 3.5653114318847656, 3.7357699871063232, 3.90622878074646, 4.076687335968018, 4.247146129608154, 4.417604923248291, 4.588063716888428]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 11.0, 8.0, 5.0, 8.0, 20.0, 16.0, 17.0, 28.0, 29.0, 32.0, 34.0, 32.0, 48.0, 32.0, 44.0, 52.0, 39.0, 40.0, 41.0, 42.0, 40.0, 47.0, 41.0, 38.0, 39.0, 30.0, 28.0, 29.0, 23.0, 21.0, 14.0, 8.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0558407306671143, -2.9604074954986572, -2.8649744987487793, -2.7695412635803223, -2.6741080284118652, -2.578674793243408, -2.483241558074951, -2.3878085613250732, -2.292375326156616, -2.196942090988159, -2.1015090942382812, -2.006075859069824, -1.9106426239013672, -1.8152093887329102, -1.7197762727737427, -1.6243431568145752, -1.5289099216461182, -1.4334766864776611, -1.3380435705184937, -1.2426104545593262, -1.1471772193908691, -1.051743984222412, -0.9563108682632446, -0.8608776926994324, -0.7654445171356201, -0.6700113415718079, -0.5745781660079956, -0.47914499044418335, -0.3837118148803711, -0.28827863931655884, -0.19284546375274658, -0.09741228818893433, -0.0019788742065429688, 0.09345430135726929, 0.18888747692108154, 0.2843206524848938, 0.37975382804870605, 0.4751870036125183, 0.5706201791763306, 0.6660533547401428, 0.7614865303039551, 0.8569197058677673, 0.9523528814315796, 1.047785997390747, 1.143219232559204, 1.2386524677276611, 1.3340855836868286, 1.429518699645996, 1.5249519348144531, 1.6203851699829102, 1.7158182859420776, 1.8112514019012451, 1.9066846370697021, 2.002117872238159, 2.097550868988037, 2.192984104156494, 2.288417339324951, 2.383850574493408, 2.4792838096618652, 2.574716806411743, 2.6701500415802, 2.7655832767486572, 2.861016273498535, 2.956449508666992, 3.051882743835449]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 8.0, 13.0, 16.0, 20.0, 37.0, 48.0, 72.0, 86.0, 154.0, 178.0, 289.0, 527.0, 835.0, 1339.0, 2328.0, 4207.0, 7653.0, 14730.0, 28558.0, 56046.0, 104543.0, 173992.0, 219182.0, 186689.0, 116109.0, 62589.0, 31951.0, 16491.0, 8690.0, 4640.0, 2527.0, 1509.0, 871.0, 560.0, 337.0, 231.0, 143.0, 106.0, 60.0, 52.0, 35.0, 23.0, 26.0, 17.0, 9.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.90625, -3.77423095703125, -3.6422119140625, -3.51019287109375, -3.378173828125, -3.24615478515625, -3.1141357421875, -2.98211669921875, -2.85009765625, -2.71807861328125, -2.5860595703125, -2.45404052734375, -2.322021484375, -2.19000244140625, -2.0579833984375, -1.92596435546875, -1.7939453125, -1.66192626953125, -1.5299072265625, -1.39788818359375, -1.265869140625, -1.13385009765625, -1.0018310546875, -0.86981201171875, -0.73779296875, -0.60577392578125, -0.4737548828125, -0.34173583984375, -0.209716796875, -0.07769775390625, 0.0543212890625, 0.18634033203125, 0.318359375, 0.45037841796875, 0.5823974609375, 0.71441650390625, 0.846435546875, 0.97845458984375, 1.1104736328125, 1.24249267578125, 1.37451171875, 1.50653076171875, 1.6385498046875, 1.77056884765625, 1.902587890625, 2.03460693359375, 2.1666259765625, 2.29864501953125, 2.4306640625, 2.56268310546875, 2.6947021484375, 2.82672119140625, 2.958740234375, 3.09075927734375, 3.2227783203125, 3.35479736328125, 3.48681640625, 3.61883544921875, 3.7508544921875, 3.88287353515625, 4.014892578125, 4.14691162109375, 4.2789306640625, 4.41094970703125, 4.54296875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 13.0, 13.0, 7.0, 6.0, 18.0, 15.0, 17.0, 34.0, 32.0, 28.0, 35.0, 44.0, 59.0, 55.0, 49.0, 50.0, 47.0, 44.0, 49.0, 34.0, 37.0, 52.0, 36.0, 36.0, 40.0, 33.0, 23.0, 27.0, 14.0, 11.0, 14.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.702850341796875, -3.58538818359375, -3.467926025390625, -3.3504638671875, -3.233001708984375, -3.11553955078125, -2.998077392578125, -2.880615234375, -2.763153076171875, -2.64569091796875, -2.528228759765625, -2.4107666015625, -2.293304443359375, -2.17584228515625, -2.058380126953125, -1.94091796875, -1.823455810546875, -1.70599365234375, -1.588531494140625, -1.4710693359375, -1.353607177734375, -1.23614501953125, -1.118682861328125, -1.001220703125, -0.883758544921875, -0.76629638671875, -0.648834228515625, -0.5313720703125, -0.413909912109375, -0.29644775390625, -0.178985595703125, -0.0615234375, 0.055938720703125, 0.17340087890625, 0.290863037109375, 0.4083251953125, 0.525787353515625, 0.64324951171875, 0.760711669921875, 0.878173828125, 0.995635986328125, 1.11309814453125, 1.230560302734375, 1.3480224609375, 1.465484619140625, 1.58294677734375, 1.700408935546875, 1.81787109375, 1.935333251953125, 2.05279541015625, 2.170257568359375, 2.2877197265625, 2.405181884765625, 2.52264404296875, 2.640106201171875, 2.757568359375, 2.875030517578125, 2.99249267578125, 3.109954833984375, 3.2274169921875, 3.344879150390625, 3.46234130859375, 3.579803466796875, 3.697265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 14.0, 25.0, 23.0, 34.0, 76.0, 101.0, 162.0, 250.0, 361.0, 585.0, 939.0, 1433.0, 2433.0, 3960.0, 6556.0, 10943.0, 18044.0, 29653.0, 48056.0, 75590.0, 110488.0, 144316.0, 157455.0, 140941.0, 106863.0, 71906.0, 45539.0, 28269.0, 16991.0, 10344.0, 6186.0, 3871.0, 2290.0, 1451.0, 871.0, 564.0, 336.0, 210.0, 134.0, 107.0, 72.0, 42.0, 22.0, 14.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.84906005859375, -2.7489013671875, -2.64874267578125, -2.548583984375, -2.44842529296875, -2.3482666015625, -2.24810791015625, -2.14794921875, -2.04779052734375, -1.9476318359375, -1.84747314453125, -1.747314453125, -1.64715576171875, -1.5469970703125, -1.44683837890625, -1.3466796875, -1.24652099609375, -1.1463623046875, -1.04620361328125, -0.946044921875, -0.84588623046875, -0.7457275390625, -0.64556884765625, -0.54541015625, -0.44525146484375, -0.3450927734375, -0.24493408203125, -0.144775390625, -0.04461669921875, 0.0555419921875, 0.15570068359375, 0.255859375, 0.35601806640625, 0.4561767578125, 0.55633544921875, 0.656494140625, 0.75665283203125, 0.8568115234375, 0.95697021484375, 1.05712890625, 1.15728759765625, 1.2574462890625, 1.35760498046875, 1.457763671875, 1.55792236328125, 1.6580810546875, 1.75823974609375, 1.8583984375, 1.95855712890625, 2.0587158203125, 2.15887451171875, 2.259033203125, 2.35919189453125, 2.4593505859375, 2.55950927734375, 2.65966796875, 2.75982666015625, 2.8599853515625, 2.96014404296875, 3.060302734375, 3.16046142578125, 3.2606201171875, 3.36077880859375, 3.4609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 8.0, 12.0, 9.0, 14.0, 6.0, 21.0, 24.0, 23.0, 24.0, 28.0, 35.0, 32.0, 37.0, 23.0, 39.0, 38.0, 46.0, 35.0, 28.0, 44.0, 42.0, 37.0, 42.0, 35.0, 33.0, 28.0, 32.0, 29.0, 24.0, 21.0, 28.0, 22.0, 18.0, 12.0, 14.0, 9.0, 15.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.982421875, -1.9237823486328125, -1.865142822265625, -1.8065032958984375, -1.74786376953125, -1.6892242431640625, -1.630584716796875, -1.5719451904296875, -1.5133056640625, -1.4546661376953125, -1.396026611328125, -1.3373870849609375, -1.27874755859375, -1.2201080322265625, -1.161468505859375, -1.1028289794921875, -1.044189453125, -0.9855499267578125, -0.926910400390625, -0.8682708740234375, -0.80963134765625, -0.7509918212890625, -0.692352294921875, -0.6337127685546875, -0.5750732421875, -0.5164337158203125, -0.457794189453125, -0.3991546630859375, -0.34051513671875, -0.2818756103515625, -0.223236083984375, -0.1645965576171875, -0.10595703125, -0.0473175048828125, 0.011322021484375, 0.0699615478515625, 0.12860107421875, 0.1872406005859375, 0.245880126953125, 0.3045196533203125, 0.3631591796875, 0.4217987060546875, 0.480438232421875, 0.5390777587890625, 0.59771728515625, 0.6563568115234375, 0.714996337890625, 0.7736358642578125, 0.832275390625, 0.8909149169921875, 0.949554443359375, 1.0081939697265625, 1.06683349609375, 1.1254730224609375, 1.184112548828125, 1.2427520751953125, 1.3013916015625, 1.3600311279296875, 1.418670654296875, 1.4773101806640625, 1.53594970703125, 1.5945892333984375, 1.653228759765625, 1.7118682861328125, 1.7705078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 13.0, 17.0, 37.0, 48.0, 71.0, 82.0, 150.0, 212.0, 344.0, 514.0, 786.0, 1230.0, 1936.0, 3103.0, 5057.0, 8283.0, 13801.0, 23330.0, 38852.0, 65703.0, 106052.0, 153532.0, 180513.0, 159449.0, 111562.0, 69333.0, 42114.0, 24414.0, 14730.0, 8815.0, 5416.0, 3258.0, 2064.0, 1306.0, 828.0, 551.0, 345.0, 233.0, 170.0, 83.0, 68.0, 46.0, 35.0, 24.0, 16.0, 9.0, 4.0, 8.0, 2.0, 4.0], "bins": [-1.87890625, -1.8275146484375, -1.776123046875, -1.7247314453125, -1.67333984375, -1.6219482421875, -1.570556640625, -1.5191650390625, -1.4677734375, -1.4163818359375, -1.364990234375, -1.3135986328125, -1.26220703125, -1.2108154296875, -1.159423828125, -1.1080322265625, -1.056640625, -1.0052490234375, -0.953857421875, -0.9024658203125, -0.85107421875, -0.7996826171875, -0.748291015625, -0.6968994140625, -0.6455078125, -0.5941162109375, -0.542724609375, -0.4913330078125, -0.43994140625, -0.3885498046875, -0.337158203125, -0.2857666015625, -0.234375, -0.1829833984375, -0.131591796875, -0.0802001953125, -0.02880859375, 0.0225830078125, 0.073974609375, 0.1253662109375, 0.1767578125, 0.2281494140625, 0.279541015625, 0.3309326171875, 0.38232421875, 0.4337158203125, 0.485107421875, 0.5364990234375, 0.587890625, 0.6392822265625, 0.690673828125, 0.7420654296875, 0.79345703125, 0.8448486328125, 0.896240234375, 0.9476318359375, 0.9990234375, 1.0504150390625, 1.101806640625, 1.1531982421875, 1.20458984375, 1.2559814453125, 1.307373046875, 1.3587646484375, 1.41015625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 13.0, 13.0, 23.0, 21.0, 25.0, 49.0, 53.0, 66.0, 81.0, 77.0, 94.0, 91.0, 68.0, 71.0, 58.0, 51.0, 33.0, 23.0, 22.0, 14.0, 6.0, 11.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00028824806213378906, -0.0002803876996040344, -0.0002725273370742798, -0.00026466697454452515, -0.0002568066120147705, -0.00024894624948501587, -0.00024108588695526123, -0.0002332255244255066, -0.00022536516189575195, -0.00021750479936599731, -0.00020964443683624268, -0.00020178407430648804, -0.0001939237117767334, -0.00018606334924697876, -0.00017820298671722412, -0.00017034262418746948, -0.00016248226165771484, -0.0001546218991279602, -0.00014676153659820557, -0.00013890117406845093, -0.0001310408115386963, -0.00012318044900894165, -0.00011532008647918701, -0.00010745972394943237, -9.959936141967773e-05, -9.17389988899231e-05, -8.387863636016846e-05, -7.601827383041382e-05, -6.815791130065918e-05, -6.029754877090454e-05, -5.24371862411499e-05, -4.4576823711395264e-05, -3.6716461181640625e-05, -2.8856098651885986e-05, -2.0995736122131348e-05, -1.3135373592376709e-05, -5.27501106262207e-06, 2.5853514671325684e-06, 1.0445713996887207e-05, 1.8306076526641846e-05, 2.6166439056396484e-05, 3.402680158615112e-05, 4.188716411590576e-05, 4.97475266456604e-05, 5.760788917541504e-05, 6.546825170516968e-05, 7.332861423492432e-05, 8.118897676467896e-05, 8.90493392944336e-05, 9.690970182418823e-05, 0.00010477006435394287, 0.00011263042688369751, 0.00012049078941345215, 0.0001283511519432068, 0.00013621151447296143, 0.00014407187700271606, 0.0001519322395324707, 0.00015979260206222534, 0.00016765296459197998, 0.00017551332712173462, 0.00018337368965148926, 0.0001912340521812439, 0.00019909441471099854, 0.00020695477724075317, 0.0002148151397705078]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 10.0, 25.0, 26.0, 50.0, 72.0, 92.0, 158.0, 245.0, 344.0, 517.0, 856.0, 1313.0, 2100.0, 3571.0, 6000.0, 10058.0, 17150.0, 29353.0, 49617.0, 80332.0, 121792.0, 159255.0, 168453.0, 141575.0, 99604.0, 63163.0, 37815.0, 22357.0, 12908.0, 7695.0, 4513.0, 2849.0, 1781.0, 1039.0, 623.0, 409.0, 260.0, 170.0, 129.0, 87.0, 69.0, 36.0, 23.0, 12.0, 17.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.494140625, -1.4477996826171875, -1.401458740234375, -1.3551177978515625, -1.30877685546875, -1.2624359130859375, -1.216094970703125, -1.1697540283203125, -1.1234130859375, -1.0770721435546875, -1.030731201171875, -0.9843902587890625, -0.93804931640625, -0.8917083740234375, -0.845367431640625, -0.7990264892578125, -0.752685546875, -0.7063446044921875, -0.660003662109375, -0.6136627197265625, -0.56732177734375, -0.5209808349609375, -0.474639892578125, -0.4282989501953125, -0.3819580078125, -0.3356170654296875, -0.289276123046875, -0.2429351806640625, -0.19659423828125, -0.1502532958984375, -0.103912353515625, -0.0575714111328125, -0.01123046875, 0.0351104736328125, 0.081451416015625, 0.1277923583984375, 0.17413330078125, 0.2204742431640625, 0.266815185546875, 0.3131561279296875, 0.3594970703125, 0.4058380126953125, 0.452178955078125, 0.4985198974609375, 0.54486083984375, 0.5912017822265625, 0.637542724609375, 0.6838836669921875, 0.730224609375, 0.7765655517578125, 0.822906494140625, 0.8692474365234375, 0.91558837890625, 0.9619293212890625, 1.008270263671875, 1.0546112060546875, 1.1009521484375, 1.1472930908203125, 1.193634033203125, 1.2399749755859375, 1.28631591796875, 1.3326568603515625, 1.378997802734375, 1.4253387451171875, 1.4716796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 4.0, 8.0, 14.0, 16.0, 16.0, 12.0, 23.0, 23.0, 29.0, 33.0, 40.0, 37.0, 45.0, 36.0, 56.0, 60.0, 54.0, 46.0, 35.0, 38.0, 50.0, 40.0, 33.0, 24.0, 43.0, 22.0, 20.0, 22.0, 12.0, 18.0, 16.0, 16.0, 4.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.41796875, -0.40587615966796875, -0.3937835693359375, -0.38169097900390625, -0.369598388671875, -0.35750579833984375, -0.3454132080078125, -0.33332061767578125, -0.32122802734375, -0.30913543701171875, -0.2970428466796875, -0.28495025634765625, -0.272857666015625, -0.26076507568359375, -0.2486724853515625, -0.23657989501953125, -0.2244873046875, -0.21239471435546875, -0.2003021240234375, -0.18820953369140625, -0.176116943359375, -0.16402435302734375, -0.1519317626953125, -0.13983917236328125, -0.12774658203125, -0.11565399169921875, -0.1035614013671875, -0.09146881103515625, -0.079376220703125, -0.06728363037109375, -0.0551910400390625, -0.04309844970703125, -0.031005859375, -0.01891326904296875, -0.0068206787109375, 0.00527191162109375, 0.017364501953125, 0.02945709228515625, 0.0415496826171875, 0.05364227294921875, 0.06573486328125, 0.07782745361328125, 0.0899200439453125, 0.10201263427734375, 0.114105224609375, 0.12619781494140625, 0.1382904052734375, 0.15038299560546875, 0.1624755859375, 0.17456817626953125, 0.1866607666015625, 0.19875335693359375, 0.210845947265625, 0.22293853759765625, 0.2350311279296875, 0.24712371826171875, 0.25921630859375, 0.27130889892578125, 0.2834014892578125, 0.29549407958984375, 0.307586669921875, 0.31967926025390625, 0.3317718505859375, 0.34386444091796875, 0.35595703125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 4.0, 11.0, 15.0, 18.0, 11.0, 30.0, 24.0, 35.0, 47.0, 44.0, 41.0, 48.0, 60.0, 67.0, 61.0, 60.0, 55.0, 52.0, 45.0, 38.0, 39.0, 28.0, 32.0, 20.0, 21.0, 17.0, 9.0, 8.0, 10.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.835660457611084, -5.679697513580322, -5.523734092712402, -5.367771148681641, -5.211808204650879, -5.055845260620117, -4.899881839752197, -4.7439188957214355, -4.587955951690674, -4.431993007659912, -4.276029586791992, -4.1200666427612305, -3.9641036987304688, -3.808140516281128, -3.652177333831787, -3.4962143898010254, -3.3402512073516846, -3.1842880249023438, -3.028325080871582, -2.872361898422241, -2.7163989543914795, -2.5604357719421387, -2.404472827911377, -2.248509645462036, -2.0925464630126953, -1.936583399772644, -1.7806203365325928, -1.624657154083252, -1.4686942100524902, -1.3127310276031494, -1.1567679643630981, -1.0008049011230469, -0.8448419570922852, -0.6888788938522339, -0.5329158306121826, -0.3769527077674866, -0.2209896445274353, -0.06502658128738403, 0.09093654155731201, 0.24689960479736328, 0.40286266803741455, 0.5588257312774658, 0.7147887945175171, 0.8707519173622131, 1.0267150402069092, 1.182677984237671, 1.3386411666870117, 1.494604229927063, 1.6505672931671143, 1.8065303564071655, 1.9624934196472168, 2.1184566020965576, 2.2744195461273193, 2.43038272857666, 2.586345672607422, 2.7423088550567627, 2.8982720375061035, 3.0542352199554443, 3.210198163986206, 3.366161346435547, 3.5221242904663086, 3.6780874729156494, 3.8340506553649902, 3.990013599395752, 4.145976543426514]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 13.0, 7.0, 17.0, 11.0, 24.0, 21.0, 22.0, 36.0, 24.0, 29.0, 50.0, 37.0, 34.0, 49.0, 38.0, 39.0, 40.0, 50.0, 49.0, 49.0, 40.0, 33.0, 42.0, 41.0, 29.0, 30.0, 32.0, 15.0, 15.0, 17.0, 16.0, 12.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.170156955718994, -3.067443609237671, -2.9647302627563477, -2.8620171546936035, -2.7593038082122803, -2.656590461730957, -2.553877353668213, -2.4511640071868896, -2.3484506607055664, -2.245737314224243, -2.14302396774292, -2.040310859680176, -1.9375975131988525, -1.8348841667175293, -1.7321709394454956, -1.629457712173462, -1.5267443656921387, -1.4240310192108154, -1.3213177919387817, -1.218604564666748, -1.1158912181854248, -1.0131778717041016, -0.9104646444320679, -0.8077513575553894, -0.7050380706787109, -0.6023247838020325, -0.499611496925354, -0.39689821004867554, -0.29418492317199707, -0.1914716362953186, -0.08875834941864014, 0.01395493745803833, 0.1166682243347168, 0.21938151121139526, 0.32209479808807373, 0.4248080849647522, 0.5275213718414307, 0.6302346587181091, 0.7329479455947876, 0.8356612324714661, 0.9383745193481445, 1.0410878658294678, 1.1438010931015015, 1.2465143203735352, 1.3492276668548584, 1.4519410133361816, 1.5546542406082153, 1.657367467880249, 1.7600808143615723, 1.8627941608428955, 1.9655073881149292, 2.068220615386963, 2.170933961868286, 2.2736473083496094, 2.3763604164123535, 2.4790737628936768, 2.581787109375, 2.6845004558563232, 2.7872138023376465, 2.8899269104003906, 2.992640256881714, 3.095353603363037, 3.1980667114257812, 3.3007800579071045, 3.4034934043884277]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 16.0, 16.0, 43.0, 44.0, 86.0, 111.0, 202.0, 286.0, 484.0, 756.0, 1274.0, 2215.0, 3810.0, 6365.0, 11388.0, 21134.0, 39471.0, 78288.0, 164794.0, 378402.0, 875783.0, 1241154.0, 755101.0, 318865.0, 142245.0, 70221.0, 36453.0, 19397.0, 10816.0, 6202.0, 3603.0, 2109.0, 1197.0, 746.0, 477.0, 229.0, 180.0, 100.0, 66.0, 58.0, 26.0, 17.0, 12.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-5.765625, -5.602783203125, -5.43994140625, -5.277099609375, -5.1142578125, -4.951416015625, -4.78857421875, -4.625732421875, -4.462890625, -4.300048828125, -4.13720703125, -3.974365234375, -3.8115234375, -3.648681640625, -3.48583984375, -3.322998046875, -3.16015625, -2.997314453125, -2.83447265625, -2.671630859375, -2.5087890625, -2.345947265625, -2.18310546875, -2.020263671875, -1.857421875, -1.694580078125, -1.53173828125, -1.368896484375, -1.2060546875, -1.043212890625, -0.88037109375, -0.717529296875, -0.5546875, -0.391845703125, -0.22900390625, -0.066162109375, 0.0966796875, 0.259521484375, 0.42236328125, 0.585205078125, 0.748046875, 0.910888671875, 1.07373046875, 1.236572265625, 1.3994140625, 1.562255859375, 1.72509765625, 1.887939453125, 2.05078125, 2.213623046875, 2.37646484375, 2.539306640625, 2.7021484375, 2.864990234375, 3.02783203125, 3.190673828125, 3.353515625, 3.516357421875, 3.67919921875, 3.842041015625, 4.0048828125, 4.167724609375, 4.33056640625, 4.493408203125, 4.65625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 11.0, 16.0, 13.0, 23.0, 19.0, 21.0, 43.0, 42.0, 39.0, 45.0, 37.0, 31.0, 38.0, 37.0, 38.0, 49.0, 46.0, 32.0, 37.0, 45.0, 32.0, 38.0, 30.0, 25.0, 38.0, 28.0, 15.0, 17.0, 16.0, 11.0, 15.0, 14.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.2755126953125, -2.197509765625, -2.1195068359375, -2.04150390625, -1.9635009765625, -1.885498046875, -1.8074951171875, -1.7294921875, -1.6514892578125, -1.573486328125, -1.4954833984375, -1.41748046875, -1.3394775390625, -1.261474609375, -1.1834716796875, -1.10546875, -1.0274658203125, -0.949462890625, -0.8714599609375, -0.79345703125, -0.7154541015625, -0.637451171875, -0.5594482421875, -0.4814453125, -0.4034423828125, -0.325439453125, -0.2474365234375, -0.16943359375, -0.0914306640625, -0.013427734375, 0.0645751953125, 0.142578125, 0.2205810546875, 0.298583984375, 0.3765869140625, 0.45458984375, 0.5325927734375, 0.610595703125, 0.6885986328125, 0.7666015625, 0.8446044921875, 0.922607421875, 1.0006103515625, 1.07861328125, 1.1566162109375, 1.234619140625, 1.3126220703125, 1.390625, 1.4686279296875, 1.546630859375, 1.6246337890625, 1.70263671875, 1.7806396484375, 1.858642578125, 1.9366455078125, 2.0146484375, 2.0926513671875, 2.170654296875, 2.2486572265625, 2.32666015625, 2.4046630859375, 2.482666015625, 2.5606689453125, 2.638671875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 9.0, 11.0, 19.0, 24.0, 27.0, 61.0, 79.0, 141.0, 181.0, 297.0, 431.0, 762.0, 1120.0, 1889.0, 3063.0, 5076.0, 8818.0, 15040.0, 26468.0, 47707.0, 88342.0, 168847.0, 331070.0, 645560.0, 1021185.0, 858423.0, 463513.0, 235836.0, 122099.0, 64387.0, 35416.0, 19837.0, 11300.0, 6691.0, 3947.0, 2438.0, 1568.0, 896.0, 584.0, 389.0, 236.0, 178.0, 90.0, 76.0, 44.0, 38.0, 17.0, 16.0, 11.0, 10.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-5.375, -5.21087646484375, -5.0467529296875, -4.88262939453125, -4.718505859375, -4.55438232421875, -4.3902587890625, -4.22613525390625, -4.06201171875, -3.89788818359375, -3.7337646484375, -3.56964111328125, -3.405517578125, -3.24139404296875, -3.0772705078125, -2.91314697265625, -2.7490234375, -2.58489990234375, -2.4207763671875, -2.25665283203125, -2.092529296875, -1.92840576171875, -1.7642822265625, -1.60015869140625, -1.43603515625, -1.27191162109375, -1.1077880859375, -0.94366455078125, -0.779541015625, -0.61541748046875, -0.4512939453125, -0.28717041015625, -0.123046875, 0.04107666015625, 0.2052001953125, 0.36932373046875, 0.533447265625, 0.69757080078125, 0.8616943359375, 1.02581787109375, 1.18994140625, 1.35406494140625, 1.5181884765625, 1.68231201171875, 1.846435546875, 2.01055908203125, 2.1746826171875, 2.33880615234375, 2.5029296875, 2.66705322265625, 2.8311767578125, 2.99530029296875, 3.159423828125, 3.32354736328125, 3.4876708984375, 3.65179443359375, 3.81591796875, 3.98004150390625, 4.1441650390625, 4.30828857421875, 4.472412109375, 4.63653564453125, 4.8006591796875, 4.96478271484375, 5.12890625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 6.0, 9.0, 7.0, 11.0, 12.0, 11.0, 14.0, 25.0, 35.0, 44.0, 46.0, 61.0, 73.0, 96.0, 118.0, 129.0, 160.0, 175.0, 181.0, 206.0, 219.0, 256.0, 248.0, 267.0, 224.0, 211.0, 183.0, 162.0, 124.0, 129.0, 100.0, 86.0, 75.0, 83.0, 54.0, 46.0, 29.0, 28.0, 28.0, 27.0, 8.0, 21.0, 11.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.345703125, -1.3045654296875, -1.263427734375, -1.2222900390625, -1.18115234375, -1.1400146484375, -1.098876953125, -1.0577392578125, -1.0166015625, -0.9754638671875, -0.934326171875, -0.8931884765625, -0.85205078125, -0.8109130859375, -0.769775390625, -0.7286376953125, -0.6875, -0.6463623046875, -0.605224609375, -0.5640869140625, -0.52294921875, -0.4818115234375, -0.440673828125, -0.3995361328125, -0.3583984375, -0.3172607421875, -0.276123046875, -0.2349853515625, -0.19384765625, -0.1527099609375, -0.111572265625, -0.0704345703125, -0.029296875, 0.0118408203125, 0.052978515625, 0.0941162109375, 0.13525390625, 0.1763916015625, 0.217529296875, 0.2586669921875, 0.2998046875, 0.3409423828125, 0.382080078125, 0.4232177734375, 0.46435546875, 0.5054931640625, 0.546630859375, 0.5877685546875, 0.62890625, 0.6700439453125, 0.711181640625, 0.7523193359375, 0.79345703125, 0.8345947265625, 0.875732421875, 0.9168701171875, 0.9580078125, 0.9991455078125, 1.040283203125, 1.0814208984375, 1.12255859375, 1.1636962890625, 1.204833984375, 1.2459716796875, 1.287109375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 5.0, 5.0, 9.0, 10.0, 10.0, 12.0, 14.0, 23.0, 25.0, 36.0, 36.0, 59.0, 61.0, 66.0, 52.0, 50.0, 71.0, 61.0, 48.0, 59.0, 49.0, 38.0, 34.0, 31.0, 25.0, 26.0, 20.0, 14.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.294163227081299, -6.114944934844971, -5.935727119445801, -5.756508827209473, -5.5772905349731445, -5.398072242736816, -5.218853950500488, -5.039636135101318, -4.86041784286499, -4.681199550628662, -4.501981735229492, -4.322763442993164, -4.143545150756836, -3.964326858520508, -3.785108804702759, -3.6058907508850098, -3.4266724586486816, -3.2474541664123535, -3.0682361125946045, -2.8890180587768555, -2.7097997665405273, -2.530581474304199, -2.35136342048645, -2.172145366668701, -1.992927074432373, -1.8137089014053345, -1.634490728378296, -1.4552725553512573, -1.2760543823242188, -1.0968362092971802, -0.9176180362701416, -0.738399863243103, -0.5591816902160645, -0.3799635171890259, -0.2007453441619873, -0.02152717113494873, 0.15769100189208984, 0.3369091749191284, 0.516127347946167, 0.6953455209732056, 0.8745636940002441, 1.0537818670272827, 1.2330000400543213, 1.4122182130813599, 1.5914363861083984, 1.770654559135437, 1.9498727321624756, 2.1290907859802246, 2.3083090782165527, 2.487527370452881, 2.66674542427063, 2.845963478088379, 3.025181770324707, 3.204400062561035, 3.383618116378784, 3.562836170196533, 3.7420544624328613, 3.9212727546691895, 4.100490570068359, 4.2797088623046875, 4.458927154541016, 4.638145446777344, 4.817363739013672, 4.996581554412842, 5.17579984664917]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 9.0, 9.0, 19.0, 19.0, 16.0, 22.0, 32.0, 31.0, 29.0, 31.0, 38.0, 33.0, 47.0, 50.0, 51.0, 43.0, 51.0, 56.0, 40.0, 52.0, 42.0, 34.0, 32.0, 28.0, 32.0, 28.0, 23.0, 14.0, 18.0, 14.0, 15.0, 10.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8257391452789307, -2.721311092376709, -2.6168832778930664, -2.5124552249908447, -2.408027410507202, -2.3035993576049805, -2.199171543121338, -2.094743490219116, -1.990315556526184, -1.885887622833252, -1.7814596891403198, -1.6770317554473877, -1.572603702545166, -1.4681758880615234, -1.3637478351593018, -1.2593199014663696, -1.1548919677734375, -1.0504640340805054, -0.9460361003875732, -0.8416081070899963, -0.7371801733970642, -0.6327522397041321, -0.5283242464065552, -0.42389631271362305, -0.3194683790206909, -0.2150404304265976, -0.11061248183250427, -0.006184518337249756, 0.09824341535568237, 0.2026713490486145, 0.3070993423461914, 0.41152727603912354, 0.5159552097320557, 0.6203831434249878, 0.7248110771179199, 0.8292390704154968, 0.933667004108429, 1.0380949974060059, 1.142522931098938, 1.2469508647918701, 1.3513787984848022, 1.4558067321777344, 1.5602346658706665, 1.6646625995635986, 1.7690906524658203, 1.873518466949463, 1.9779465198516846, 2.0823745727539062, 2.186802387237549, 2.2912304401397705, 2.395658254623413, 2.5000863075256348, 2.6045141220092773, 2.708942174911499, 2.8133702278137207, 2.9177980422973633, 3.022225856781006, 3.1266539096832275, 3.23108172416687, 3.335509777069092, 3.4399375915527344, 3.544365644454956, 3.6487936973571777, 3.7532215118408203, 3.857649564743042]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 7.0, 15.0, 11.0, 29.0, 19.0, 41.0, 73.0, 95.0, 167.0, 203.0, 349.0, 560.0, 956.0, 1402.0, 2401.0, 3986.0, 7075.0, 12682.0, 23314.0, 43146.0, 82809.0, 153315.0, 228697.0, 210711.0, 128128.0, 68089.0, 36107.0, 19007.0, 10236.0, 6021.0, 3391.0, 2122.0, 1231.0, 746.0, 488.0, 297.0, 205.0, 127.0, 81.0, 53.0, 59.0, 27.0, 21.0, 15.0, 11.0, 4.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-0.44970703125, -0.4364204406738281, -0.42313385009765625, -0.4098472595214844, -0.3965606689453125, -0.3832740783691406, -0.36998748779296875, -0.3567008972167969, -0.343414306640625, -0.3301277160644531, -0.31684112548828125, -0.3035545349121094, -0.2902679443359375, -0.2769813537597656, -0.26369476318359375, -0.2504081726074219, -0.23712158203125, -0.22383499145507812, -0.21054840087890625, -0.19726181030273438, -0.1839752197265625, -0.17068862915039062, -0.15740203857421875, -0.14411544799804688, -0.130828857421875, -0.11754226684570312, -0.10425567626953125, -0.09096908569335938, -0.0776824951171875, -0.06439590454101562, -0.05110931396484375, -0.037822723388671875, -0.0245361328125, -0.011249542236328125, 0.00203704833984375, 0.015323638916015625, 0.0286102294921875, 0.041896820068359375, 0.05518341064453125, 0.06847000122070312, 0.081756591796875, 0.09504318237304688, 0.10832977294921875, 0.12161636352539062, 0.1349029541015625, 0.14818954467773438, 0.16147613525390625, 0.17476272583007812, 0.18804931640625, 0.20133590698242188, 0.21462249755859375, 0.22790908813476562, 0.2411956787109375, 0.2544822692871094, 0.26776885986328125, 0.2810554504394531, 0.294342041015625, 0.3076286315917969, 0.32091522216796875, 0.3342018127441406, 0.3474884033203125, 0.3607749938964844, 0.37406158447265625, 0.3873481750488281, 0.400634765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 9.0, 20.0, 14.0, 15.0, 20.0, 26.0, 23.0, 34.0, 32.0, 39.0, 39.0, 48.0, 50.0, 48.0, 57.0, 37.0, 47.0, 52.0, 47.0, 37.0, 37.0, 33.0, 39.0, 23.0, 28.0, 26.0, 17.0, 15.0, 10.0, 21.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.31640625, -3.19927978515625, -3.0821533203125, -2.96502685546875, -2.847900390625, -2.73077392578125, -2.6136474609375, -2.49652099609375, -2.37939453125, -2.26226806640625, -2.1451416015625, -2.02801513671875, -1.910888671875, -1.79376220703125, -1.6766357421875, -1.55950927734375, -1.4423828125, -1.32525634765625, -1.2081298828125, -1.09100341796875, -0.973876953125, -0.85675048828125, -0.7396240234375, -0.62249755859375, -0.50537109375, -0.38824462890625, -0.2711181640625, -0.15399169921875, -0.036865234375, 0.08026123046875, 0.1973876953125, 0.31451416015625, 0.431640625, 0.54876708984375, 0.6658935546875, 0.78302001953125, 0.900146484375, 1.01727294921875, 1.1343994140625, 1.25152587890625, 1.36865234375, 1.48577880859375, 1.6029052734375, 1.72003173828125, 1.837158203125, 1.95428466796875, 2.0714111328125, 2.18853759765625, 2.3056640625, 2.42279052734375, 2.5399169921875, 2.65704345703125, 2.774169921875, 2.89129638671875, 3.0084228515625, 3.12554931640625, 3.24267578125, 3.35980224609375, 3.4769287109375, 3.59405517578125, 3.711181640625, 3.82830810546875, 3.9454345703125, 4.06256103515625, 4.1796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 6.0, 19.0, 17.0, 25.0, 35.0, 40.0, 52.0, 96.0, 136.0, 179.0, 275.0, 431.0, 609.0, 1067.0, 1705.0, 2979.0, 5700.0, 11524.0, 26487.0, 182752.0, 740534.0, 41758.0, 15393.0, 7187.0, 3820.0, 2191.0, 1231.0, 747.0, 465.0, 337.0, 203.0, 169.0, 107.0, 72.0, 49.0, 43.0, 24.0, 23.0, 11.0, 4.0, 10.0, 12.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0251617431640625, -0.988800048828125, -0.9524383544921875, -0.91607666015625, -0.8797149658203125, -0.843353271484375, -0.8069915771484375, -0.7706298828125, -0.7342681884765625, -0.697906494140625, -0.6615447998046875, -0.62518310546875, -0.5888214111328125, -0.552459716796875, -0.5160980224609375, -0.479736328125, -0.4433746337890625, -0.407012939453125, -0.3706512451171875, -0.33428955078125, -0.2979278564453125, -0.261566162109375, -0.2252044677734375, -0.1888427734375, -0.1524810791015625, -0.116119384765625, -0.0797576904296875, -0.04339599609375, -0.0070343017578125, 0.029327392578125, 0.0656890869140625, 0.10205078125, 0.1384124755859375, 0.174774169921875, 0.2111358642578125, 0.24749755859375, 0.2838592529296875, 0.320220947265625, 0.3565826416015625, 0.3929443359375, 0.4293060302734375, 0.465667724609375, 0.5020294189453125, 0.53839111328125, 0.5747528076171875, 0.611114501953125, 0.6474761962890625, 0.683837890625, 0.7201995849609375, 0.756561279296875, 0.7929229736328125, 0.82928466796875, 0.8656463623046875, 0.902008056640625, 0.9383697509765625, 0.9747314453125, 1.0110931396484375, 1.047454833984375, 1.0838165283203125, 1.12017822265625, 1.1565399169921875, 1.192901611328125, 1.2292633056640625, 1.265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 4.0, 7.0, 9.0, 13.0, 16.0, 23.0, 26.0, 17.0, 21.0, 23.0, 24.0, 31.0, 31.0, 43.0, 36.0, 33.0, 43.0, 34.0, 36.0, 40.0, 45.0, 31.0, 29.0, 34.0, 36.0, 21.0, 22.0, 33.0, 21.0, 25.0, 27.0, 21.0, 29.0, 14.0, 22.0, 11.0, 10.0, 10.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.824188232421875, -1.76361083984375, -1.703033447265625, -1.6424560546875, -1.581878662109375, -1.52130126953125, -1.460723876953125, -1.400146484375, -1.339569091796875, -1.27899169921875, -1.218414306640625, -1.1578369140625, -1.097259521484375, -1.03668212890625, -0.976104736328125, -0.91552734375, -0.854949951171875, -0.79437255859375, -0.733795166015625, -0.6732177734375, -0.612640380859375, -0.55206298828125, -0.491485595703125, -0.430908203125, -0.370330810546875, -0.30975341796875, -0.249176025390625, -0.1885986328125, -0.128021240234375, -0.06744384765625, -0.006866455078125, 0.0537109375, 0.114288330078125, 0.17486572265625, 0.235443115234375, 0.2960205078125, 0.356597900390625, 0.41717529296875, 0.477752685546875, 0.538330078125, 0.598907470703125, 0.65948486328125, 0.720062255859375, 0.7806396484375, 0.841217041015625, 0.90179443359375, 0.962371826171875, 1.02294921875, 1.083526611328125, 1.14410400390625, 1.204681396484375, 1.2652587890625, 1.325836181640625, 1.38641357421875, 1.446990966796875, 1.507568359375, 1.568145751953125, 1.62872314453125, 1.689300537109375, 1.7498779296875, 1.810455322265625, 1.87103271484375, 1.931610107421875, 1.9921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 11.0, 20.0, 21.0, 22.0, 33.0, 62.0, 96.0, 130.0, 201.0, 329.0, 599.0, 1273.0, 2577.0, 5747.0, 14199.0, 43392.0, 910998.0, 43654.0, 14214.0, 5740.0, 2471.0, 1180.0, 623.0, 298.0, 220.0, 131.0, 69.0, 71.0, 41.0, 32.0, 15.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.355224609375, -0.3435783386230469, -0.33193206787109375, -0.3202857971191406, -0.3086395263671875, -0.2969932556152344, -0.28534698486328125, -0.2737007141113281, -0.262054443359375, -0.2504081726074219, -0.23876190185546875, -0.22711563110351562, -0.2154693603515625, -0.20382308959960938, -0.19217681884765625, -0.18053054809570312, -0.16888427734375, -0.15723800659179688, -0.14559173583984375, -0.13394546508789062, -0.1222991943359375, -0.11065292358398438, -0.09900665283203125, -0.08736038208007812, -0.075714111328125, -0.06406784057617188, -0.05242156982421875, -0.040775299072265625, -0.0291290283203125, -0.017482757568359375, -0.00583648681640625, 0.005809783935546875, 0.0174560546875, 0.029102325439453125, 0.04074859619140625, 0.052394866943359375, 0.0640411376953125, 0.07568740844726562, 0.08733367919921875, 0.09897994995117188, 0.110626220703125, 0.12227249145507812, 0.13391876220703125, 0.14556503295898438, 0.1572113037109375, 0.16885757446289062, 0.18050384521484375, 0.19215011596679688, 0.20379638671875, 0.21544265747070312, 0.22708892822265625, 0.23873519897460938, 0.2503814697265625, 0.2620277404785156, 0.27367401123046875, 0.2853202819824219, 0.296966552734375, 0.3086128234863281, 0.32025909423828125, 0.3319053649902344, 0.3435516357421875, 0.3551979064941406, 0.36684417724609375, 0.3784904479980469, 0.39013671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 10.0, 7.0, 12.0, 22.0, 21.0, 23.0, 10.0, 31.0, 42.0, 42.0, 42.0, 51.0, 53.0, 47.0, 47.0, 40.0, 44.0, 49.0, 50.0, 41.0, 49.0, 36.0, 28.0, 28.0, 27.0, 25.0, 21.0, 21.0, 10.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919269561767578e-05, -1.848861575126648e-05, -1.7784535884857178e-05, -1.7080456018447876e-05, -1.6376376152038574e-05, -1.5672296285629272e-05, -1.496821641921997e-05, -1.4264136552810669e-05, -1.3560056686401367e-05, -1.2855976819992065e-05, -1.2151896953582764e-05, -1.1447817087173462e-05, -1.074373722076416e-05, -1.0039657354354858e-05, -9.335577487945557e-06, -8.631497621536255e-06, -7.927417755126953e-06, -7.223337888717651e-06, -6.51925802230835e-06, -5.815178155899048e-06, -5.111098289489746e-06, -4.407018423080444e-06, -3.7029385566711426e-06, -2.998858690261841e-06, -2.294778823852539e-06, -1.5906989574432373e-06, -8.866190910339355e-07, -1.825392246246338e-07, 5.21540641784668e-07, 1.2256205081939697e-06, 1.9297003746032715e-06, 2.6337802410125732e-06, 3.337860107421875e-06, 4.041939973831177e-06, 4.7460198402404785e-06, 5.45009970664978e-06, 6.154179573059082e-06, 6.858259439468384e-06, 7.5623393058776855e-06, 8.266419172286987e-06, 8.970499038696289e-06, 9.67457890510559e-06, 1.0378658771514893e-05, 1.1082738637924194e-05, 1.1786818504333496e-05, 1.2490898370742798e-05, 1.31949782371521e-05, 1.3899058103561401e-05, 1.4603137969970703e-05, 1.5307217836380005e-05, 1.6011297702789307e-05, 1.671537756919861e-05, 1.741945743560791e-05, 1.8123537302017212e-05, 1.8827617168426514e-05, 1.9531697034835815e-05, 2.0235776901245117e-05, 2.093985676765442e-05, 2.164393663406372e-05, 2.2348016500473022e-05, 2.3052096366882324e-05, 2.3756176233291626e-05, 2.4460256099700928e-05, 2.516433596611023e-05, 2.586841583251953e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 4.0, 12.0, 11.0, 27.0, 48.0, 61.0, 69.0, 114.0, 172.0, 244.0, 390.0, 620.0, 944.0, 1456.0, 2407.0, 4113.0, 7465.0, 14539.0, 30390.0, 63271.0, 131567.0, 234075.0, 251944.0, 154522.0, 75717.0, 36287.0, 17279.0, 8816.0, 4819.0, 2615.0, 1566.0, 1015.0, 667.0, 418.0, 274.0, 182.0, 134.0, 85.0, 56.0, 40.0, 33.0, 24.0, 21.0, 7.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10455322265625, -0.10108184814453125, -0.0976104736328125, -0.09413909912109375, -0.090667724609375, -0.08719635009765625, -0.0837249755859375, -0.08025360107421875, -0.0767822265625, -0.07331085205078125, -0.0698394775390625, -0.06636810302734375, -0.062896728515625, -0.05942535400390625, -0.0559539794921875, -0.05248260498046875, -0.04901123046875, -0.04553985595703125, -0.0420684814453125, -0.03859710693359375, -0.035125732421875, -0.03165435791015625, -0.0281829833984375, -0.02471160888671875, -0.021240234375, -0.01776885986328125, -0.0142974853515625, -0.01082611083984375, -0.007354736328125, -0.00388336181640625, -0.0004119873046875, 0.00305938720703125, 0.00653076171875, 0.01000213623046875, 0.0134735107421875, 0.01694488525390625, 0.020416259765625, 0.02388763427734375, 0.0273590087890625, 0.03083038330078125, 0.0343017578125, 0.03777313232421875, 0.0412445068359375, 0.04471588134765625, 0.048187255859375, 0.05165863037109375, 0.0551300048828125, 0.05860137939453125, 0.06207275390625, 0.06554412841796875, 0.0690155029296875, 0.07248687744140625, 0.075958251953125, 0.07942962646484375, 0.0829010009765625, 0.08637237548828125, 0.08984375, 0.09331512451171875, 0.0967864990234375, 0.10025787353515625, 0.103729248046875, 0.10720062255859375, 0.1106719970703125, 0.11414337158203125, 0.11761474609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 11.0, 10.0, 18.0, 24.0, 28.0, 23.0, 31.0, 43.0, 53.0, 70.0, 54.0, 72.0, 70.0, 76.0, 55.0, 50.0, 47.0, 36.0, 37.0, 31.0, 30.0, 19.0, 6.0, 16.0, 14.0, 11.0, 6.0, 4.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.023162841796875, -0.022449970245361328, -0.021737098693847656, -0.021024227142333984, -0.020311355590820312, -0.01959848403930664, -0.01888561248779297, -0.018172740936279297, -0.017459869384765625, -0.016746997833251953, -0.01603412628173828, -0.01532125473022461, -0.014608383178710938, -0.013895511627197266, -0.013182640075683594, -0.012469768524169922, -0.01175689697265625, -0.011044025421142578, -0.010331153869628906, -0.009618282318115234, -0.008905410766601562, -0.00819253921508789, -0.007479667663574219, -0.006766796112060547, -0.006053924560546875, -0.005341053009033203, -0.004628181457519531, -0.003915309906005859, -0.0032024383544921875, -0.0024895668029785156, -0.0017766952514648438, -0.0010638236999511719, -0.0003509521484375, 0.0003619194030761719, 0.0010747909545898438, 0.0017876625061035156, 0.0025005340576171875, 0.0032134056091308594, 0.003926277160644531, 0.004639148712158203, 0.005352020263671875, 0.006064891815185547, 0.006777763366699219, 0.007490634918212891, 0.008203506469726562, 0.008916378021240234, 0.009629249572753906, 0.010342121124267578, 0.01105499267578125, 0.011767864227294922, 0.012480735778808594, 0.013193607330322266, 0.013906478881835938, 0.01461935043334961, 0.015332221984863281, 0.016045093536376953, 0.016757965087890625, 0.017470836639404297, 0.01818370819091797, 0.01889657974243164, 0.019609451293945312, 0.020322322845458984, 0.021035194396972656, 0.021748065948486328, 0.0224609375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 8.0, 9.0, 11.0, 12.0, 17.0, 22.0, 26.0, 38.0, 44.0, 54.0, 59.0, 62.0, 55.0, 58.0, 64.0, 62.0, 47.0, 60.0, 43.0, 42.0, 34.0, 29.0, 24.0, 26.0, 18.0, 13.0, 6.0, 14.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.235409736633301, -6.057042121887207, -5.878674507141113, -5.7003068923950195, -5.521938800811768, -5.343571186065674, -5.16520357131958, -4.986835956573486, -4.808467864990234, -4.630100250244141, -4.451732635498047, -4.273365020751953, -4.094996929168701, -3.9166293144226074, -3.7382616996765137, -3.55989408493042, -3.381526470184326, -3.2031588554382324, -3.0247910022735596, -2.846423387527466, -2.668055534362793, -2.489687919616699, -2.3113203048706055, -2.1329526901245117, -1.9545848369598389, -1.7762171030044556, -1.5978493690490723, -1.4194817543029785, -1.2411140203475952, -1.062746286392212, -0.8843786716461182, -0.7060109376907349, -0.5276436805725098, -0.34927597641944885, -0.17090827226638794, 0.007459402084350586, 0.1858271360397339, 0.3641948699951172, 0.5425624847412109, 0.7209302186965942, 0.8992979526519775, 1.0776656866073608, 1.2560334205627441, 1.434401035308838, 1.6127687692642212, 1.7911365032196045, 1.9695041179656982, 2.147871971130371, 2.326239585876465, 2.5046072006225586, 2.6829750537872314, 2.861342668533325, 3.039710521697998, 3.218078136444092, 3.3964457511901855, 3.5748133659362793, 3.753181219100952, 3.931548833847046, 4.109916687011719, 4.2882843017578125, 4.466651916503906, 4.64501953125, 4.823387145996094, 5.001755237579346, 5.1801228523254395]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 9.0, 18.0, 19.0, 16.0, 24.0, 31.0, 34.0, 26.0, 31.0, 38.0, 33.0, 49.0, 51.0, 48.0, 44.0, 52.0, 52.0, 43.0, 51.0, 45.0, 32.0, 31.0, 28.0, 35.0, 27.0, 20.0, 14.0, 18.0, 16.0, 14.0, 9.0, 5.0, 9.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8157401084899902, -2.711730480194092, -2.6077210903167725, -2.503711462020874, -2.3997018337249756, -2.2956924438476562, -2.191682815551758, -2.0876731872558594, -1.983663558959961, -1.879654049873352, -1.7756444215774536, -1.6716349124908447, -1.5676252841949463, -1.4636157751083374, -1.3596062660217285, -1.25559663772583, -1.1515871286392212, -1.0475776195526123, -0.9435679912567139, -0.839558482170105, -0.7355488538742065, -0.6315393447875977, -0.527529776096344, -0.42352020740509033, -0.31951063871383667, -0.215501070022583, -0.11149151623249054, -0.007481962442398071, 0.09652760624885559, 0.20053714513778687, 0.3045467138290405, 0.4085562825202942, 0.5125658512115479, 0.6165754199028015, 0.7205849885940552, 0.8245944976806641, 0.9286041259765625, 1.0326136350631714, 1.1366231441497803, 1.2406327724456787, 1.3446424007415771, 1.448651909828186, 1.5526615381240845, 1.6566710472106934, 1.7606806755065918, 1.8646901845932007, 1.9686996936798096, 2.072709321975708, 2.1767187118530273, 2.280728340148926, 2.384737730026245, 2.4887473583221436, 2.592756986618042, 2.6967663764953613, 2.8007760047912598, 2.904785633087158, 3.0087952613830566, 3.112804889678955, 3.2168142795562744, 3.320823907852173, 3.4248335361480713, 3.5288429260253906, 3.632852554321289, 3.7368621826171875, 3.840871810913086]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 12.0, 20.0, 24.0, 40.0, 53.0, 90.0, 125.0, 227.0, 332.0, 529.0, 873.0, 1415.0, 2474.0, 4032.0, 6827.0, 12076.0, 20930.0, 36091.0, 61282.0, 97814.0, 142192.0, 173167.0, 164146.0, 124003.0, 81323.0, 49345.0, 29206.0, 16275.0, 9745.0, 5517.0, 3275.0, 1987.0, 1169.0, 726.0, 455.0, 291.0, 172.0, 111.0, 64.0, 46.0, 23.0, 23.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.790924072265625, -3.67169189453125, -3.552459716796875, -3.4332275390625, -3.313995361328125, -3.19476318359375, -3.075531005859375, -2.956298828125, -2.837066650390625, -2.71783447265625, -2.598602294921875, -2.4793701171875, -2.360137939453125, -2.24090576171875, -2.121673583984375, -2.00244140625, -1.883209228515625, -1.76397705078125, -1.644744873046875, -1.5255126953125, -1.406280517578125, -1.28704833984375, -1.167816162109375, -1.048583984375, -0.929351806640625, -0.81011962890625, -0.690887451171875, -0.5716552734375, -0.452423095703125, -0.33319091796875, -0.213958740234375, -0.0947265625, 0.024505615234375, 0.14373779296875, 0.262969970703125, 0.3822021484375, 0.501434326171875, 0.62066650390625, 0.739898681640625, 0.859130859375, 0.978363037109375, 1.09759521484375, 1.216827392578125, 1.3360595703125, 1.455291748046875, 1.57452392578125, 1.693756103515625, 1.81298828125, 1.932220458984375, 2.05145263671875, 2.170684814453125, 2.2899169921875, 2.409149169921875, 2.52838134765625, 2.647613525390625, 2.766845703125, 2.886077880859375, 3.00531005859375, 3.124542236328125, 3.2437744140625, 3.363006591796875, 3.48223876953125, 3.601470947265625, 3.720703125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 9.0, 3.0, 8.0, 11.0, 14.0, 18.0, 18.0, 26.0, 29.0, 30.0, 21.0, 38.0, 52.0, 40.0, 43.0, 55.0, 54.0, 55.0, 34.0, 51.0, 47.0, 43.0, 45.0, 31.0, 20.0, 28.0, 26.0, 31.0, 24.0, 12.0, 24.0, 14.0, 14.0, 8.0, 2.0, 4.0, 3.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.86016845703125, -2.7437744140625, -2.62738037109375, -2.510986328125, -2.39459228515625, -2.2781982421875, -2.16180419921875, -2.04541015625, -1.92901611328125, -1.8126220703125, -1.69622802734375, -1.579833984375, -1.46343994140625, -1.3470458984375, -1.23065185546875, -1.1142578125, -0.99786376953125, -0.8814697265625, -0.76507568359375, -0.648681640625, -0.53228759765625, -0.4158935546875, -0.29949951171875, -0.18310546875, -0.06671142578125, 0.0496826171875, 0.16607666015625, 0.282470703125, 0.39886474609375, 0.5152587890625, 0.63165283203125, 0.748046875, 0.86444091796875, 0.9808349609375, 1.09722900390625, 1.213623046875, 1.33001708984375, 1.4464111328125, 1.56280517578125, 1.67919921875, 1.79559326171875, 1.9119873046875, 2.02838134765625, 2.144775390625, 2.26116943359375, 2.3775634765625, 2.49395751953125, 2.6103515625, 2.72674560546875, 2.8431396484375, 2.95953369140625, 3.075927734375, 3.19232177734375, 3.3087158203125, 3.42510986328125, 3.54150390625, 3.65789794921875, 3.7742919921875, 3.89068603515625, 4.007080078125, 4.12347412109375, 4.2398681640625, 4.35626220703125, 4.47265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 20.0, 26.0, 28.0, 43.0, 65.0, 85.0, 154.0, 245.0, 349.0, 523.0, 774.0, 1231.0, 1861.0, 2889.0, 4620.0, 7302.0, 11528.0, 18090.0, 28905.0, 44232.0, 65097.0, 92252.0, 119702.0, 136225.0, 134579.0, 114807.0, 87747.0, 61337.0, 40765.0, 26589.0, 17063.0, 10668.0, 6680.0, 4378.0, 2692.0, 1714.0, 1159.0, 716.0, 467.0, 294.0, 223.0, 137.0, 88.0, 58.0, 43.0, 33.0, 17.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0], "bins": [-3.322265625, -3.22430419921875, -3.1263427734375, -3.02838134765625, -2.930419921875, -2.83245849609375, -2.7344970703125, -2.63653564453125, -2.53857421875, -2.44061279296875, -2.3426513671875, -2.24468994140625, -2.146728515625, -2.04876708984375, -1.9508056640625, -1.85284423828125, -1.7548828125, -1.65692138671875, -1.5589599609375, -1.46099853515625, -1.363037109375, -1.26507568359375, -1.1671142578125, -1.06915283203125, -0.97119140625, -0.87322998046875, -0.7752685546875, -0.67730712890625, -0.579345703125, -0.48138427734375, -0.3834228515625, -0.28546142578125, -0.1875, -0.08953857421875, 0.0084228515625, 0.10638427734375, 0.204345703125, 0.30230712890625, 0.4002685546875, 0.49822998046875, 0.59619140625, 0.69415283203125, 0.7921142578125, 0.89007568359375, 0.988037109375, 1.08599853515625, 1.1839599609375, 1.28192138671875, 1.3798828125, 1.47784423828125, 1.5758056640625, 1.67376708984375, 1.771728515625, 1.86968994140625, 1.9676513671875, 2.06561279296875, 2.16357421875, 2.26153564453125, 2.3594970703125, 2.45745849609375, 2.555419921875, 2.65338134765625, 2.7513427734375, 2.84930419921875, 2.947265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 9.0, 9.0, 10.0, 10.0, 20.0, 11.0, 26.0, 25.0, 25.0, 23.0, 24.0, 40.0, 33.0, 37.0, 40.0, 54.0, 41.0, 52.0, 37.0, 45.0, 40.0, 45.0, 44.0, 34.0, 28.0, 37.0, 25.0, 25.0, 26.0, 23.0, 15.0, 19.0, 17.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00927734375, -1.9462890625, -1.88330078125, -1.8203125, -1.75732421875, -1.6943359375, -1.63134765625, -1.568359375, -1.50537109375, -1.4423828125, -1.37939453125, -1.31640625, -1.25341796875, -1.1904296875, -1.12744140625, -1.064453125, -1.00146484375, -0.9384765625, -0.87548828125, -0.8125, -0.74951171875, -0.6865234375, -0.62353515625, -0.560546875, -0.49755859375, -0.4345703125, -0.37158203125, -0.30859375, -0.24560546875, -0.1826171875, -0.11962890625, -0.056640625, 0.00634765625, 0.0693359375, 0.13232421875, 0.1953125, 0.25830078125, 0.3212890625, 0.38427734375, 0.447265625, 0.51025390625, 0.5732421875, 0.63623046875, 0.69921875, 0.76220703125, 0.8251953125, 0.88818359375, 0.951171875, 1.01416015625, 1.0771484375, 1.14013671875, 1.203125, 1.26611328125, 1.3291015625, 1.39208984375, 1.455078125, 1.51806640625, 1.5810546875, 1.64404296875, 1.70703125, 1.77001953125, 1.8330078125, 1.89599609375, 1.958984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 12.0, 11.0, 10.0, 14.0, 32.0, 34.0, 45.0, 81.0, 124.0, 157.0, 217.0, 401.0, 606.0, 988.0, 1742.0, 3163.0, 5625.0, 10762.0, 21424.0, 44809.0, 96186.0, 184453.0, 255022.0, 205278.0, 111501.0, 53145.0, 25262.0, 12495.0, 6380.0, 3491.0, 1999.0, 1111.0, 709.0, 422.0, 250.0, 185.0, 121.0, 75.0, 60.0, 43.0, 29.0, 25.0, 15.0, 6.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.046875, -2.94732666015625, -2.8477783203125, -2.74822998046875, -2.648681640625, -2.54913330078125, -2.4495849609375, -2.35003662109375, -2.25048828125, -2.15093994140625, -2.0513916015625, -1.95184326171875, -1.852294921875, -1.75274658203125, -1.6531982421875, -1.55364990234375, -1.4541015625, -1.35455322265625, -1.2550048828125, -1.15545654296875, -1.055908203125, -0.95635986328125, -0.8568115234375, -0.75726318359375, -0.65771484375, -0.55816650390625, -0.4586181640625, -0.35906982421875, -0.259521484375, -0.15997314453125, -0.0604248046875, 0.03912353515625, 0.138671875, 0.23822021484375, 0.3377685546875, 0.43731689453125, 0.536865234375, 0.63641357421875, 0.7359619140625, 0.83551025390625, 0.93505859375, 1.03460693359375, 1.1341552734375, 1.23370361328125, 1.333251953125, 1.43280029296875, 1.5323486328125, 1.63189697265625, 1.7314453125, 1.83099365234375, 1.9305419921875, 2.03009033203125, 2.129638671875, 2.22918701171875, 2.3287353515625, 2.42828369140625, 2.52783203125, 2.62738037109375, 2.7269287109375, 2.82647705078125, 2.926025390625, 3.02557373046875, 3.1251220703125, 3.22467041015625, 3.32421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 9.0, 5.0, 12.0, 11.0, 9.0, 29.0, 22.0, 29.0, 25.0, 44.0, 55.0, 46.0, 62.0, 68.0, 64.0, 61.0, 50.0, 56.0, 65.0, 50.0, 28.0, 29.0, 26.0, 35.0, 25.0, 17.0, 15.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00030684471130371094, -0.00029884278774261475, -0.00029084086418151855, -0.00028283894062042236, -0.00027483701705932617, -0.00026683509349823, -0.0002588331699371338, -0.0002508312463760376, -0.0002428293228149414, -0.00023482739925384521, -0.00022682547569274902, -0.00021882355213165283, -0.00021082162857055664, -0.00020281970500946045, -0.00019481778144836426, -0.00018681585788726807, -0.00017881393432617188, -0.00017081201076507568, -0.0001628100872039795, -0.0001548081636428833, -0.0001468062400817871, -0.00013880431652069092, -0.00013080239295959473, -0.00012280046939849854, -0.00011479854583740234, -0.00010679662227630615, -9.879469871520996e-05, -9.079277515411377e-05, -8.279085159301758e-05, -7.478892803192139e-05, -6.67870044708252e-05, -5.8785080909729004e-05, -5.078315734863281e-05, -4.278123378753662e-05, -3.477931022644043e-05, -2.6777386665344238e-05, -1.8775463104248047e-05, -1.0773539543151855e-05, -2.771615982055664e-06, 5.230307579040527e-06, 1.3232231140136719e-05, 2.123415470123291e-05, 2.92360782623291e-05, 3.723800182342529e-05, 4.5239925384521484e-05, 5.3241848945617676e-05, 6.124377250671387e-05, 6.924569606781006e-05, 7.724761962890625e-05, 8.524954319000244e-05, 9.325146675109863e-05, 0.00010125339031219482, 0.00010925531387329102, 0.00011725723743438721, 0.0001252591609954834, 0.0001332610845565796, 0.00014126300811767578, 0.00014926493167877197, 0.00015726685523986816, 0.00016526877880096436, 0.00017327070236206055, 0.00018127262592315674, 0.00018927454948425293, 0.00019727647304534912, 0.0002052783966064453]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 4.0, 9.0, 8.0, 20.0, 37.0, 40.0, 73.0, 105.0, 137.0, 196.0, 286.0, 400.0, 670.0, 910.0, 1323.0, 2050.0, 3372.0, 5287.0, 8774.0, 14711.0, 24881.0, 42966.0, 72442.0, 116576.0, 162893.0, 179438.0, 152219.0, 103734.0, 63055.0, 36560.0, 21576.0, 12761.0, 7594.0, 4787.0, 2942.0, 1956.0, 1276.0, 834.0, 535.0, 378.0, 227.0, 159.0, 107.0, 85.0, 52.0, 37.0, 28.0, 14.0, 8.0, 8.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.021484375, -1.95703125, -1.892578125, -1.828125, -1.763671875, -1.69921875, -1.634765625, -1.5703125, -1.505859375, -1.44140625, -1.376953125, -1.3125, -1.248046875, -1.18359375, -1.119140625, -1.0546875, -0.990234375, -0.92578125, -0.861328125, -0.796875, -0.732421875, -0.66796875, -0.603515625, -0.5390625, -0.474609375, -0.41015625, -0.345703125, -0.28125, -0.216796875, -0.15234375, -0.087890625, -0.0234375, 0.041015625, 0.10546875, 0.169921875, 0.234375, 0.298828125, 0.36328125, 0.427734375, 0.4921875, 0.556640625, 0.62109375, 0.685546875, 0.75, 0.814453125, 0.87890625, 0.943359375, 1.0078125, 1.072265625, 1.13671875, 1.201171875, 1.265625, 1.330078125, 1.39453125, 1.458984375, 1.5234375, 1.587890625, 1.65234375, 1.716796875, 1.78125, 1.845703125, 1.91015625, 1.974609375, 2.0390625, 2.103515625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 11.0, 21.0, 15.0, 27.0, 30.0, 37.0, 44.0, 43.0, 50.0, 55.0, 64.0, 46.0, 46.0, 67.0, 53.0, 49.0, 47.0, 34.0, 28.0, 24.0, 26.0, 16.0, 30.0, 18.0, 11.0, 8.0, 15.0, 7.0, 2.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.48014068603515625, -0.4622344970703125, -0.44432830810546875, -0.426422119140625, -0.40851593017578125, -0.3906097412109375, -0.37270355224609375, -0.35479736328125, -0.33689117431640625, -0.3189849853515625, -0.30107879638671875, -0.283172607421875, -0.26526641845703125, -0.2473602294921875, -0.22945404052734375, -0.2115478515625, -0.19364166259765625, -0.1757354736328125, -0.15782928466796875, -0.139923095703125, -0.12201690673828125, -0.1041107177734375, -0.08620452880859375, -0.06829833984375, -0.05039215087890625, -0.0324859619140625, -0.01457977294921875, 0.003326416015625, 0.02123260498046875, 0.0391387939453125, 0.05704498291015625, 0.074951171875, 0.09285736083984375, 0.1107635498046875, 0.12866973876953125, 0.146575927734375, 0.16448211669921875, 0.1823883056640625, 0.20029449462890625, 0.21820068359375, 0.23610687255859375, 0.2540130615234375, 0.27191925048828125, 0.289825439453125, 0.30773162841796875, 0.3256378173828125, 0.34354400634765625, 0.3614501953125, 0.37935638427734375, 0.3972625732421875, 0.41516876220703125, 0.433074951171875, 0.45098114013671875, 0.4688873291015625, 0.48679351806640625, 0.50469970703125, 0.5226058959960938, 0.5405120849609375, 0.5584182739257812, 0.576324462890625, 0.5942306518554688, 0.6121368408203125, 0.6300430297851562, 0.64794921875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 4.0, 10.0, 3.0, 8.0, 9.0, 20.0, 28.0, 24.0, 27.0, 48.0, 41.0, 55.0, 79.0, 61.0, 67.0, 68.0, 63.0, 54.0, 54.0, 52.0, 45.0, 29.0, 30.0, 33.0, 20.0, 13.0, 11.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.87745475769043, -6.682534217834473, -6.487614154815674, -6.292694091796875, -6.097773551940918, -5.902853012084961, -5.707932949066162, -5.513012886047363, -5.318092346191406, -5.123171806335449, -4.92825174331665, -4.733331680297852, -4.5384111404418945, -4.3434906005859375, -4.148570537567139, -3.9536502361297607, -3.758729934692383, -3.563809633255005, -3.368889331817627, -3.173969030380249, -2.979048728942871, -2.784128427505493, -2.5892081260681152, -2.3942878246307373, -2.1993675231933594, -2.0044472217559814, -1.8095269203186035, -1.6146066188812256, -1.4196863174438477, -1.2247660160064697, -1.0298457145690918, -0.8349254131317139, -0.6400055885314941, -0.4450852870941162, -0.2501649856567383, -0.05524468421936035, 0.13967561721801758, 0.3345959186553955, 0.5295162200927734, 0.7244365215301514, 0.9193568229675293, 1.1142771244049072, 1.3091974258422852, 1.504117727279663, 1.699038028717041, 1.893958330154419, 2.088878631591797, 2.283798933029175, 2.4787192344665527, 2.6736395359039307, 2.8685598373413086, 3.0634801387786865, 3.2584004402160645, 3.4533207416534424, 3.6482410430908203, 3.8431613445281982, 4.038081645965576, 4.233001708984375, 4.427922248840332, 4.622842788696289, 4.817762851715088, 5.012682914733887, 5.207603454589844, 5.402523994445801, 5.5974440574646]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 1.0, 5.0, 8.0, 8.0, 7.0, 8.0, 14.0, 18.0, 20.0, 23.0, 22.0, 26.0, 30.0, 39.0, 40.0, 34.0, 46.0, 46.0, 40.0, 53.0, 39.0, 41.0, 51.0, 38.0, 49.0, 48.0, 37.0, 22.0, 33.0, 32.0, 17.0, 22.0, 18.0, 11.0, 7.0, 11.0, 16.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7863235473632812, -2.684755325317383, -2.5831868648529053, -2.481618642807007, -2.3800504207611084, -2.278481960296631, -2.1769137382507324, -2.075345516204834, -1.973777174949646, -1.872208833694458, -1.7706406116485596, -1.6690722703933716, -1.5675039291381836, -1.4659357070922852, -1.3643673658370972, -1.2627990245819092, -1.1612308025360107, -1.0596624612808228, -0.9580942392349243, -0.8565258979797363, -0.7549576163291931, -0.6533893346786499, -0.5518209934234619, -0.4502527117729187, -0.3486844301223755, -0.24711613357067108, -0.14554783701896667, -0.043979525566101074, 0.05758875608444214, 0.15915703773498535, 0.26072537899017334, 0.36229366064071655, 0.46386218070983887, 0.5654304623603821, 0.6669987440109253, 0.7685670852661133, 0.8701353669166565, 0.9717036485671997, 1.0732719898223877, 1.1748402118682861, 1.2764085531234741, 1.377976894378662, 1.4795451164245605, 1.5811134576797485, 1.6826817989349365, 1.784250020980835, 1.885818362236023, 1.987386703491211, 2.0889549255371094, 2.190523147583008, 2.2920916080474854, 2.393659830093384, 2.4952280521392822, 2.5967965126037598, 2.698364734649658, 2.7999329566955566, 2.901501178741455, 3.0030694007873535, 3.104637861251831, 3.2062060832977295, 3.307774305343628, 3.4093427658081055, 3.510910987854004, 3.6124792098999023, 3.71404767036438]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 11.0, 19.0, 40.0, 50.0, 80.0, 95.0, 177.0, 304.0, 451.0, 689.0, 1173.0, 1966.0, 3338.0, 5759.0, 10773.0, 19930.0, 38882.0, 80806.0, 180652.0, 443372.0, 1048086.0, 1265552.0, 629651.0, 248653.0, 107323.0, 50746.0, 25285.0, 13305.0, 7206.0, 3990.0, 2330.0, 1407.0, 833.0, 519.0, 312.0, 166.0, 127.0, 78.0, 52.0, 28.0, 19.0, 18.0, 10.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.65625, -6.4615478515625, -6.266845703125, -6.0721435546875, -5.87744140625, -5.6827392578125, -5.488037109375, -5.2933349609375, -5.0986328125, -4.9039306640625, -4.709228515625, -4.5145263671875, -4.31982421875, -4.1251220703125, -3.930419921875, -3.7357177734375, -3.541015625, -3.3463134765625, -3.151611328125, -2.9569091796875, -2.76220703125, -2.5675048828125, -2.372802734375, -2.1781005859375, -1.9833984375, -1.7886962890625, -1.593994140625, -1.3992919921875, -1.20458984375, -1.0098876953125, -0.815185546875, -0.6204833984375, -0.42578125, -0.2310791015625, -0.036376953125, 0.1583251953125, 0.35302734375, 0.5477294921875, 0.742431640625, 0.9371337890625, 1.1318359375, 1.3265380859375, 1.521240234375, 1.7159423828125, 1.91064453125, 2.1053466796875, 2.300048828125, 2.4947509765625, 2.689453125, 2.8841552734375, 3.078857421875, 3.2735595703125, 3.46826171875, 3.6629638671875, 3.857666015625, 4.0523681640625, 4.2470703125, 4.4417724609375, 4.636474609375, 4.8311767578125, 5.02587890625, 5.2205810546875, 5.415283203125, 5.6099853515625, 5.8046875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 8.0, 7.0, 9.0, 11.0, 19.0, 10.0, 17.0, 18.0, 18.0, 23.0, 29.0, 29.0, 32.0, 36.0, 36.0, 30.0, 44.0, 35.0, 41.0, 48.0, 49.0, 39.0, 48.0, 39.0, 29.0, 43.0, 31.0, 22.0, 29.0, 24.0, 22.0, 20.0, 15.0, 12.0, 16.0, 5.0, 5.0, 14.0, 5.0, 2.0, 1.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.498046875, -2.420623779296875, -2.34320068359375, -2.265777587890625, -2.1883544921875, -2.110931396484375, -2.03350830078125, -1.956085205078125, -1.878662109375, -1.801239013671875, -1.72381591796875, -1.646392822265625, -1.5689697265625, -1.491546630859375, -1.41412353515625, -1.336700439453125, -1.25927734375, -1.181854248046875, -1.10443115234375, -1.027008056640625, -0.9495849609375, -0.872161865234375, -0.79473876953125, -0.717315673828125, -0.639892578125, -0.562469482421875, -0.48504638671875, -0.407623291015625, -0.3302001953125, -0.252777099609375, -0.17535400390625, -0.097930908203125, -0.0205078125, 0.056915283203125, 0.13433837890625, 0.211761474609375, 0.2891845703125, 0.366607666015625, 0.44403076171875, 0.521453857421875, 0.598876953125, 0.676300048828125, 0.75372314453125, 0.831146240234375, 0.9085693359375, 0.985992431640625, 1.06341552734375, 1.140838623046875, 1.21826171875, 1.295684814453125, 1.37310791015625, 1.450531005859375, 1.5279541015625, 1.605377197265625, 1.68280029296875, 1.760223388671875, 1.837646484375, 1.915069580078125, 1.99249267578125, 2.069915771484375, 2.1473388671875, 2.224761962890625, 2.30218505859375, 2.379608154296875, 2.45703125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 16.0, 25.0, 33.0, 72.0, 99.0, 150.0, 227.0, 428.0, 812.0, 1431.0, 2934.0, 6001.0, 12799.0, 28523.0, 68899.0, 176384.0, 474941.0, 1196802.0, 1323308.0, 554368.0, 205584.0, 79689.0, 32864.0, 14430.0, 6668.0, 3138.0, 1616.0, 885.0, 440.0, 276.0, 150.0, 106.0, 62.0, 39.0, 31.0, 12.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.833984375, -8.55859375, -8.283203125, -8.0078125, -7.732421875, -7.45703125, -7.181640625, -6.90625, -6.630859375, -6.35546875, -6.080078125, -5.8046875, -5.529296875, -5.25390625, -4.978515625, -4.703125, -4.427734375, -4.15234375, -3.876953125, -3.6015625, -3.326171875, -3.05078125, -2.775390625, -2.5, -2.224609375, -1.94921875, -1.673828125, -1.3984375, -1.123046875, -0.84765625, -0.572265625, -0.296875, -0.021484375, 0.25390625, 0.529296875, 0.8046875, 1.080078125, 1.35546875, 1.630859375, 1.90625, 2.181640625, 2.45703125, 2.732421875, 3.0078125, 3.283203125, 3.55859375, 3.833984375, 4.109375, 4.384765625, 4.66015625, 4.935546875, 5.2109375, 5.486328125, 5.76171875, 6.037109375, 6.3125, 6.587890625, 6.86328125, 7.138671875, 7.4140625, 7.689453125, 7.96484375, 8.240234375, 8.515625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 13.0, 14.0, 23.0, 38.0, 51.0, 61.0, 83.0, 127.0, 164.0, 177.0, 221.0, 285.0, 318.0, 394.0, 319.0, 345.0, 302.0, 259.0, 198.0, 159.0, 118.0, 105.0, 75.0, 74.0, 49.0, 32.0, 20.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.6670379638671875, -1.600677490234375, -1.5343170166015625, -1.46795654296875, -1.4015960693359375, -1.335235595703125, -1.2688751220703125, -1.2025146484375, -1.1361541748046875, -1.069793701171875, -1.0034332275390625, -0.93707275390625, -0.8707122802734375, -0.804351806640625, -0.7379913330078125, -0.671630859375, -0.6052703857421875, -0.538909912109375, -0.4725494384765625, -0.40618896484375, -0.3398284912109375, -0.273468017578125, -0.2071075439453125, -0.1407470703125, -0.0743865966796875, -0.008026123046875, 0.0583343505859375, 0.12469482421875, 0.1910552978515625, 0.257415771484375, 0.3237762451171875, 0.39013671875, 0.4564971923828125, 0.522857666015625, 0.5892181396484375, 0.65557861328125, 0.7219390869140625, 0.788299560546875, 0.8546600341796875, 0.9210205078125, 0.9873809814453125, 1.053741455078125, 1.1201019287109375, 1.18646240234375, 1.2528228759765625, 1.319183349609375, 1.3855438232421875, 1.451904296875, 1.5182647705078125, 1.584625244140625, 1.6509857177734375, 1.71734619140625, 1.7837066650390625, 1.850067138671875, 1.9164276123046875, 1.9827880859375, 2.0491485595703125, 2.115509033203125, 2.1818695068359375, 2.24822998046875, 2.3145904541015625, 2.380950927734375, 2.4473114013671875, 2.513671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 2.0, 4.0, 8.0, 9.0, 13.0, 7.0, 16.0, 29.0, 33.0, 45.0, 49.0, 61.0, 73.0, 85.0, 83.0, 70.0, 67.0, 61.0, 71.0, 53.0, 44.0, 25.0, 23.0, 15.0, 22.0, 9.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.248263359069824, -7.997119426727295, -7.745975971221924, -7.4948320388793945, -7.243688106536865, -6.992544174194336, -6.741400718688965, -6.4902567863464355, -6.239112854003906, -5.987968921661377, -5.736825466156006, -5.485681533813477, -5.234537601470947, -4.983393669128418, -4.732250213623047, -4.481106281280518, -4.2299628257751465, -3.9788191318511963, -3.727675199508667, -3.476531505584717, -3.2253875732421875, -2.9742438793182373, -2.723100185394287, -2.471956253051758, -2.2208125591278076, -1.9696687459945679, -1.7185249328613281, -1.467381238937378, -1.2162374258041382, -0.9650936126708984, -0.7139499187469482, -0.4628061056137085, -0.21166181564331055, 0.03948196768760681, 0.29062575101852417, 0.5417695045471191, 0.7929133176803589, 1.0440571308135986, 1.2952008247375488, 1.5463446378707886, 1.7974884510040283, 2.0486321449279785, 2.299776077270508, 2.550919771194458, 2.802063465118408, 3.0532073974609375, 3.3043510913848877, 3.555494785308838, 3.806638717651367, 4.0577826499938965, 4.308926105499268, 4.560070037841797, 4.811213970184326, 5.0623579025268555, 5.313501358032227, 5.564645290374756, 5.815789222717285, 6.0669331550598145, 6.3180766105651855, 6.569220542907715, 6.820364475250244, 7.071508407592773, 7.3226518630981445, 7.573795795440674, 7.824939250946045]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 15.0, 15.0, 24.0, 12.0, 22.0, 20.0, 25.0, 29.0, 27.0, 28.0, 38.0, 28.0, 41.0, 38.0, 37.0, 47.0, 43.0, 39.0, 46.0, 41.0, 42.0, 25.0, 47.0, 32.0, 35.0, 25.0, 20.0, 22.0, 24.0, 20.0, 6.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.2820608615875244, -3.1809041500091553, -3.079747438430786, -2.978590965270996, -2.877434253692627, -2.776277542114258, -2.6751208305358887, -2.5739641189575195, -2.4728074073791504, -2.3716506958007812, -2.270493984222412, -2.169337272644043, -2.068180799484253, -1.9670240879058838, -1.8658673763275146, -1.7647106647491455, -1.6635541915893555, -1.5623974800109863, -1.4612408876419067, -1.3600841760635376, -1.258927583694458, -1.1577708721160889, -1.0566141605377197, -0.9554575085639954, -0.854300856590271, -0.7531442046165466, -0.6519875526428223, -0.5508308410644531, -0.44967418909072876, -0.3485175371170044, -0.24736082553863525, -0.1462041735649109, -0.04504728317260742, 0.05610938370227814, 0.1572660505771637, 0.25842273235321045, 0.3595793843269348, 0.4607360363006592, 0.5618927478790283, 0.6630493998527527, 0.764206051826477, 0.8653627038002014, 0.9665193557739258, 1.067676067352295, 1.168832778930664, 1.2699893712997437, 1.3711460828781128, 1.4723026752471924, 1.5734593868255615, 1.6746160984039307, 1.7757726907730103, 1.8769294023513794, 1.978085994720459, 2.079242706298828, 2.1803994178771973, 2.2815561294555664, 2.3827128410339355, 2.4838695526123047, 2.585026264190674, 2.686182975769043, 2.787339448928833, 2.888496160507202, 2.9896528720855713, 3.0908095836639404, 3.1919660568237305]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 10.0, 18.0, 26.0, 27.0, 59.0, 60.0, 101.0, 114.0, 196.0, 313.0, 509.0, 817.0, 1165.0, 1964.0, 3270.0, 5236.0, 9006.0, 14918.0, 26220.0, 45632.0, 80808.0, 138262.0, 204980.0, 200141.0, 133296.0, 76715.0, 43756.0, 24497.0, 14343.0, 8424.0, 5240.0, 3171.0, 1925.0, 1179.0, 742.0, 473.0, 329.0, 198.0, 134.0, 99.0, 54.0, 44.0, 22.0, 23.0, 10.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.57177734375, -0.5544281005859375, -0.537078857421875, -0.5197296142578125, -0.50238037109375, -0.4850311279296875, -0.467681884765625, -0.4503326416015625, -0.4329833984375, -0.4156341552734375, -0.398284912109375, -0.3809356689453125, -0.36358642578125, -0.3462371826171875, -0.328887939453125, -0.3115386962890625, -0.294189453125, -0.2768402099609375, -0.259490966796875, -0.2421417236328125, -0.22479248046875, -0.2074432373046875, -0.190093994140625, -0.1727447509765625, -0.1553955078125, -0.1380462646484375, -0.120697021484375, -0.1033477783203125, -0.08599853515625, -0.0686492919921875, -0.051300048828125, -0.0339508056640625, -0.0166015625, 0.0007476806640625, 0.018096923828125, 0.0354461669921875, 0.05279541015625, 0.0701446533203125, 0.087493896484375, 0.1048431396484375, 0.1221923828125, 0.1395416259765625, 0.156890869140625, 0.1742401123046875, 0.19158935546875, 0.2089385986328125, 0.226287841796875, 0.2436370849609375, 0.260986328125, 0.2783355712890625, 0.295684814453125, 0.3130340576171875, 0.33038330078125, 0.3477325439453125, 0.365081787109375, 0.3824310302734375, 0.3997802734375, 0.4171295166015625, 0.434478759765625, 0.4518280029296875, 0.46917724609375, 0.4865264892578125, 0.503875732421875, 0.5212249755859375, 0.53857421875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 0.0, 6.0, 6.0, 6.0, 7.0, 6.0, 11.0, 19.0, 20.0, 21.0, 17.0, 26.0, 30.0, 21.0, 33.0, 32.0, 42.0, 42.0, 36.0, 49.0, 36.0, 54.0, 39.0, 35.0, 55.0, 32.0, 40.0, 40.0, 33.0, 28.0, 35.0, 18.0, 26.0, 25.0, 17.0, 10.0, 7.0, 8.0, 12.0, 5.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.927734375, -3.80401611328125, -3.6802978515625, -3.55657958984375, -3.432861328125, -3.30914306640625, -3.1854248046875, -3.06170654296875, -2.93798828125, -2.81427001953125, -2.6905517578125, -2.56683349609375, -2.443115234375, -2.31939697265625, -2.1956787109375, -2.07196044921875, -1.9482421875, -1.82452392578125, -1.7008056640625, -1.57708740234375, -1.453369140625, -1.32965087890625, -1.2059326171875, -1.08221435546875, -0.95849609375, -0.83477783203125, -0.7110595703125, -0.58734130859375, -0.463623046875, -0.33990478515625, -0.2161865234375, -0.09246826171875, 0.03125, 0.15496826171875, 0.2786865234375, 0.40240478515625, 0.526123046875, 0.64984130859375, 0.7735595703125, 0.89727783203125, 1.02099609375, 1.14471435546875, 1.2684326171875, 1.39215087890625, 1.515869140625, 1.63958740234375, 1.7633056640625, 1.88702392578125, 2.0107421875, 2.13446044921875, 2.2581787109375, 2.38189697265625, 2.505615234375, 2.62933349609375, 2.7530517578125, 2.87677001953125, 3.00048828125, 3.12420654296875, 3.2479248046875, 3.37164306640625, 3.495361328125, 3.61907958984375, 3.7427978515625, 3.86651611328125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 14.0, 17.0, 18.0, 24.0, 47.0, 70.0, 85.0, 136.0, 185.0, 365.0, 466.0, 825.0, 1350.0, 2400.0, 4730.0, 9987.0, 24910.0, 261490.0, 688507.0, 29650.0, 11258.0, 5381.0, 2715.0, 1478.0, 932.0, 533.0, 375.0, 206.0, 133.0, 80.0, 54.0, 38.0, 34.0, 23.0, 11.0, 11.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.07025146484375, -2.0057373046875, -1.94122314453125, -1.876708984375, -1.81219482421875, -1.7476806640625, -1.68316650390625, -1.61865234375, -1.55413818359375, -1.4896240234375, -1.42510986328125, -1.360595703125, -1.29608154296875, -1.2315673828125, -1.16705322265625, -1.1025390625, -1.03802490234375, -0.9735107421875, -0.90899658203125, -0.844482421875, -0.77996826171875, -0.7154541015625, -0.65093994140625, -0.58642578125, -0.52191162109375, -0.4573974609375, -0.39288330078125, -0.328369140625, -0.26385498046875, -0.1993408203125, -0.13482666015625, -0.0703125, -0.00579833984375, 0.0587158203125, 0.12322998046875, 0.187744140625, 0.25225830078125, 0.3167724609375, 0.38128662109375, 0.44580078125, 0.51031494140625, 0.5748291015625, 0.63934326171875, 0.703857421875, 0.76837158203125, 0.8328857421875, 0.89739990234375, 0.9619140625, 1.02642822265625, 1.0909423828125, 1.15545654296875, 1.219970703125, 1.28448486328125, 1.3489990234375, 1.41351318359375, 1.47802734375, 1.54254150390625, 1.6070556640625, 1.67156982421875, 1.736083984375, 1.80059814453125, 1.8651123046875, 1.92962646484375, 1.994140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 1.0, 5.0, 8.0, 7.0, 14.0, 15.0, 24.0, 17.0, 20.0, 18.0, 31.0, 33.0, 30.0, 29.0, 46.0, 30.0, 43.0, 43.0, 38.0, 38.0, 51.0, 36.0, 44.0, 34.0, 43.0, 36.0, 27.0, 29.0, 31.0, 28.0, 24.0, 21.0, 15.0, 24.0, 23.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.29986572265625, -2.2149658203125, -2.13006591796875, -2.045166015625, -1.96026611328125, -1.8753662109375, -1.79046630859375, -1.70556640625, -1.62066650390625, -1.5357666015625, -1.45086669921875, -1.365966796875, -1.28106689453125, -1.1961669921875, -1.11126708984375, -1.0263671875, -0.94146728515625, -0.8565673828125, -0.77166748046875, -0.686767578125, -0.60186767578125, -0.5169677734375, -0.43206787109375, -0.34716796875, -0.26226806640625, -0.1773681640625, -0.09246826171875, -0.007568359375, 0.07733154296875, 0.1622314453125, 0.24713134765625, 0.33203125, 0.41693115234375, 0.5018310546875, 0.58673095703125, 0.671630859375, 0.75653076171875, 0.8414306640625, 0.92633056640625, 1.01123046875, 1.09613037109375, 1.1810302734375, 1.26593017578125, 1.350830078125, 1.43572998046875, 1.5206298828125, 1.60552978515625, 1.6904296875, 1.77532958984375, 1.8602294921875, 1.94512939453125, 2.030029296875, 2.11492919921875, 2.1998291015625, 2.28472900390625, 2.36962890625, 2.45452880859375, 2.5394287109375, 2.62432861328125, 2.709228515625, 2.79412841796875, 2.8790283203125, 2.96392822265625, 3.048828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 7.0, 7.0, 9.0, 12.0, 19.0, 25.0, 36.0, 56.0, 100.0, 165.0, 286.0, 555.0, 1031.0, 2299.0, 5529.0, 21362.0, 955108.0, 47272.0, 8579.0, 3148.0, 1372.0, 663.0, 384.0, 200.0, 121.0, 80.0, 45.0, 32.0, 26.0, 6.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1837615966796875, -1.143890380859375, -1.1040191650390625, -1.06414794921875, -1.0242767333984375, -0.984405517578125, -0.9445343017578125, -0.9046630859375, -0.8647918701171875, -0.824920654296875, -0.7850494384765625, -0.74517822265625, -0.7053070068359375, -0.665435791015625, -0.6255645751953125, -0.585693359375, -0.5458221435546875, -0.505950927734375, -0.4660797119140625, -0.42620849609375, -0.3863372802734375, -0.346466064453125, -0.3065948486328125, -0.2667236328125, -0.2268524169921875, -0.186981201171875, -0.1471099853515625, -0.10723876953125, -0.0673675537109375, -0.027496337890625, 0.0123748779296875, 0.05224609375, 0.0921173095703125, 0.131988525390625, 0.1718597412109375, 0.21173095703125, 0.2516021728515625, 0.291473388671875, 0.3313446044921875, 0.3712158203125, 0.4110870361328125, 0.450958251953125, 0.4908294677734375, 0.53070068359375, 0.5705718994140625, 0.610443115234375, 0.6503143310546875, 0.690185546875, 0.7300567626953125, 0.769927978515625, 0.8097991943359375, 0.84967041015625, 0.8895416259765625, 0.929412841796875, 0.9692840576171875, 1.0091552734375, 1.0490264892578125, 1.088897705078125, 1.1287689208984375, 1.16864013671875, 1.2085113525390625, 1.248382568359375, 1.2882537841796875, 1.328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 8.0, 5.0, 15.0, 7.0, 27.0, 25.0, 37.0, 39.0, 48.0, 87.0, 105.0, 80.0, 102.0, 83.0, 84.0, 53.0, 42.0, 28.0, 24.0, 12.0, 13.0, 3.0, 6.0, 7.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.310773849487305e-05, -5.1544979214668274e-05, -4.99822199344635e-05, -4.841946065425873e-05, -4.6856701374053955e-05, -4.529394209384918e-05, -4.373118281364441e-05, -4.2168423533439636e-05, -4.060566425323486e-05, -3.904290497303009e-05, -3.748014569282532e-05, -3.5917386412620544e-05, -3.435462713241577e-05, -3.2791867852211e-05, -3.1229108572006226e-05, -2.9666349291801453e-05, -2.810359001159668e-05, -2.6540830731391907e-05, -2.4978071451187134e-05, -2.341531217098236e-05, -2.1852552890777588e-05, -2.0289793610572815e-05, -1.8727034330368042e-05, -1.716427505016327e-05, -1.5601515769958496e-05, -1.4038756489753723e-05, -1.247599720954895e-05, -1.0913237929344177e-05, -9.350478649139404e-06, -7.787719368934631e-06, -6.224960088729858e-06, -4.6622008085250854e-06, -3.0994415283203125e-06, -1.5366822481155396e-06, 2.60770320892334e-08, 1.5888363122940063e-06, 3.1515955924987793e-06, 4.714354872703552e-06, 6.277114152908325e-06, 7.839873433113098e-06, 9.402632713317871e-06, 1.0965391993522644e-05, 1.2528151273727417e-05, 1.409091055393219e-05, 1.5653669834136963e-05, 1.7216429114341736e-05, 1.877918839454651e-05, 2.0341947674751282e-05, 2.1904706954956055e-05, 2.3467466235160828e-05, 2.50302255153656e-05, 2.6592984795570374e-05, 2.8155744075775146e-05, 2.971850335597992e-05, 3.128126263618469e-05, 3.2844021916389465e-05, 3.440678119659424e-05, 3.596954047679901e-05, 3.7532299757003784e-05, 3.909505903720856e-05, 4.065781831741333e-05, 4.22205775976181e-05, 4.3783336877822876e-05, 4.534609615802765e-05, 4.690885543823242e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 5.0, 22.0, 9.0, 16.0, 25.0, 24.0, 69.0, 107.0, 181.0, 322.0, 660.0, 1488.0, 3548.0, 8403.0, 23075.0, 85470.0, 627280.0, 233607.0, 41141.0, 13444.0, 5321.0, 2246.0, 1002.0, 495.0, 242.0, 130.0, 70.0, 46.0, 38.0, 19.0, 11.0, 13.0, 3.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7175750732421875, -0.693450927734375, -0.6693267822265625, -0.64520263671875, -0.6210784912109375, -0.596954345703125, -0.5728302001953125, -0.5487060546875, -0.5245819091796875, -0.500457763671875, -0.4763336181640625, -0.45220947265625, -0.4280853271484375, -0.403961181640625, -0.3798370361328125, -0.355712890625, -0.3315887451171875, -0.307464599609375, -0.2833404541015625, -0.25921630859375, -0.2350921630859375, -0.210968017578125, -0.1868438720703125, -0.1627197265625, -0.1385955810546875, -0.114471435546875, -0.0903472900390625, -0.06622314453125, -0.0420989990234375, -0.017974853515625, 0.0061492919921875, 0.0302734375, 0.0543975830078125, 0.078521728515625, 0.1026458740234375, 0.12677001953125, 0.1508941650390625, 0.175018310546875, 0.1991424560546875, 0.2232666015625, 0.2473907470703125, 0.271514892578125, 0.2956390380859375, 0.31976318359375, 0.3438873291015625, 0.368011474609375, 0.3921356201171875, 0.416259765625, 0.4403839111328125, 0.464508056640625, 0.4886322021484375, 0.51275634765625, 0.5368804931640625, 0.561004638671875, 0.5851287841796875, 0.6092529296875, 0.6333770751953125, 0.657501220703125, 0.6816253662109375, 0.70574951171875, 0.7298736572265625, 0.753997802734375, 0.7781219482421875, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 6.0, 7.0, 7.0, 19.0, 23.0, 34.0, 42.0, 76.0, 105.0, 176.0, 164.0, 107.0, 62.0, 40.0, 17.0, 23.0, 21.0, 12.0, 8.0, 7.0, 11.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07769775390625, -0.07398700714111328, -0.07027626037597656, -0.06656551361083984, -0.06285476684570312, -0.059144020080566406, -0.05543327331542969, -0.05172252655029297, -0.04801177978515625, -0.04430103302001953, -0.04059028625488281, -0.036879539489746094, -0.033168792724609375, -0.029458045959472656, -0.025747299194335938, -0.02203655242919922, -0.0183258056640625, -0.014615058898925781, -0.010904312133789062, -0.007193565368652344, -0.003482818603515625, 0.00022792816162109375, 0.0039386749267578125, 0.007649421691894531, 0.01136016845703125, 0.015070915222167969, 0.018781661987304688, 0.022492408752441406, 0.026203155517578125, 0.029913902282714844, 0.03362464904785156, 0.03733539581298828, 0.041046142578125, 0.04475688934326172, 0.04846763610839844, 0.052178382873535156, 0.055889129638671875, 0.059599876403808594, 0.06331062316894531, 0.06702136993408203, 0.07073211669921875, 0.07444286346435547, 0.07815361022949219, 0.0818643569946289, 0.08557510375976562, 0.08928585052490234, 0.09299659729003906, 0.09670734405517578, 0.1004180908203125, 0.10412883758544922, 0.10783958435058594, 0.11155033111572266, 0.11526107788085938, 0.1189718246459961, 0.12268257141113281, 0.12639331817626953, 0.13010406494140625, 0.13381481170654297, 0.1375255584716797, 0.1412363052368164, 0.14494705200195312, 0.14865779876708984, 0.15236854553222656, 0.15607929229736328, 0.1597900390625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 9.0, 10.0, 12.0, 13.0, 16.0, 38.0, 31.0, 50.0, 52.0, 58.0, 86.0, 76.0, 73.0, 78.0, 68.0, 59.0, 69.0, 47.0, 41.0, 21.0, 21.0, 16.0, 17.0, 10.0, 4.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.105216026306152, -7.8560895919799805, -7.60696268081665, -7.3578362464904785, -7.108709812164307, -6.859582901000977, -6.610456466674805, -6.361330032348633, -6.112203598022461, -5.863077163696289, -5.613950252532959, -5.364823818206787, -5.115697383880615, -4.866570472717285, -4.617444038391113, -4.368317604064941, -4.1191911697387695, -3.8700644969940186, -3.6209380626678467, -3.3718113899230957, -3.122684955596924, -2.873558282852173, -2.624431610107422, -2.37530517578125, -2.12617826461792, -1.8770517110824585, -1.627925157546997, -1.378798484802246, -1.1296720504760742, -0.8805453777313232, -0.6314188241958618, -0.3822922706604004, -0.13316583633422852, 0.1159607321023941, 0.3650873005390167, 0.6142138838768005, 0.863340437412262, 1.1124670505523682, 1.3615936040878296, 1.610720157623291, 1.8598467111587524, 2.108973264694214, 2.358099937438965, 2.6072263717651367, 2.8563530445098877, 3.1054797172546387, 3.3546061515808105, 3.6037325859069824, 3.8528592586517334, 4.101985931396484, 4.351112365722656, 4.600238800048828, 4.849365711212158, 5.09849214553833, 5.347618579864502, 5.596745491027832, 5.845871925354004, 6.094998359680176, 6.344125270843506, 6.593251705169678, 6.84237813949585, 7.09150505065918, 7.340631484985352, 7.589757919311523, 7.838884353637695]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 0.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 15.0, 17.0, 22.0, 16.0, 16.0, 26.0, 27.0, 27.0, 32.0, 35.0, 33.0, 34.0, 39.0, 39.0, 44.0, 41.0, 41.0, 47.0, 42.0, 43.0, 28.0, 40.0, 39.0, 37.0, 21.0, 23.0, 20.0, 26.0, 17.0, 15.0, 14.0, 8.0, 6.0, 7.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.305217981338501, -3.2046446800231934, -3.1040713787078857, -3.003498077392578, -2.9029247760772705, -2.802351474761963, -2.7017784118652344, -2.6012048721313477, -2.500631809234619, -2.4000585079193115, -2.299485206604004, -2.1989119052886963, -2.0983386039733887, -1.997765302658081, -1.897192120552063, -1.7966188192367554, -1.6960453987121582, -1.5954720973968506, -1.494898796081543, -1.3943254947662354, -1.2937521934509277, -1.1931788921356201, -1.092605710029602, -0.9920324087142944, -0.8914591073989868, -0.7908858060836792, -0.6903125047683716, -0.5897392630577087, -0.4891659617424011, -0.3885926604270935, -0.28801941871643066, -0.18744611740112305, -0.08687257766723633, 0.013700708746910095, 0.11427399516105652, 0.21484726667404175, 0.31542056798934937, 0.415993869304657, 0.5165671110153198, 0.6171404123306274, 0.7177137136459351, 0.8182870149612427, 0.9188603162765503, 1.0194334983825684, 1.120006799697876, 1.2205801010131836, 1.3211534023284912, 1.4217267036437988, 1.5223000049591064, 1.622873306274414, 1.7234466075897217, 1.8240199089050293, 1.924593210220337, 2.0251665115356445, 2.125739574432373, 2.2263131141662598, 2.3268861770629883, 2.427459478378296, 2.5280327796936035, 2.628606081008911, 2.7291793823242188, 2.8297526836395264, 2.930325984954834, 3.0308990478515625, 3.131472587585449]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 3.0, 7.0, 16.0, 11.0, 17.0, 27.0, 37.0, 49.0, 56.0, 92.0, 132.0, 229.0, 274.0, 476.0, 605.0, 938.0, 1464.0, 2226.0, 3529.0, 5716.0, 9156.0, 15202.0, 25115.0, 42293.0, 68367.0, 106208.0, 147140.0, 168990.0, 151587.0, 111618.0, 72786.0, 44754.0, 26745.0, 15905.0, 9821.0, 5957.0, 3861.0, 2372.0, 1532.0, 1068.0, 677.0, 460.0, 314.0, 222.0, 146.0, 114.0, 84.0, 48.0, 35.0, 20.0, 16.0, 9.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.4921875, -4.349853515625, -4.20751953125, -4.065185546875, -3.9228515625, -3.780517578125, -3.63818359375, -3.495849609375, -3.353515625, -3.211181640625, -3.06884765625, -2.926513671875, -2.7841796875, -2.641845703125, -2.49951171875, -2.357177734375, -2.21484375, -2.072509765625, -1.93017578125, -1.787841796875, -1.6455078125, -1.503173828125, -1.36083984375, -1.218505859375, -1.076171875, -0.933837890625, -0.79150390625, -0.649169921875, -0.5068359375, -0.364501953125, -0.22216796875, -0.079833984375, 0.0625, 0.204833984375, 0.34716796875, 0.489501953125, 0.6318359375, 0.774169921875, 0.91650390625, 1.058837890625, 1.201171875, 1.343505859375, 1.48583984375, 1.628173828125, 1.7705078125, 1.912841796875, 2.05517578125, 2.197509765625, 2.33984375, 2.482177734375, 2.62451171875, 2.766845703125, 2.9091796875, 3.051513671875, 3.19384765625, 3.336181640625, 3.478515625, 3.620849609375, 3.76318359375, 3.905517578125, 4.0478515625, 4.190185546875, 4.33251953125, 4.474853515625, 4.6171875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 5.0, 11.0, 14.0, 9.0, 15.0, 19.0, 18.0, 19.0, 20.0, 29.0, 36.0, 24.0, 29.0, 27.0, 32.0, 27.0, 39.0, 31.0, 43.0, 41.0, 45.0, 54.0, 40.0, 50.0, 38.0, 28.0, 29.0, 23.0, 28.0, 27.0, 18.0, 19.0, 8.0, 13.0, 16.0, 11.0, 8.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.501953125, -3.39642333984375, -3.2908935546875, -3.18536376953125, -3.079833984375, -2.97430419921875, -2.8687744140625, -2.76324462890625, -2.65771484375, -2.55218505859375, -2.4466552734375, -2.34112548828125, -2.235595703125, -2.13006591796875, -2.0245361328125, -1.91900634765625, -1.8134765625, -1.70794677734375, -1.6024169921875, -1.49688720703125, -1.391357421875, -1.28582763671875, -1.1802978515625, -1.07476806640625, -0.96923828125, -0.86370849609375, -0.7581787109375, -0.65264892578125, -0.547119140625, -0.44158935546875, -0.3360595703125, -0.23052978515625, -0.125, -0.01947021484375, 0.0860595703125, 0.19158935546875, 0.297119140625, 0.40264892578125, 0.5081787109375, 0.61370849609375, 0.71923828125, 0.82476806640625, 0.9302978515625, 1.03582763671875, 1.141357421875, 1.24688720703125, 1.3524169921875, 1.45794677734375, 1.5634765625, 1.66900634765625, 1.7745361328125, 1.88006591796875, 1.985595703125, 2.09112548828125, 2.1966552734375, 2.30218505859375, 2.40771484375, 2.51324462890625, 2.6187744140625, 2.72430419921875, 2.829833984375, 2.93536376953125, 3.0408935546875, 3.14642333984375, 3.251953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 14.0, 12.0, 25.0, 32.0, 48.0, 81.0, 151.0, 209.0, 330.0, 594.0, 1126.0, 1953.0, 4001.0, 8456.0, 18459.0, 41836.0, 94849.0, 187946.0, 264318.0, 214442.0, 114779.0, 51821.0, 22810.0, 10072.0, 4797.0, 2410.0, 1243.0, 683.0, 425.0, 230.0, 140.0, 92.0, 50.0, 39.0, 23.0, 17.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.421875, -7.19439697265625, -6.9669189453125, -6.73944091796875, -6.511962890625, -6.28448486328125, -6.0570068359375, -5.82952880859375, -5.60205078125, -5.37457275390625, -5.1470947265625, -4.91961669921875, -4.692138671875, -4.46466064453125, -4.2371826171875, -4.00970458984375, -3.7822265625, -3.55474853515625, -3.3272705078125, -3.09979248046875, -2.872314453125, -2.64483642578125, -2.4173583984375, -2.18988037109375, -1.96240234375, -1.73492431640625, -1.5074462890625, -1.27996826171875, -1.052490234375, -0.82501220703125, -0.5975341796875, -0.37005615234375, -0.142578125, 0.08489990234375, 0.3123779296875, 0.53985595703125, 0.767333984375, 0.99481201171875, 1.2222900390625, 1.44976806640625, 1.67724609375, 1.90472412109375, 2.1322021484375, 2.35968017578125, 2.587158203125, 2.81463623046875, 3.0421142578125, 3.26959228515625, 3.4970703125, 3.72454833984375, 3.9520263671875, 4.17950439453125, 4.406982421875, 4.63446044921875, 4.8619384765625, 5.08941650390625, 5.31689453125, 5.54437255859375, 5.7718505859375, 5.99932861328125, 6.226806640625, 6.45428466796875, 6.6817626953125, 6.90924072265625, 7.13671875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 13.0, 7.0, 16.0, 19.0, 18.0, 14.0, 21.0, 17.0, 21.0, 48.0, 36.0, 40.0, 28.0, 40.0, 38.0, 53.0, 42.0, 48.0, 33.0, 39.0, 41.0, 35.0, 31.0, 32.0, 25.0, 33.0, 28.0, 21.0, 23.0, 26.0, 20.0, 10.0, 12.0, 11.0, 8.0, 5.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.85528564453125, -1.7886962890625, -1.72210693359375, -1.655517578125, -1.58892822265625, -1.5223388671875, -1.45574951171875, -1.38916015625, -1.32257080078125, -1.2559814453125, -1.18939208984375, -1.122802734375, -1.05621337890625, -0.9896240234375, -0.92303466796875, -0.8564453125, -0.78985595703125, -0.7232666015625, -0.65667724609375, -0.590087890625, -0.52349853515625, -0.4569091796875, -0.39031982421875, -0.32373046875, -0.25714111328125, -0.1905517578125, -0.12396240234375, -0.057373046875, 0.00921630859375, 0.0758056640625, 0.14239501953125, 0.208984375, 0.27557373046875, 0.3421630859375, 0.40875244140625, 0.475341796875, 0.54193115234375, 0.6085205078125, 0.67510986328125, 0.74169921875, 0.80828857421875, 0.8748779296875, 0.94146728515625, 1.008056640625, 1.07464599609375, 1.1412353515625, 1.20782470703125, 1.2744140625, 1.34100341796875, 1.4075927734375, 1.47418212890625, 1.540771484375, 1.60736083984375, 1.6739501953125, 1.74053955078125, 1.80712890625, 1.87371826171875, 1.9403076171875, 2.00689697265625, 2.073486328125, 2.14007568359375, 2.2066650390625, 2.27325439453125, 2.33984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 13.0, 8.0, 11.0, 9.0, 15.0, 26.0, 26.0, 41.0, 69.0, 70.0, 99.0, 141.0, 168.0, 260.0, 332.0, 497.0, 613.0, 985.0, 1625.0, 2539.0, 4540.0, 8783.0, 18724.0, 44677.0, 119183.0, 286370.0, 317309.0, 143425.0, 52867.0, 21650.0, 10164.0, 5049.0, 2819.0, 1731.0, 1139.0, 692.0, 532.0, 348.0, 268.0, 192.0, 126.0, 93.0, 79.0, 62.0, 37.0, 46.0, 25.0, 25.0, 15.0, 13.0, 13.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.734375, -5.56109619140625, -5.3878173828125, -5.21453857421875, -5.041259765625, -4.86798095703125, -4.6947021484375, -4.52142333984375, -4.34814453125, -4.17486572265625, -4.0015869140625, -3.82830810546875, -3.655029296875, -3.48175048828125, -3.3084716796875, -3.13519287109375, -2.9619140625, -2.78863525390625, -2.6153564453125, -2.44207763671875, -2.268798828125, -2.09552001953125, -1.9222412109375, -1.74896240234375, -1.57568359375, -1.40240478515625, -1.2291259765625, -1.05584716796875, -0.882568359375, -0.70928955078125, -0.5360107421875, -0.36273193359375, -0.189453125, -0.01617431640625, 0.1571044921875, 0.33038330078125, 0.503662109375, 0.67694091796875, 0.8502197265625, 1.02349853515625, 1.19677734375, 1.37005615234375, 1.5433349609375, 1.71661376953125, 1.889892578125, 2.06317138671875, 2.2364501953125, 2.40972900390625, 2.5830078125, 2.75628662109375, 2.9295654296875, 3.10284423828125, 3.276123046875, 3.44940185546875, 3.6226806640625, 3.79595947265625, 3.96923828125, 4.14251708984375, 4.3157958984375, 4.48907470703125, 4.662353515625, 4.83563232421875, 5.0089111328125, 5.18218994140625, 5.35546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 20.0, 9.0, 25.0, 31.0, 54.0, 85.0, 110.0, 138.0, 154.0, 110.0, 71.0, 59.0, 37.0, 23.0, 14.0, 14.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006833076477050781, -0.0006625279784202576, -0.000641748309135437, -0.0006209686398506165, -0.0006001889705657959, -0.0005794093012809753, -0.0005586296319961548, -0.0005378499627113342, -0.0005170702934265137, -0.0004962906241416931, -0.00047551095485687256, -0.000454731285572052, -0.00043395161628723145, -0.0004131719470024109, -0.00039239227771759033, -0.0003716126084327698, -0.0003508329391479492, -0.00033005326986312866, -0.0003092736005783081, -0.00028849393129348755, -0.000267714262008667, -0.00024693459272384644, -0.00022615492343902588, -0.00020537525415420532, -0.00018459558486938477, -0.0001638159155845642, -0.00014303624629974365, -0.0001222565770149231, -0.00010147690773010254, -8.069723844528198e-05, -5.9917569160461426e-05, -3.913789987564087e-05, -1.8358230590820312e-05, 2.421438694000244e-06, 2.32011079788208e-05, 4.398077726364136e-05, 6.476044654846191e-05, 8.554011583328247e-05, 0.00010631978511810303, 0.00012709945440292358, 0.00014787912368774414, 0.0001686587929725647, 0.00018943846225738525, 0.0002102181315422058, 0.00023099780082702637, 0.0002517774701118469, 0.0002725571393966675, 0.00029333680868148804, 0.0003141164779663086, 0.00033489614725112915, 0.0003556758165359497, 0.00037645548582077026, 0.0003972351551055908, 0.0004180148243904114, 0.00043879449367523193, 0.0004595741629600525, 0.00048035383224487305, 0.0005011335015296936, 0.0005219131708145142, 0.0005426928400993347, 0.0005634725093841553, 0.0005842521786689758, 0.0006050318479537964, 0.0006258115172386169, 0.0006465911865234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 10.0, 20.0, 27.0, 47.0, 63.0, 110.0, 169.0, 221.0, 344.0, 467.0, 781.0, 1120.0, 1814.0, 2909.0, 4899.0, 9390.0, 20101.0, 46905.0, 115079.0, 240959.0, 291260.0, 175709.0, 74743.0, 30369.0, 13818.0, 6906.0, 3791.0, 2257.0, 1418.0, 972.0, 642.0, 395.0, 249.0, 170.0, 121.0, 86.0, 60.0, 45.0, 27.0, 17.0, 14.0, 16.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2620849609375, -4.125732421875, -3.9893798828125, -3.85302734375, -3.7166748046875, -3.580322265625, -3.4439697265625, -3.3076171875, -3.1712646484375, -3.034912109375, -2.8985595703125, -2.76220703125, -2.6258544921875, -2.489501953125, -2.3531494140625, -2.216796875, -2.0804443359375, -1.944091796875, -1.8077392578125, -1.67138671875, -1.5350341796875, -1.398681640625, -1.2623291015625, -1.1259765625, -0.9896240234375, -0.853271484375, -0.7169189453125, -0.58056640625, -0.4442138671875, -0.307861328125, -0.1715087890625, -0.03515625, 0.1011962890625, 0.237548828125, 0.3739013671875, 0.51025390625, 0.6466064453125, 0.782958984375, 0.9193115234375, 1.0556640625, 1.1920166015625, 1.328369140625, 1.4647216796875, 1.60107421875, 1.7374267578125, 1.873779296875, 2.0101318359375, 2.146484375, 2.2828369140625, 2.419189453125, 2.5555419921875, 2.69189453125, 2.8282470703125, 2.964599609375, 3.1009521484375, 3.2373046875, 3.3736572265625, 3.510009765625, 3.6463623046875, 3.78271484375, 3.9190673828125, 4.055419921875, 4.1917724609375, 4.328125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 14.0, 15.0, 46.0, 47.0, 85.0, 87.0, 128.0, 143.0, 120.0, 102.0, 79.0, 37.0, 31.0, 16.0, 18.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.84930419921875, -1.7923583984375, -1.73541259765625, -1.678466796875, -1.62152099609375, -1.5645751953125, -1.50762939453125, -1.45068359375, -1.39373779296875, -1.3367919921875, -1.27984619140625, -1.222900390625, -1.16595458984375, -1.1090087890625, -1.05206298828125, -0.9951171875, -0.93817138671875, -0.8812255859375, -0.82427978515625, -0.767333984375, -0.71038818359375, -0.6534423828125, -0.59649658203125, -0.53955078125, -0.48260498046875, -0.4256591796875, -0.36871337890625, -0.311767578125, -0.25482177734375, -0.1978759765625, -0.14093017578125, -0.083984375, -0.02703857421875, 0.0299072265625, 0.08685302734375, 0.143798828125, 0.20074462890625, 0.2576904296875, 0.31463623046875, 0.37158203125, 0.42852783203125, 0.4854736328125, 0.54241943359375, 0.599365234375, 0.65631103515625, 0.7132568359375, 0.77020263671875, 0.8271484375, 0.88409423828125, 0.9410400390625, 0.99798583984375, 1.054931640625, 1.11187744140625, 1.1688232421875, 1.22576904296875, 1.28271484375, 1.33966064453125, 1.3966064453125, 1.45355224609375, 1.510498046875, 1.56744384765625, 1.6243896484375, 1.68133544921875, 1.73828125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 14.0, 19.0, 23.0, 31.0, 38.0, 47.0, 61.0, 73.0, 99.0, 90.0, 75.0, 89.0, 64.0, 51.0, 47.0, 45.0, 34.0, 28.0, 16.0, 9.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25886344909668, -7.984199047088623, -7.709534645080566, -7.43487024307251, -7.160205841064453, -6.8855414390563965, -6.61087703704834, -6.336212158203125, -6.061548233032227, -5.78688383102417, -5.512219429016113, -5.237555027008057, -4.962890625, -4.688226222991943, -4.413561820983887, -4.138896942138672, -3.8642325401306152, -3.5895681381225586, -3.314903736114502, -3.0402393341064453, -2.7655749320983887, -2.490910530090332, -2.2162458896636963, -1.9415814876556396, -1.666917085647583, -1.3922526836395264, -1.1175882816314697, -0.8429237604141235, -0.5682593584060669, -0.29359495639801025, -0.018930435180664062, 0.2557339668273926, 0.5303983688354492, 0.8050627708435059, 1.0797271728515625, 1.3543916940689087, 1.6290560960769653, 1.903720498085022, 2.178385019302368, 2.453049421310425, 2.7277138233184814, 3.002378225326538, 3.2770426273345947, 3.5517072677612305, 3.826371669769287, 4.101036071777344, 4.3757004737854, 4.650364875793457, 4.925029277801514, 5.19969367980957, 5.474358081817627, 5.749022483825684, 6.02368688583374, 6.298351287841797, 6.573016166687012, 6.84768009185791, 7.122344970703125, 7.397009372711182, 7.671673774719238, 7.946338176727295, 8.221002578735352, 8.495667457580566, 8.770331382751465, 9.04499626159668, 9.319660186767578]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 10.0, 11.0, 9.0, 12.0, 10.0, 25.0, 15.0, 11.0, 18.0, 23.0, 21.0, 34.0, 37.0, 41.0, 31.0, 37.0, 34.0, 48.0, 36.0, 39.0, 33.0, 39.0, 40.0, 42.0, 31.0, 31.0, 23.0, 31.0, 27.0, 22.0, 18.0, 28.0, 14.0, 15.0, 18.0, 10.0, 10.0, 8.0, 15.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.2262632846832275, -3.127998113632202, -3.0297329425811768, -2.9314680099487305, -2.833202838897705, -2.7349376678466797, -2.6366724967956543, -2.538407325744629, -2.4401421546936035, -2.341876983642578, -2.2436118125915527, -2.1453466415405273, -2.047081708908081, -1.9488165378570557, -1.8505513668060303, -1.7522861957550049, -1.6540212631225586, -1.5557560920715332, -1.4574910402297974, -1.359225869178772, -1.2609608173370361, -1.1626956462860107, -1.0644304752349854, -0.9661653637886047, -0.8679002523422241, -0.7696351408958435, -0.6713700294494629, -0.5731048583984375, -0.4748397469520569, -0.37657463550567627, -0.2783094644546509, -0.18004435300827026, -0.08177924156188965, 0.01648588478565216, 0.11475101113319397, 0.21301615238189697, 0.3112812638282776, 0.4095463752746582, 0.5078115463256836, 0.6060766577720642, 0.7043417692184448, 0.8026068806648254, 0.900871992111206, 0.9991371631622314, 1.0974023342132568, 1.1956673860549927, 1.293932557106018, 1.392197608947754, 1.4904627799987793, 1.5887279510498047, 1.6869930028915405, 1.785258173942566, 1.8835232257843018, 1.9817883968353271, 2.0800535678863525, 2.178318738937378, 2.276583671569824, 2.3748488426208496, 2.473114013671875, 2.5713791847229004, 2.6696441173553467, 2.767909288406372, 2.8661744594573975, 2.964439630508423, 3.0627048015594482]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 13.0, 16.0, 16.0, 25.0, 36.0, 47.0, 59.0, 107.0, 145.0, 247.0, 312.0, 554.0, 794.0, 1213.0, 2057.0, 3362.0, 5814.0, 10099.0, 17516.0, 33247.0, 64025.0, 131685.0, 292347.0, 679873.0, 1176654.0, 954166.0, 441214.0, 191189.0, 88546.0, 44364.0, 23435.0, 13165.0, 7239.0, 4164.0, 2525.0, 1531.0, 910.0, 602.0, 340.0, 237.0, 126.0, 98.0, 53.0, 34.0, 21.0, 15.0, 20.0, 10.0, 2.0, 2.0, 4.0, 2.0, 3.0], "bins": [-7.33203125, -7.12689208984375, -6.9217529296875, -6.71661376953125, -6.511474609375, -6.30633544921875, -6.1011962890625, -5.89605712890625, -5.69091796875, -5.48577880859375, -5.2806396484375, -5.07550048828125, -4.870361328125, -4.66522216796875, -4.4600830078125, -4.25494384765625, -4.0498046875, -3.84466552734375, -3.6395263671875, -3.43438720703125, -3.229248046875, -3.02410888671875, -2.8189697265625, -2.61383056640625, -2.40869140625, -2.20355224609375, -1.9984130859375, -1.79327392578125, -1.588134765625, -1.38299560546875, -1.1778564453125, -0.97271728515625, -0.767578125, -0.56243896484375, -0.3572998046875, -0.15216064453125, 0.052978515625, 0.25811767578125, 0.4632568359375, 0.66839599609375, 0.87353515625, 1.07867431640625, 1.2838134765625, 1.48895263671875, 1.694091796875, 1.89923095703125, 2.1043701171875, 2.30950927734375, 2.5146484375, 2.71978759765625, 2.9249267578125, 3.13006591796875, 3.335205078125, 3.54034423828125, 3.7454833984375, 3.95062255859375, 4.15576171875, 4.36090087890625, 4.5660400390625, 4.77117919921875, 4.976318359375, 5.18145751953125, 5.3865966796875, 5.59173583984375, 5.796875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 9.0, 12.0, 10.0, 6.0, 11.0, 19.0, 17.0, 18.0, 18.0, 28.0, 34.0, 35.0, 28.0, 47.0, 36.0, 44.0, 39.0, 38.0, 46.0, 45.0, 41.0, 40.0, 44.0, 38.0, 38.0, 33.0, 33.0, 23.0, 24.0, 21.0, 13.0, 17.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-3.37890625, -3.284576416015625, -3.19024658203125, -3.095916748046875, -3.0015869140625, -2.907257080078125, -2.81292724609375, -2.718597412109375, -2.624267578125, -2.529937744140625, -2.43560791015625, -2.341278076171875, -2.2469482421875, -2.152618408203125, -2.05828857421875, -1.963958740234375, -1.86962890625, -1.775299072265625, -1.68096923828125, -1.586639404296875, -1.4923095703125, -1.397979736328125, -1.30364990234375, -1.209320068359375, -1.114990234375, -1.020660400390625, -0.92633056640625, -0.832000732421875, -0.7376708984375, -0.643341064453125, -0.54901123046875, -0.454681396484375, -0.3603515625, -0.266021728515625, -0.17169189453125, -0.077362060546875, 0.0169677734375, 0.111297607421875, 0.20562744140625, 0.299957275390625, 0.394287109375, 0.488616943359375, 0.58294677734375, 0.677276611328125, 0.7716064453125, 0.865936279296875, 0.96026611328125, 1.054595947265625, 1.14892578125, 1.243255615234375, 1.33758544921875, 1.431915283203125, 1.5262451171875, 1.620574951171875, 1.71490478515625, 1.809234619140625, 1.903564453125, 1.997894287109375, 2.09222412109375, 2.186553955078125, 2.2808837890625, 2.375213623046875, 2.46954345703125, 2.563873291015625, 2.658203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 10.0, 16.0, 18.0, 27.0, 53.0, 61.0, 121.0, 165.0, 234.0, 379.0, 574.0, 871.0, 1430.0, 2467.0, 4080.0, 7048.0, 12610.0, 23141.0, 44878.0, 89764.0, 187086.0, 400990.0, 825705.0, 1146397.0, 751888.0, 356572.0, 167262.0, 80713.0, 40437.0, 21336.0, 11641.0, 6467.0, 3779.0, 2219.0, 1423.0, 897.0, 532.0, 341.0, 210.0, 150.0, 99.0, 57.0, 44.0, 20.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.87890625, -7.63592529296875, -7.3929443359375, -7.14996337890625, -6.906982421875, -6.66400146484375, -6.4210205078125, -6.17803955078125, -5.93505859375, -5.69207763671875, -5.4490966796875, -5.20611572265625, -4.963134765625, -4.72015380859375, -4.4771728515625, -4.23419189453125, -3.9912109375, -3.74822998046875, -3.5052490234375, -3.26226806640625, -3.019287109375, -2.77630615234375, -2.5333251953125, -2.29034423828125, -2.04736328125, -1.80438232421875, -1.5614013671875, -1.31842041015625, -1.075439453125, -0.83245849609375, -0.5894775390625, -0.34649658203125, -0.103515625, 0.13946533203125, 0.3824462890625, 0.62542724609375, 0.868408203125, 1.11138916015625, 1.3543701171875, 1.59735107421875, 1.84033203125, 2.08331298828125, 2.3262939453125, 2.56927490234375, 2.812255859375, 3.05523681640625, 3.2982177734375, 3.54119873046875, 3.7841796875, 4.02716064453125, 4.2701416015625, 4.51312255859375, 4.756103515625, 4.99908447265625, 5.2420654296875, 5.48504638671875, 5.72802734375, 5.97100830078125, 6.2139892578125, 6.45697021484375, 6.699951171875, 6.94293212890625, 7.1859130859375, 7.42889404296875, 7.671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 4.0, 4.0, 13.0, 5.0, 15.0, 22.0, 12.0, 26.0, 42.0, 35.0, 58.0, 69.0, 85.0, 124.0, 136.0, 225.0, 226.0, 238.0, 298.0, 284.0, 281.0, 289.0, 281.0, 253.0, 207.0, 161.0, 147.0, 125.0, 101.0, 88.0, 51.0, 36.0, 33.0, 26.0, 17.0, 13.0, 14.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.375, -2.3098297119140625, -2.244659423828125, -2.1794891357421875, -2.11431884765625, -2.0491485595703125, -1.983978271484375, -1.9188079833984375, -1.8536376953125, -1.7884674072265625, -1.723297119140625, -1.6581268310546875, -1.59295654296875, -1.5277862548828125, -1.462615966796875, -1.3974456787109375, -1.332275390625, -1.2671051025390625, -1.201934814453125, -1.1367645263671875, -1.07159423828125, -1.0064239501953125, -0.941253662109375, -0.8760833740234375, -0.8109130859375, -0.7457427978515625, -0.680572509765625, -0.6154022216796875, -0.55023193359375, -0.4850616455078125, -0.419891357421875, -0.3547210693359375, -0.28955078125, -0.2243804931640625, -0.159210205078125, -0.0940399169921875, -0.02886962890625, 0.0363006591796875, 0.101470947265625, 0.1666412353515625, 0.2318115234375, 0.2969818115234375, 0.362152099609375, 0.4273223876953125, 0.49249267578125, 0.5576629638671875, 0.622833251953125, 0.6880035400390625, 0.753173828125, 0.8183441162109375, 0.883514404296875, 0.9486846923828125, 1.01385498046875, 1.0790252685546875, 1.144195556640625, 1.2093658447265625, 1.2745361328125, 1.3397064208984375, 1.404876708984375, 1.4700469970703125, 1.53521728515625, 1.6003875732421875, 1.665557861328125, 1.7307281494140625, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 15.0, 10.0, 11.0, 21.0, 21.0, 40.0, 43.0, 51.0, 54.0, 72.0, 72.0, 81.0, 73.0, 82.0, 77.0, 61.0, 60.0, 40.0, 40.0, 24.0, 10.0, 9.0, 10.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.115337371826172, -9.808186531066895, -9.501035690307617, -9.19388484954834, -8.886734008789062, -8.579583168029785, -8.272432327270508, -7.965281963348389, -7.658131122589111, -7.350980281829834, -7.043829441070557, -6.736678600311279, -6.42952823638916, -6.122377395629883, -5.8152265548706055, -5.508075714111328, -5.200924873352051, -4.893774032592773, -4.586623191833496, -4.279472351074219, -3.9723217487335205, -3.665170907974243, -3.358020305633545, -3.0508694648742676, -2.7437186241149902, -2.436567783355713, -2.1294169425964355, -1.8222663402557373, -1.51511549949646, -1.2079646587371826, -0.9008139371871948, -0.593663215637207, -0.2865133285522461, 0.020637452602386475, 0.32778823375701904, 0.6349390149116516, 0.9420897960662842, 1.2492406368255615, 1.5563913583755493, 1.863542079925537, 2.1706929206848145, 2.477843761444092, 2.784994602203369, 3.0921452045440674, 3.3992960453033447, 3.706446886062622, 4.01359748840332, 4.320748329162598, 4.627899169921875, 4.935050010681152, 5.24220085144043, 5.549351692199707, 5.856502532958984, 6.163653373718262, 6.470803737640381, 6.777954578399658, 7.0851054191589355, 7.392256259918213, 7.69940710067749, 8.00655746459961, 8.313708305358887, 8.620859146118164, 8.928009986877441, 9.235160827636719, 9.542311668395996]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 3.0, 7.0, 5.0, 4.0, 11.0, 26.0, 19.0, 18.0, 14.0, 13.0, 36.0, 34.0, 36.0, 29.0, 32.0, 34.0, 35.0, 32.0, 42.0, 43.0, 24.0, 36.0, 50.0, 46.0, 35.0, 38.0, 26.0, 30.0, 26.0, 32.0, 26.0, 19.0, 21.0, 19.0, 16.0, 10.0, 9.0, 7.0, 11.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.426629066467285, -3.315779209136963, -3.2049291133880615, -3.09407901763916, -2.983229160308838, -2.8723793029785156, -2.7615292072296143, -2.650679111480713, -2.5398292541503906, -2.4289793968200684, -2.318129301071167, -2.2072792053222656, -2.0964293479919434, -1.9855793714523315, -1.8747293949127197, -1.763879418373108, -1.653029441833496, -1.5421794652938843, -1.4313294887542725, -1.3204795122146606, -1.2096295356750488, -1.098779559135437, -0.9879295825958252, -0.8770796060562134, -0.7662296295166016, -0.6553796529769897, -0.5445296764373779, -0.4336796998977661, -0.3228297233581543, -0.21197974681854248, -0.10112977027893066, 0.009720206260681152, 0.12057018280029297, 0.23142015933990479, 0.3422701358795166, 0.4531201124191284, 0.5639700889587402, 0.674820065498352, 0.7856700420379639, 0.8965200185775757, 1.0073699951171875, 1.1182199716567993, 1.2290699481964111, 1.339919924736023, 1.4507699012756348, 1.5616198778152466, 1.6724698543548584, 1.7833198308944702, 1.894169807434082, 2.0050196647644043, 2.1158697605133057, 2.226719856262207, 2.3375697135925293, 2.4484195709228516, 2.559269666671753, 2.6701197624206543, 2.7809696197509766, 2.891819477081299, 3.0026695728302, 3.1135196685791016, 3.224369525909424, 3.335219383239746, 3.4460694789886475, 3.556919574737549, 3.667769432067871]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 14.0, 16.0, 18.0, 32.0, 41.0, 71.0, 91.0, 136.0, 198.0, 294.0, 443.0, 736.0, 1210.0, 1979.0, 3407.0, 6287.0, 11134.0, 21249.0, 41730.0, 83827.0, 164038.0, 258373.0, 214263.0, 117138.0, 58207.0, 29122.0, 15020.0, 8018.0, 4530.0, 2634.0, 1575.0, 943.0, 603.0, 373.0, 263.0, 167.0, 130.0, 70.0, 45.0, 30.0, 14.0, 20.0, 16.0, 12.0, 11.0, 6.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7426071166992188, -0.7176361083984375, -0.6926651000976562, -0.667694091796875, -0.6427230834960938, -0.6177520751953125, -0.5927810668945312, -0.56781005859375, -0.5428390502929688, -0.5178680419921875, -0.49289703369140625, -0.467926025390625, -0.44295501708984375, -0.4179840087890625, -0.39301300048828125, -0.3680419921875, -0.34307098388671875, -0.3180999755859375, -0.29312896728515625, -0.268157958984375, -0.24318695068359375, -0.2182159423828125, -0.19324493408203125, -0.16827392578125, -0.14330291748046875, -0.1183319091796875, -0.09336090087890625, -0.068389892578125, -0.04341888427734375, -0.0184478759765625, 0.00652313232421875, 0.031494140625, 0.05646514892578125, 0.0814361572265625, 0.10640716552734375, 0.131378173828125, 0.15634918212890625, 0.1813201904296875, 0.20629119873046875, 0.23126220703125, 0.25623321533203125, 0.2812042236328125, 0.30617523193359375, 0.331146240234375, 0.35611724853515625, 0.3810882568359375, 0.40605926513671875, 0.4310302734375, 0.45600128173828125, 0.4809722900390625, 0.5059432983398438, 0.530914306640625, 0.5558853149414062, 0.5808563232421875, 0.6058273315429688, 0.63079833984375, 0.6557693481445312, 0.6807403564453125, 0.7057113647460938, 0.730682373046875, 0.7556533813476562, 0.7806243896484375, 0.8055953979492188, 0.83056640625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 7.0, 5.0, 9.0, 8.0, 5.0, 15.0, 19.0, 21.0, 23.0, 23.0, 28.0, 29.0, 31.0, 41.0, 35.0, 31.0, 38.0, 42.0, 36.0, 48.0, 41.0, 49.0, 38.0, 47.0, 33.0, 31.0, 37.0, 35.0, 34.0, 26.0, 25.0, 14.0, 19.0, 14.0, 13.0, 7.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.14031982421875, -3.9993896484375, -3.85845947265625, -3.717529296875, -3.57659912109375, -3.4356689453125, -3.29473876953125, -3.15380859375, -3.01287841796875, -2.8719482421875, -2.73101806640625, -2.590087890625, -2.44915771484375, -2.3082275390625, -2.16729736328125, -2.0263671875, -1.88543701171875, -1.7445068359375, -1.60357666015625, -1.462646484375, -1.32171630859375, -1.1807861328125, -1.03985595703125, -0.89892578125, -0.75799560546875, -0.6170654296875, -0.47613525390625, -0.335205078125, -0.19427490234375, -0.0533447265625, 0.08758544921875, 0.228515625, 0.36944580078125, 0.5103759765625, 0.65130615234375, 0.792236328125, 0.93316650390625, 1.0740966796875, 1.21502685546875, 1.35595703125, 1.49688720703125, 1.6378173828125, 1.77874755859375, 1.919677734375, 2.06060791015625, 2.2015380859375, 2.34246826171875, 2.4833984375, 2.62432861328125, 2.7652587890625, 2.90618896484375, 3.047119140625, 3.18804931640625, 3.3289794921875, 3.46990966796875, 3.61083984375, 3.75177001953125, 3.8927001953125, 4.03363037109375, 4.174560546875, 4.31549072265625, 4.4564208984375, 4.59735107421875, 4.73828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 13.0, 16.0, 25.0, 43.0, 44.0, 69.0, 112.0, 129.0, 238.0, 449.0, 676.0, 1269.0, 2475.0, 5431.0, 13705.0, 52133.0, 897394.0, 50158.0, 13562.0, 5152.0, 2446.0, 1218.0, 669.0, 402.0, 214.0, 156.0, 94.0, 58.0, 48.0, 38.0, 19.0, 17.0, 17.0, 15.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.791015625, -2.705108642578125, -2.61920166015625, -2.533294677734375, -2.4473876953125, -2.361480712890625, -2.27557373046875, -2.189666748046875, -2.103759765625, -2.017852783203125, -1.93194580078125, -1.846038818359375, -1.7601318359375, -1.674224853515625, -1.58831787109375, -1.502410888671875, -1.41650390625, -1.330596923828125, -1.24468994140625, -1.158782958984375, -1.0728759765625, -0.986968994140625, -0.90106201171875, -0.815155029296875, -0.729248046875, -0.643341064453125, -0.55743408203125, -0.471527099609375, -0.3856201171875, -0.299713134765625, -0.21380615234375, -0.127899169921875, -0.0419921875, 0.043914794921875, 0.12982177734375, 0.215728759765625, 0.3016357421875, 0.387542724609375, 0.47344970703125, 0.559356689453125, 0.645263671875, 0.731170654296875, 0.81707763671875, 0.902984619140625, 0.9888916015625, 1.074798583984375, 1.16070556640625, 1.246612548828125, 1.33251953125, 1.418426513671875, 1.50433349609375, 1.590240478515625, 1.6761474609375, 1.762054443359375, 1.84796142578125, 1.933868408203125, 2.019775390625, 2.105682373046875, 2.19158935546875, 2.277496337890625, 2.3634033203125, 2.449310302734375, 2.53521728515625, 2.621124267578125, 2.70703125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 13.0, 11.0, 25.0, 22.0, 25.0, 32.0, 28.0, 44.0, 45.0, 53.0, 53.0, 55.0, 46.0, 69.0, 59.0, 62.0, 42.0, 49.0, 41.0, 35.0, 42.0, 31.0, 28.0, 16.0, 21.0, 10.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.638580322265625, -3.51348876953125, -3.388397216796875, -3.2633056640625, -3.138214111328125, -3.01312255859375, -2.888031005859375, -2.762939453125, -2.637847900390625, -2.51275634765625, -2.387664794921875, -2.2625732421875, -2.137481689453125, -2.01239013671875, -1.887298583984375, -1.76220703125, -1.637115478515625, -1.51202392578125, -1.386932373046875, -1.2618408203125, -1.136749267578125, -1.01165771484375, -0.886566162109375, -0.761474609375, -0.636383056640625, -0.51129150390625, -0.386199951171875, -0.2611083984375, -0.136016845703125, -0.01092529296875, 0.114166259765625, 0.2392578125, 0.364349365234375, 0.48944091796875, 0.614532470703125, 0.7396240234375, 0.864715576171875, 0.98980712890625, 1.114898681640625, 1.239990234375, 1.365081787109375, 1.49017333984375, 1.615264892578125, 1.7403564453125, 1.865447998046875, 1.99053955078125, 2.115631103515625, 2.24072265625, 2.365814208984375, 2.49090576171875, 2.615997314453125, 2.7410888671875, 2.866180419921875, 2.99127197265625, 3.116363525390625, 3.241455078125, 3.366546630859375, 3.49163818359375, 3.616729736328125, 3.7418212890625, 3.866912841796875, 3.99200439453125, 4.117095947265625, 4.2421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 15.0, 15.0, 13.0, 23.0, 32.0, 50.0, 56.0, 108.0, 159.0, 247.0, 408.0, 744.0, 2176.0, 19853.0, 1011205.0, 10197.0, 1571.0, 644.0, 388.0, 182.0, 146.0, 80.0, 70.0, 37.0, 34.0, 22.0, 23.0, 13.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.095703125, -3.00823974609375, -2.9207763671875, -2.83331298828125, -2.745849609375, -2.65838623046875, -2.5709228515625, -2.48345947265625, -2.39599609375, -2.30853271484375, -2.2210693359375, -2.13360595703125, -2.046142578125, -1.95867919921875, -1.8712158203125, -1.78375244140625, -1.6962890625, -1.60882568359375, -1.5213623046875, -1.43389892578125, -1.346435546875, -1.25897216796875, -1.1715087890625, -1.08404541015625, -0.99658203125, -0.90911865234375, -0.8216552734375, -0.73419189453125, -0.646728515625, -0.55926513671875, -0.4718017578125, -0.38433837890625, -0.296875, -0.20941162109375, -0.1219482421875, -0.03448486328125, 0.052978515625, 0.14044189453125, 0.2279052734375, 0.31536865234375, 0.40283203125, 0.49029541015625, 0.5777587890625, 0.66522216796875, 0.752685546875, 0.84014892578125, 0.9276123046875, 1.01507568359375, 1.1025390625, 1.19000244140625, 1.2774658203125, 1.36492919921875, 1.452392578125, 1.53985595703125, 1.6273193359375, 1.71478271484375, 1.80224609375, 1.88970947265625, 1.9771728515625, 2.06463623046875, 2.152099609375, 2.23956298828125, 2.3270263671875, 2.41448974609375, 2.501953125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 17.0, 39.0, 76.0, 125.0, 176.0, 175.0, 138.0, 115.0, 67.0, 19.0, 14.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.392333984375e-05, -8.132774382829666e-05, -7.873214781284332e-05, -7.613655179738998e-05, -7.354095578193665e-05, -7.094535976648331e-05, -6.834976375102997e-05, -6.575416773557663e-05, -6.315857172012329e-05, -6.056297570466995e-05, -5.7967379689216614e-05, -5.5371783673763275e-05, -5.2776187658309937e-05, -5.01805916428566e-05, -4.758499562740326e-05, -4.498939961194992e-05, -4.239380359649658e-05, -3.9798207581043243e-05, -3.7202611565589905e-05, -3.4607015550136566e-05, -3.201141953468323e-05, -2.941582351922989e-05, -2.682022750377655e-05, -2.422463148832321e-05, -2.1629035472869873e-05, -1.9033439457416534e-05, -1.6437843441963196e-05, -1.3842247426509857e-05, -1.1246651411056519e-05, -8.65105539560318e-06, -6.055459380149841e-06, -3.4598633646965027e-06, -8.642673492431641e-07, 1.7313286662101746e-06, 4.326924681663513e-06, 6.922520697116852e-06, 9.51811671257019e-06, 1.2113712728023529e-05, 1.4709308743476868e-05, 1.7304904758930206e-05, 1.9900500774383545e-05, 2.2496096789836884e-05, 2.5091692805290222e-05, 2.768728882074356e-05, 3.02828848361969e-05, 3.287848085165024e-05, 3.547407686710358e-05, 3.8069672882556915e-05, 4.0665268898010254e-05, 4.326086491346359e-05, 4.585646092891693e-05, 4.845205694437027e-05, 5.104765295982361e-05, 5.364324897527695e-05, 5.6238844990730286e-05, 5.8834441006183624e-05, 6.143003702163696e-05, 6.40256330370903e-05, 6.662122905254364e-05, 6.921682506799698e-05, 7.181242108345032e-05, 7.440801709890366e-05, 7.7003613114357e-05, 7.959920912981033e-05, 8.219480514526367e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 14.0, 20.0, 26.0, 38.0, 68.0, 73.0, 109.0, 187.0, 264.0, 363.0, 581.0, 943.0, 1483.0, 2454.0, 3903.0, 7155.0, 30454.0, 570994.0, 390410.0, 22574.0, 6585.0, 3690.0, 2240.0, 1390.0, 858.0, 558.0, 361.0, 243.0, 151.0, 92.0, 74.0, 70.0, 26.0, 26.0, 20.0, 15.0, 11.0, 2.0, 7.0, 2.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8053665161132812, -0.7743072509765625, -0.7432479858398438, -0.712188720703125, -0.6811294555664062, -0.6500701904296875, -0.6190109252929688, -0.58795166015625, -0.5568923950195312, -0.5258331298828125, -0.49477386474609375, -0.463714599609375, -0.43265533447265625, -0.4015960693359375, -0.37053680419921875, -0.3394775390625, -0.30841827392578125, -0.2773590087890625, -0.24629974365234375, -0.215240478515625, -0.18418121337890625, -0.1531219482421875, -0.12206268310546875, -0.09100341796875, -0.05994415283203125, -0.0288848876953125, 0.00217437744140625, 0.033233642578125, 0.06429290771484375, 0.0953521728515625, 0.12641143798828125, 0.157470703125, 0.18852996826171875, 0.2195892333984375, 0.25064849853515625, 0.281707763671875, 0.31276702880859375, 0.3438262939453125, 0.37488555908203125, 0.40594482421875, 0.43700408935546875, 0.4680633544921875, 0.49912261962890625, 0.530181884765625, 0.5612411499023438, 0.5923004150390625, 0.6233596801757812, 0.6544189453125, 0.6854782104492188, 0.7165374755859375, 0.7475967407226562, 0.778656005859375, 0.8097152709960938, 0.8407745361328125, 0.8718338012695312, 0.90289306640625, 0.9339523315429688, 0.9650115966796875, 0.9960708618164062, 1.027130126953125, 1.0581893920898438, 1.0892486572265625, 1.1203079223632812, 1.1513671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 28.0, 46.0, 59.0, 137.0, 220.0, 205.0, 126.0, 56.0, 31.0, 20.0, 10.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1239013671875, -0.11959648132324219, -0.11529159545898438, -0.11098670959472656, -0.10668182373046875, -0.10237693786621094, -0.09807205200195312, -0.09376716613769531, -0.0894622802734375, -0.08515739440917969, -0.08085250854492188, -0.07654762268066406, -0.07224273681640625, -0.06793785095214844, -0.06363296508789062, -0.05932807922363281, -0.055023193359375, -0.05071830749511719, -0.046413421630859375, -0.04210853576660156, -0.03780364990234375, -0.03349876403808594, -0.029193878173828125, -0.024888992309570312, -0.0205841064453125, -0.016279220581054688, -0.011974334716796875, -0.0076694488525390625, -0.00336456298828125, 0.0009403228759765625, 0.005245208740234375, 0.009550094604492188, 0.01385498046875, 0.018159866333007812, 0.022464752197265625, 0.026769638061523438, 0.03107452392578125, 0.03537940979003906, 0.039684295654296875, 0.04398918151855469, 0.0482940673828125, 0.05259895324707031, 0.056903839111328125, 0.06120872497558594, 0.06551361083984375, 0.06981849670410156, 0.07412338256835938, 0.07842826843261719, 0.082733154296875, 0.08703804016113281, 0.09134292602539062, 0.09564781188964844, 0.09995269775390625, 0.10425758361816406, 0.10856246948242188, 0.11286735534667969, 0.1171722412109375, 0.12147712707519531, 0.12578201293945312, 0.13008689880371094, 0.13439178466796875, 0.13869667053222656, 0.14300155639648438, 0.1473064422607422, 0.151611328125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 12.0, 17.0, 22.0, 23.0, 56.0, 42.0, 59.0, 54.0, 77.0, 82.0, 70.0, 92.0, 66.0, 56.0, 67.0, 49.0, 41.0, 27.0, 19.0, 8.0, 11.0, 6.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75455093383789, -9.4525728225708, -9.150594711303711, -8.848617553710938, -8.546639442443848, -8.244661331176758, -7.942683219909668, -7.640705108642578, -7.3387274742126465, -7.036749362945557, -6.734771728515625, -6.432793617248535, -6.130815505981445, -5.828837871551514, -5.526859760284424, -5.224882125854492, -4.922904014587402, -4.6209259033203125, -4.318948268890381, -4.016970157623291, -3.7149922847747803, -3.4130144119262695, -3.1110363006591797, -2.809058427810669, -2.507080554962158, -2.2051026821136475, -1.9031246900558472, -1.6011466979980469, -1.2991688251495361, -0.9971909523010254, -0.6952129602432251, -0.3932349681854248, -0.09125709533691406, 0.21072083711624146, 0.512698769569397, 0.8146767020225525, 1.116654634475708, 1.4186325073242188, 1.720610499382019, 2.0225884914398193, 2.32456636428833, 2.626544237136841, 2.9285221099853516, 3.2305002212524414, 3.532478094100952, 3.834455966949463, 4.136434078216553, 4.438411712646484, 4.740389823913574, 5.042367935180664, 5.344345569610596, 5.6463236808776855, 5.948301315307617, 6.250279426574707, 6.552257537841797, 6.854235649108887, 7.156213283538818, 7.458191394805908, 7.76016902923584, 8.06214714050293, 8.36412525177002, 8.66610336303711, 8.968080520629883, 9.270058631896973, 9.572036743164062]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 8.0, 5.0, 5.0, 6.0, 8.0, 19.0, 23.0, 18.0, 16.0, 18.0, 21.0, 36.0, 38.0, 25.0, 39.0, 31.0, 31.0, 40.0, 34.0, 43.0, 30.0, 34.0, 39.0, 52.0, 40.0, 32.0, 37.0, 24.0, 28.0, 29.0, 28.0, 25.0, 20.0, 17.0, 14.0, 17.0, 8.0, 7.0, 11.0, 7.0, 8.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.446017265319824, -3.3359527587890625, -3.225888252258301, -3.115823745727539, -3.0057590007781982, -2.8956944942474365, -2.785629987716675, -2.675565481185913, -2.5655007362365723, -2.4554362297058105, -2.345371723175049, -2.235307216644287, -2.1252424716949463, -2.0151779651641846, -1.9051134586334229, -1.7950489521026611, -1.6849844455718994, -1.5749199390411377, -1.4648553133010864, -1.3547908067703247, -1.2447261810302734, -1.1346616744995117, -1.02459716796875, -0.9145326018333435, -0.804468035697937, -0.6944034695625305, -0.584338903427124, -0.4742743968963623, -0.3642098307609558, -0.2541452646255493, -0.1440807580947876, -0.034016191959381104, 0.07604837417602539, 0.1861129254102707, 0.296177476644516, 0.4062420129776001, 0.5163065791130066, 0.6263711452484131, 0.7364356517791748, 0.8465002179145813, 0.9565647840499878, 1.0666292905807495, 1.1766939163208008, 1.2867584228515625, 1.3968229293823242, 1.5068875551223755, 1.6169520616531372, 1.7270166873931885, 1.8370811939239502, 1.947145700454712, 2.0572102069854736, 2.1672749519348145, 2.277339458465576, 2.387403964996338, 2.4974684715270996, 2.6075329780578613, 2.717597484588623, 2.8276619911193848, 2.9377264976501465, 3.047791004180908, 3.157855749130249, 3.2679202556610107, 3.3779847621917725, 3.488049268722534, 3.598114013671875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 22.0, 32.0, 37.0, 54.0, 60.0, 119.0, 187.0, 249.0, 400.0, 555.0, 818.0, 1322.0, 1912.0, 2958.0, 4451.0, 6910.0, 10695.0, 16877.0, 25965.0, 40191.0, 61249.0, 88925.0, 120059.0, 142063.0, 141763.0, 119038.0, 88131.0, 60305.0, 39904.0, 26167.0, 16648.0, 10709.0, 6814.0, 4439.0, 2849.0, 1887.0, 1222.0, 897.0, 523.0, 388.0, 245.0, 167.0, 125.0, 84.0, 39.0, 32.0, 30.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0], "bins": [-4.40625, -4.276611328125, -4.14697265625, -4.017333984375, -3.8876953125, -3.758056640625, -3.62841796875, -3.498779296875, -3.369140625, -3.239501953125, -3.10986328125, -2.980224609375, -2.8505859375, -2.720947265625, -2.59130859375, -2.461669921875, -2.33203125, -2.202392578125, -2.07275390625, -1.943115234375, -1.8134765625, -1.683837890625, -1.55419921875, -1.424560546875, -1.294921875, -1.165283203125, -1.03564453125, -0.906005859375, -0.7763671875, -0.646728515625, -0.51708984375, -0.387451171875, -0.2578125, -0.128173828125, 0.00146484375, 0.131103515625, 0.2607421875, 0.390380859375, 0.52001953125, 0.649658203125, 0.779296875, 0.908935546875, 1.03857421875, 1.168212890625, 1.2978515625, 1.427490234375, 1.55712890625, 1.686767578125, 1.81640625, 1.946044921875, 2.07568359375, 2.205322265625, 2.3349609375, 2.464599609375, 2.59423828125, 2.723876953125, 2.853515625, 2.983154296875, 3.11279296875, 3.242431640625, 3.3720703125, 3.501708984375, 3.63134765625, 3.760986328125, 3.890625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 13.0, 1.0, 6.0, 11.0, 5.0, 12.0, 12.0, 14.0, 21.0, 22.0, 24.0, 24.0, 26.0, 34.0, 36.0, 32.0, 36.0, 35.0, 43.0, 62.0, 38.0, 39.0, 37.0, 48.0, 52.0, 33.0, 49.0, 38.0, 26.0, 23.0, 25.0, 21.0, 19.0, 15.0, 13.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.6484375, -4.510986328125, -4.37353515625, -4.236083984375, -4.0986328125, -3.961181640625, -3.82373046875, -3.686279296875, -3.548828125, -3.411376953125, -3.27392578125, -3.136474609375, -2.9990234375, -2.861572265625, -2.72412109375, -2.586669921875, -2.44921875, -2.311767578125, -2.17431640625, -2.036865234375, -1.8994140625, -1.761962890625, -1.62451171875, -1.487060546875, -1.349609375, -1.212158203125, -1.07470703125, -0.937255859375, -0.7998046875, -0.662353515625, -0.52490234375, -0.387451171875, -0.25, -0.112548828125, 0.02490234375, 0.162353515625, 0.2998046875, 0.437255859375, 0.57470703125, 0.712158203125, 0.849609375, 0.987060546875, 1.12451171875, 1.261962890625, 1.3994140625, 1.536865234375, 1.67431640625, 1.811767578125, 1.94921875, 2.086669921875, 2.22412109375, 2.361572265625, 2.4990234375, 2.636474609375, 2.77392578125, 2.911376953125, 3.048828125, 3.186279296875, 3.32373046875, 3.461181640625, 3.5986328125, 3.736083984375, 3.87353515625, 4.010986328125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 9.0, 13.0, 22.0, 29.0, 45.0, 68.0, 102.0, 173.0, 279.0, 424.0, 616.0, 993.0, 1589.0, 2614.0, 4251.0, 7126.0, 11392.0, 18983.0, 31565.0, 50035.0, 77443.0, 112062.0, 143136.0, 154231.0, 138012.0, 104939.0, 70884.0, 45713.0, 27609.0, 17314.0, 10427.0, 6368.0, 3800.0, 2285.0, 1470.0, 915.0, 563.0, 368.0, 221.0, 156.0, 104.0, 72.0, 37.0, 30.0, 24.0, 14.0, 10.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.83203125, -4.682861328125, -4.53369140625, -4.384521484375, -4.2353515625, -4.086181640625, -3.93701171875, -3.787841796875, -3.638671875, -3.489501953125, -3.34033203125, -3.191162109375, -3.0419921875, -2.892822265625, -2.74365234375, -2.594482421875, -2.4453125, -2.296142578125, -2.14697265625, -1.997802734375, -1.8486328125, -1.699462890625, -1.55029296875, -1.401123046875, -1.251953125, -1.102783203125, -0.95361328125, -0.804443359375, -0.6552734375, -0.506103515625, -0.35693359375, -0.207763671875, -0.05859375, 0.090576171875, 0.23974609375, 0.388916015625, 0.5380859375, 0.687255859375, 0.83642578125, 0.985595703125, 1.134765625, 1.283935546875, 1.43310546875, 1.582275390625, 1.7314453125, 1.880615234375, 2.02978515625, 2.178955078125, 2.328125, 2.477294921875, 2.62646484375, 2.775634765625, 2.9248046875, 3.073974609375, 3.22314453125, 3.372314453125, 3.521484375, 3.670654296875, 3.81982421875, 3.968994140625, 4.1181640625, 4.267333984375, 4.41650390625, 4.565673828125, 4.71484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 17.0, 15.0, 16.0, 19.0, 21.0, 28.0, 26.0, 38.0, 26.0, 40.0, 49.0, 38.0, 32.0, 52.0, 39.0, 49.0, 38.0, 48.0, 43.0, 40.0, 34.0, 41.0, 38.0, 43.0, 31.0, 16.0, 27.0, 13.0, 18.0, 7.0, 10.0, 8.0, 5.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.271484375, -3.175506591796875, -3.07952880859375, -2.983551025390625, -2.8875732421875, -2.791595458984375, -2.69561767578125, -2.599639892578125, -2.503662109375, -2.407684326171875, -2.31170654296875, -2.215728759765625, -2.1197509765625, -2.023773193359375, -1.92779541015625, -1.831817626953125, -1.73583984375, -1.639862060546875, -1.54388427734375, -1.447906494140625, -1.3519287109375, -1.255950927734375, -1.15997314453125, -1.063995361328125, -0.968017578125, -0.872039794921875, -0.77606201171875, -0.680084228515625, -0.5841064453125, -0.488128662109375, -0.39215087890625, -0.296173095703125, -0.2001953125, -0.104217529296875, -0.00823974609375, 0.087738037109375, 0.1837158203125, 0.279693603515625, 0.37567138671875, 0.471649169921875, 0.567626953125, 0.663604736328125, 0.75958251953125, 0.855560302734375, 0.9515380859375, 1.047515869140625, 1.14349365234375, 1.239471435546875, 1.33544921875, 1.431427001953125, 1.52740478515625, 1.623382568359375, 1.7193603515625, 1.815338134765625, 1.91131591796875, 2.007293701171875, 2.103271484375, 2.199249267578125, 2.29522705078125, 2.391204833984375, 2.4871826171875, 2.583160400390625, 2.67913818359375, 2.775115966796875, 2.87109375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 13.0, 16.0, 28.0, 27.0, 47.0, 67.0, 98.0, 159.0, 195.0, 354.0, 542.0, 858.0, 1336.0, 2265.0, 3787.0, 6321.0, 10573.0, 17449.0, 29972.0, 50559.0, 85677.0, 134924.0, 180383.0, 179871.0, 134459.0, 84977.0, 50242.0, 29424.0, 17702.0, 10349.0, 6125.0, 3733.0, 2325.0, 1389.0, 832.0, 498.0, 335.0, 214.0, 132.0, 97.0, 58.0, 31.0, 36.0, 21.0, 20.0, 6.0, 9.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.804901123046875, -2.71722412109375, -2.629547119140625, -2.5418701171875, -2.454193115234375, -2.36651611328125, -2.278839111328125, -2.191162109375, -2.103485107421875, -2.01580810546875, -1.928131103515625, -1.8404541015625, -1.752777099609375, -1.66510009765625, -1.577423095703125, -1.48974609375, -1.402069091796875, -1.31439208984375, -1.226715087890625, -1.1390380859375, -1.051361083984375, -0.96368408203125, -0.876007080078125, -0.788330078125, -0.700653076171875, -0.61297607421875, -0.525299072265625, -0.4376220703125, -0.349945068359375, -0.26226806640625, -0.174591064453125, -0.0869140625, 0.000762939453125, 0.08843994140625, 0.176116943359375, 0.2637939453125, 0.351470947265625, 0.43914794921875, 0.526824951171875, 0.614501953125, 0.702178955078125, 0.78985595703125, 0.877532958984375, 0.9652099609375, 1.052886962890625, 1.14056396484375, 1.228240966796875, 1.31591796875, 1.403594970703125, 1.49127197265625, 1.578948974609375, 1.6666259765625, 1.754302978515625, 1.84197998046875, 1.929656982421875, 2.017333984375, 2.105010986328125, 2.19268798828125, 2.280364990234375, 2.3680419921875, 2.455718994140625, 2.54339599609375, 2.631072998046875, 2.71875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 9.0, 4.0, 20.0, 23.0, 31.0, 45.0, 41.0, 73.0, 78.0, 123.0, 109.0, 101.0, 87.0, 73.0, 53.0, 41.0, 28.0, 15.0, 11.0, 14.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0007257461547851562, -0.00070919468998909, -0.0006926432251930237, -0.0006760917603969574, -0.0006595402956008911, -0.0006429888308048248, -0.0006264373660087585, -0.0006098859012126923, -0.000593334436416626, -0.0005767829716205597, -0.0005602315068244934, -0.0005436800420284271, -0.0005271285772323608, -0.0005105771124362946, -0.0004940256476402283, -0.000477474182844162, -0.0004609227180480957, -0.0004443712532520294, -0.00042781978845596313, -0.00041126832365989685, -0.00039471685886383057, -0.0003781653940677643, -0.000361613929271698, -0.0003450624644756317, -0.00032851099967956543, -0.00031195953488349915, -0.00029540807008743286, -0.0002788566052913666, -0.0002623051404953003, -0.000245753675699234, -0.00022920221090316772, -0.00021265074610710144, -0.00019609928131103516, -0.00017954781651496887, -0.0001629963517189026, -0.0001464448869228363, -0.00012989342212677002, -0.00011334195733070374, -9.679049253463745e-05, -8.023902773857117e-05, -6.368756294250488e-05, -4.71360981464386e-05, -3.0584633350372314e-05, -1.403316855430603e-05, 2.518296241760254e-06, 1.9069761037826538e-05, 3.562122583389282e-05, 5.2172690629959106e-05, 6.872415542602539e-05, 8.527562022209167e-05, 0.00010182708501815796, 0.00011837854981422424, 0.00013493001461029053, 0.0001514814794063568, 0.0001680329442024231, 0.00018458440899848938, 0.00020113587379455566, 0.00021768733859062195, 0.00023423880338668823, 0.0002507902681827545, 0.0002673417329788208, 0.0002838931977748871, 0.00030044466257095337, 0.00031699612736701965, 0.00033354759216308594]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 9.0, 13.0, 15.0, 24.0, 28.0, 37.0, 58.0, 83.0, 115.0, 187.0, 241.0, 364.0, 518.0, 745.0, 1063.0, 1677.0, 2717.0, 4129.0, 6904.0, 11707.0, 19952.0, 34439.0, 59247.0, 97491.0, 147145.0, 182001.0, 168438.0, 121741.0, 76860.0, 45198.0, 26272.0, 15101.0, 8984.0, 5507.0, 3204.0, 2084.0, 1360.0, 885.0, 630.0, 426.0, 267.0, 207.0, 147.0, 111.0, 60.0, 47.0, 40.0, 29.0, 18.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.607421875, -2.519775390625, -2.43212890625, -2.344482421875, -2.2568359375, -2.169189453125, -2.08154296875, -1.993896484375, -1.90625, -1.818603515625, -1.73095703125, -1.643310546875, -1.5556640625, -1.468017578125, -1.38037109375, -1.292724609375, -1.205078125, -1.117431640625, -1.02978515625, -0.942138671875, -0.8544921875, -0.766845703125, -0.67919921875, -0.591552734375, -0.50390625, -0.416259765625, -0.32861328125, -0.240966796875, -0.1533203125, -0.065673828125, 0.02197265625, 0.109619140625, 0.197265625, 0.284912109375, 0.37255859375, 0.460205078125, 0.5478515625, 0.635498046875, 0.72314453125, 0.810791015625, 0.8984375, 0.986083984375, 1.07373046875, 1.161376953125, 1.2490234375, 1.336669921875, 1.42431640625, 1.511962890625, 1.599609375, 1.687255859375, 1.77490234375, 1.862548828125, 1.9501953125, 2.037841796875, 2.12548828125, 2.213134765625, 2.30078125, 2.388427734375, 2.47607421875, 2.563720703125, 2.6513671875, 2.739013671875, 2.82666015625, 2.914306640625, 3.001953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 9.0, 13.0, 18.0, 16.0, 16.0, 28.0, 26.0, 37.0, 45.0, 51.0, 36.0, 51.0, 51.0, 52.0, 65.0, 53.0, 43.0, 41.0, 43.0, 30.0, 33.0, 29.0, 23.0, 29.0, 20.0, 22.0, 13.0, 17.0, 6.0, 9.0, 10.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-0.7255859375, -0.7011795043945312, -0.6767730712890625, -0.6523666381835938, -0.627960205078125, -0.6035537719726562, -0.5791473388671875, -0.5547409057617188, -0.53033447265625, -0.5059280395507812, -0.4815216064453125, -0.45711517333984375, -0.432708740234375, -0.40830230712890625, -0.3838958740234375, -0.35948944091796875, -0.3350830078125, -0.31067657470703125, -0.2862701416015625, -0.26186370849609375, -0.237457275390625, -0.21305084228515625, -0.1886444091796875, -0.16423797607421875, -0.13983154296875, -0.11542510986328125, -0.0910186767578125, -0.06661224365234375, -0.042205810546875, -0.01779937744140625, 0.0066070556640625, 0.03101348876953125, 0.055419921875, 0.07982635498046875, 0.1042327880859375, 0.12863922119140625, 0.153045654296875, 0.17745208740234375, 0.2018585205078125, 0.22626495361328125, 0.25067138671875, 0.27507781982421875, 0.2994842529296875, 0.32389068603515625, 0.348297119140625, 0.37270355224609375, 0.3971099853515625, 0.42151641845703125, 0.4459228515625, 0.47032928466796875, 0.4947357177734375, 0.5191421508789062, 0.543548583984375, 0.5679550170898438, 0.5923614501953125, 0.6167678833007812, 0.64117431640625, 0.6655807495117188, 0.6899871826171875, 0.7143936157226562, 0.738800048828125, 0.7632064819335938, 0.7876129150390625, 0.8120193481445312, 0.83642578125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 10.0, 27.0, 38.0, 31.0, 37.0, 50.0, 68.0, 76.0, 84.0, 85.0, 75.0, 61.0, 57.0, 55.0, 57.0, 45.0, 26.0, 21.0, 18.0, 18.0, 10.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.24628734588623, -9.950932502746582, -9.655576705932617, -9.360221862792969, -9.064866065979004, -8.769511222839355, -8.47415542602539, -8.178800582885742, -7.8834452629089355, -7.588089942932129, -7.292734622955322, -6.997379302978516, -6.702024459838867, -6.406668663024902, -6.111313819885254, -5.815958499908447, -5.520603179931641, -5.225247859954834, -4.929892539978027, -4.634537220001221, -4.339181900024414, -4.043827056884766, -3.748471736907959, -3.4531164169311523, -3.1577610969543457, -2.862405776977539, -2.5670504570007324, -2.271695375442505, -1.9763400554656982, -1.6809847354888916, -1.3856295347213745, -1.0902743339538574, -0.7949199676513672, -0.4995647072792053, -0.20420944690704346, 0.09114581346511841, 0.3865010738372803, 0.6818563938140869, 0.977211594581604, 1.272566795349121, 1.5679221153259277, 1.8632774353027344, 2.158632755279541, 2.4539878368377686, 2.749343156814575, 3.044698476791382, 3.3400535583496094, 3.635408878326416, 3.9307641983032227, 4.226119518280029, 4.521474838256836, 4.816830158233643, 5.112185478210449, 5.407540321350098, 5.702895641326904, 5.998250961303711, 6.293606281280518, 6.588961601257324, 6.884316921234131, 7.1796722412109375, 7.475027084350586, 7.770382881164551, 8.0657377243042, 8.361093521118164, 8.656448364257812]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 9.0, 9.0, 9.0, 15.0, 20.0, 14.0, 28.0, 15.0, 22.0, 25.0, 37.0, 32.0, 38.0, 44.0, 56.0, 28.0, 40.0, 37.0, 34.0, 38.0, 41.0, 30.0, 40.0, 42.0, 42.0, 29.0, 26.0, 21.0, 28.0, 24.0, 24.0, 10.0, 11.0, 11.0, 7.0, 16.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9239768981933594, -3.804469347000122, -3.6849617958068848, -3.5654542446136475, -3.44594669342041, -3.326439380645752, -3.2069315910339355, -3.0874242782592773, -2.96791672706604, -2.8484091758728027, -2.7289016246795654, -2.609394073486328, -2.489886522293091, -2.3703789710998535, -2.2508716583251953, -2.131364107131958, -2.0118565559387207, -1.8923490047454834, -1.772841453552246, -1.6533339023590088, -1.533826470375061, -1.4143189191818237, -1.2948113679885864, -1.1753039360046387, -1.0557961463928223, -0.936288595199585, -0.8167811036109924, -0.6972735524177551, -0.5777660608291626, -0.4582585096359253, -0.338750958442688, -0.21924346685409546, -0.09973597526550293, 0.019771553575992584, 0.1392790824174881, 0.2587866187095642, 0.3782941401004791, 0.49780166149139404, 0.6173092126846313, 0.7368167042732239, 0.8563242554664612, 0.9758318066596985, 1.095339298248291, 1.2148468494415283, 1.3343544006347656, 1.453861951828003, 1.5733695030212402, 1.692876935005188, 1.8123844861984253, 1.9318920373916626, 2.0513994693756104, 2.1709070205688477, 2.290414571762085, 2.4099221229553223, 2.5294296741485596, 2.648937225341797, 2.768444776535034, 2.8879523277282715, 3.007459878921509, 3.126967430114746, 3.2464749813079834, 3.3659825325012207, 3.485489845275879, 3.604997396469116, 3.7245049476623535]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 7.0, 3.0, 8.0, 9.0, 14.0, 20.0, 31.0, 37.0, 61.0, 77.0, 107.0, 150.0, 223.0, 291.0, 451.0, 617.0, 940.0, 1371.0, 1972.0, 3029.0, 4739.0, 7350.0, 11924.0, 19351.0, 32823.0, 57676.0, 106448.0, 207877.0, 424379.0, 787195.0, 982918.0, 721523.0, 389529.0, 196682.0, 101068.0, 54841.0, 30738.0, 18364.0, 10899.0, 6698.0, 4113.0, 2701.0, 1721.0, 1091.0, 742.0, 453.0, 308.0, 264.0, 150.0, 113.0, 63.0, 44.0, 28.0, 22.0, 17.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0], "bins": [-6.46875, -6.2752685546875, -6.081787109375, -5.8883056640625, -5.69482421875, -5.5013427734375, -5.307861328125, -5.1143798828125, -4.9208984375, -4.7274169921875, -4.533935546875, -4.3404541015625, -4.14697265625, -3.9534912109375, -3.760009765625, -3.5665283203125, -3.373046875, -3.1795654296875, -2.986083984375, -2.7926025390625, -2.59912109375, -2.4056396484375, -2.212158203125, -2.0186767578125, -1.8251953125, -1.6317138671875, -1.438232421875, -1.2447509765625, -1.05126953125, -0.8577880859375, -0.664306640625, -0.4708251953125, -0.27734375, -0.0838623046875, 0.109619140625, 0.3031005859375, 0.49658203125, 0.6900634765625, 0.883544921875, 1.0770263671875, 1.2705078125, 1.4639892578125, 1.657470703125, 1.8509521484375, 2.04443359375, 2.2379150390625, 2.431396484375, 2.6248779296875, 2.818359375, 3.0118408203125, 3.205322265625, 3.3988037109375, 3.59228515625, 3.7857666015625, 3.979248046875, 4.1727294921875, 4.3662109375, 4.5596923828125, 4.753173828125, 4.9466552734375, 5.14013671875, 5.3336181640625, 5.527099609375, 5.7205810546875, 5.9140625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 9.0, 3.0, 14.0, 12.0, 16.0, 15.0, 18.0, 20.0, 24.0, 25.0, 29.0, 28.0, 24.0, 36.0, 42.0, 39.0, 31.0, 47.0, 47.0, 46.0, 43.0, 41.0, 43.0, 40.0, 36.0, 39.0, 30.0, 23.0, 28.0, 19.0, 25.0, 21.0, 9.0, 11.0, 19.0, 11.0, 4.0, 5.0, 7.0, 4.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.99609375, -3.88427734375, -3.7724609375, -3.66064453125, -3.548828125, -3.43701171875, -3.3251953125, -3.21337890625, -3.1015625, -2.98974609375, -2.8779296875, -2.76611328125, -2.654296875, -2.54248046875, -2.4306640625, -2.31884765625, -2.20703125, -2.09521484375, -1.9833984375, -1.87158203125, -1.759765625, -1.64794921875, -1.5361328125, -1.42431640625, -1.3125, -1.20068359375, -1.0888671875, -0.97705078125, -0.865234375, -0.75341796875, -0.6416015625, -0.52978515625, -0.41796875, -0.30615234375, -0.1943359375, -0.08251953125, 0.029296875, 0.14111328125, 0.2529296875, 0.36474609375, 0.4765625, 0.58837890625, 0.7001953125, 0.81201171875, 0.923828125, 1.03564453125, 1.1474609375, 1.25927734375, 1.37109375, 1.48291015625, 1.5947265625, 1.70654296875, 1.818359375, 1.93017578125, 2.0419921875, 2.15380859375, 2.265625, 2.37744140625, 2.4892578125, 2.60107421875, 2.712890625, 2.82470703125, 2.9365234375, 3.04833984375, 3.16015625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 12.0, 15.0, 13.0, 25.0, 28.0, 50.0, 73.0, 115.0, 164.0, 228.0, 363.0, 556.0, 834.0, 1284.0, 2089.0, 3413.0, 5844.0, 9992.0, 17945.0, 33616.0, 64398.0, 132007.0, 282463.0, 608761.0, 1078765.0, 978982.0, 506131.0, 234500.0, 110668.0, 54696.0, 28570.0, 15682.0, 8684.0, 5143.0, 3079.0, 1853.0, 1116.0, 734.0, 477.0, 316.0, 203.0, 126.0, 98.0, 55.0, 40.0, 21.0, 15.0, 15.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.1484375, -8.8614501953125, -8.574462890625, -8.2874755859375, -8.00048828125, -7.7135009765625, -7.426513671875, -7.1395263671875, -6.8525390625, -6.5655517578125, -6.278564453125, -5.9915771484375, -5.70458984375, -5.4176025390625, -5.130615234375, -4.8436279296875, -4.556640625, -4.2696533203125, -3.982666015625, -3.6956787109375, -3.40869140625, -3.1217041015625, -2.834716796875, -2.5477294921875, -2.2607421875, -1.9737548828125, -1.686767578125, -1.3997802734375, -1.11279296875, -0.8258056640625, -0.538818359375, -0.2518310546875, 0.03515625, 0.3221435546875, 0.609130859375, 0.8961181640625, 1.18310546875, 1.4700927734375, 1.757080078125, 2.0440673828125, 2.3310546875, 2.6180419921875, 2.905029296875, 3.1920166015625, 3.47900390625, 3.7659912109375, 4.052978515625, 4.3399658203125, 4.626953125, 4.9139404296875, 5.200927734375, 5.4879150390625, 5.77490234375, 6.0618896484375, 6.348876953125, 6.6358642578125, 6.9228515625, 7.2098388671875, 7.496826171875, 7.7838134765625, 8.07080078125, 8.3577880859375, 8.644775390625, 8.9317626953125, 9.21875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 3.0, 9.0, 18.0, 17.0, 33.0, 34.0, 46.0, 44.0, 86.0, 86.0, 131.0, 192.0, 209.0, 238.0, 302.0, 355.0, 340.0, 308.0, 303.0, 266.0, 218.0, 199.0, 152.0, 111.0, 103.0, 70.0, 37.0, 40.0, 30.0, 21.0, 22.0, 13.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.422119140625, -2.33447265625, -2.246826171875, -2.1591796875, -2.071533203125, -1.98388671875, -1.896240234375, -1.80859375, -1.720947265625, -1.63330078125, -1.545654296875, -1.4580078125, -1.370361328125, -1.28271484375, -1.195068359375, -1.107421875, -1.019775390625, -0.93212890625, -0.844482421875, -0.7568359375, -0.669189453125, -0.58154296875, -0.493896484375, -0.40625, -0.318603515625, -0.23095703125, -0.143310546875, -0.0556640625, 0.031982421875, 0.11962890625, 0.207275390625, 0.294921875, 0.382568359375, 0.47021484375, 0.557861328125, 0.6455078125, 0.733154296875, 0.82080078125, 0.908447265625, 0.99609375, 1.083740234375, 1.17138671875, 1.259033203125, 1.3466796875, 1.434326171875, 1.52197265625, 1.609619140625, 1.697265625, 1.784912109375, 1.87255859375, 1.960205078125, 2.0478515625, 2.135498046875, 2.22314453125, 2.310791015625, 2.3984375, 2.486083984375, 2.57373046875, 2.661376953125, 2.7490234375, 2.836669921875, 2.92431640625, 3.011962890625, 3.099609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 15.0, 12.0, 22.0, 25.0, 28.0, 36.0, 40.0, 39.0, 60.0, 45.0, 80.0, 60.0, 61.0, 62.0, 47.0, 54.0, 50.0, 54.0, 42.0, 31.0, 28.0, 20.0, 8.0, 15.0, 11.0, 10.0, 8.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.099714279174805, -9.812762260437012, -9.525810241699219, -9.238858222961426, -8.951906204223633, -8.66495418548584, -8.378002166748047, -8.091050148010254, -7.804098129272461, -7.517146110534668, -7.230194091796875, -6.943242073059082, -6.656290054321289, -6.369338035583496, -6.082386016845703, -5.79543399810791, -5.508482456207275, -5.221530437469482, -4.9345784187316895, -4.6476263999938965, -4.3606743812561035, -4.0737223625183105, -3.7867705821990967, -3.4998185634613037, -3.2128665447235107, -2.9259145259857178, -2.638962507247925, -2.352010726928711, -2.065058708190918, -1.7781065702438354, -1.491154670715332, -1.204202651977539, -0.9172506332397461, -0.6302986145019531, -0.34334665536880493, -0.05639469623565674, 0.23055732250213623, 0.5175093412399292, 0.8044612407684326, 1.0914132595062256, 1.3783652782440186, 1.6653172969818115, 1.9522693157196045, 2.2392210960388184, 2.5261731147766113, 2.8131251335144043, 3.1000771522521973, 3.3870291709899902, 3.673981189727783, 3.960933208465576, 4.247885227203369, 4.534837245941162, 4.821789264678955, 5.108741283416748, 5.395692825317383, 5.682644844055176, 5.969596862792969, 6.256548881530762, 6.543500900268555, 6.830452919006348, 7.117404937744141, 7.404356956481934, 7.691308975219727, 7.9782609939575195, 8.265213012695312]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 9.0, 3.0, 5.0, 7.0, 3.0, 6.0, 5.0, 15.0, 10.0, 9.0, 14.0, 20.0, 12.0, 30.0, 29.0, 28.0, 25.0, 32.0, 38.0, 38.0, 36.0, 33.0, 48.0, 46.0, 42.0, 34.0, 44.0, 36.0, 33.0, 32.0, 24.0, 26.0, 29.0, 18.0, 25.0, 24.0, 17.0, 22.0, 13.0, 15.0, 13.0, 10.0, 8.0, 9.0, 8.0, 6.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.151684284210205, -4.021500587463379, -3.891317367553711, -3.761133909225464, -3.630950450897217, -3.5007667541503906, -3.3705832958221436, -3.2403998374938965, -3.1102163791656494, -2.9800329208374023, -2.8498494625091553, -2.719666004180908, -2.589482307434082, -2.459299087524414, -2.329115390777588, -2.198931932449341, -2.0687484741210938, -1.9385650157928467, -1.8083815574645996, -1.678197979927063, -1.548014521598816, -1.4178310632705688, -1.2876474857330322, -1.1574640274047852, -1.027280569076538, -0.897097110748291, -0.7669135928153992, -0.6367300748825073, -0.5065466165542603, -0.3763631582260132, -0.24617964029312134, -0.11599612236022949, 0.014186859130859375, 0.14437034726142883, 0.2745538353919983, 0.40473732352256775, 0.5349208116531372, 0.6651042699813843, 0.7952877879142761, 0.925471305847168, 1.055654764175415, 1.185838222503662, 1.3160216808319092, 1.4462052583694458, 1.5763887166976929, 1.70657217502594, 1.8367557525634766, 1.9669392108917236, 2.0971226692199707, 2.2273061275482178, 2.357489585876465, 2.487673044204712, 2.617856502532959, 2.748040199279785, 2.8782236576080322, 3.0084071159362793, 3.1385905742645264, 3.2687740325927734, 3.3989574909210205, 3.5291409492492676, 3.6593246459960938, 3.7895078659057617, 3.919691562652588, 4.049875259399414, 4.180058479309082]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 6.0, 2.0, 10.0, 6.0, 19.0, 26.0, 42.0, 44.0, 62.0, 108.0, 158.0, 213.0, 268.0, 441.0, 581.0, 846.0, 1275.0, 1816.0, 2732.0, 4201.0, 6381.0, 10235.0, 15982.0, 25995.0, 42906.0, 70851.0, 114449.0, 163230.0, 181465.0, 147856.0, 98468.0, 60346.0, 36313.0, 22060.0, 13696.0, 8754.0, 5533.0, 3530.0, 2448.0, 1635.0, 1135.0, 728.0, 539.0, 356.0, 227.0, 149.0, 124.0, 106.0, 60.0, 47.0, 39.0, 27.0, 11.0, 14.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.5869140625, -0.5681838989257812, -0.5494537353515625, -0.5307235717773438, -0.511993408203125, -0.49326324462890625, -0.4745330810546875, -0.45580291748046875, -0.43707275390625, -0.41834259033203125, -0.3996124267578125, -0.38088226318359375, -0.362152099609375, -0.34342193603515625, -0.3246917724609375, -0.30596160888671875, -0.2872314453125, -0.26850128173828125, -0.2497711181640625, -0.23104095458984375, -0.212310791015625, -0.19358062744140625, -0.1748504638671875, -0.15612030029296875, -0.13739013671875, -0.11865997314453125, -0.0999298095703125, -0.08119964599609375, -0.062469482421875, -0.04373931884765625, -0.0250091552734375, -0.00627899169921875, 0.012451171875, 0.03118133544921875, 0.0499114990234375, 0.06864166259765625, 0.087371826171875, 0.10610198974609375, 0.1248321533203125, 0.14356231689453125, 0.16229248046875, 0.18102264404296875, 0.1997528076171875, 0.21848297119140625, 0.237213134765625, 0.25594329833984375, 0.2746734619140625, 0.29340362548828125, 0.3121337890625, 0.33086395263671875, 0.3495941162109375, 0.36832427978515625, 0.387054443359375, 0.40578460693359375, 0.4245147705078125, 0.44324493408203125, 0.46197509765625, 0.48070526123046875, 0.4994354248046875, 0.5181655883789062, 0.536895751953125, 0.5556259155273438, 0.5743560791015625, 0.5930862426757812, 0.61181640625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 7.0, 4.0, 8.0, 9.0, 8.0, 11.0, 15.0, 19.0, 17.0, 26.0, 33.0, 24.0, 32.0, 32.0, 31.0, 42.0, 52.0, 37.0, 38.0, 40.0, 40.0, 31.0, 36.0, 33.0, 51.0, 33.0, 28.0, 29.0, 29.0, 25.0, 25.0, 19.0, 15.0, 18.0, 10.0, 15.0, 8.0, 6.0, 8.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.7890625, -4.63934326171875, -4.4896240234375, -4.33990478515625, -4.190185546875, -4.04046630859375, -3.8907470703125, -3.74102783203125, -3.59130859375, -3.44158935546875, -3.2918701171875, -3.14215087890625, -2.992431640625, -2.84271240234375, -2.6929931640625, -2.54327392578125, -2.3935546875, -2.24383544921875, -2.0941162109375, -1.94439697265625, -1.794677734375, -1.64495849609375, -1.4952392578125, -1.34552001953125, -1.19580078125, -1.04608154296875, -0.8963623046875, -0.74664306640625, -0.596923828125, -0.44720458984375, -0.2974853515625, -0.14776611328125, 0.001953125, 0.15167236328125, 0.3013916015625, 0.45111083984375, 0.600830078125, 0.75054931640625, 0.9002685546875, 1.04998779296875, 1.19970703125, 1.34942626953125, 1.4991455078125, 1.64886474609375, 1.798583984375, 1.94830322265625, 2.0980224609375, 2.24774169921875, 2.3974609375, 2.54718017578125, 2.6968994140625, 2.84661865234375, 2.996337890625, 3.14605712890625, 3.2957763671875, 3.44549560546875, 3.59521484375, 3.74493408203125, 3.8946533203125, 4.04437255859375, 4.194091796875, 4.34381103515625, 4.4935302734375, 4.64324951171875, 4.79296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 7.0, 8.0, 18.0, 22.0, 11.0, 36.0, 46.0, 55.0, 98.0, 138.0, 160.0, 268.0, 396.0, 651.0, 998.0, 1736.0, 2881.0, 5357.0, 10900.0, 25517.0, 179614.0, 750312.0, 38827.0, 14608.0, 6812.0, 3675.0, 2056.0, 1149.0, 777.0, 422.0, 300.0, 204.0, 151.0, 99.0, 79.0, 49.0, 36.0, 26.0, 11.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.037109375, -1.97381591796875, -1.9105224609375, -1.84722900390625, -1.783935546875, -1.72064208984375, -1.6573486328125, -1.59405517578125, -1.53076171875, -1.46746826171875, -1.4041748046875, -1.34088134765625, -1.277587890625, -1.21429443359375, -1.1510009765625, -1.08770751953125, -1.0244140625, -0.96112060546875, -0.8978271484375, -0.83453369140625, -0.771240234375, -0.70794677734375, -0.6446533203125, -0.58135986328125, -0.51806640625, -0.45477294921875, -0.3914794921875, -0.32818603515625, -0.264892578125, -0.20159912109375, -0.1383056640625, -0.07501220703125, -0.01171875, 0.05157470703125, 0.1148681640625, 0.17816162109375, 0.241455078125, 0.30474853515625, 0.3680419921875, 0.43133544921875, 0.49462890625, 0.55792236328125, 0.6212158203125, 0.68450927734375, 0.747802734375, 0.81109619140625, 0.8743896484375, 0.93768310546875, 1.0009765625, 1.06427001953125, 1.1275634765625, 1.19085693359375, 1.254150390625, 1.31744384765625, 1.3807373046875, 1.44403076171875, 1.50732421875, 1.57061767578125, 1.6339111328125, 1.69720458984375, 1.760498046875, 1.82379150390625, 1.8870849609375, 1.95037841796875, 2.013671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 11.0, 10.0, 14.0, 16.0, 22.0, 30.0, 23.0, 26.0, 28.0, 29.0, 48.0, 33.0, 39.0, 40.0, 52.0, 43.0, 41.0, 48.0, 38.0, 38.0, 47.0, 37.0, 40.0, 35.0, 23.0, 30.0, 29.0, 23.0, 18.0, 19.0, 10.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3984375, -3.2872314453125, -3.176025390625, -3.0648193359375, -2.95361328125, -2.8424072265625, -2.731201171875, -2.6199951171875, -2.5087890625, -2.3975830078125, -2.286376953125, -2.1751708984375, -2.06396484375, -1.9527587890625, -1.841552734375, -1.7303466796875, -1.619140625, -1.5079345703125, -1.396728515625, -1.2855224609375, -1.17431640625, -1.0631103515625, -0.951904296875, -0.8406982421875, -0.7294921875, -0.6182861328125, -0.507080078125, -0.3958740234375, -0.28466796875, -0.1734619140625, -0.062255859375, 0.0489501953125, 0.16015625, 0.2713623046875, 0.382568359375, 0.4937744140625, 0.60498046875, 0.7161865234375, 0.827392578125, 0.9385986328125, 1.0498046875, 1.1610107421875, 1.272216796875, 1.3834228515625, 1.49462890625, 1.6058349609375, 1.717041015625, 1.8282470703125, 1.939453125, 2.0506591796875, 2.161865234375, 2.2730712890625, 2.38427734375, 2.4954833984375, 2.606689453125, 2.7178955078125, 2.8291015625, 2.9403076171875, 3.051513671875, 3.1627197265625, 3.27392578125, 3.3851318359375, 3.496337890625, 3.6075439453125, 3.71875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 10.0, 10.0, 15.0, 14.0, 25.0, 41.0, 49.0, 67.0, 93.0, 146.0, 225.0, 313.0, 469.0, 794.0, 1199.0, 1960.0, 3468.0, 6175.0, 11469.0, 24630.0, 238272.0, 702039.0, 28225.0, 12712.0, 6578.0, 3704.0, 2114.0, 1348.0, 783.0, 500.0, 315.0, 238.0, 161.0, 112.0, 81.0, 55.0, 32.0, 37.0, 19.0, 10.0, 9.0, 7.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4335823059082031, -0.41916656494140625, -0.4047508239746094, -0.3903350830078125, -0.3759193420410156, -0.36150360107421875, -0.3470878601074219, -0.332672119140625, -0.3182563781738281, -0.30384063720703125, -0.2894248962402344, -0.2750091552734375, -0.2605934143066406, -0.24617767333984375, -0.23176193237304688, -0.21734619140625, -0.20293045043945312, -0.18851470947265625, -0.17409896850585938, -0.1596832275390625, -0.14526748657226562, -0.13085174560546875, -0.11643600463867188, -0.102020263671875, -0.08760452270507812, -0.07318878173828125, -0.058773040771484375, -0.0443572998046875, -0.029941558837890625, -0.01552581787109375, -0.001110076904296875, 0.0133056640625, 0.027721405029296875, 0.04213714599609375, 0.056552886962890625, 0.0709686279296875, 0.08538436889648438, 0.09980010986328125, 0.11421585083007812, 0.128631591796875, 0.14304733276367188, 0.15746307373046875, 0.17187881469726562, 0.1862945556640625, 0.20071029663085938, 0.21512603759765625, 0.22954177856445312, 0.24395751953125, 0.2583732604980469, 0.27278900146484375, 0.2872047424316406, 0.3016204833984375, 0.3160362243652344, 0.33045196533203125, 0.3448677062988281, 0.359283447265625, 0.3736991882324219, 0.38811492919921875, 0.4025306701660156, 0.4169464111328125, 0.4313621520996094, 0.44577789306640625, 0.4601936340332031, 0.474609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 12.0, 12.0, 12.0, 25.0, 20.0, 22.0, 22.0, 30.0, 19.0, 21.0, 34.0, 22.0, 37.0, 34.0, 41.0, 50.0, 61.0, 35.0, 41.0, 34.0, 33.0, 34.0, 46.0, 23.0, 36.0, 33.0, 28.0, 22.0, 19.0, 17.0, 13.0, 17.0, 15.0, 8.0, 8.0, 4.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6987323760986328e-05, -1.6470439732074738e-05, -1.5953555703163147e-05, -1.5436671674251556e-05, -1.4919787645339966e-05, -1.4402903616428375e-05, -1.3886019587516785e-05, -1.3369135558605194e-05, -1.2852251529693604e-05, -1.2335367500782013e-05, -1.1818483471870422e-05, -1.1301599442958832e-05, -1.0784715414047241e-05, -1.026783138513565e-05, -9.75094735622406e-06, -9.23406332731247e-06, -8.717179298400879e-06, -8.200295269489288e-06, -7.683411240577698e-06, -7.166527211666107e-06, -6.649643182754517e-06, -6.132759153842926e-06, -5.6158751249313354e-06, -5.098991096019745e-06, -4.582107067108154e-06, -4.065223038196564e-06, -3.548339009284973e-06, -3.0314549803733826e-06, -2.514570951461792e-06, -1.9976869225502014e-06, -1.4808028936386108e-06, -9.639188647270203e-07, -4.470348358154297e-07, 6.984919309616089e-08, 5.867332220077515e-07, 1.103617250919342e-06, 1.6205012798309326e-06, 2.137385308742523e-06, 2.6542693376541138e-06, 3.1711533665657043e-06, 3.688037395477295e-06, 4.2049214243888855e-06, 4.721805453300476e-06, 5.238689482212067e-06, 5.755573511123657e-06, 6.272457540035248e-06, 6.789341568946838e-06, 7.306225597858429e-06, 7.82310962677002e-06, 8.33999365568161e-06, 8.8568776845932e-06, 9.373761713504791e-06, 9.890645742416382e-06, 1.0407529771327972e-05, 1.0924413800239563e-05, 1.1441297829151154e-05, 1.1958181858062744e-05, 1.2475065886974335e-05, 1.2991949915885925e-05, 1.3508833944797516e-05, 1.4025717973709106e-05, 1.4542602002620697e-05, 1.5059486031532288e-05, 1.5576370060443878e-05, 1.609325408935547e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 17.0, 12.0, 18.0, 24.0, 32.0, 39.0, 75.0, 93.0, 114.0, 196.0, 232.0, 383.0, 574.0, 990.0, 1698.0, 3086.0, 6042.0, 12936.0, 29452.0, 73571.0, 184243.0, 330250.0, 235627.0, 97502.0, 38291.0, 16435.0, 7595.0, 3792.0, 2024.0, 1065.0, 697.0, 435.0, 289.0, 200.0, 136.0, 111.0, 79.0, 54.0, 34.0, 26.0, 24.0, 17.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.2635078430175781, -0.25431060791015625, -0.24511337280273438, -0.2359161376953125, -0.22671890258789062, -0.21752166748046875, -0.20832443237304688, -0.199127197265625, -0.18992996215820312, -0.18073272705078125, -0.17153549194335938, -0.1623382568359375, -0.15314102172851562, -0.14394378662109375, -0.13474655151367188, -0.12554931640625, -0.11635208129882812, -0.10715484619140625, -0.09795761108398438, -0.0887603759765625, -0.07956314086914062, -0.07036590576171875, -0.061168670654296875, -0.051971435546875, -0.042774200439453125, -0.03357696533203125, -0.024379730224609375, -0.0151824951171875, -0.005985260009765625, 0.00321197509765625, 0.012409210205078125, 0.0216064453125, 0.030803680419921875, 0.04000091552734375, 0.049198150634765625, 0.0583953857421875, 0.06759262084960938, 0.07678985595703125, 0.08598709106445312, 0.095184326171875, 0.10438156127929688, 0.11357879638671875, 0.12277603149414062, 0.1319732666015625, 0.14117050170898438, 0.15036773681640625, 0.15956497192382812, 0.16876220703125, 0.17795944213867188, 0.18715667724609375, 0.19635391235351562, 0.2055511474609375, 0.21474838256835938, 0.22394561767578125, 0.23314285278320312, 0.242340087890625, 0.2515373229980469, 0.26073455810546875, 0.2699317932128906, 0.2791290283203125, 0.2883262634277344, 0.29752349853515625, 0.3067207336425781, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 8.0, 5.0, 13.0, 20.0, 22.0, 26.0, 54.0, 67.0, 99.0, 106.0, 115.0, 124.0, 94.0, 83.0, 46.0, 47.0, 25.0, 15.0, 13.0, 2.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061859130859375, -0.05942106246948242, -0.056982994079589844, -0.054544925689697266, -0.05210685729980469, -0.04966878890991211, -0.04723072052001953, -0.04479265213012695, -0.042354583740234375, -0.0399165153503418, -0.03747844696044922, -0.03504037857055664, -0.03260231018066406, -0.030164241790771484, -0.027726173400878906, -0.025288105010986328, -0.02285003662109375, -0.020411968231201172, -0.017973899841308594, -0.015535831451416016, -0.013097763061523438, -0.01065969467163086, -0.008221626281738281, -0.005783557891845703, -0.003345489501953125, -0.0009074211120605469, 0.0015306472778320312, 0.003968715667724609, 0.0064067840576171875, 0.008844852447509766, 0.011282920837402344, 0.013720989227294922, 0.0161590576171875, 0.018597126007080078, 0.021035194396972656, 0.023473262786865234, 0.025911331176757812, 0.02834939956665039, 0.03078746795654297, 0.03322553634643555, 0.035663604736328125, 0.0381016731262207, 0.04053974151611328, 0.04297780990600586, 0.04541587829589844, 0.047853946685791016, 0.050292015075683594, 0.05273008346557617, 0.05516815185546875, 0.05760622024536133, 0.060044288635253906, 0.062482357025146484, 0.06492042541503906, 0.06735849380493164, 0.06979656219482422, 0.0722346305847168, 0.07467269897460938, 0.07711076736450195, 0.07954883575439453, 0.08198690414428711, 0.08442497253417969, 0.08686304092407227, 0.08930110931396484, 0.09173917770385742, 0.09417724609375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 6.0, 10.0, 16.0, 14.0, 31.0, 28.0, 31.0, 41.0, 35.0, 56.0, 46.0, 87.0, 55.0, 64.0, 63.0, 51.0, 46.0, 61.0, 46.0, 53.0, 28.0, 31.0, 17.0, 11.0, 12.0, 11.0, 10.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.182402610778809, -9.894397735595703, -9.606393814086914, -9.318388938903809, -9.030384063720703, -8.742380142211914, -8.454375267028809, -8.166370391845703, -7.878365993499756, -7.590361595153809, -7.302356719970703, -7.014352321624756, -6.726347923278809, -6.438343048095703, -6.150338649749756, -5.862334251403809, -5.574329376220703, -5.286324977874756, -4.99832010269165, -4.710315704345703, -4.422310829162598, -4.13430643081665, -3.846302032470703, -3.5582973957061768, -3.2702927589416504, -2.982288122177124, -2.6942834854125977, -2.4062790870666504, -2.118274450302124, -1.8302698135375977, -1.5422652959823608, -1.254260778427124, -0.9662561416625977, -0.6782515645027161, -0.3902469873428345, -0.10224241018295288, 0.1857621669769287, 0.4737668037414551, 0.7617713212966919, 1.0497758388519287, 1.337780475616455, 1.6257851123809814, 1.9137896299362183, 2.201794147491455, 2.4897987842559814, 2.777803421020508, 3.065807819366455, 3.3538124561309814, 3.641817092895508, 3.929821729660034, 4.2178263664245605, 4.505830764770508, 4.793835639953613, 5.0818400382995605, 5.369844436645508, 5.657849311828613, 5.9458537101745605, 6.233858108520508, 6.521862983703613, 6.8098673820495605, 7.097871780395508, 7.385876655578613, 7.6738810539245605, 7.961885452270508, 8.249890327453613]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 2.0, 9.0, 3.0, 4.0, 8.0, 3.0, 6.0, 6.0, 16.0, 10.0, 10.0, 11.0, 20.0, 16.0, 29.0, 33.0, 25.0, 24.0, 36.0, 34.0, 38.0, 39.0, 34.0, 46.0, 45.0, 43.0, 34.0, 44.0, 34.0, 33.0, 33.0, 22.0, 28.0, 26.0, 19.0, 28.0, 21.0, 17.0, 21.0, 12.0, 13.0, 15.0, 9.0, 10.0, 12.0, 6.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.1361870765686035, -4.00673770904541, -3.877288818359375, -3.7478396892547607, -3.6183905601501465, -3.488941192626953, -3.359492063522339, -3.2300429344177246, -3.1005938053131104, -2.971144676208496, -2.841695547103882, -2.7122464179992676, -2.582797050476074, -2.453348159790039, -2.3238987922668457, -2.1944496631622314, -2.065000534057617, -1.935551404953003, -1.8061022758483887, -1.6766530275344849, -1.5472038984298706, -1.4177547693252563, -1.2883055210113525, -1.1588563919067383, -1.029407262802124, -0.8999581336975098, -0.7705089449882507, -0.6410597562789917, -0.5116106271743774, -0.3821614980697632, -0.25271230936050415, -0.12326312065124512, 0.006186008453369141, 0.1356351673603058, 0.26508432626724243, 0.3945334851741791, 0.5239826440811157, 0.65343177318573, 0.782880961894989, 0.912330150604248, 1.0417792797088623, 1.1712284088134766, 1.3006775379180908, 1.4301267862319946, 1.5595759153366089, 1.6890250444412231, 1.818474292755127, 1.9479234218597412, 2.0773725509643555, 2.2068216800689697, 2.336270809173584, 2.4657199382781982, 2.5951690673828125, 2.724618434906006, 2.85406756401062, 2.9835166931152344, 3.1129658222198486, 3.242414951324463, 3.371864080429077, 3.5013132095336914, 3.6307625770568848, 3.76021146774292, 3.8896608352661133, 4.019109725952148, 4.148559093475342]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 19.0, 25.0, 33.0, 42.0, 64.0, 57.0, 114.0, 175.0, 268.0, 406.0, 712.0, 1014.0, 1707.0, 2667.0, 4659.0, 7978.0, 13929.0, 25387.0, 45505.0, 79442.0, 127644.0, 174814.0, 185014.0, 148215.0, 96972.0, 57415.0, 32039.0, 17849.0, 9801.0, 5817.0, 3311.0, 2002.0, 1195.0, 729.0, 492.0, 352.0, 215.0, 133.0, 89.0, 85.0, 52.0, 30.0, 19.0, 20.0, 8.0, 12.0, 5.0, 9.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-7.02734375, -6.815673828125, -6.60400390625, -6.392333984375, -6.1806640625, -5.968994140625, -5.75732421875, -5.545654296875, -5.333984375, -5.122314453125, -4.91064453125, -4.698974609375, -4.4873046875, -4.275634765625, -4.06396484375, -3.852294921875, -3.640625, -3.428955078125, -3.21728515625, -3.005615234375, -2.7939453125, -2.582275390625, -2.37060546875, -2.158935546875, -1.947265625, -1.735595703125, -1.52392578125, -1.312255859375, -1.1005859375, -0.888916015625, -0.67724609375, -0.465576171875, -0.25390625, -0.042236328125, 0.16943359375, 0.381103515625, 0.5927734375, 0.804443359375, 1.01611328125, 1.227783203125, 1.439453125, 1.651123046875, 1.86279296875, 2.074462890625, 2.2861328125, 2.497802734375, 2.70947265625, 2.921142578125, 3.1328125, 3.344482421875, 3.55615234375, 3.767822265625, 3.9794921875, 4.191162109375, 4.40283203125, 4.614501953125, 4.826171875, 5.037841796875, 5.24951171875, 5.461181640625, 5.6728515625, 5.884521484375, 6.09619140625, 6.307861328125, 6.51953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 9.0, 15.0, 7.0, 9.0, 11.0, 12.0, 18.0, 11.0, 13.0, 22.0, 26.0, 29.0, 20.0, 42.0, 35.0, 29.0, 33.0, 40.0, 36.0, 41.0, 48.0, 41.0, 47.0, 33.0, 40.0, 32.0, 30.0, 32.0, 27.0, 35.0, 35.0, 22.0, 22.0, 18.0, 13.0, 11.0, 7.0, 8.0, 12.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.598388671875, -4.44287109375, -4.287353515625, -4.1318359375, -3.976318359375, -3.82080078125, -3.665283203125, -3.509765625, -3.354248046875, -3.19873046875, -3.043212890625, -2.8876953125, -2.732177734375, -2.57666015625, -2.421142578125, -2.265625, -2.110107421875, -1.95458984375, -1.799072265625, -1.6435546875, -1.488037109375, -1.33251953125, -1.177001953125, -1.021484375, -0.865966796875, -0.71044921875, -0.554931640625, -0.3994140625, -0.243896484375, -0.08837890625, 0.067138671875, 0.22265625, 0.378173828125, 0.53369140625, 0.689208984375, 0.8447265625, 1.000244140625, 1.15576171875, 1.311279296875, 1.466796875, 1.622314453125, 1.77783203125, 1.933349609375, 2.0888671875, 2.244384765625, 2.39990234375, 2.555419921875, 2.7109375, 2.866455078125, 3.02197265625, 3.177490234375, 3.3330078125, 3.488525390625, 3.64404296875, 3.799560546875, 3.955078125, 4.110595703125, 4.26611328125, 4.421630859375, 4.5771484375, 4.732666015625, 4.88818359375, 5.043701171875, 5.19921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 12.0, 12.0, 26.0, 38.0, 41.0, 83.0, 117.0, 166.0, 240.0, 440.0, 670.0, 1071.0, 1735.0, 2806.0, 4538.0, 7433.0, 12606.0, 20684.0, 35068.0, 58236.0, 92629.0, 135269.0, 166747.0, 163167.0, 127013.0, 84877.0, 53045.0, 31620.0, 19023.0, 11494.0, 6874.0, 4020.0, 2524.0, 1553.0, 985.0, 605.0, 355.0, 255.0, 145.0, 113.0, 64.0, 54.0, 38.0, 18.0, 14.0, 8.0, 2.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.16796875, -5.9683837890625, -5.768798828125, -5.5692138671875, -5.36962890625, -5.1700439453125, -4.970458984375, -4.7708740234375, -4.5712890625, -4.3717041015625, -4.172119140625, -3.9725341796875, -3.77294921875, -3.5733642578125, -3.373779296875, -3.1741943359375, -2.974609375, -2.7750244140625, -2.575439453125, -2.3758544921875, -2.17626953125, -1.9766845703125, -1.777099609375, -1.5775146484375, -1.3779296875, -1.1783447265625, -0.978759765625, -0.7791748046875, -0.57958984375, -0.3800048828125, -0.180419921875, 0.0191650390625, 0.21875, 0.4183349609375, 0.617919921875, 0.8175048828125, 1.01708984375, 1.2166748046875, 1.416259765625, 1.6158447265625, 1.8154296875, 2.0150146484375, 2.214599609375, 2.4141845703125, 2.61376953125, 2.8133544921875, 3.012939453125, 3.2125244140625, 3.412109375, 3.6116943359375, 3.811279296875, 4.0108642578125, 4.21044921875, 4.4100341796875, 4.609619140625, 4.8092041015625, 5.0087890625, 5.2083740234375, 5.407958984375, 5.6075439453125, 5.80712890625, 6.0067138671875, 6.206298828125, 6.4058837890625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 5.0, 10.0, 15.0, 14.0, 30.0, 19.0, 27.0, 27.0, 27.0, 31.0, 42.0, 33.0, 42.0, 38.0, 54.0, 32.0, 51.0, 54.0, 53.0, 45.0, 38.0, 37.0, 30.0, 36.0, 38.0, 29.0, 23.0, 31.0, 14.0, 11.0, 7.0, 10.0, 8.0, 5.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.105865478515625, -2.99688720703125, -2.887908935546875, -2.7789306640625, -2.669952392578125, -2.56097412109375, -2.451995849609375, -2.343017578125, -2.234039306640625, -2.12506103515625, -2.016082763671875, -1.9071044921875, -1.798126220703125, -1.68914794921875, -1.580169677734375, -1.47119140625, -1.362213134765625, -1.25323486328125, -1.144256591796875, -1.0352783203125, -0.926300048828125, -0.81732177734375, -0.708343505859375, -0.599365234375, -0.490386962890625, -0.38140869140625, -0.272430419921875, -0.1634521484375, -0.054473876953125, 0.05450439453125, 0.163482666015625, 0.2724609375, 0.381439208984375, 0.49041748046875, 0.599395751953125, 0.7083740234375, 0.817352294921875, 0.92633056640625, 1.035308837890625, 1.144287109375, 1.253265380859375, 1.36224365234375, 1.471221923828125, 1.5802001953125, 1.689178466796875, 1.79815673828125, 1.907135009765625, 2.01611328125, 2.125091552734375, 2.23406982421875, 2.343048095703125, 2.4520263671875, 2.561004638671875, 2.66998291015625, 2.778961181640625, 2.887939453125, 2.996917724609375, 3.10589599609375, 3.214874267578125, 3.3238525390625, 3.432830810546875, 3.54180908203125, 3.650787353515625, 3.759765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 13.0, 17.0, 32.0, 26.0, 65.0, 83.0, 97.0, 175.0, 212.0, 340.0, 494.0, 752.0, 1098.0, 1646.0, 2646.0, 4428.0, 7786.0, 14356.0, 28377.0, 55497.0, 106157.0, 179049.0, 224345.0, 184406.0, 112044.0, 58383.0, 29914.0, 15389.0, 8034.0, 4672.0, 2737.0, 1777.0, 1129.0, 764.0, 514.0, 334.0, 250.0, 150.0, 131.0, 74.0, 51.0, 35.0, 29.0, 21.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.57421875, -4.43365478515625, -4.2930908203125, -4.15252685546875, -4.011962890625, -3.87139892578125, -3.7308349609375, -3.59027099609375, -3.44970703125, -3.30914306640625, -3.1685791015625, -3.02801513671875, -2.887451171875, -2.74688720703125, -2.6063232421875, -2.46575927734375, -2.3251953125, -2.18463134765625, -2.0440673828125, -1.90350341796875, -1.762939453125, -1.62237548828125, -1.4818115234375, -1.34124755859375, -1.20068359375, -1.06011962890625, -0.9195556640625, -0.77899169921875, -0.638427734375, -0.49786376953125, -0.3572998046875, -0.21673583984375, -0.076171875, 0.06439208984375, 0.2049560546875, 0.34552001953125, 0.486083984375, 0.62664794921875, 0.7672119140625, 0.90777587890625, 1.04833984375, 1.18890380859375, 1.3294677734375, 1.47003173828125, 1.610595703125, 1.75115966796875, 1.8917236328125, 2.03228759765625, 2.1728515625, 2.31341552734375, 2.4539794921875, 2.59454345703125, 2.735107421875, 2.87567138671875, 3.0162353515625, 3.15679931640625, 3.29736328125, 3.43792724609375, 3.5784912109375, 3.71905517578125, 3.859619140625, 4.00018310546875, 4.1407470703125, 4.28131103515625, 4.421875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 14.0, 10.0, 14.0, 25.0, 25.0, 34.0, 47.0, 41.0, 40.0, 58.0, 71.0, 83.0, 83.0, 74.0, 69.0, 40.0, 49.0, 43.0, 39.0, 24.0, 24.0, 16.0, 11.0, 8.0, 11.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005197525024414062, -0.0005041398108005524, -0.0004885271191596985, -0.0004729144275188446, -0.0004573017358779907, -0.00044168904423713684, -0.00042607635259628296, -0.0004104636609554291, -0.0003948509693145752, -0.0003792382776737213, -0.00036362558603286743, -0.00034801289439201355, -0.00033240020275115967, -0.0003167875111103058, -0.0003011748194694519, -0.000285562127828598, -0.00026994943618774414, -0.00025433674454689026, -0.00023872405290603638, -0.0002231113612651825, -0.0002074986696243286, -0.00019188597798347473, -0.00017627328634262085, -0.00016066059470176697, -0.00014504790306091309, -0.0001294352114200592, -0.00011382251977920532, -9.820982813835144e-05, -8.259713649749756e-05, -6.698444485664368e-05, -5.1371753215789795e-05, -3.575906157493591e-05, -2.014636993408203e-05, -4.533678293228149e-06, 1.1079013347625732e-05, 2.6691704988479614e-05, 4.2304396629333496e-05, 5.791708827018738e-05, 7.352977991104126e-05, 8.914247155189514e-05, 0.00010475516319274902, 0.0001203678548336029, 0.0001359805464744568, 0.00015159323811531067, 0.00016720592975616455, 0.00018281862139701843, 0.00019843131303787231, 0.0002140440046787262, 0.00022965669631958008, 0.00024526938796043396, 0.00026088207960128784, 0.0002764947712421417, 0.0002921074628829956, 0.0003077201545238495, 0.00032333284616470337, 0.00033894553780555725, 0.00035455822944641113, 0.000370170921087265, 0.0003857836127281189, 0.0004013963043689728, 0.00041700899600982666, 0.00043262168765068054, 0.0004482343792915344, 0.0004638470709323883, 0.0004794597625732422]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 19.0, 27.0, 30.0, 49.0, 88.0, 107.0, 150.0, 247.0, 416.0, 715.0, 1137.0, 2080.0, 3430.0, 6237.0, 11128.0, 20595.0, 37928.0, 69040.0, 119976.0, 180420.0, 204659.0, 161519.0, 101581.0, 57202.0, 31049.0, 17123.0, 9342.0, 5015.0, 2944.0, 1638.0, 1028.0, 567.0, 374.0, 239.0, 159.0, 93.0, 54.0, 47.0, 40.0, 16.0, 5.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.334716796875, -4.20068359375, -4.066650390625, -3.9326171875, -3.798583984375, -3.66455078125, -3.530517578125, -3.396484375, -3.262451171875, -3.12841796875, -2.994384765625, -2.8603515625, -2.726318359375, -2.59228515625, -2.458251953125, -2.32421875, -2.190185546875, -2.05615234375, -1.922119140625, -1.7880859375, -1.654052734375, -1.52001953125, -1.385986328125, -1.251953125, -1.117919921875, -0.98388671875, -0.849853515625, -0.7158203125, -0.581787109375, -0.44775390625, -0.313720703125, -0.1796875, -0.045654296875, 0.08837890625, 0.222412109375, 0.3564453125, 0.490478515625, 0.62451171875, 0.758544921875, 0.892578125, 1.026611328125, 1.16064453125, 1.294677734375, 1.4287109375, 1.562744140625, 1.69677734375, 1.830810546875, 1.96484375, 2.098876953125, 2.23291015625, 2.366943359375, 2.5009765625, 2.635009765625, 2.76904296875, 2.903076171875, 3.037109375, 3.171142578125, 3.30517578125, 3.439208984375, 3.5732421875, 3.707275390625, 3.84130859375, 3.975341796875, 4.109375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 9.0, 19.0, 26.0, 31.0, 29.0, 45.0, 33.0, 65.0, 71.0, 55.0, 76.0, 95.0, 71.0, 53.0, 52.0, 46.0, 45.0, 32.0, 31.0, 24.0, 20.0, 6.0, 9.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.442626953125, -1.39990234375, -1.357177734375, -1.314453125, -1.271728515625, -1.22900390625, -1.186279296875, -1.1435546875, -1.100830078125, -1.05810546875, -1.015380859375, -0.97265625, -0.929931640625, -0.88720703125, -0.844482421875, -0.8017578125, -0.759033203125, -0.71630859375, -0.673583984375, -0.630859375, -0.588134765625, -0.54541015625, -0.502685546875, -0.4599609375, -0.417236328125, -0.37451171875, -0.331787109375, -0.2890625, -0.246337890625, -0.20361328125, -0.160888671875, -0.1181640625, -0.075439453125, -0.03271484375, 0.010009765625, 0.052734375, 0.095458984375, 0.13818359375, 0.180908203125, 0.2236328125, 0.266357421875, 0.30908203125, 0.351806640625, 0.39453125, 0.437255859375, 0.47998046875, 0.522705078125, 0.5654296875, 0.608154296875, 0.65087890625, 0.693603515625, 0.736328125, 0.779052734375, 0.82177734375, 0.864501953125, 0.9072265625, 0.949951171875, 0.99267578125, 1.035400390625, 1.078125, 1.120849609375, 1.16357421875, 1.206298828125, 1.2490234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 2.0, 10.0, 6.0, 12.0, 15.0, 10.0, 28.0, 28.0, 28.0, 33.0, 43.0, 52.0, 60.0, 58.0, 68.0, 83.0, 56.0, 57.0, 41.0, 56.0, 46.0, 51.0, 30.0, 29.0, 21.0, 18.0, 18.0, 7.0, 10.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.874255180358887, -10.578197479248047, -10.282139778137207, -9.986083030700684, -9.690025329589844, -9.393967628479004, -9.097909927368164, -8.801852226257324, -8.505794525146484, -8.209736824035645, -7.913679599761963, -7.617621898651123, -7.321564674377441, -7.025506973266602, -6.729449272155762, -6.433391571044922, -6.137334823608398, -5.841277122497559, -5.545219898223877, -5.249162197113037, -4.9531049728393555, -4.657047271728516, -4.360989570617676, -4.064931869506836, -3.7688746452331543, -3.4728171825408936, -3.176759719848633, -2.880702018737793, -2.5846445560455322, -2.2885870933532715, -1.9925295114517212, -1.696471929550171, -1.4004154205322266, -1.1043579578399658, -0.8083003759384155, -0.51224285364151, -0.2161853313446045, 0.07987213134765625, 0.37592971324920654, 0.6719872951507568, 0.9680447578430176, 1.2641022205352783, 1.5601598024368286, 1.856217384338379, 2.1522748470306396, 2.4483323097229004, 2.7443900108337402, 3.040447473526001, 3.3365049362182617, 3.6325623989105225, 3.928619861602783, 4.224677562713623, 4.520734786987305, 4.8167924880981445, 5.112850189208984, 5.408907890319824, 5.704965114593506, 6.001022815704346, 6.297080039978027, 6.593137741088867, 6.889195442199707, 7.185252666473389, 7.4813103675842285, 7.77736759185791, 8.07342529296875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 2.0, 4.0, 7.0, 11.0, 6.0, 8.0, 10.0, 6.0, 18.0, 19.0, 25.0, 22.0, 22.0, 20.0, 34.0, 36.0, 31.0, 36.0, 39.0, 29.0, 36.0, 50.0, 34.0, 39.0, 37.0, 31.0, 38.0, 33.0, 27.0, 40.0, 25.0, 27.0, 27.0, 24.0, 16.0, 23.0, 19.0, 14.0, 13.0, 16.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.142911911010742, -4.009039402008057, -3.87516713142395, -3.7412946224212646, -3.607422351837158, -3.4735498428344727, -3.339677333831787, -3.2058050632476807, -3.071932792663574, -2.9380602836608887, -2.8041880130767822, -2.6703155040740967, -2.5364432334899902, -2.4025707244873047, -2.268698215484619, -2.1348259449005127, -2.000953435897827, -1.8670810461044312, -1.7332086563110352, -1.5993361473083496, -1.4654638767242432, -1.3315913677215576, -1.1977189779281616, -1.0638465881347656, -0.9299741983413696, -0.7961018085479736, -0.6622294187545776, -0.5283569693565369, -0.39448457956314087, -0.2606121897697449, -0.1267397403717041, 0.0071326494216918945, 0.1410050392150879, 0.2748774290084839, 0.40874984860420227, 0.5426222681999207, 0.6764946579933167, 0.8103670477867126, 0.9442394971847534, 1.0781118869781494, 1.2119842767715454, 1.3458566665649414, 1.4797290563583374, 1.6136014461517334, 1.747473955154419, 1.8813462257385254, 2.015218734741211, 2.1490912437438965, 2.282963514328003, 2.4168360233306885, 2.550708293914795, 2.6845808029174805, 2.818453073501587, 2.9523255825042725, 3.086197853088379, 3.2200703620910645, 3.35394287109375, 3.4878153800964355, 3.621687650680542, 3.7555601596832275, 3.889432430267334, 4.0233049392700195, 4.157177448272705, 4.291049957275391, 4.424921989440918]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 10.0, 5.0, 9.0, 16.0, 22.0, 32.0, 27.0, 62.0, 73.0, 86.0, 150.0, 204.0, 299.0, 450.0, 663.0, 979.0, 1325.0, 1994.0, 3184.0, 4951.0, 7593.0, 12099.0, 19811.0, 33513.0, 59410.0, 110323.0, 215070.0, 432020.0, 779920.0, 964544.0, 718553.0, 392933.0, 197792.0, 102662.0, 54736.0, 31188.0, 18141.0, 11046.0, 6529.0, 4201.0, 2636.0, 1789.0, 1159.0, 679.0, 480.0, 321.0, 215.0, 122.0, 106.0, 53.0, 36.0, 22.0, 14.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0], "bins": [-8.328125, -8.086181640625, -7.84423828125, -7.602294921875, -7.3603515625, -7.118408203125, -6.87646484375, -6.634521484375, -6.392578125, -6.150634765625, -5.90869140625, -5.666748046875, -5.4248046875, -5.182861328125, -4.94091796875, -4.698974609375, -4.45703125, -4.215087890625, -3.97314453125, -3.731201171875, -3.4892578125, -3.247314453125, -3.00537109375, -2.763427734375, -2.521484375, -2.279541015625, -2.03759765625, -1.795654296875, -1.5537109375, -1.311767578125, -1.06982421875, -0.827880859375, -0.5859375, -0.343994140625, -0.10205078125, 0.139892578125, 0.3818359375, 0.623779296875, 0.86572265625, 1.107666015625, 1.349609375, 1.591552734375, 1.83349609375, 2.075439453125, 2.3173828125, 2.559326171875, 2.80126953125, 3.043212890625, 3.28515625, 3.527099609375, 3.76904296875, 4.010986328125, 4.2529296875, 4.494873046875, 4.73681640625, 4.978759765625, 5.220703125, 5.462646484375, 5.70458984375, 5.946533203125, 6.1884765625, 6.430419921875, 6.67236328125, 6.914306640625, 7.15625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 10.0, 6.0, 7.0, 8.0, 10.0, 21.0, 16.0, 16.0, 32.0, 22.0, 30.0, 27.0, 28.0, 32.0, 43.0, 36.0, 43.0, 33.0, 49.0, 41.0, 50.0, 42.0, 22.0, 41.0, 40.0, 31.0, 28.0, 36.0, 31.0, 10.0, 28.0, 19.0, 19.0, 17.0, 22.0, 10.0, 9.0, 6.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.7890625, -4.65057373046875, -4.5120849609375, -4.37359619140625, -4.235107421875, -4.09661865234375, -3.9581298828125, -3.81964111328125, -3.68115234375, -3.54266357421875, -3.4041748046875, -3.26568603515625, -3.127197265625, -2.98870849609375, -2.8502197265625, -2.71173095703125, -2.5732421875, -2.43475341796875, -2.2962646484375, -2.15777587890625, -2.019287109375, -1.88079833984375, -1.7423095703125, -1.60382080078125, -1.46533203125, -1.32684326171875, -1.1883544921875, -1.04986572265625, -0.911376953125, -0.77288818359375, -0.6343994140625, -0.49591064453125, -0.357421875, -0.21893310546875, -0.0804443359375, 0.05804443359375, 0.196533203125, 0.33502197265625, 0.4735107421875, 0.61199951171875, 0.75048828125, 0.88897705078125, 1.0274658203125, 1.16595458984375, 1.304443359375, 1.44293212890625, 1.5814208984375, 1.71990966796875, 1.8583984375, 1.99688720703125, 2.1353759765625, 2.27386474609375, 2.412353515625, 2.55084228515625, 2.6893310546875, 2.82781982421875, 2.96630859375, 3.10479736328125, 3.2432861328125, 3.38177490234375, 3.520263671875, 3.65875244140625, 3.7972412109375, 3.93572998046875, 4.07421875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 17.0, 19.0, 29.0, 34.0, 43.0, 63.0, 109.0, 187.0, 238.0, 344.0, 507.0, 824.0, 1332.0, 2191.0, 3676.0, 6625.0, 11721.0, 21771.0, 41167.0, 81328.0, 165938.0, 346884.0, 709091.0, 1100995.0, 851249.0, 431657.0, 206066.0, 99782.0, 50291.0, 26501.0, 14321.0, 7879.0, 4516.0, 2560.0, 1613.0, 991.0, 595.0, 357.0, 254.0, 163.0, 111.0, 75.0, 59.0, 33.0, 27.0, 9.0, 9.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-11.7890625, -11.427978515625, -11.06689453125, -10.705810546875, -10.3447265625, -9.983642578125, -9.62255859375, -9.261474609375, -8.900390625, -8.539306640625, -8.17822265625, -7.817138671875, -7.4560546875, -7.094970703125, -6.73388671875, -6.372802734375, -6.01171875, -5.650634765625, -5.28955078125, -4.928466796875, -4.5673828125, -4.206298828125, -3.84521484375, -3.484130859375, -3.123046875, -2.761962890625, -2.40087890625, -2.039794921875, -1.6787109375, -1.317626953125, -0.95654296875, -0.595458984375, -0.234375, 0.126708984375, 0.48779296875, 0.848876953125, 1.2099609375, 1.571044921875, 1.93212890625, 2.293212890625, 2.654296875, 3.015380859375, 3.37646484375, 3.737548828125, 4.0986328125, 4.459716796875, 4.82080078125, 5.181884765625, 5.54296875, 5.904052734375, 6.26513671875, 6.626220703125, 6.9873046875, 7.348388671875, 7.70947265625, 8.070556640625, 8.431640625, 8.792724609375, 9.15380859375, 9.514892578125, 9.8759765625, 10.237060546875, 10.59814453125, 10.959228515625, 11.3203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 12.0, 5.0, 12.0, 14.0, 16.0, 33.0, 31.0, 48.0, 36.0, 61.0, 83.0, 90.0, 98.0, 121.0, 157.0, 179.0, 207.0, 223.0, 266.0, 239.0, 276.0, 259.0, 257.0, 214.0, 200.0, 188.0, 163.0, 106.0, 102.0, 81.0, 60.0, 62.0, 33.0, 25.0, 24.0, 20.0, 8.0, 17.0, 7.0, 11.0, 9.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.479583740234375, -2.38885498046875, -2.298126220703125, -2.2073974609375, -2.116668701171875, -2.02593994140625, -1.935211181640625, -1.844482421875, -1.753753662109375, -1.66302490234375, -1.572296142578125, -1.4815673828125, -1.390838623046875, -1.30010986328125, -1.209381103515625, -1.11865234375, -1.027923583984375, -0.93719482421875, -0.846466064453125, -0.7557373046875, -0.665008544921875, -0.57427978515625, -0.483551025390625, -0.392822265625, -0.302093505859375, -0.21136474609375, -0.120635986328125, -0.0299072265625, 0.060821533203125, 0.15155029296875, 0.242279052734375, 0.3330078125, 0.423736572265625, 0.51446533203125, 0.605194091796875, 0.6959228515625, 0.786651611328125, 0.87738037109375, 0.968109130859375, 1.058837890625, 1.149566650390625, 1.24029541015625, 1.331024169921875, 1.4217529296875, 1.512481689453125, 1.60321044921875, 1.693939208984375, 1.78466796875, 1.875396728515625, 1.96612548828125, 2.056854248046875, 2.1475830078125, 2.238311767578125, 2.32904052734375, 2.419769287109375, 2.510498046875, 2.601226806640625, 2.69195556640625, 2.782684326171875, 2.8734130859375, 2.964141845703125, 3.05487060546875, 3.145599365234375, 3.236328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 5.0, 8.0, 6.0, 6.0, 12.0, 11.0, 18.0, 20.0, 26.0, 36.0, 28.0, 31.0, 39.0, 52.0, 51.0, 60.0, 63.0, 70.0, 51.0, 64.0, 49.0, 59.0, 49.0, 19.0, 22.0, 28.0, 29.0, 16.0, 16.0, 15.0, 4.0, 4.0, 10.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.572054862976074, -11.243688583374023, -10.915321350097656, -10.586955070495605, -10.258587837219238, -9.930221557617188, -9.60185432434082, -9.27348804473877, -8.945120811462402, -8.616754531860352, -8.288387298583984, -7.960020542144775, -7.631653785705566, -7.303287029266357, -6.974920272827148, -6.646553993225098, -6.318187236785889, -5.98982048034668, -5.661453723907471, -5.333086967468262, -5.004720211029053, -4.676353454589844, -4.347987174987793, -4.019619941711426, -3.691253423690796, -3.362886667251587, -3.034519910812378, -2.706153392791748, -2.377786636352539, -2.04941987991333, -1.721053123474121, -1.392686367034912, -1.0643196105957031, -0.7359528541564941, -0.40758615732192993, -0.07921946048736572, 0.24914729595184326, 0.5775140523910522, 0.9058806896209717, 1.2342474460601807, 1.5626142024993896, 1.8909809589385986, 2.2193477153778076, 2.5477142333984375, 2.8760809898376465, 3.2044477462768555, 3.5328145027160645, 3.8611812591552734, 4.189548015594482, 4.517914772033691, 4.8462815284729, 5.174648284912109, 5.503015041351318, 5.831381797790527, 6.159748077392578, 6.488115310668945, 6.816481590270996, 7.144848346710205, 7.473215103149414, 7.801581859588623, 8.129948616027832, 8.458314895629883, 8.78668212890625, 9.1150484085083, 9.443415641784668]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 8.0, 8.0, 5.0, 4.0, 14.0, 13.0, 18.0, 20.0, 16.0, 16.0, 24.0, 18.0, 22.0, 34.0, 25.0, 23.0, 27.0, 34.0, 33.0, 43.0, 41.0, 33.0, 33.0, 36.0, 29.0, 30.0, 28.0, 34.0, 35.0, 28.0, 21.0, 30.0, 19.0, 18.0, 13.0, 23.0, 18.0, 16.0, 16.0, 11.0, 15.0, 9.0, 12.0, 10.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.13959264755249, -4.986419677734375, -4.83324670791626, -4.6800737380981445, -4.5269012451171875, -4.373728275299072, -4.220555305480957, -4.067382335662842, -3.9142093658447266, -3.7610363960266113, -3.607863664627075, -3.45469069480896, -3.3015177249908447, -3.1483449935913086, -2.9951720237731934, -2.841999053955078, -2.688826322555542, -2.5356533527374268, -2.3824806213378906, -2.2293076515197754, -2.07613468170166, -1.9229618310928345, -1.7697889804840088, -1.6166160106658936, -1.4634431600570679, -1.3102703094482422, -1.157097339630127, -1.0039244890213013, -0.8507515788078308, -0.6975786685943604, -0.5444058179855347, -0.39123284816741943, -0.23805999755859375, -0.08488710224628448, 0.06828579306602478, 0.22145867347717285, 0.3746315836906433, 0.5278044939041138, 0.6809773445129395, 0.8341503143310547, 0.9873231649398804, 1.140496015548706, 1.2936689853668213, 1.446841835975647, 1.6000146865844727, 1.753187656402588, 1.9063605070114136, 2.0595335960388184, 2.2127063274383545, 2.3658792972564697, 2.519052028656006, 2.672224998474121, 2.8253979682922363, 2.9785709381103516, 3.1317436695098877, 3.284916639328003, 3.438089370727539, 3.5912623405456543, 3.7444350719451904, 3.8976080417633057, 4.050780773162842, 4.203953742980957, 4.357126712799072, 4.5102996826171875, 4.663472652435303]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 14.0, 29.0, 40.0, 49.0, 92.0, 110.0, 173.0, 253.0, 470.0, 630.0, 1037.0, 1560.0, 2389.0, 4061.0, 6665.0, 11178.0, 18844.0, 32728.0, 56465.0, 96404.0, 156026.0, 202654.0, 177368.0, 115041.0, 68073.0, 39233.0, 22682.0, 13437.0, 7867.0, 4834.0, 2965.0, 1765.0, 1146.0, 781.0, 493.0, 300.0, 227.0, 149.0, 101.0, 64.0, 43.0, 26.0, 19.0, 18.0, 13.0, 6.0, 8.0, 4.0, 2.0, 1.0], "bins": [-0.91796875, -0.8922348022460938, -0.8665008544921875, -0.8407669067382812, -0.815032958984375, -0.7892990112304688, -0.7635650634765625, -0.7378311157226562, -0.71209716796875, -0.6863632202148438, -0.6606292724609375, -0.6348953247070312, -0.609161376953125, -0.5834274291992188, -0.5576934814453125, -0.5319595336914062, -0.5062255859375, -0.48049163818359375, -0.4547576904296875, -0.42902374267578125, -0.403289794921875, -0.37755584716796875, -0.3518218994140625, -0.32608795166015625, -0.30035400390625, -0.27462005615234375, -0.2488861083984375, -0.22315216064453125, -0.197418212890625, -0.17168426513671875, -0.1459503173828125, -0.12021636962890625, -0.094482421875, -0.06874847412109375, -0.0430145263671875, -0.01728057861328125, 0.008453369140625, 0.03418731689453125, 0.0599212646484375, 0.08565521240234375, 0.11138916015625, 0.13712310791015625, 0.1628570556640625, 0.18859100341796875, 0.214324951171875, 0.24005889892578125, 0.2657928466796875, 0.29152679443359375, 0.3172607421875, 0.34299468994140625, 0.3687286376953125, 0.39446258544921875, 0.420196533203125, 0.44593048095703125, 0.4716644287109375, 0.49739837646484375, 0.52313232421875, 0.5488662719726562, 0.5746002197265625, 0.6003341674804688, 0.626068115234375, 0.6518020629882812, 0.6775360107421875, 0.7032699584960938, 0.72900390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 12.0, 11.0, 22.0, 28.0, 23.0, 27.0, 19.0, 42.0, 30.0, 43.0, 32.0, 41.0, 43.0, 44.0, 37.0, 48.0, 37.0, 38.0, 42.0, 49.0, 33.0, 22.0, 30.0, 29.0, 23.0, 22.0, 20.0, 18.0, 17.0, 17.0, 10.0, 4.0, 10.0, 8.0, 4.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.3131103515625, -7.102783203125, -6.8924560546875, -6.68212890625, -6.4718017578125, -6.261474609375, -6.0511474609375, -5.8408203125, -5.6304931640625, -5.420166015625, -5.2098388671875, -4.99951171875, -4.7891845703125, -4.578857421875, -4.3685302734375, -4.158203125, -3.9478759765625, -3.737548828125, -3.5272216796875, -3.31689453125, -3.1065673828125, -2.896240234375, -2.6859130859375, -2.4755859375, -2.2652587890625, -2.054931640625, -1.8446044921875, -1.63427734375, -1.4239501953125, -1.213623046875, -1.0032958984375, -0.79296875, -0.5826416015625, -0.372314453125, -0.1619873046875, 0.04833984375, 0.2586669921875, 0.468994140625, 0.6793212890625, 0.8896484375, 1.0999755859375, 1.310302734375, 1.5206298828125, 1.73095703125, 1.9412841796875, 2.151611328125, 2.3619384765625, 2.572265625, 2.7825927734375, 2.992919921875, 3.2032470703125, 3.41357421875, 3.6239013671875, 3.834228515625, 4.0445556640625, 4.2548828125, 4.4652099609375, 4.675537109375, 4.8858642578125, 5.09619140625, 5.3065185546875, 5.516845703125, 5.7271728515625, 5.9375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 3.0, 8.0, 10.0, 19.0, 22.0, 27.0, 53.0, 53.0, 83.0, 106.0, 139.0, 264.0, 351.0, 526.0, 802.0, 1377.0, 2189.0, 4128.0, 7812.0, 16988.0, 50588.0, 816532.0, 102395.0, 22325.0, 9926.0, 4868.0, 2684.0, 1497.0, 941.0, 558.0, 425.0, 267.0, 162.0, 132.0, 81.0, 55.0, 41.0, 37.0, 23.0, 19.0, 9.0, 8.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4512939453125, -2.371337890625, -2.2913818359375, -2.21142578125, -2.1314697265625, -2.051513671875, -1.9715576171875, -1.8916015625, -1.8116455078125, -1.731689453125, -1.6517333984375, -1.57177734375, -1.4918212890625, -1.411865234375, -1.3319091796875, -1.251953125, -1.1719970703125, -1.092041015625, -1.0120849609375, -0.93212890625, -0.8521728515625, -0.772216796875, -0.6922607421875, -0.6123046875, -0.5323486328125, -0.452392578125, -0.3724365234375, -0.29248046875, -0.2125244140625, -0.132568359375, -0.0526123046875, 0.02734375, 0.1072998046875, 0.187255859375, 0.2672119140625, 0.34716796875, 0.4271240234375, 0.507080078125, 0.5870361328125, 0.6669921875, 0.7469482421875, 0.826904296875, 0.9068603515625, 0.98681640625, 1.0667724609375, 1.146728515625, 1.2266845703125, 1.306640625, 1.3865966796875, 1.466552734375, 1.5465087890625, 1.62646484375, 1.7064208984375, 1.786376953125, 1.8663330078125, 1.9462890625, 2.0262451171875, 2.106201171875, 2.1861572265625, 2.26611328125, 2.3460693359375, 2.426025390625, 2.5059814453125, 2.5859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 6.0, 5.0, 6.0, 7.0, 11.0, 13.0, 15.0, 9.0, 11.0, 20.0, 16.0, 23.0, 29.0, 24.0, 35.0, 36.0, 33.0, 40.0, 44.0, 33.0, 38.0, 36.0, 45.0, 30.0, 28.0, 40.0, 38.0, 28.0, 24.0, 38.0, 33.0, 31.0, 33.0, 22.0, 24.0, 15.0, 10.0, 7.0, 14.0, 7.0, 3.0, 7.0, 8.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.03515625, -3.90655517578125, -3.7779541015625, -3.64935302734375, -3.520751953125, -3.39215087890625, -3.2635498046875, -3.13494873046875, -3.00634765625, -2.87774658203125, -2.7491455078125, -2.62054443359375, -2.491943359375, -2.36334228515625, -2.2347412109375, -2.10614013671875, -1.9775390625, -1.84893798828125, -1.7203369140625, -1.59173583984375, -1.463134765625, -1.33453369140625, -1.2059326171875, -1.07733154296875, -0.94873046875, -0.82012939453125, -0.6915283203125, -0.56292724609375, -0.434326171875, -0.30572509765625, -0.1771240234375, -0.04852294921875, 0.080078125, 0.20867919921875, 0.3372802734375, 0.46588134765625, 0.594482421875, 0.72308349609375, 0.8516845703125, 0.98028564453125, 1.10888671875, 1.23748779296875, 1.3660888671875, 1.49468994140625, 1.623291015625, 1.75189208984375, 1.8804931640625, 2.00909423828125, 2.1376953125, 2.26629638671875, 2.3948974609375, 2.52349853515625, 2.652099609375, 2.78070068359375, 2.9093017578125, 3.03790283203125, 3.16650390625, 3.29510498046875, 3.4237060546875, 3.55230712890625, 3.680908203125, 3.80950927734375, 3.9381103515625, 4.06671142578125, 4.1953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 11.0, 9.0, 13.0, 18.0, 35.0, 55.0, 65.0, 118.0, 153.0, 248.0, 414.0, 706.0, 1324.0, 2252.0, 4563.0, 9439.0, 21576.0, 117965.0, 836681.0, 29034.0, 11716.0, 5515.0, 2841.0, 1541.0, 847.0, 481.0, 293.0, 196.0, 114.0, 98.0, 65.0, 47.0, 36.0, 23.0, 10.0, 12.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66845703125, -0.6476669311523438, -0.6268768310546875, -0.6060867309570312, -0.585296630859375, -0.5645065307617188, -0.5437164306640625, -0.5229263305664062, -0.50213623046875, -0.48134613037109375, -0.4605560302734375, -0.43976593017578125, -0.418975830078125, -0.39818572998046875, -0.3773956298828125, -0.35660552978515625, -0.3358154296875, -0.31502532958984375, -0.2942352294921875, -0.27344512939453125, -0.252655029296875, -0.23186492919921875, -0.2110748291015625, -0.19028472900390625, -0.16949462890625, -0.14870452880859375, -0.1279144287109375, -0.10712432861328125, -0.086334228515625, -0.06554412841796875, -0.0447540283203125, -0.02396392822265625, -0.003173828125, 0.01761627197265625, 0.0384063720703125, 0.05919647216796875, 0.079986572265625, 0.10077667236328125, 0.1215667724609375, 0.14235687255859375, 0.16314697265625, 0.18393707275390625, 0.2047271728515625, 0.22551727294921875, 0.246307373046875, 0.26709747314453125, 0.2878875732421875, 0.30867767333984375, 0.3294677734375, 0.35025787353515625, 0.3710479736328125, 0.39183807373046875, 0.412628173828125, 0.43341827392578125, 0.4542083740234375, 0.47499847412109375, 0.49578857421875, 0.5165786743164062, 0.5373687744140625, 0.5581588745117188, 0.578948974609375, 0.5997390747070312, 0.6205291748046875, 0.6413192749023438, 0.662109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 15.0, 17.0, 13.0, 21.0, 24.0, 25.0, 25.0, 46.0, 46.0, 48.0, 49.0, 45.0, 57.0, 57.0, 42.0, 41.0, 59.0, 43.0, 43.0, 46.0, 42.0, 27.0, 23.0, 12.0, 17.0, 18.0, 19.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5153160095214844e-05, -2.4388544261455536e-05, -2.3623928427696228e-05, -2.285931259393692e-05, -2.2094696760177612e-05, -2.1330080926418304e-05, -2.0565465092658997e-05, -1.980084925889969e-05, -1.903623342514038e-05, -1.8271617591381073e-05, -1.7507001757621765e-05, -1.6742385923862457e-05, -1.597777009010315e-05, -1.5213154256343842e-05, -1.4448538422584534e-05, -1.3683922588825226e-05, -1.2919306755065918e-05, -1.215469092130661e-05, -1.1390075087547302e-05, -1.0625459253787994e-05, -9.860843420028687e-06, -9.096227586269379e-06, -8.33161175251007e-06, -7.566995918750763e-06, -6.802380084991455e-06, -6.037764251232147e-06, -5.273148417472839e-06, -4.5085325837135315e-06, -3.7439167499542236e-06, -2.9793009161949158e-06, -2.214685082435608e-06, -1.4500692486763e-06, -6.854534149169922e-07, 7.916241884231567e-08, 8.437782526016235e-07, 1.6083940863609314e-06, 2.3730099201202393e-06, 3.137625753879547e-06, 3.902241587638855e-06, 4.666857421398163e-06, 5.431473255157471e-06, 6.1960890889167786e-06, 6.9607049226760864e-06, 7.725320756435394e-06, 8.489936590194702e-06, 9.25455242395401e-06, 1.0019168257713318e-05, 1.0783784091472626e-05, 1.1548399925231934e-05, 1.2313015758991241e-05, 1.307763159275055e-05, 1.3842247426509857e-05, 1.4606863260269165e-05, 1.5371479094028473e-05, 1.613609492778778e-05, 1.690071076154709e-05, 1.7665326595306396e-05, 1.8429942429065704e-05, 1.9194558262825012e-05, 1.995917409658432e-05, 2.0723789930343628e-05, 2.1488405764102936e-05, 2.2253021597862244e-05, 2.301763743162155e-05, 2.378225326538086e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 9.0, 4.0, 8.0, 17.0, 26.0, 49.0, 51.0, 99.0, 124.0, 219.0, 365.0, 535.0, 767.0, 1373.0, 2315.0, 3917.0, 7228.0, 13765.0, 28143.0, 62424.0, 146939.0, 294495.0, 262961.0, 120809.0, 51378.0, 23819.0, 11801.0, 6078.0, 3493.0, 1993.0, 1196.0, 775.0, 474.0, 322.0, 195.0, 131.0, 92.0, 59.0, 36.0, 25.0, 11.0, 4.0, 9.0, 7.0, 9.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3133697509765625, -0.302520751953125, -0.2916717529296875, -0.28082275390625, -0.2699737548828125, -0.259124755859375, -0.2482757568359375, -0.2374267578125, -0.2265777587890625, -0.215728759765625, -0.2048797607421875, -0.19403076171875, -0.1831817626953125, -0.172332763671875, -0.1614837646484375, -0.150634765625, -0.1397857666015625, -0.128936767578125, -0.1180877685546875, -0.10723876953125, -0.0963897705078125, -0.085540771484375, -0.0746917724609375, -0.0638427734375, -0.0529937744140625, -0.042144775390625, -0.0312957763671875, -0.02044677734375, -0.0095977783203125, 0.001251220703125, 0.0121002197265625, 0.02294921875, 0.0337982177734375, 0.044647216796875, 0.0554962158203125, 0.06634521484375, 0.0771942138671875, 0.088043212890625, 0.0988922119140625, 0.1097412109375, 0.1205902099609375, 0.131439208984375, 0.1422882080078125, 0.15313720703125, 0.1639862060546875, 0.174835205078125, 0.1856842041015625, 0.196533203125, 0.2073822021484375, 0.218231201171875, 0.2290802001953125, 0.23992919921875, 0.2507781982421875, 0.261627197265625, 0.2724761962890625, 0.2833251953125, 0.2941741943359375, 0.305023193359375, 0.3158721923828125, 0.32672119140625, 0.3375701904296875, 0.348419189453125, 0.3592681884765625, 0.3701171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 6.0, 3.0, 10.0, 6.0, 9.0, 8.0, 22.0, 12.0, 20.0, 17.0, 31.0, 29.0, 39.0, 61.0, 57.0, 71.0, 71.0, 61.0, 68.0, 62.0, 55.0, 48.0, 47.0, 37.0, 29.0, 24.0, 23.0, 15.0, 7.0, 10.0, 10.0, 6.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0751953125, -0.07299518585205078, -0.07079505920410156, -0.06859493255615234, -0.06639480590820312, -0.0641946792602539, -0.06199455261230469, -0.05979442596435547, -0.05759429931640625, -0.05539417266845703, -0.05319404602050781, -0.050993919372558594, -0.048793792724609375, -0.046593666076660156, -0.04439353942871094, -0.04219341278076172, -0.0399932861328125, -0.03779315948486328, -0.03559303283691406, -0.033392906188964844, -0.031192779541015625, -0.028992652893066406, -0.026792526245117188, -0.02459239959716797, -0.02239227294921875, -0.02019214630126953, -0.017992019653320312, -0.015791893005371094, -0.013591766357421875, -0.011391639709472656, -0.009191513061523438, -0.006991386413574219, -0.004791259765625, -0.0025911331176757812, -0.0003910064697265625, 0.0018091201782226562, 0.004009246826171875, 0.006209373474121094, 0.008409500122070312, 0.010609626770019531, 0.01280975341796875, 0.015009880065917969, 0.017210006713867188, 0.019410133361816406, 0.021610260009765625, 0.023810386657714844, 0.026010513305664062, 0.02821063995361328, 0.0304107666015625, 0.03261089324951172, 0.03481101989746094, 0.037011146545410156, 0.039211273193359375, 0.041411399841308594, 0.04361152648925781, 0.04581165313720703, 0.04801177978515625, 0.05021190643310547, 0.05241203308105469, 0.054612159729003906, 0.056812286376953125, 0.059012413024902344, 0.06121253967285156, 0.06341266632080078, 0.06561279296875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 10.0, 19.0, 27.0, 28.0, 33.0, 27.0, 36.0, 56.0, 46.0, 62.0, 50.0, 73.0, 59.0, 55.0, 57.0, 55.0, 57.0, 31.0, 24.0, 21.0, 27.0, 20.0, 16.0, 16.0, 10.0, 4.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.313261985778809, -10.98647403717041, -10.659685134887695, -10.332897186279297, -10.006109237670898, -9.6793212890625, -9.352532386779785, -9.025744438171387, -8.698955535888672, -8.372167587280273, -8.045378684997559, -7.71859073638916, -7.391802787780762, -7.065014362335205, -6.738225936889648, -6.41143798828125, -6.084650039672852, -5.757861614227295, -5.4310736656188965, -5.10428524017334, -4.777497291564941, -4.450708866119385, -4.123920440673828, -3.7971322536468506, -3.470344066619873, -3.1435558795928955, -2.816767692565918, -2.4899792671203613, -2.163191080093384, -1.8364028930664062, -1.5096145868301392, -1.182826280593872, -0.8560390472412109, -0.5292508006095886, -0.2024625539779663, 0.124325692653656, 0.4511139392852783, 0.7779021263122559, 1.104690432548523, 1.43147873878479, 1.7582669258117676, 2.085055112838745, 2.4118432998657227, 2.7386317253112793, 3.065419912338257, 3.3922080993652344, 3.718996524810791, 4.045784950256348, 4.372572898864746, 4.699361324310303, 5.026149272918701, 5.352937698364258, 5.679725646972656, 6.006514072418213, 6.3333024978637695, 6.660090446472168, 6.986878871917725, 7.313667297363281, 7.64045524597168, 7.967243671417236, 8.294032096862793, 8.620820045471191, 8.94760799407959, 9.274396896362305, 9.601184844970703]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 7.0, 9.0, 5.0, 2.0, 15.0, 12.0, 19.0, 21.0, 17.0, 13.0, 21.0, 20.0, 25.0, 28.0, 26.0, 22.0, 30.0, 30.0, 37.0, 42.0, 38.0, 36.0, 33.0, 36.0, 29.0, 34.0, 22.0, 34.0, 36.0, 28.0, 21.0, 27.0, 25.0, 16.0, 14.0, 22.0, 15.0, 19.0, 20.0, 8.0, 15.0, 11.0, 10.0, 12.0, 6.0, 9.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.119045257568359, -4.966975212097168, -4.814905166625977, -4.662835121154785, -4.510765075683594, -4.358695030212402, -4.206624984741211, -4.0545549392700195, -3.9024851322174072, -3.750415086746216, -3.5983450412750244, -3.446274995803833, -3.2942051887512207, -3.1421351432800293, -2.990065097808838, -2.8379950523376465, -2.685925006866455, -2.5338549613952637, -2.3817849159240723, -2.229714870452881, -2.0776448249816895, -1.9255748987197876, -1.7735049724578857, -1.6214349269866943, -1.469364881515503, -1.3172948360443115, -1.1652247905731201, -1.0131548643112183, -0.8610848188400269, -0.7090147733688354, -0.5569447875022888, -0.4048748016357422, -0.2528042793273926, -0.10073426365852356, 0.05133575201034546, 0.20340576767921448, 0.3554757833480835, 0.5075458288192749, 0.6596158146858215, 0.8116858005523682, 0.9637558460235596, 1.115825891494751, 1.2678959369659424, 1.4199658632278442, 1.5720359086990356, 1.724105954170227, 1.876175880432129, 2.0282459259033203, 2.1803159713745117, 2.332386016845703, 2.4844560623168945, 2.636526107788086, 2.7885961532592773, 2.9406661987304688, 3.092736005783081, 3.2448060512542725, 3.396876096725464, 3.5489461421966553, 3.7010161876678467, 3.853086233139038, 4.00515604019165, 4.157226085662842, 4.309296131134033, 4.461366176605225, 4.613436222076416]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 11.0, 11.0, 18.0, 28.0, 32.0, 46.0, 80.0, 136.0, 219.0, 374.0, 593.0, 1094.0, 1967.0, 3370.0, 6079.0, 11233.0, 19925.0, 35497.0, 62672.0, 104269.0, 155483.0, 187211.0, 168896.0, 119638.0, 73788.0, 42559.0, 23549.0, 13176.0, 7212.0, 4024.0, 2235.0, 1310.0, 729.0, 415.0, 250.0, 171.0, 84.0, 50.0, 36.0, 22.0, 21.0, 14.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.92620849609375, -6.6844482421875, -6.44268798828125, -6.200927734375, -5.95916748046875, -5.7174072265625, -5.47564697265625, -5.23388671875, -4.99212646484375, -4.7503662109375, -4.50860595703125, -4.266845703125, -4.02508544921875, -3.7833251953125, -3.54156494140625, -3.2998046875, -3.05804443359375, -2.8162841796875, -2.57452392578125, -2.332763671875, -2.09100341796875, -1.8492431640625, -1.60748291015625, -1.36572265625, -1.12396240234375, -0.8822021484375, -0.64044189453125, -0.398681640625, -0.15692138671875, 0.0848388671875, 0.32659912109375, 0.568359375, 0.81011962890625, 1.0518798828125, 1.29364013671875, 1.535400390625, 1.77716064453125, 2.0189208984375, 2.26068115234375, 2.50244140625, 2.74420166015625, 2.9859619140625, 3.22772216796875, 3.469482421875, 3.71124267578125, 3.9530029296875, 4.19476318359375, 4.4365234375, 4.67828369140625, 4.9200439453125, 5.16180419921875, 5.403564453125, 5.64532470703125, 5.8870849609375, 6.12884521484375, 6.37060546875, 6.61236572265625, 6.8541259765625, 7.09588623046875, 7.337646484375, 7.57940673828125, 7.8211669921875, 8.06292724609375, 8.3046875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 12.0, 7.0, 8.0, 7.0, 7.0, 16.0, 14.0, 27.0, 26.0, 19.0, 26.0, 28.0, 30.0, 37.0, 39.0, 37.0, 33.0, 34.0, 43.0, 44.0, 34.0, 33.0, 48.0, 34.0, 25.0, 30.0, 32.0, 27.0, 29.0, 27.0, 25.0, 18.0, 21.0, 8.0, 20.0, 15.0, 17.0, 14.0, 7.0, 15.0, 5.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.8671875, -6.67791748046875, -6.4886474609375, -6.29937744140625, -6.110107421875, -5.92083740234375, -5.7315673828125, -5.54229736328125, -5.35302734375, -5.16375732421875, -4.9744873046875, -4.78521728515625, -4.595947265625, -4.40667724609375, -4.2174072265625, -4.02813720703125, -3.8388671875, -3.64959716796875, -3.4603271484375, -3.27105712890625, -3.081787109375, -2.89251708984375, -2.7032470703125, -2.51397705078125, -2.32470703125, -2.13543701171875, -1.9461669921875, -1.75689697265625, -1.567626953125, -1.37835693359375, -1.1890869140625, -0.99981689453125, -0.810546875, -0.62127685546875, -0.4320068359375, -0.24273681640625, -0.053466796875, 0.13580322265625, 0.3250732421875, 0.51434326171875, 0.70361328125, 0.89288330078125, 1.0821533203125, 1.27142333984375, 1.460693359375, 1.64996337890625, 1.8392333984375, 2.02850341796875, 2.2177734375, 2.40704345703125, 2.5963134765625, 2.78558349609375, 2.974853515625, 3.16412353515625, 3.3533935546875, 3.54266357421875, 3.73193359375, 3.92120361328125, 4.1104736328125, 4.29974365234375, 4.489013671875, 4.67828369140625, 4.8675537109375, 5.05682373046875, 5.24609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 18.0, 34.0, 48.0, 63.0, 109.0, 165.0, 276.0, 400.0, 716.0, 1155.0, 1851.0, 3214.0, 5309.0, 9093.0, 15274.0, 26332.0, 44347.0, 72750.0, 109939.0, 149336.0, 166615.0, 149622.0, 110471.0, 72296.0, 44598.0, 26383.0, 15645.0, 9049.0, 5433.0, 3067.0, 1904.0, 1165.0, 687.0, 440.0, 281.0, 187.0, 103.0, 46.0, 36.0, 29.0, 21.0, 17.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.21246337890625, -6.9835205078125, -6.75457763671875, -6.525634765625, -6.29669189453125, -6.0677490234375, -5.83880615234375, -5.60986328125, -5.38092041015625, -5.1519775390625, -4.92303466796875, -4.694091796875, -4.46514892578125, -4.2362060546875, -4.00726318359375, -3.7783203125, -3.54937744140625, -3.3204345703125, -3.09149169921875, -2.862548828125, -2.63360595703125, -2.4046630859375, -2.17572021484375, -1.94677734375, -1.71783447265625, -1.4888916015625, -1.25994873046875, -1.031005859375, -0.80206298828125, -0.5731201171875, -0.34417724609375, -0.115234375, 0.11370849609375, 0.3426513671875, 0.57159423828125, 0.800537109375, 1.02947998046875, 1.2584228515625, 1.48736572265625, 1.71630859375, 1.94525146484375, 2.1741943359375, 2.40313720703125, 2.632080078125, 2.86102294921875, 3.0899658203125, 3.31890869140625, 3.5478515625, 3.77679443359375, 4.0057373046875, 4.23468017578125, 4.463623046875, 4.69256591796875, 4.9215087890625, 5.15045166015625, 5.37939453125, 5.60833740234375, 5.8372802734375, 6.06622314453125, 6.295166015625, 6.52410888671875, 6.7530517578125, 6.98199462890625, 7.2109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 21.0, 19.0, 20.0, 26.0, 34.0, 25.0, 23.0, 35.0, 52.0, 39.0, 42.0, 53.0, 47.0, 48.0, 53.0, 30.0, 41.0, 39.0, 40.0, 37.0, 38.0, 29.0, 36.0, 19.0, 20.0, 15.0, 14.0, 12.0, 14.0, 6.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -3.99932861328125, -3.8541259765625, -3.70892333984375, -3.563720703125, -3.41851806640625, -3.2733154296875, -3.12811279296875, -2.98291015625, -2.83770751953125, -2.6925048828125, -2.54730224609375, -2.402099609375, -2.25689697265625, -2.1116943359375, -1.96649169921875, -1.8212890625, -1.67608642578125, -1.5308837890625, -1.38568115234375, -1.240478515625, -1.09527587890625, -0.9500732421875, -0.80487060546875, -0.65966796875, -0.51446533203125, -0.3692626953125, -0.22406005859375, -0.078857421875, 0.06634521484375, 0.2115478515625, 0.35675048828125, 0.501953125, 0.64715576171875, 0.7923583984375, 0.93756103515625, 1.082763671875, 1.22796630859375, 1.3731689453125, 1.51837158203125, 1.66357421875, 1.80877685546875, 1.9539794921875, 2.09918212890625, 2.244384765625, 2.38958740234375, 2.5347900390625, 2.67999267578125, 2.8251953125, 2.97039794921875, 3.1156005859375, 3.26080322265625, 3.406005859375, 3.55120849609375, 3.6964111328125, 3.84161376953125, 3.98681640625, 4.13201904296875, 4.2772216796875, 4.42242431640625, 4.567626953125, 4.71282958984375, 4.8580322265625, 5.00323486328125, 5.1484375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 12.0, 21.0, 31.0, 42.0, 45.0, 92.0, 124.0, 200.0, 327.0, 432.0, 655.0, 1007.0, 1561.0, 2324.0, 3715.0, 5504.0, 8906.0, 14205.0, 23116.0, 38822.0, 64578.0, 104458.0, 152241.0, 178155.0, 158649.0, 111552.0, 69447.0, 41606.0, 24913.0, 15100.0, 9473.0, 5980.0, 3899.0, 2519.0, 1598.0, 1109.0, 754.0, 478.0, 330.0, 211.0, 121.0, 81.0, 49.0, 42.0, 30.0, 18.0, 12.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.711883544921875, -3.58197021484375, -3.452056884765625, -3.3221435546875, -3.192230224609375, -3.06231689453125, -2.932403564453125, -2.802490234375, -2.672576904296875, -2.54266357421875, -2.412750244140625, -2.2828369140625, -2.152923583984375, -2.02301025390625, -1.893096923828125, -1.76318359375, -1.633270263671875, -1.50335693359375, -1.373443603515625, -1.2435302734375, -1.113616943359375, -0.98370361328125, -0.853790283203125, -0.723876953125, -0.593963623046875, -0.46405029296875, -0.334136962890625, -0.2042236328125, -0.074310302734375, 0.05560302734375, 0.185516357421875, 0.3154296875, 0.445343017578125, 0.57525634765625, 0.705169677734375, 0.8350830078125, 0.964996337890625, 1.09490966796875, 1.224822998046875, 1.354736328125, 1.484649658203125, 1.61456298828125, 1.744476318359375, 1.8743896484375, 2.004302978515625, 2.13421630859375, 2.264129638671875, 2.39404296875, 2.523956298828125, 2.65386962890625, 2.783782958984375, 2.9136962890625, 3.043609619140625, 3.17352294921875, 3.303436279296875, 3.433349609375, 3.563262939453125, 3.69317626953125, 3.823089599609375, 3.9530029296875, 4.082916259765625, 4.21282958984375, 4.342742919921875, 4.47265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 4.0, 5.0, 11.0, 9.0, 11.0, 10.0, 19.0, 15.0, 24.0, 21.0, 40.0, 39.0, 57.0, 69.0, 67.0, 60.0, 85.0, 56.0, 58.0, 63.0, 53.0, 52.0, 28.0, 26.0, 29.0, 10.0, 10.0, 11.0, 12.0, 2.0, 5.0, 2.0, 5.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044417381286621094, -0.0004290081560611725, -0.00041384249925613403, -0.0003986768424510956, -0.00038351118564605713, -0.0003683455288410187, -0.0003531798720359802, -0.00033801421523094177, -0.0003228485584259033, -0.00030768290162086487, -0.0002925172448158264, -0.00027735158801078796, -0.0002621859312057495, -0.00024702027440071106, -0.0002318546175956726, -0.00021668896079063416, -0.0002015233039855957, -0.00018635764718055725, -0.0001711919903755188, -0.00015602633357048035, -0.0001408606767654419, -0.00012569501996040344, -0.00011052936315536499, -9.536370635032654e-05, -8.019804954528809e-05, -6.503239274024963e-05, -4.986673593521118e-05, -3.470107913017273e-05, -1.9535422325134277e-05, -4.369765520095825e-06, 1.0795891284942627e-05, 2.596154808998108e-05, 4.112720489501953e-05, 5.6292861700057983e-05, 7.145851850509644e-05, 8.662417531013489e-05, 0.00010178983211517334, 0.00011695548892021179, 0.00013212114572525024, 0.0001472868025302887, 0.00016245245933532715, 0.0001776181161403656, 0.00019278377294540405, 0.0002079494297504425, 0.00022311508655548096, 0.0002382807433605194, 0.00025344640016555786, 0.0002686120569705963, 0.00028377771377563477, 0.0002989433705806732, 0.00031410902738571167, 0.0003292746841907501, 0.0003444403409957886, 0.000359605997800827, 0.0003747716546058655, 0.00038993731141090393, 0.0004051029682159424, 0.00042026862502098083, 0.0004354342818260193, 0.00045059993863105774, 0.0004657655954360962, 0.00048093125224113464, 0.0004960969090461731, 0.0005112625658512115, 0.00052642822265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 14.0, 13.0, 27.0, 30.0, 34.0, 62.0, 107.0, 152.0, 239.0, 347.0, 480.0, 733.0, 1084.0, 1682.0, 2468.0, 3764.0, 5687.0, 9102.0, 14129.0, 22737.0, 37551.0, 62621.0, 99865.0, 143623.0, 171579.0, 158655.0, 117086.0, 74692.0, 44953.0, 27425.0, 16827.0, 10654.0, 6884.0, 4489.0, 2919.0, 1957.0, 1255.0, 889.0, 546.0, 393.0, 270.0, 173.0, 119.0, 77.0, 44.0, 35.0, 23.0, 16.0, 15.0, 4.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0], "bins": [-4.2734375, -4.1427001953125, -4.011962890625, -3.8812255859375, -3.75048828125, -3.6197509765625, -3.489013671875, -3.3582763671875, -3.2275390625, -3.0968017578125, -2.966064453125, -2.8353271484375, -2.70458984375, -2.5738525390625, -2.443115234375, -2.3123779296875, -2.181640625, -2.0509033203125, -1.920166015625, -1.7894287109375, -1.65869140625, -1.5279541015625, -1.397216796875, -1.2664794921875, -1.1357421875, -1.0050048828125, -0.874267578125, -0.7435302734375, -0.61279296875, -0.4820556640625, -0.351318359375, -0.2205810546875, -0.08984375, 0.0408935546875, 0.171630859375, 0.3023681640625, 0.43310546875, 0.5638427734375, 0.694580078125, 0.8253173828125, 0.9560546875, 1.0867919921875, 1.217529296875, 1.3482666015625, 1.47900390625, 1.6097412109375, 1.740478515625, 1.8712158203125, 2.001953125, 2.1326904296875, 2.263427734375, 2.3941650390625, 2.52490234375, 2.6556396484375, 2.786376953125, 2.9171142578125, 3.0478515625, 3.1785888671875, 3.309326171875, 3.4400634765625, 3.57080078125, 3.7015380859375, 3.832275390625, 3.9630126953125, 4.09375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 18.0, 18.0, 13.0, 18.0, 17.0, 23.0, 15.0, 28.0, 26.0, 33.0, 37.0, 53.0, 51.0, 52.0, 52.0, 52.0, 41.0, 48.0, 39.0, 49.0, 41.0, 26.0, 33.0, 24.0, 22.0, 25.0, 16.0, 14.0, 13.0, 17.0, 9.0, 8.0, 10.0, 7.0, 1.0, 8.0, 3.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.138671875, -1.1033935546875, -1.068115234375, -1.0328369140625, -0.99755859375, -0.9622802734375, -0.927001953125, -0.8917236328125, -0.8564453125, -0.8211669921875, -0.785888671875, -0.7506103515625, -0.71533203125, -0.6800537109375, -0.644775390625, -0.6094970703125, -0.57421875, -0.5389404296875, -0.503662109375, -0.4683837890625, -0.43310546875, -0.3978271484375, -0.362548828125, -0.3272705078125, -0.2919921875, -0.2567138671875, -0.221435546875, -0.1861572265625, -0.15087890625, -0.1156005859375, -0.080322265625, -0.0450439453125, -0.009765625, 0.0255126953125, 0.060791015625, 0.0960693359375, 0.13134765625, 0.1666259765625, 0.201904296875, 0.2371826171875, 0.2724609375, 0.3077392578125, 0.343017578125, 0.3782958984375, 0.41357421875, 0.4488525390625, 0.484130859375, 0.5194091796875, 0.5546875, 0.5899658203125, 0.625244140625, 0.6605224609375, 0.69580078125, 0.7310791015625, 0.766357421875, 0.8016357421875, 0.8369140625, 0.8721923828125, 0.907470703125, 0.9427490234375, 0.97802734375, 1.0133056640625, 1.048583984375, 1.0838623046875, 1.119140625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 8.0, 20.0, 11.0, 26.0, 26.0, 27.0, 23.0, 34.0, 35.0, 53.0, 47.0, 57.0, 59.0, 64.0, 47.0, 61.0, 63.0, 55.0, 45.0, 28.0, 34.0, 29.0, 24.0, 17.0, 12.0, 10.0, 12.0, 14.0, 4.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.41679859161377, -11.084955215454102, -10.753110885620117, -10.42126750946045, -10.089423179626465, -9.757579803466797, -9.425735473632812, -9.093892097473145, -8.762048721313477, -8.430205345153809, -8.098361015319824, -7.766517639160156, -7.43467378616333, -7.102829933166504, -6.770986080169678, -6.439142227172852, -6.107298374176025, -5.775454521179199, -5.443610668182373, -5.111766815185547, -4.779923439025879, -4.448079586029053, -4.116235733032227, -3.7843921184539795, -3.4525482654571533, -3.120704412460327, -2.78886079788208, -2.457016944885254, -2.1251730918884277, -1.7933294773101807, -1.4614856243133545, -1.1296420097351074, -0.7977981567382812, -0.46595439314842224, -0.13411062955856323, 0.19773316383361816, 0.5295768976211548, 0.8614206314086914, 1.1932644844055176, 1.5251080989837646, 1.8569519519805908, 2.188795804977417, 2.520639419555664, 2.8524832725524902, 3.1843271255493164, 3.5161707401275635, 3.8480145931243896, 4.179858207702637, 4.511702060699463, 4.843545913696289, 5.175389766693115, 5.507233619689941, 5.839076995849609, 6.1709208488464355, 6.502764701843262, 6.83460807800293, 7.166452407836914, 7.49829626083374, 7.830140113830566, 8.161983489990234, 8.493827819824219, 8.825671195983887, 9.157514572143555, 9.489358901977539, 9.821202278137207]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 10.0, 6.0, 6.0, 5.0, 20.0, 18.0, 18.0, 22.0, 24.0, 27.0, 33.0, 31.0, 37.0, 35.0, 36.0, 30.0, 31.0, 37.0, 30.0, 36.0, 51.0, 35.0, 43.0, 33.0, 47.0, 29.0, 33.0, 22.0, 24.0, 23.0, 19.0, 34.0, 20.0, 15.0, 18.0, 8.0, 7.0, 9.0, 2.0, 10.0, 4.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.380634307861328, -6.1947736740112305, -6.008913040161133, -5.823052406311035, -5.6371917724609375, -5.45133113861084, -5.265470504760742, -5.0796098709106445, -4.893749237060547, -4.707888603210449, -4.522027969360352, -4.336167335510254, -4.150306701660156, -3.9644460678100586, -3.77858567237854, -3.5927250385284424, -3.406864643096924, -3.221004009246826, -3.0351433753967285, -2.849282741546631, -2.663422107696533, -2.4775614738464355, -2.291701078414917, -2.1058404445648193, -1.9199798107147217, -1.734119176864624, -1.5482585430145264, -1.3623980283737183, -1.1765373945236206, -0.990676760673523, -0.8048162460327148, -0.6189556121826172, -0.43309497833251953, -0.24723437428474426, -0.061373770236968994, 0.12448680400848389, 0.31034743785858154, 0.4962080717086792, 0.6820685863494873, 0.867929220199585, 1.0537898540496826, 1.2396504878997803, 1.425511121749878, 1.611371636390686, 1.7972322702407837, 1.9830929040908813, 2.1689534187316895, 2.354814052581787, 2.5406746864318848, 2.7265353202819824, 2.91239595413208, 3.0982565879821777, 3.2841172218322754, 3.469977855682373, 3.6558382511138916, 3.8416988849639893, 4.027559280395508, 4.2134199142456055, 4.399280548095703, 4.585141181945801, 4.771001815795898, 4.956862449645996, 5.142723083496094, 5.328583717346191, 5.514444351196289]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 4.0, 11.0, 15.0, 21.0, 31.0, 54.0, 64.0, 87.0, 125.0, 213.0, 296.0, 488.0, 697.0, 1075.0, 1804.0, 2888.0, 4842.0, 8173.0, 14624.0, 26999.0, 52506.0, 110249.0, 248436.0, 582123.0, 1091528.0, 1051196.0, 547900.0, 236433.0, 105534.0, 50073.0, 25167.0, 13317.0, 7149.0, 4223.0, 2433.0, 1412.0, 794.0, 478.0, 324.0, 203.0, 120.0, 81.0, 32.0, 25.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.671875, -13.2916259765625, -12.911376953125, -12.5311279296875, -12.15087890625, -11.7706298828125, -11.390380859375, -11.0101318359375, -10.6298828125, -10.2496337890625, -9.869384765625, -9.4891357421875, -9.10888671875, -8.7286376953125, -8.348388671875, -7.9681396484375, -7.587890625, -7.2076416015625, -6.827392578125, -6.4471435546875, -6.06689453125, -5.6866455078125, -5.306396484375, -4.9261474609375, -4.5458984375, -4.1656494140625, -3.785400390625, -3.4051513671875, -3.02490234375, -2.6446533203125, -2.264404296875, -1.8841552734375, -1.50390625, -1.1236572265625, -0.743408203125, -0.3631591796875, 0.01708984375, 0.3973388671875, 0.777587890625, 1.1578369140625, 1.5380859375, 1.9183349609375, 2.298583984375, 2.6788330078125, 3.05908203125, 3.4393310546875, 3.819580078125, 4.1998291015625, 4.580078125, 4.9603271484375, 5.340576171875, 5.7208251953125, 6.10107421875, 6.4813232421875, 6.861572265625, 7.2418212890625, 7.6220703125, 8.0023193359375, 8.382568359375, 8.7628173828125, 9.14306640625, 9.5233154296875, 9.903564453125, 10.2838134765625, 10.6640625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 12.0, 14.0, 13.0, 13.0, 11.0, 14.0, 21.0, 26.0, 29.0, 25.0, 32.0, 42.0, 33.0, 35.0, 30.0, 35.0, 39.0, 46.0, 42.0, 37.0, 35.0, 38.0, 30.0, 27.0, 27.0, 31.0, 25.0, 19.0, 25.0, 23.0, 22.0, 18.0, 12.0, 11.0, 14.0, 13.0, 8.0, 5.0, 8.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2828369140625, -5.120361328125, -4.9578857421875, -4.79541015625, -4.6329345703125, -4.470458984375, -4.3079833984375, -4.1455078125, -3.9830322265625, -3.820556640625, -3.6580810546875, -3.49560546875, -3.3331298828125, -3.170654296875, -3.0081787109375, -2.845703125, -2.6832275390625, -2.520751953125, -2.3582763671875, -2.19580078125, -2.0333251953125, -1.870849609375, -1.7083740234375, -1.5458984375, -1.3834228515625, -1.220947265625, -1.0584716796875, -0.89599609375, -0.7335205078125, -0.571044921875, -0.4085693359375, -0.24609375, -0.0836181640625, 0.078857421875, 0.2413330078125, 0.40380859375, 0.5662841796875, 0.728759765625, 0.8912353515625, 1.0537109375, 1.2161865234375, 1.378662109375, 1.5411376953125, 1.70361328125, 1.8660888671875, 2.028564453125, 2.1910400390625, 2.353515625, 2.5159912109375, 2.678466796875, 2.8409423828125, 3.00341796875, 3.1658935546875, 3.328369140625, 3.4908447265625, 3.6533203125, 3.8157958984375, 3.978271484375, 4.1407470703125, 4.30322265625, 4.4656982421875, 4.628173828125, 4.7906494140625, 4.953125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 8.0, 6.0, 12.0, 20.0, 32.0, 56.0, 73.0, 124.0, 192.0, 303.0, 480.0, 780.0, 1281.0, 2081.0, 3533.0, 6419.0, 11118.0, 21092.0, 39984.0, 79870.0, 166077.0, 358955.0, 748727.0, 1125971.0, 837055.0, 410500.0, 190017.0, 91025.0, 45022.0, 23714.0, 12904.0, 6999.0, 3882.0, 2381.0, 1409.0, 837.0, 458.0, 351.0, 214.0, 111.0, 77.0, 46.0, 32.0, 20.0, 15.0, 12.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.59375, -16.114013671875, -15.63427734375, -15.154541015625, -14.6748046875, -14.195068359375, -13.71533203125, -13.235595703125, -12.755859375, -12.276123046875, -11.79638671875, -11.316650390625, -10.8369140625, -10.357177734375, -9.87744140625, -9.397705078125, -8.91796875, -8.438232421875, -7.95849609375, -7.478759765625, -6.9990234375, -6.519287109375, -6.03955078125, -5.559814453125, -5.080078125, -4.600341796875, -4.12060546875, -3.640869140625, -3.1611328125, -2.681396484375, -2.20166015625, -1.721923828125, -1.2421875, -0.762451171875, -0.28271484375, 0.197021484375, 0.6767578125, 1.156494140625, 1.63623046875, 2.115966796875, 2.595703125, 3.075439453125, 3.55517578125, 4.034912109375, 4.5146484375, 4.994384765625, 5.47412109375, 5.953857421875, 6.43359375, 6.913330078125, 7.39306640625, 7.872802734375, 8.3525390625, 8.832275390625, 9.31201171875, 9.791748046875, 10.271484375, 10.751220703125, 11.23095703125, 11.710693359375, 12.1904296875, 12.670166015625, 13.14990234375, 13.629638671875, 14.109375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 16.0, 34.0, 34.0, 28.0, 52.0, 72.0, 94.0, 121.0, 137.0, 151.0, 183.0, 223.0, 272.0, 299.0, 313.0, 263.0, 266.0, 262.0, 206.0, 198.0, 167.0, 140.0, 125.0, 80.0, 62.0, 52.0, 35.0, 32.0, 26.0, 16.0, 21.0, 12.0, 11.0, 10.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0792236328125, -3.947509765625, -3.8157958984375, -3.68408203125, -3.5523681640625, -3.420654296875, -3.2889404296875, -3.1572265625, -3.0255126953125, -2.893798828125, -2.7620849609375, -2.63037109375, -2.4986572265625, -2.366943359375, -2.2352294921875, -2.103515625, -1.9718017578125, -1.840087890625, -1.7083740234375, -1.57666015625, -1.4449462890625, -1.313232421875, -1.1815185546875, -1.0498046875, -0.9180908203125, -0.786376953125, -0.6546630859375, -0.52294921875, -0.3912353515625, -0.259521484375, -0.1278076171875, 0.00390625, 0.1356201171875, 0.267333984375, 0.3990478515625, 0.53076171875, 0.6624755859375, 0.794189453125, 0.9259033203125, 1.0576171875, 1.1893310546875, 1.321044921875, 1.4527587890625, 1.58447265625, 1.7161865234375, 1.847900390625, 1.9796142578125, 2.111328125, 2.2430419921875, 2.374755859375, 2.5064697265625, 2.63818359375, 2.7698974609375, 2.901611328125, 3.0333251953125, 3.1650390625, 3.2967529296875, 3.428466796875, 3.5601806640625, 3.69189453125, 3.8236083984375, 3.955322265625, 4.0870361328125, 4.21875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 13.0, 18.0, 26.0, 16.0, 37.0, 43.0, 32.0, 50.0, 48.0, 58.0, 68.0, 59.0, 66.0, 68.0, 48.0, 37.0, 59.0, 40.0, 39.0, 23.0, 25.0, 17.0, 19.0, 11.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.37887191772461, -16.9278564453125, -16.47684097290039, -16.02582550048828, -15.574809074401855, -15.123793601989746, -14.672778129577637, -14.221762657165527, -13.770747184753418, -13.319731712341309, -12.8687162399292, -12.417699813842773, -11.966684341430664, -11.515668869018555, -11.064653396606445, -10.613637924194336, -10.162622451782227, -9.711606979370117, -9.260591506958008, -8.809576034545898, -8.358559608459473, -7.907544136047363, -7.456528663635254, -7.0055131912231445, -6.554496765136719, -6.103481292724609, -5.652465343475342, -5.201449871063232, -4.750434398651123, -4.2994184494018555, -3.848402976989746, -3.3973875045776367, -2.9463720321655273, -2.495356321334839, -2.0443408489227295, -1.593325138092041, -1.142309546470642, -0.6912939548492432, -0.2402782440185547, 0.2107372283935547, 0.6617529392242432, 1.112768530845642, 1.563784122467041, 2.0147998332977295, 2.465815544128418, 2.9168310165405273, 3.367846727371216, 3.818862199783325, 4.269877910614014, 4.720893383026123, 5.171909332275391, 5.6229248046875, 6.073940277099609, 6.524955749511719, 6.975971698760986, 7.426987171173096, 7.878003120422363, 8.329018592834473, 8.780034065246582, 9.231050491333008, 9.682065963745117, 10.133081436157227, 10.584096908569336, 11.035112380981445, 11.486127853393555]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 6.0, 4.0, 7.0, 8.0, 11.0, 11.0, 18.0, 18.0, 18.0, 12.0, 18.0, 22.0, 24.0, 37.0, 29.0, 29.0, 41.0, 34.0, 33.0, 36.0, 28.0, 33.0, 33.0, 39.0, 31.0, 41.0, 34.0, 42.0, 34.0, 31.0, 28.0, 21.0, 24.0, 19.0, 17.0, 15.0, 16.0, 20.0, 8.0, 11.0, 10.0, 12.0, 10.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0], "bins": [-7.343834400177002, -7.12726354598999, -6.910693168640137, -6.694122314453125, -6.4775519371032715, -6.26098108291626, -6.044410705566406, -5.8278398513793945, -5.611269474029541, -5.394698619842529, -5.178128242492676, -4.961557388305664, -4.7449870109558105, -4.528416156768799, -4.311845779418945, -4.095274925231934, -3.878704309463501, -3.6621336936950684, -3.4455630779266357, -3.228992462158203, -3.0124218463897705, -2.795851230621338, -2.579280376434326, -2.3627099990844727, -2.146139144897461, -1.9295685291290283, -1.7129979133605957, -1.496427297592163, -1.2798566818237305, -1.0632859468460083, -0.8467153310775757, -0.6301447153091431, -0.41357421875, -0.1970035880804062, 0.019567042589187622, 0.23613768815994263, 0.45270830392837524, 0.6692789793014526, 0.8858495950698853, 1.1024202108383179, 1.3189908266067505, 1.535561442375183, 1.7521320581436157, 1.968702793121338, 2.1852734088897705, 2.401844024658203, 2.6184146404266357, 2.8349852561950684, 3.051555871963501, 3.2681264877319336, 3.484697103500366, 3.701267719268799, 3.9178383350372314, 4.134408950805664, 4.350979804992676, 4.567550182342529, 4.784121036529541, 5.000691890716553, 5.217262268066406, 5.433833122253418, 5.6504034996032715, 5.866974353790283, 6.083544731140137, 6.300115585327148, 6.516685962677002]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 17.0, 26.0, 27.0, 43.0, 64.0, 102.0, 175.0, 210.0, 316.0, 468.0, 685.0, 1092.0, 1593.0, 2548.0, 3999.0, 6271.0, 9946.0, 16721.0, 27556.0, 45570.0, 75839.0, 121276.0, 172044.0, 183135.0, 142427.0, 92294.0, 56112.0, 33848.0, 20600.0, 12627.0, 7567.0, 4736.0, 3000.0, 1975.0, 1211.0, 767.0, 512.0, 370.0, 231.0, 169.0, 124.0, 85.0, 55.0, 33.0, 29.0, 23.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.8875732421875, -0.857177734375, -0.8267822265625, -0.79638671875, -0.7659912109375, -0.735595703125, -0.7052001953125, -0.6748046875, -0.6444091796875, -0.614013671875, -0.5836181640625, -0.55322265625, -0.5228271484375, -0.492431640625, -0.4620361328125, -0.431640625, -0.4012451171875, -0.370849609375, -0.3404541015625, -0.31005859375, -0.2796630859375, -0.249267578125, -0.2188720703125, -0.1884765625, -0.1580810546875, -0.127685546875, -0.0972900390625, -0.06689453125, -0.0364990234375, -0.006103515625, 0.0242919921875, 0.0546875, 0.0850830078125, 0.115478515625, 0.1458740234375, 0.17626953125, 0.2066650390625, 0.237060546875, 0.2674560546875, 0.2978515625, 0.3282470703125, 0.358642578125, 0.3890380859375, 0.41943359375, 0.4498291015625, 0.480224609375, 0.5106201171875, 0.541015625, 0.5714111328125, 0.601806640625, 0.6322021484375, 0.66259765625, 0.6929931640625, 0.723388671875, 0.7537841796875, 0.7841796875, 0.8145751953125, 0.844970703125, 0.8753662109375, 0.90576171875, 0.9361572265625, 0.966552734375, 0.9969482421875, 1.02734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 16.0, 15.0, 17.0, 25.0, 16.0, 29.0, 25.0, 31.0, 33.0, 42.0, 30.0, 48.0, 42.0, 51.0, 44.0, 51.0, 40.0, 47.0, 41.0, 44.0, 53.0, 34.0, 28.0, 30.0, 23.0, 26.0, 24.0, 15.0, 19.0, 12.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.1968994140625, -9.885986328125, -9.5750732421875, -9.26416015625, -8.9532470703125, -8.642333984375, -8.3314208984375, -8.0205078125, -7.7095947265625, -7.398681640625, -7.0877685546875, -6.77685546875, -6.4659423828125, -6.155029296875, -5.8441162109375, -5.533203125, -5.2222900390625, -4.911376953125, -4.6004638671875, -4.28955078125, -3.9786376953125, -3.667724609375, -3.3568115234375, -3.0458984375, -2.7349853515625, -2.424072265625, -2.1131591796875, -1.80224609375, -1.4913330078125, -1.180419921875, -0.8695068359375, -0.55859375, -0.2476806640625, 0.063232421875, 0.3741455078125, 0.68505859375, 0.9959716796875, 1.306884765625, 1.6177978515625, 1.9287109375, 2.2396240234375, 2.550537109375, 2.8614501953125, 3.17236328125, 3.4832763671875, 3.794189453125, 4.1051025390625, 4.416015625, 4.7269287109375, 5.037841796875, 5.3487548828125, 5.65966796875, 5.9705810546875, 6.281494140625, 6.5924072265625, 6.9033203125, 7.2142333984375, 7.525146484375, 7.8360595703125, 8.14697265625, 8.4578857421875, 8.768798828125, 9.0797119140625, 9.390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 12.0, 14.0, 12.0, 25.0, 25.0, 41.0, 35.0, 59.0, 66.0, 104.0, 138.0, 213.0, 261.0, 402.0, 599.0, 870.0, 1377.0, 2170.0, 3759.0, 6720.0, 13175.0, 30256.0, 280944.0, 633917.0, 38925.0, 15295.0, 7669.0, 4309.0, 2452.0, 1553.0, 984.0, 621.0, 468.0, 280.0, 229.0, 156.0, 91.0, 89.0, 72.0, 36.0, 33.0, 27.0, 22.0, 14.0, 6.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0], "bins": [-2.84765625, -2.76416015625, -2.6806640625, -2.59716796875, -2.513671875, -2.43017578125, -2.3466796875, -2.26318359375, -2.1796875, -2.09619140625, -2.0126953125, -1.92919921875, -1.845703125, -1.76220703125, -1.6787109375, -1.59521484375, -1.51171875, -1.42822265625, -1.3447265625, -1.26123046875, -1.177734375, -1.09423828125, -1.0107421875, -0.92724609375, -0.84375, -0.76025390625, -0.6767578125, -0.59326171875, -0.509765625, -0.42626953125, -0.3427734375, -0.25927734375, -0.17578125, -0.09228515625, -0.0087890625, 0.07470703125, 0.158203125, 0.24169921875, 0.3251953125, 0.40869140625, 0.4921875, 0.57568359375, 0.6591796875, 0.74267578125, 0.826171875, 0.90966796875, 0.9931640625, 1.07666015625, 1.16015625, 1.24365234375, 1.3271484375, 1.41064453125, 1.494140625, 1.57763671875, 1.6611328125, 1.74462890625, 1.828125, 1.91162109375, 1.9951171875, 2.07861328125, 2.162109375, 2.24560546875, 2.3291015625, 2.41259765625, 2.49609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 11.0, 8.0, 9.0, 9.0, 13.0, 10.0, 13.0, 15.0, 22.0, 6.0, 26.0, 22.0, 31.0, 25.0, 25.0, 47.0, 48.0, 28.0, 38.0, 27.0, 40.0, 38.0, 39.0, 41.0, 40.0, 41.0, 44.0, 27.0, 30.0, 31.0, 29.0, 33.0, 19.0, 19.0, 17.0, 7.0, 19.0, 11.0, 19.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.0987548828125, -4.935791015625, -4.7728271484375, -4.60986328125, -4.4468994140625, -4.283935546875, -4.1209716796875, -3.9580078125, -3.7950439453125, -3.632080078125, -3.4691162109375, -3.30615234375, -3.1431884765625, -2.980224609375, -2.8172607421875, -2.654296875, -2.4913330078125, -2.328369140625, -2.1654052734375, -2.00244140625, -1.8394775390625, -1.676513671875, -1.5135498046875, -1.3505859375, -1.1876220703125, -1.024658203125, -0.8616943359375, -0.69873046875, -0.5357666015625, -0.372802734375, -0.2098388671875, -0.046875, 0.1160888671875, 0.279052734375, 0.4420166015625, 0.60498046875, 0.7679443359375, 0.930908203125, 1.0938720703125, 1.2568359375, 1.4197998046875, 1.582763671875, 1.7457275390625, 1.90869140625, 2.0716552734375, 2.234619140625, 2.3975830078125, 2.560546875, 2.7235107421875, 2.886474609375, 3.0494384765625, 3.21240234375, 3.3753662109375, 3.538330078125, 3.7012939453125, 3.8642578125, 4.0272216796875, 4.190185546875, 4.3531494140625, 4.51611328125, 4.6790771484375, 4.842041015625, 5.0050048828125, 5.16796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 4.0, 15.0, 18.0, 29.0, 33.0, 55.0, 90.0, 117.0, 171.0, 253.0, 412.0, 611.0, 994.0, 1569.0, 2456.0, 4125.0, 6970.0, 12179.0, 23249.0, 98181.0, 823942.0, 33855.0, 16390.0, 9158.0, 5221.0, 3060.0, 1937.0, 1233.0, 767.0, 467.0, 339.0, 203.0, 139.0, 100.0, 54.0, 43.0, 31.0, 26.0, 19.0, 4.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465576171875, -0.4501762390136719, -0.43477630615234375, -0.4193763732910156, -0.4039764404296875, -0.3885765075683594, -0.37317657470703125, -0.3577766418457031, -0.342376708984375, -0.3269767761230469, -0.31157684326171875, -0.2961769104003906, -0.2807769775390625, -0.2653770446777344, -0.24997711181640625, -0.23457717895507812, -0.21917724609375, -0.20377731323242188, -0.18837738037109375, -0.17297744750976562, -0.1575775146484375, -0.14217758178710938, -0.12677764892578125, -0.11137771606445312, -0.095977783203125, -0.08057785034179688, -0.06517791748046875, -0.049777984619140625, -0.0343780517578125, -0.018978118896484375, -0.00357818603515625, 0.011821746826171875, 0.0272216796875, 0.042621612548828125, 0.05802154541015625, 0.07342147827148438, 0.0888214111328125, 0.10422134399414062, 0.11962127685546875, 0.13502120971679688, 0.150421142578125, 0.16582107543945312, 0.18122100830078125, 0.19662094116210938, 0.2120208740234375, 0.22742080688476562, 0.24282073974609375, 0.2582206726074219, 0.27362060546875, 0.2890205383300781, 0.30442047119140625, 0.3198204040527344, 0.3352203369140625, 0.3506202697753906, 0.36602020263671875, 0.3814201354980469, 0.396820068359375, 0.4122200012207031, 0.42761993408203125, 0.4430198669433594, 0.4584197998046875, 0.4738197326660156, 0.48921966552734375, 0.5046195983886719, 0.52001953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 7.0, 7.0, 6.0, 9.0, 8.0, 10.0, 16.0, 23.0, 22.0, 16.0, 19.0, 22.0, 22.0, 32.0, 36.0, 45.0, 32.0, 43.0, 31.0, 34.0, 37.0, 53.0, 35.0, 48.0, 62.0, 35.0, 34.0, 25.0, 39.0, 36.0, 19.0, 19.0, 12.0, 19.0, 16.0, 10.0, 10.0, 9.0, 9.0, 6.0, 8.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7583370208740234e-05, -1.7012469470500946e-05, -1.6441568732261658e-05, -1.587066799402237e-05, -1.529976725578308e-05, -1.4728866517543793e-05, -1.4157965779304504e-05, -1.3587065041065216e-05, -1.3016164302825928e-05, -1.244526356458664e-05, -1.1874362826347351e-05, -1.1303462088108063e-05, -1.0732561349868774e-05, -1.0161660611629486e-05, -9.590759873390198e-06, -9.01985913515091e-06, -8.448958396911621e-06, -7.878057658672333e-06, -7.3071569204330444e-06, -6.736256182193756e-06, -6.165355443954468e-06, -5.5944547057151794e-06, -5.023553967475891e-06, -4.452653229236603e-06, -3.8817524909973145e-06, -3.310851752758026e-06, -2.739951014518738e-06, -2.1690502762794495e-06, -1.5981495380401611e-06, -1.0272487998008728e-06, -4.5634806156158447e-07, 1.1455267667770386e-07, 6.854534149169922e-07, 1.2563541531562805e-06, 1.8272548913955688e-06, 2.398155629634857e-06, 2.9690563678741455e-06, 3.539957106113434e-06, 4.110857844352722e-06, 4.6817585825920105e-06, 5.252659320831299e-06, 5.823560059070587e-06, 6.3944607973098755e-06, 6.965361535549164e-06, 7.536262273788452e-06, 8.10716301202774e-06, 8.678063750267029e-06, 9.248964488506317e-06, 9.819865226745605e-06, 1.0390765964984894e-05, 1.0961666703224182e-05, 1.153256744146347e-05, 1.2103468179702759e-05, 1.2674368917942047e-05, 1.3245269656181335e-05, 1.3816170394420624e-05, 1.4387071132659912e-05, 1.49579718708992e-05, 1.552887260913849e-05, 1.6099773347377777e-05, 1.6670674085617065e-05, 1.7241574823856354e-05, 1.7812475562095642e-05, 1.838337630033493e-05, 1.895427703857422e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 19.0, 20.0, 40.0, 47.0, 65.0, 121.0, 148.0, 251.0, 414.0, 726.0, 1065.0, 1753.0, 2887.0, 4837.0, 7960.0, 13180.0, 21982.0, 37826.0, 63538.0, 104205.0, 156781.0, 189929.0, 162804.0, 110136.0, 68472.0, 40116.0, 23640.0, 13861.0, 8478.0, 5084.0, 3160.0, 1912.0, 1134.0, 680.0, 416.0, 315.0, 181.0, 124.0, 92.0, 55.0, 24.0, 17.0, 15.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.24658203125, -0.23923492431640625, -0.2318878173828125, -0.22454071044921875, -0.217193603515625, -0.20984649658203125, -0.2024993896484375, -0.19515228271484375, -0.18780517578125, -0.18045806884765625, -0.1731109619140625, -0.16576385498046875, -0.158416748046875, -0.15106964111328125, -0.1437225341796875, -0.13637542724609375, -0.1290283203125, -0.12168121337890625, -0.1143341064453125, -0.10698699951171875, -0.099639892578125, -0.09229278564453125, -0.0849456787109375, -0.07759857177734375, -0.07025146484375, -0.06290435791015625, -0.0555572509765625, -0.04821014404296875, -0.040863037109375, -0.03351593017578125, -0.0261688232421875, -0.01882171630859375, -0.011474609375, -0.00412750244140625, 0.0032196044921875, 0.01056671142578125, 0.017913818359375, 0.02526092529296875, 0.0326080322265625, 0.03995513916015625, 0.04730224609375, 0.05464935302734375, 0.0619964599609375, 0.06934356689453125, 0.076690673828125, 0.08403778076171875, 0.0913848876953125, 0.09873199462890625, 0.1060791015625, 0.11342620849609375, 0.1207733154296875, 0.12812042236328125, 0.135467529296875, 0.14281463623046875, 0.1501617431640625, 0.15750885009765625, 0.16485595703125, 0.17220306396484375, 0.1795501708984375, 0.18689727783203125, 0.194244384765625, 0.20159149169921875, 0.2089385986328125, 0.21628570556640625, 0.2236328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 7.0, 7.0, 13.0, 20.0, 19.0, 22.0, 26.0, 35.0, 52.0, 56.0, 56.0, 65.0, 52.0, 63.0, 69.0, 56.0, 50.0, 52.0, 43.0, 31.0, 42.0, 27.0, 24.0, 18.0, 16.0, 19.0, 11.0, 12.0, 3.0, 4.0, 8.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08172607421875, -0.07924365997314453, -0.07676124572753906, -0.0742788314819336, -0.07179641723632812, -0.06931400299072266, -0.06683158874511719, -0.06434917449951172, -0.06186676025390625, -0.05938434600830078, -0.05690193176269531, -0.054419517517089844, -0.051937103271484375, -0.049454689025878906, -0.04697227478027344, -0.04448986053466797, -0.0420074462890625, -0.03952503204345703, -0.03704261779785156, -0.034560203552246094, -0.032077789306640625, -0.029595375061035156, -0.027112960815429688, -0.02463054656982422, -0.02214813232421875, -0.01966571807861328, -0.017183303833007812, -0.014700889587402344, -0.012218475341796875, -0.009736061096191406, -0.0072536468505859375, -0.004771232604980469, -0.002288818359375, 0.00019359588623046875, 0.0026760101318359375, 0.005158424377441406, 0.007640838623046875, 0.010123252868652344, 0.012605667114257812, 0.015088081359863281, 0.01757049560546875, 0.02005290985107422, 0.022535324096679688, 0.025017738342285156, 0.027500152587890625, 0.029982566833496094, 0.03246498107910156, 0.03494739532470703, 0.0374298095703125, 0.03991222381591797, 0.04239463806152344, 0.044877052307128906, 0.047359466552734375, 0.049841880798339844, 0.05232429504394531, 0.05480670928955078, 0.05728912353515625, 0.05977153778076172, 0.06225395202636719, 0.06473636627197266, 0.06721878051757812, 0.0697011947631836, 0.07218360900878906, 0.07466602325439453, 0.0771484375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 6.0, 9.0, 7.0, 11.0, 11.0, 15.0, 16.0, 21.0, 20.0, 29.0, 38.0, 37.0, 51.0, 41.0, 59.0, 60.0, 69.0, 53.0, 73.0, 56.0, 40.0, 56.0, 44.0, 40.0, 25.0, 27.0, 22.0, 14.0, 13.0, 11.0, 8.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-17.484338760375977, -17.033742904663086, -16.583148956298828, -16.132553100585938, -15.681957244873047, -15.231362342834473, -14.780767440795898, -14.330171585083008, -13.879576683044434, -13.42898178100586, -12.978385925292969, -12.527791023254395, -12.07719612121582, -11.62660026550293, -11.176005363464355, -10.725410461425781, -10.27481460571289, -9.824219703674316, -9.373623847961426, -8.923028945922852, -8.472433090209961, -8.021838188171387, -7.5712432861328125, -7.12064790725708, -6.670052528381348, -6.219457149505615, -5.768861770629883, -5.318266868591309, -4.867671489715576, -4.417076110839844, -3.9664809703826904, -3.515885829925537, -3.0652894973754883, -2.614694118499756, -2.1640989780426025, -1.7135037183761597, -1.2629084587097168, -0.8123130798339844, -0.36171793937683105, 0.08887720108032227, 0.5394725799560547, 0.9900678396224976, 1.4406630992889404, 1.8912583589553833, 2.341853618621826, 2.7924489974975586, 3.243044137954712, 3.6936392784118652, 4.144234657287598, 4.59483003616333, 5.0454254150390625, 5.496020317077637, 5.946615695953369, 6.397211074829102, 6.847805976867676, 7.298401355743408, 7.748996734619141, 8.199591636657715, 8.650187492370605, 9.10078239440918, 9.55137825012207, 10.001973152160645, 10.452568054199219, 10.90316390991211, 11.353758811950684]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 6.0, 9.0, 11.0, 8.0, 16.0, 19.0, 18.0, 13.0, 17.0, 22.0, 25.0, 33.0, 34.0, 27.0, 36.0, 38.0, 36.0, 31.0, 31.0, 34.0, 30.0, 35.0, 34.0, 43.0, 32.0, 44.0, 33.0, 29.0, 35.0, 19.0, 24.0, 22.0, 16.0, 15.0, 15.0, 20.0, 7.0, 14.0, 10.0, 11.0, 12.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-7.346375942230225, -7.1301188468933105, -6.913861274719238, -6.697604179382324, -6.48134708404541, -6.265089511871338, -6.048832416534424, -5.832574844360352, -5.6163177490234375, -5.400060653686523, -5.183803081512451, -4.967545986175537, -4.751288890838623, -4.535031318664551, -4.318774223327637, -4.102517127990723, -3.8862597942352295, -3.6700024604797363, -3.4537453651428223, -3.237488031387329, -3.021230697631836, -2.804973602294922, -2.5887162685394287, -2.3724589347839355, -2.1562018394470215, -1.9399446249008179, -1.7236872911453247, -1.507430076599121, -1.291172742843628, -1.0749155282974243, -0.8586583137512207, -0.6424009799957275, -0.4261436462402344, -0.20988638699054718, 0.006370872259140015, 0.22262811660766602, 0.4388853907585144, 0.6551426649093628, 0.8713998794555664, 1.0876572132110596, 1.3039144277572632, 1.5201716423034668, 1.73642897605896, 1.9526861906051636, 2.168943405151367, 2.3852007389068604, 2.6014580726623535, 2.8177151679992676, 3.0339725017547607, 3.250229835510254, 3.466486930847168, 3.682744264602661, 3.8990015983581543, 4.115258693695068, 4.331516265869141, 4.547773361206055, 4.764030456542969, 4.980287551879883, 5.196545124053955, 5.412802219390869, 5.629059314727783, 5.8453168869018555, 6.0615739822387695, 6.277831077575684, 6.494088649749756]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 7.0, 12.0, 9.0, 15.0, 27.0, 38.0, 54.0, 95.0, 171.0, 216.0, 327.0, 537.0, 832.0, 1340.0, 2107.0, 3418.0, 5432.0, 9032.0, 14908.0, 24689.0, 40779.0, 66387.0, 102621.0, 142483.0, 163895.0, 152142.0, 116363.0, 77741.0, 47921.0, 29417.0, 17544.0, 10856.0, 6448.0, 3930.0, 2448.0, 1617.0, 945.0, 643.0, 399.0, 242.0, 150.0, 110.0, 70.0, 53.0, 28.0, 18.0, 15.0, 8.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-8.9140625, -8.6492919921875, -8.384521484375, -8.1197509765625, -7.85498046875, -7.5902099609375, -7.325439453125, -7.0606689453125, -6.7958984375, -6.5311279296875, -6.266357421875, -6.0015869140625, -5.73681640625, -5.4720458984375, -5.207275390625, -4.9425048828125, -4.677734375, -4.4129638671875, -4.148193359375, -3.8834228515625, -3.61865234375, -3.3538818359375, -3.089111328125, -2.8243408203125, -2.5595703125, -2.2947998046875, -2.030029296875, -1.7652587890625, -1.50048828125, -1.2357177734375, -0.970947265625, -0.7061767578125, -0.44140625, -0.1766357421875, 0.088134765625, 0.3529052734375, 0.61767578125, 0.8824462890625, 1.147216796875, 1.4119873046875, 1.6767578125, 1.9415283203125, 2.206298828125, 2.4710693359375, 2.73583984375, 3.0006103515625, 3.265380859375, 3.5301513671875, 3.794921875, 4.0596923828125, 4.324462890625, 4.5892333984375, 4.85400390625, 5.1187744140625, 5.383544921875, 5.6483154296875, 5.9130859375, 6.1778564453125, 6.442626953125, 6.7073974609375, 6.97216796875, 7.2369384765625, 7.501708984375, 7.7664794921875, 8.03125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 3.0, 12.0, 4.0, 6.0, 11.0, 11.0, 23.0, 17.0, 18.0, 21.0, 24.0, 33.0, 34.0, 32.0, 33.0, 24.0, 34.0, 41.0, 29.0, 46.0, 49.0, 33.0, 38.0, 32.0, 35.0, 35.0, 29.0, 29.0, 35.0, 24.0, 28.0, 23.0, 22.0, 15.0, 18.0, 9.0, 14.0, 9.0, 11.0, 7.0, 9.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0], "bins": [-7.91796875, -7.6763916015625, -7.434814453125, -7.1932373046875, -6.95166015625, -6.7100830078125, -6.468505859375, -6.2269287109375, -5.9853515625, -5.7437744140625, -5.502197265625, -5.2606201171875, -5.01904296875, -4.7774658203125, -4.535888671875, -4.2943115234375, -4.052734375, -3.8111572265625, -3.569580078125, -3.3280029296875, -3.08642578125, -2.8448486328125, -2.603271484375, -2.3616943359375, -2.1201171875, -1.8785400390625, -1.636962890625, -1.3953857421875, -1.15380859375, -0.9122314453125, -0.670654296875, -0.4290771484375, -0.1875, 0.0540771484375, 0.295654296875, 0.5372314453125, 0.77880859375, 1.0203857421875, 1.261962890625, 1.5035400390625, 1.7451171875, 1.9866943359375, 2.228271484375, 2.4698486328125, 2.71142578125, 2.9530029296875, 3.194580078125, 3.4361572265625, 3.677734375, 3.9193115234375, 4.160888671875, 4.4024658203125, 4.64404296875, 4.8856201171875, 5.127197265625, 5.3687744140625, 5.6103515625, 5.8519287109375, 6.093505859375, 6.3350830078125, 6.57666015625, 6.8182373046875, 7.059814453125, 7.3013916015625, 7.54296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 13.0, 17.0, 27.0, 48.0, 88.0, 178.0, 286.0, 424.0, 826.0, 1364.0, 2463.0, 4261.0, 7702.0, 14269.0, 25728.0, 46444.0, 82109.0, 133880.0, 181475.0, 187777.0, 146015.0, 93441.0, 53451.0, 29680.0, 16181.0, 9036.0, 4965.0, 2734.0, 1529.0, 884.0, 507.0, 324.0, 180.0, 90.0, 63.0, 36.0, 17.0, 17.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9962158203125, -9.664306640625, -9.3323974609375, -9.00048828125, -8.6685791015625, -8.336669921875, -8.0047607421875, -7.6728515625, -7.3409423828125, -7.009033203125, -6.6771240234375, -6.34521484375, -6.0133056640625, -5.681396484375, -5.3494873046875, -5.017578125, -4.6856689453125, -4.353759765625, -4.0218505859375, -3.68994140625, -3.3580322265625, -3.026123046875, -2.6942138671875, -2.3623046875, -2.0303955078125, -1.698486328125, -1.3665771484375, -1.03466796875, -0.7027587890625, -0.370849609375, -0.0389404296875, 0.29296875, 0.6248779296875, 0.956787109375, 1.2886962890625, 1.62060546875, 1.9525146484375, 2.284423828125, 2.6163330078125, 2.9482421875, 3.2801513671875, 3.612060546875, 3.9439697265625, 4.27587890625, 4.6077880859375, 4.939697265625, 5.2716064453125, 5.603515625, 5.9354248046875, 6.267333984375, 6.5992431640625, 6.93115234375, 7.2630615234375, 7.594970703125, 7.9268798828125, 8.2587890625, 8.5906982421875, 8.922607421875, 9.2545166015625, 9.58642578125, 9.9183349609375, 10.250244140625, 10.5821533203125, 10.9140625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 2.0, 6.0, 6.0, 15.0, 15.0, 7.0, 14.0, 12.0, 19.0, 22.0, 31.0, 30.0, 31.0, 39.0, 38.0, 24.0, 35.0, 36.0, 34.0, 47.0, 42.0, 52.0, 50.0, 42.0, 38.0, 32.0, 28.0, 36.0, 34.0, 27.0, 14.0, 22.0, 30.0, 21.0, 10.0, 7.0, 10.0, 9.0, 11.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.76654052734375, -4.5877685546875, -4.40899658203125, -4.230224609375, -4.05145263671875, -3.8726806640625, -3.69390869140625, -3.51513671875, -3.33636474609375, -3.1575927734375, -2.97882080078125, -2.800048828125, -2.62127685546875, -2.4425048828125, -2.26373291015625, -2.0849609375, -1.90618896484375, -1.7274169921875, -1.54864501953125, -1.369873046875, -1.19110107421875, -1.0123291015625, -0.83355712890625, -0.65478515625, -0.47601318359375, -0.2972412109375, -0.11846923828125, 0.060302734375, 0.23907470703125, 0.4178466796875, 0.59661865234375, 0.775390625, 0.95416259765625, 1.1329345703125, 1.31170654296875, 1.490478515625, 1.66925048828125, 1.8480224609375, 2.02679443359375, 2.20556640625, 2.38433837890625, 2.5631103515625, 2.74188232421875, 2.920654296875, 3.09942626953125, 3.2781982421875, 3.45697021484375, 3.6357421875, 3.81451416015625, 3.9932861328125, 4.17205810546875, 4.350830078125, 4.52960205078125, 4.7083740234375, 4.88714599609375, 5.06591796875, 5.24468994140625, 5.4234619140625, 5.60223388671875, 5.781005859375, 5.95977783203125, 6.1385498046875, 6.31732177734375, 6.49609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 6.0, 15.0, 35.0, 31.0, 65.0, 80.0, 128.0, 196.0, 321.0, 494.0, 820.0, 1156.0, 1854.0, 2959.0, 4857.0, 8694.0, 14560.0, 25172.0, 42976.0, 71320.0, 110362.0, 152835.0, 172268.0, 152630.0, 110268.0, 71044.0, 42230.0, 24970.0, 14510.0, 8396.0, 4997.0, 3020.0, 1935.0, 1203.0, 719.0, 501.0, 285.0, 217.0, 137.0, 93.0, 61.0, 49.0, 23.0, 20.0, 16.0, 6.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.87109375, -4.7164306640625, -4.561767578125, -4.4071044921875, -4.25244140625, -4.0977783203125, -3.943115234375, -3.7884521484375, -3.6337890625, -3.4791259765625, -3.324462890625, -3.1697998046875, -3.01513671875, -2.8604736328125, -2.705810546875, -2.5511474609375, -2.396484375, -2.2418212890625, -2.087158203125, -1.9324951171875, -1.77783203125, -1.6231689453125, -1.468505859375, -1.3138427734375, -1.1591796875, -1.0045166015625, -0.849853515625, -0.6951904296875, -0.54052734375, -0.3858642578125, -0.231201171875, -0.0765380859375, 0.078125, 0.2327880859375, 0.387451171875, 0.5421142578125, 0.69677734375, 0.8514404296875, 1.006103515625, 1.1607666015625, 1.3154296875, 1.4700927734375, 1.624755859375, 1.7794189453125, 1.93408203125, 2.0887451171875, 2.243408203125, 2.3980712890625, 2.552734375, 2.7073974609375, 2.862060546875, 3.0167236328125, 3.17138671875, 3.3260498046875, 3.480712890625, 3.6353759765625, 3.7900390625, 3.9447021484375, 4.099365234375, 4.2540283203125, 4.40869140625, 4.5633544921875, 4.718017578125, 4.8726806640625, 5.02734375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 7.0, 8.0, 15.0, 13.0, 19.0, 15.0, 28.0, 27.0, 32.0, 58.0, 58.0, 41.0, 51.0, 83.0, 55.0, 56.0, 54.0, 61.0, 32.0, 43.0, 40.0, 33.0, 36.0, 22.0, 16.0, 10.0, 10.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.0005652531981468201, -0.0005482882261276245, -0.000531323254108429, -0.0005143582820892334, -0.0004973933100700378, -0.0004804283380508423, -0.00046346336603164673, -0.00044649839401245117, -0.0004295334219932556, -0.00041256844997406006, -0.0003956034779548645, -0.00037863850593566895, -0.0003616735339164734, -0.00034470856189727783, -0.0003277435898780823, -0.0003107786178588867, -0.00029381364583969116, -0.0002768486738204956, -0.00025988370180130005, -0.0002429187297821045, -0.00022595375776290894, -0.00020898878574371338, -0.00019202381372451782, -0.00017505884170532227, -0.0001580938696861267, -0.00014112889766693115, -0.0001241639256477356, -0.00010719895362854004, -9.023398160934448e-05, -7.326900959014893e-05, -5.630403757095337e-05, -3.933906555175781e-05, -2.2374093532562256e-05, -5.409121513366699e-06, 1.1555850505828857e-05, 2.8520822525024414e-05, 4.548579454421997e-05, 6.245076656341553e-05, 7.941573858261108e-05, 9.638071060180664e-05, 0.0001133456826210022, 0.00013031065464019775, 0.0001472756266593933, 0.00016424059867858887, 0.00018120557069778442, 0.00019817054271697998, 0.00021513551473617554, 0.0002321004867553711, 0.00024906545877456665, 0.0002660304307937622, 0.00028299540281295776, 0.0002999603748321533, 0.0003169253468513489, 0.00033389031887054443, 0.00035085529088974, 0.00036782026290893555, 0.0003847852349281311, 0.00040175020694732666, 0.0004187151789665222, 0.0004356801509857178, 0.00045264512300491333, 0.0004696100950241089, 0.00048657506704330444, 0.0005035400390625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 14.0, 13.0, 10.0, 25.0, 30.0, 50.0, 81.0, 98.0, 153.0, 244.0, 312.0, 492.0, 786.0, 1106.0, 1841.0, 2763.0, 4324.0, 6721.0, 10682.0, 16942.0, 27009.0, 42369.0, 64631.0, 94083.0, 125514.0, 145516.0, 141430.0, 115895.0, 84974.0, 57735.0, 37662.0, 23999.0, 14980.0, 9402.0, 5797.0, 3761.0, 2443.0, 1569.0, 1041.0, 685.0, 467.0, 285.0, 198.0, 138.0, 89.0, 66.0, 44.0, 37.0, 24.0, 7.0, 10.0, 9.0, 4.0, 4.0, 1.0], "bins": [-4.90625, -4.7655029296875, -4.624755859375, -4.4840087890625, -4.34326171875, -4.2025146484375, -4.061767578125, -3.9210205078125, -3.7802734375, -3.6395263671875, -3.498779296875, -3.3580322265625, -3.21728515625, -3.0765380859375, -2.935791015625, -2.7950439453125, -2.654296875, -2.5135498046875, -2.372802734375, -2.2320556640625, -2.09130859375, -1.9505615234375, -1.809814453125, -1.6690673828125, -1.5283203125, -1.3875732421875, -1.246826171875, -1.1060791015625, -0.96533203125, -0.8245849609375, -0.683837890625, -0.5430908203125, -0.40234375, -0.2615966796875, -0.120849609375, 0.0198974609375, 0.16064453125, 0.3013916015625, 0.442138671875, 0.5828857421875, 0.7236328125, 0.8643798828125, 1.005126953125, 1.1458740234375, 1.28662109375, 1.4273681640625, 1.568115234375, 1.7088623046875, 1.849609375, 1.9903564453125, 2.131103515625, 2.2718505859375, 2.41259765625, 2.5533447265625, 2.694091796875, 2.8348388671875, 2.9755859375, 3.1163330078125, 3.257080078125, 3.3978271484375, 3.53857421875, 3.6793212890625, 3.820068359375, 3.9608154296875, 4.1015625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 13.0, 10.0, 8.0, 12.0, 15.0, 11.0, 23.0, 21.0, 23.0, 22.0, 29.0, 30.0, 30.0, 38.0, 59.0, 48.0, 45.0, 45.0, 48.0, 36.0, 42.0, 43.0, 41.0, 43.0, 43.0, 37.0, 30.0, 24.0, 22.0, 25.0, 11.0, 21.0, 6.0, 11.0, 10.0, 11.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4775390625, -1.4342803955078125, -1.391021728515625, -1.3477630615234375, -1.30450439453125, -1.2612457275390625, -1.217987060546875, -1.1747283935546875, -1.1314697265625, -1.0882110595703125, -1.044952392578125, -1.0016937255859375, -0.95843505859375, -0.9151763916015625, -0.871917724609375, -0.8286590576171875, -0.785400390625, -0.7421417236328125, -0.698883056640625, -0.6556243896484375, -0.61236572265625, -0.5691070556640625, -0.525848388671875, -0.4825897216796875, -0.4393310546875, -0.3960723876953125, -0.352813720703125, -0.3095550537109375, -0.26629638671875, -0.2230377197265625, -0.179779052734375, -0.1365203857421875, -0.09326171875, -0.0500030517578125, -0.006744384765625, 0.0365142822265625, 0.07977294921875, 0.1230316162109375, 0.166290283203125, 0.2095489501953125, 0.2528076171875, 0.2960662841796875, 0.339324951171875, 0.3825836181640625, 0.42584228515625, 0.4691009521484375, 0.512359619140625, 0.5556182861328125, 0.598876953125, 0.6421356201171875, 0.685394287109375, 0.7286529541015625, 0.77191162109375, 0.8151702880859375, 0.858428955078125, 0.9016876220703125, 0.9449462890625, 0.9882049560546875, 1.031463623046875, 1.0747222900390625, 1.11798095703125, 1.1612396240234375, 1.204498291015625, 1.2477569580078125, 1.291015625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 9.0, 13.0, 19.0, 21.0, 19.0, 22.0, 21.0, 29.0, 32.0, 48.0, 58.0, 64.0, 42.0, 57.0, 77.0, 59.0, 52.0, 45.0, 60.0, 44.0, 27.0, 36.0, 23.0, 23.0, 12.0, 14.0, 22.0, 7.0, 6.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-17.58538246154785, -17.135787963867188, -16.686193466186523, -16.23659896850586, -15.787004470825195, -15.337409973144531, -14.887815475463867, -14.438220977783203, -13.988626480102539, -13.539031982421875, -13.089437484741211, -12.639842987060547, -12.190248489379883, -11.740653991699219, -11.291059494018555, -10.84146499633789, -10.391870498657227, -9.942276000976562, -9.492681503295898, -9.043087005615234, -8.59349250793457, -8.143898010253906, -7.694303512573242, -7.244709014892578, -6.795114517211914, -6.34552001953125, -5.895925521850586, -5.446331024169922, -4.996736526489258, -4.547142028808594, -4.09754753112793, -3.6479530334472656, -3.198357582092285, -2.748763084411621, -2.299168586730957, -1.849574089050293, -1.399979591369629, -0.9503850936889648, -0.5007905960083008, -0.05119609832763672, 0.39839839935302734, 0.8479928970336914, 1.2975873947143555, 1.7471818923950195, 2.1967763900756836, 2.6463708877563477, 3.0959653854370117, 3.545559883117676, 3.99515438079834, 4.444748878479004, 4.894343376159668, 5.343937873840332, 5.793532371520996, 6.24312686920166, 6.692721366882324, 7.142315864562988, 7.591910362243652, 8.041504859924316, 8.49109935760498, 8.940693855285645, 9.390288352966309, 9.839882850646973, 10.289477348327637, 10.7390718460083, 11.188666343688965]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 10.0, 13.0, 10.0, 12.0, 12.0, 20.0, 26.0, 18.0, 20.0, 24.0, 27.0, 30.0, 28.0, 38.0, 36.0, 43.0, 36.0, 41.0, 38.0, 42.0, 36.0, 39.0, 40.0, 50.0, 25.0, 29.0, 28.0, 26.0, 23.0, 24.0, 19.0, 16.0, 20.0, 13.0, 13.0, 7.0, 12.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.953724384307861, -7.707611560821533, -7.461498737335205, -7.215385913848877, -6.969273090362549, -6.723160266876221, -6.477047443389893, -6.2309346199035645, -5.984821796417236, -5.738708972930908, -5.49259614944458, -5.246483325958252, -5.000370502471924, -4.754257678985596, -4.508144855499268, -4.2620320320129395, -4.015919208526611, -3.769806385040283, -3.523693561553955, -3.277580738067627, -3.031467914581299, -2.7853550910949707, -2.5392422676086426, -2.2931294441223145, -2.0470166206359863, -1.8009037971496582, -1.55479097366333, -1.308678150177002, -1.0625653266906738, -0.8164525032043457, -0.5703396797180176, -0.32422685623168945, -0.07811403274536133, 0.1679987907409668, 0.4141116142272949, 0.660224437713623, 0.9063372611999512, 1.1524500846862793, 1.3985629081726074, 1.6446757316589355, 1.8907885551452637, 2.136901378631592, 2.38301420211792, 2.629127025604248, 2.875239849090576, 3.1213526725769043, 3.3674654960632324, 3.6135783195495605, 3.8596911430358887, 4.105803966522217, 4.351916790008545, 4.598029613494873, 4.844142436981201, 5.090255260467529, 5.336368083953857, 5.5824809074401855, 5.828593730926514, 6.074706554412842, 6.32081937789917, 6.566932201385498, 6.813045024871826, 7.059157848358154, 7.305270671844482, 7.5513834953308105, 7.797496318817139]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 9.0, 15.0, 11.0, 30.0, 30.0, 76.0, 68.0, 104.0, 179.0, 239.0, 333.0, 558.0, 780.0, 1191.0, 1792.0, 2729.0, 4202.0, 6833.0, 11256.0, 19449.0, 34943.0, 66782.0, 137725.0, 299143.0, 635918.0, 1037037.0, 941644.0, 515907.0, 237344.0, 111658.0, 55538.0, 29473.0, 16077.0, 9503.0, 5779.0, 3524.0, 2242.0, 1456.0, 894.0, 614.0, 427.0, 266.0, 164.0, 118.0, 68.0, 48.0, 35.0, 30.0, 12.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-15.8984375, -15.4422607421875, -14.986083984375, -14.5299072265625, -14.07373046875, -13.6175537109375, -13.161376953125, -12.7052001953125, -12.2490234375, -11.7928466796875, -11.336669921875, -10.8804931640625, -10.42431640625, -9.9681396484375, -9.511962890625, -9.0557861328125, -8.599609375, -8.1434326171875, -7.687255859375, -7.2310791015625, -6.77490234375, -6.3187255859375, -5.862548828125, -5.4063720703125, -4.9501953125, -4.4940185546875, -4.037841796875, -3.5816650390625, -3.12548828125, -2.6693115234375, -2.213134765625, -1.7569580078125, -1.30078125, -0.8446044921875, -0.388427734375, 0.0677490234375, 0.52392578125, 0.9801025390625, 1.436279296875, 1.8924560546875, 2.3486328125, 2.8048095703125, 3.260986328125, 3.7171630859375, 4.17333984375, 4.6295166015625, 5.085693359375, 5.5418701171875, 5.998046875, 6.4542236328125, 6.910400390625, 7.3665771484375, 7.82275390625, 8.2789306640625, 8.735107421875, 9.1912841796875, 9.6474609375, 10.1036376953125, 10.559814453125, 11.0159912109375, 11.47216796875, 11.9283447265625, 12.384521484375, 12.8406982421875, 13.296875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 8.0, 7.0, 12.0, 12.0, 16.0, 13.0, 20.0, 17.0, 10.0, 22.0, 22.0, 36.0, 29.0, 34.0, 47.0, 35.0, 44.0, 40.0, 41.0, 50.0, 48.0, 46.0, 42.0, 41.0, 31.0, 29.0, 38.0, 30.0, 24.0, 23.0, 22.0, 19.0, 8.0, 13.0, 11.0, 8.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.421875, -8.17510986328125, -7.9283447265625, -7.68157958984375, -7.434814453125, -7.18804931640625, -6.9412841796875, -6.69451904296875, -6.44775390625, -6.20098876953125, -5.9542236328125, -5.70745849609375, -5.460693359375, -5.21392822265625, -4.9671630859375, -4.72039794921875, -4.4736328125, -4.22686767578125, -3.9801025390625, -3.73333740234375, -3.486572265625, -3.23980712890625, -2.9930419921875, -2.74627685546875, -2.49951171875, -2.25274658203125, -2.0059814453125, -1.75921630859375, -1.512451171875, -1.26568603515625, -1.0189208984375, -0.77215576171875, -0.525390625, -0.27862548828125, -0.0318603515625, 0.21490478515625, 0.461669921875, 0.70843505859375, 0.9552001953125, 1.20196533203125, 1.44873046875, 1.69549560546875, 1.9422607421875, 2.18902587890625, 2.435791015625, 2.68255615234375, 2.9293212890625, 3.17608642578125, 3.4228515625, 3.66961669921875, 3.9163818359375, 4.16314697265625, 4.409912109375, 4.65667724609375, 4.9034423828125, 5.15020751953125, 5.39697265625, 5.64373779296875, 5.8905029296875, 6.13726806640625, 6.384033203125, 6.63079833984375, 6.8775634765625, 7.12432861328125, 7.37109375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 10.0, 11.0, 11.0, 28.0, 40.0, 70.0, 98.0, 131.0, 155.0, 270.0, 362.0, 565.0, 747.0, 1184.0, 1742.0, 2706.0, 4479.0, 7181.0, 12200.0, 21397.0, 38227.0, 71384.0, 138100.0, 281038.0, 567213.0, 962885.0, 952815.0, 556992.0, 275062.0, 136733.0, 69928.0, 37858.0, 20995.0, 12239.0, 7228.0, 4362.0, 2689.0, 1681.0, 1165.0, 722.0, 502.0, 336.0, 236.0, 159.0, 114.0, 73.0, 46.0, 29.0, 31.0, 21.0, 7.0, 13.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0], "bins": [-18.90625, -18.315185546875, -17.72412109375, -17.133056640625, -16.5419921875, -15.950927734375, -15.35986328125, -14.768798828125, -14.177734375, -13.586669921875, -12.99560546875, -12.404541015625, -11.8134765625, -11.222412109375, -10.63134765625, -10.040283203125, -9.44921875, -8.858154296875, -8.26708984375, -7.676025390625, -7.0849609375, -6.493896484375, -5.90283203125, -5.311767578125, -4.720703125, -4.129638671875, -3.53857421875, -2.947509765625, -2.3564453125, -1.765380859375, -1.17431640625, -0.583251953125, 0.0078125, 0.598876953125, 1.18994140625, 1.781005859375, 2.3720703125, 2.963134765625, 3.55419921875, 4.145263671875, 4.736328125, 5.327392578125, 5.91845703125, 6.509521484375, 7.1005859375, 7.691650390625, 8.28271484375, 8.873779296875, 9.46484375, 10.055908203125, 10.64697265625, 11.238037109375, 11.8291015625, 12.420166015625, 13.01123046875, 13.602294921875, 14.193359375, 14.784423828125, 15.37548828125, 15.966552734375, 16.5576171875, 17.148681640625, 17.73974609375, 18.330810546875, 18.921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 6.0, 4.0, 3.0, 5.0, 7.0, 13.0, 10.0, 16.0, 29.0, 28.0, 33.0, 55.0, 60.0, 79.0, 107.0, 115.0, 161.0, 188.0, 229.0, 227.0, 280.0, 287.0, 304.0, 251.0, 243.0, 223.0, 214.0, 173.0, 155.0, 112.0, 103.0, 85.0, 70.0, 43.0, 30.0, 29.0, 24.0, 21.0, 12.0, 14.0, 7.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.4921875, -5.31744384765625, -5.1427001953125, -4.96795654296875, -4.793212890625, -4.61846923828125, -4.4437255859375, -4.26898193359375, -4.09423828125, -3.91949462890625, -3.7447509765625, -3.57000732421875, -3.395263671875, -3.22052001953125, -3.0457763671875, -2.87103271484375, -2.6962890625, -2.52154541015625, -2.3468017578125, -2.17205810546875, -1.997314453125, -1.82257080078125, -1.6478271484375, -1.47308349609375, -1.29833984375, -1.12359619140625, -0.9488525390625, -0.77410888671875, -0.599365234375, -0.42462158203125, -0.2498779296875, -0.07513427734375, 0.099609375, 0.27435302734375, 0.4490966796875, 0.62384033203125, 0.798583984375, 0.97332763671875, 1.1480712890625, 1.32281494140625, 1.49755859375, 1.67230224609375, 1.8470458984375, 2.02178955078125, 2.196533203125, 2.37127685546875, 2.5460205078125, 2.72076416015625, 2.8955078125, 3.07025146484375, 3.2449951171875, 3.41973876953125, 3.594482421875, 3.76922607421875, 3.9439697265625, 4.11871337890625, 4.29345703125, 4.46820068359375, 4.6429443359375, 4.81768798828125, 4.992431640625, 5.16717529296875, 5.3419189453125, 5.51666259765625, 5.69140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 3.0, 5.0, 11.0, 16.0, 14.0, 20.0, 23.0, 40.0, 39.0, 42.0, 71.0, 64.0, 73.0, 85.0, 58.0, 69.0, 68.0, 47.0, 56.0, 40.0, 35.0, 23.0, 16.0, 16.0, 15.0, 14.0, 14.0, 4.0, 1.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.666440963745117, -22.970821380615234, -22.27520179748535, -21.57958221435547, -20.88396453857422, -20.188344955444336, -19.492725372314453, -18.79710578918457, -18.101486206054688, -17.405866622924805, -16.710247039794922, -16.014629364013672, -15.319009780883789, -14.623390197753906, -13.927770614624023, -13.23215103149414, -12.53653335571289, -11.840913772583008, -11.145295143127441, -10.449675559997559, -9.754056930541992, -9.05843734741211, -8.362817764282227, -7.667198657989502, -6.971579551696777, -6.275960445404053, -5.580341339111328, -4.884721755981445, -4.189102649688721, -3.493483543395996, -2.7978639602661133, -2.1022448539733887, -1.4066276550292969, -0.7110084295272827, -0.015389204025268555, 0.6802301406860352, 1.3758492469787598, 2.0714683532714844, 2.767087936401367, 3.462707042694092, 4.158326148986816, 4.853945255279541, 5.549564361572266, 6.245183944702148, 6.940803050994873, 7.636422157287598, 8.33204174041748, 9.027660369873047, 9.72327995300293, 10.418899536132812, 11.114518165588379, 11.810137748718262, 12.505756378173828, 13.201375961303711, 13.896995544433594, 14.592615127563477, 15.288233757019043, 15.983853340148926, 16.679471969604492, 17.375091552734375, 18.070711135864258, 18.76633071899414, 19.46194839477539, 20.157567977905273, 20.853187561035156]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 10.0, 16.0, 2.0, 8.0, 9.0, 10.0, 19.0, 21.0, 12.0, 19.0, 22.0, 28.0, 32.0, 33.0, 31.0, 39.0, 39.0, 33.0, 47.0, 38.0, 34.0, 36.0, 48.0, 33.0, 46.0, 39.0, 29.0, 27.0, 24.0, 29.0, 33.0, 21.0, 23.0, 18.0, 13.0, 8.0, 11.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-9.95065975189209, -9.642020225524902, -9.333381652832031, -9.024742126464844, -8.716102600097656, -8.407463073730469, -8.098823547363281, -7.79018497467041, -7.481545448303223, -7.172905921936035, -6.864266872406006, -6.555627822875977, -6.246988296508789, -5.938348770141602, -5.629709720611572, -5.321070671081543, -5.0124311447143555, -4.703791618347168, -4.395152568817139, -4.086513519287109, -3.777873992919922, -3.4692347049713135, -3.160595417022705, -2.8519561290740967, -2.5433168411254883, -2.23467755317688, -1.9260382652282715, -1.617398977279663, -1.3087596893310547, -1.0001204013824463, -0.6914811134338379, -0.3828418254852295, -0.0742034912109375, 0.2344357967376709, 0.5430750846862793, 0.8517143726348877, 1.160353660583496, 1.4689929485321045, 1.777632236480713, 2.0862715244293213, 2.3949108123779297, 2.703550100326538, 3.0121893882751465, 3.320828676223755, 3.6294679641723633, 3.9381072521209717, 4.24674654006958, 4.555385589599609, 4.864025115966797, 5.172664642333984, 5.481303691864014, 5.789942741394043, 6.0985822677612305, 6.407221794128418, 6.715860843658447, 7.024499893188477, 7.333139419555664, 7.641778945922852, 7.950417995452881, 8.25905704498291, 8.567696571350098, 8.876336097717285, 9.184974670410156, 9.493614196777344, 9.802253723144531]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 12.0, 17.0, 21.0, 18.0, 31.0, 38.0, 63.0, 85.0, 112.0, 194.0, 248.0, 350.0, 505.0, 777.0, 1111.0, 1745.0, 2516.0, 3873.0, 6105.0, 9765.0, 15929.0, 26572.0, 45568.0, 79688.0, 136007.0, 200244.0, 196743.0, 131516.0, 76686.0, 44003.0, 25536.0, 15416.0, 9493.0, 5883.0, 3840.0, 2512.0, 1681.0, 1128.0, 774.0, 572.0, 359.0, 241.0, 172.0, 126.0, 78.0, 61.0, 48.0, 33.0, 21.0, 13.0, 12.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.4287109375, -1.3840179443359375, -1.339324951171875, -1.2946319580078125, -1.24993896484375, -1.2052459716796875, -1.160552978515625, -1.1158599853515625, -1.0711669921875, -1.0264739990234375, -0.981781005859375, -0.9370880126953125, -0.89239501953125, -0.8477020263671875, -0.803009033203125, -0.7583160400390625, -0.713623046875, -0.6689300537109375, -0.624237060546875, -0.5795440673828125, -0.53485107421875, -0.4901580810546875, -0.445465087890625, -0.4007720947265625, -0.3560791015625, -0.3113861083984375, -0.266693115234375, -0.2220001220703125, -0.17730712890625, -0.1326141357421875, -0.087921142578125, -0.0432281494140625, 0.00146484375, 0.0461578369140625, 0.090850830078125, 0.1355438232421875, 0.18023681640625, 0.2249298095703125, 0.269622802734375, 0.3143157958984375, 0.3590087890625, 0.4037017822265625, 0.448394775390625, 0.4930877685546875, 0.53778076171875, 0.5824737548828125, 0.627166748046875, 0.6718597412109375, 0.716552734375, 0.7612457275390625, 0.805938720703125, 0.8506317138671875, 0.89532470703125, 0.9400177001953125, 0.984710693359375, 1.0294036865234375, 1.0740966796875, 1.1187896728515625, 1.163482666015625, 1.2081756591796875, 1.25286865234375, 1.2975616455078125, 1.342254638671875, 1.3869476318359375, 1.431640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 5.0, 7.0, 6.0, 8.0, 9.0, 12.0, 21.0, 21.0, 21.0, 21.0, 22.0, 36.0, 33.0, 30.0, 38.0, 49.0, 50.0, 48.0, 40.0, 55.0, 47.0, 36.0, 39.0, 38.0, 38.0, 27.0, 36.0, 18.0, 29.0, 25.0, 17.0, 17.0, 14.0, 17.0, 10.0, 5.0, 10.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.162109375, -10.79296875, -10.423828125, -10.0546875, -9.685546875, -9.31640625, -8.947265625, -8.578125, -8.208984375, -7.83984375, -7.470703125, -7.1015625, -6.732421875, -6.36328125, -5.994140625, -5.625, -5.255859375, -4.88671875, -4.517578125, -4.1484375, -3.779296875, -3.41015625, -3.041015625, -2.671875, -2.302734375, -1.93359375, -1.564453125, -1.1953125, -0.826171875, -0.45703125, -0.087890625, 0.28125, 0.650390625, 1.01953125, 1.388671875, 1.7578125, 2.126953125, 2.49609375, 2.865234375, 3.234375, 3.603515625, 3.97265625, 4.341796875, 4.7109375, 5.080078125, 5.44921875, 5.818359375, 6.1875, 6.556640625, 6.92578125, 7.294921875, 7.6640625, 8.033203125, 8.40234375, 8.771484375, 9.140625, 9.509765625, 9.87890625, 10.248046875, 10.6171875, 10.986328125, 11.35546875, 11.724609375, 12.09375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 10.0, 14.0, 18.0, 28.0, 51.0, 70.0, 102.0, 138.0, 200.0, 372.0, 594.0, 989.0, 1758.0, 3606.0, 7583.0, 19085.0, 95487.0, 852141.0, 41233.0, 13283.0, 5621.0, 2684.0, 1443.0, 813.0, 479.0, 247.0, 157.0, 130.0, 70.0, 50.0, 36.0, 18.0, 14.0, 9.0, 10.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.91241455078125, -4.7388916015625, -4.56536865234375, -4.391845703125, -4.21832275390625, -4.0447998046875, -3.87127685546875, -3.69775390625, -3.52423095703125, -3.3507080078125, -3.17718505859375, -3.003662109375, -2.83013916015625, -2.6566162109375, -2.48309326171875, -2.3095703125, -2.13604736328125, -1.9625244140625, -1.78900146484375, -1.615478515625, -1.44195556640625, -1.2684326171875, -1.09490966796875, -0.92138671875, -0.74786376953125, -0.5743408203125, -0.40081787109375, -0.227294921875, -0.05377197265625, 0.1197509765625, 0.29327392578125, 0.466796875, 0.64031982421875, 0.8138427734375, 0.98736572265625, 1.160888671875, 1.33441162109375, 1.5079345703125, 1.68145751953125, 1.85498046875, 2.02850341796875, 2.2020263671875, 2.37554931640625, 2.549072265625, 2.72259521484375, 2.8961181640625, 3.06964111328125, 3.2431640625, 3.41668701171875, 3.5902099609375, 3.76373291015625, 3.937255859375, 4.11077880859375, 4.2843017578125, 4.45782470703125, 4.63134765625, 4.80487060546875, 4.9783935546875, 5.15191650390625, 5.325439453125, 5.49896240234375, 5.6724853515625, 5.84600830078125, 6.01953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 8.0, 4.0, 5.0, 18.0, 10.0, 24.0, 15.0, 22.0, 18.0, 26.0, 23.0, 41.0, 30.0, 33.0, 33.0, 34.0, 51.0, 47.0, 53.0, 39.0, 43.0, 47.0, 34.0, 41.0, 36.0, 36.0, 41.0, 12.0, 23.0, 26.0, 18.0, 25.0, 21.0, 9.0, 6.0, 11.0, 11.0, 5.0, 5.0, 6.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.06488037109375, -6.8211669921875, -6.57745361328125, -6.333740234375, -6.09002685546875, -5.8463134765625, -5.60260009765625, -5.35888671875, -5.11517333984375, -4.8714599609375, -4.62774658203125, -4.384033203125, -4.14031982421875, -3.8966064453125, -3.65289306640625, -3.4091796875, -3.16546630859375, -2.9217529296875, -2.67803955078125, -2.434326171875, -2.19061279296875, -1.9468994140625, -1.70318603515625, -1.45947265625, -1.21575927734375, -0.9720458984375, -0.72833251953125, -0.484619140625, -0.24090576171875, 0.0028076171875, 0.24652099609375, 0.490234375, 0.73394775390625, 0.9776611328125, 1.22137451171875, 1.465087890625, 1.70880126953125, 1.9525146484375, 2.19622802734375, 2.43994140625, 2.68365478515625, 2.9273681640625, 3.17108154296875, 3.414794921875, 3.65850830078125, 3.9022216796875, 4.14593505859375, 4.3896484375, 4.63336181640625, 4.8770751953125, 5.12078857421875, 5.364501953125, 5.60821533203125, 5.8519287109375, 6.09564208984375, 6.33935546875, 6.58306884765625, 6.8267822265625, 7.07049560546875, 7.314208984375, 7.55792236328125, 7.8016357421875, 8.04534912109375, 8.2890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 16.0, 13.0, 27.0, 29.0, 60.0, 78.0, 118.0, 186.0, 248.0, 400.0, 615.0, 912.0, 1514.0, 2380.0, 4220.0, 7382.0, 14189.0, 30082.0, 751396.0, 182100.0, 24412.0, 12132.0, 6397.0, 3654.0, 2121.0, 1340.0, 821.0, 531.0, 367.0, 257.0, 168.0, 117.0, 82.0, 52.0, 33.0, 26.0, 16.0, 19.0, 11.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87255859375, -0.8460235595703125, -0.819488525390625, -0.7929534912109375, -0.76641845703125, -0.7398834228515625, -0.713348388671875, -0.6868133544921875, -0.6602783203125, -0.6337432861328125, -0.607208251953125, -0.5806732177734375, -0.55413818359375, -0.5276031494140625, -0.501068115234375, -0.4745330810546875, -0.447998046875, -0.4214630126953125, -0.394927978515625, -0.3683929443359375, -0.34185791015625, -0.3153228759765625, -0.288787841796875, -0.2622528076171875, -0.2357177734375, -0.2091827392578125, -0.182647705078125, -0.1561126708984375, -0.12957763671875, -0.1030426025390625, -0.076507568359375, -0.0499725341796875, -0.0234375, 0.0030975341796875, 0.029632568359375, 0.0561676025390625, 0.08270263671875, 0.1092376708984375, 0.135772705078125, 0.1623077392578125, 0.1888427734375, 0.2153778076171875, 0.241912841796875, 0.2684478759765625, 0.29498291015625, 0.3215179443359375, 0.348052978515625, 0.3745880126953125, 0.401123046875, 0.4276580810546875, 0.454193115234375, 0.4807281494140625, 0.50726318359375, 0.5337982177734375, 0.560333251953125, 0.5868682861328125, 0.6134033203125, 0.6399383544921875, 0.666473388671875, 0.6930084228515625, 0.71954345703125, 0.7460784912109375, 0.772613525390625, 0.7991485595703125, 0.82568359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 4.0, 3.0, 7.0, 7.0, 12.0, 14.0, 16.0, 15.0, 19.0, 34.0, 24.0, 26.0, 39.0, 45.0, 50.0, 51.0, 54.0, 46.0, 42.0, 54.0, 45.0, 41.0, 45.0, 57.0, 42.0, 35.0, 24.0, 22.0, 16.0, 21.0, 20.0, 11.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1656975150108337e-05, -2.084299921989441e-05, -2.002902328968048e-05, -1.9215047359466553e-05, -1.8401071429252625e-05, -1.7587095499038696e-05, -1.6773119568824768e-05, -1.595914363861084e-05, -1.5145167708396912e-05, -1.4331191778182983e-05, -1.3517215847969055e-05, -1.2703239917755127e-05, -1.1889263987541199e-05, -1.107528805732727e-05, -1.0261312127113342e-05, -9.447336196899414e-06, -8.633360266685486e-06, -7.819384336471558e-06, -7.005408406257629e-06, -6.191432476043701e-06, -5.377456545829773e-06, -4.563480615615845e-06, -3.7495046854019165e-06, -2.9355287551879883e-06, -2.12155282497406e-06, -1.3075768947601318e-06, -4.936009645462036e-07, 3.203749656677246e-07, 1.1343508958816528e-06, 1.948326826095581e-06, 2.7623027563095093e-06, 3.5762786865234375e-06, 4.390254616737366e-06, 5.204230546951294e-06, 6.018206477165222e-06, 6.83218240737915e-06, 7.646158337593079e-06, 8.460134267807007e-06, 9.274110198020935e-06, 1.0088086128234863e-05, 1.0902062058448792e-05, 1.171603798866272e-05, 1.2530013918876648e-05, 1.3343989849090576e-05, 1.4157965779304504e-05, 1.4971941709518433e-05, 1.578591763973236e-05, 1.659989356994629e-05, 1.7413869500160217e-05, 1.8227845430374146e-05, 1.9041821360588074e-05, 1.9855797290802002e-05, 2.066977322101593e-05, 2.148374915122986e-05, 2.2297725081443787e-05, 2.3111701011657715e-05, 2.3925676941871643e-05, 2.473965287208557e-05, 2.55536288022995e-05, 2.6367604732513428e-05, 2.7181580662727356e-05, 2.7995556592941284e-05, 2.8809532523155212e-05, 2.962350845336914e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 4.0, 11.0, 13.0, 7.0, 25.0, 17.0, 37.0, 64.0, 115.0, 211.0, 363.0, 717.0, 1304.0, 2450.0, 4940.0, 9995.0, 21578.0, 47125.0, 102290.0, 205143.0, 281106.0, 193499.0, 94746.0, 43560.0, 20160.0, 9344.0, 4742.0, 2262.0, 1190.0, 647.0, 360.0, 171.0, 108.0, 78.0, 54.0, 31.0, 18.0, 12.0, 12.0, 10.0, 7.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5087890625, -0.4920806884765625, -0.475372314453125, -0.4586639404296875, -0.44195556640625, -0.4252471923828125, -0.408538818359375, -0.3918304443359375, -0.3751220703125, -0.3584136962890625, -0.341705322265625, -0.3249969482421875, -0.30828857421875, -0.2915802001953125, -0.274871826171875, -0.2581634521484375, -0.241455078125, -0.2247467041015625, -0.208038330078125, -0.1913299560546875, -0.17462158203125, -0.1579132080078125, -0.141204833984375, -0.1244964599609375, -0.1077880859375, -0.0910797119140625, -0.074371337890625, -0.0576629638671875, -0.04095458984375, -0.0242462158203125, -0.007537841796875, 0.0091705322265625, 0.02587890625, 0.0425872802734375, 0.059295654296875, 0.0760040283203125, 0.09271240234375, 0.1094207763671875, 0.126129150390625, 0.1428375244140625, 0.1595458984375, 0.1762542724609375, 0.192962646484375, 0.2096710205078125, 0.22637939453125, 0.2430877685546875, 0.259796142578125, 0.2765045166015625, 0.293212890625, 0.3099212646484375, 0.326629638671875, 0.3433380126953125, 0.36004638671875, 0.3767547607421875, 0.393463134765625, 0.4101715087890625, 0.4268798828125, 0.4435882568359375, 0.460296630859375, 0.4770050048828125, 0.49371337890625, 0.5104217529296875, 0.527130126953125, 0.5438385009765625, 0.560546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 9.0, 10.0, 5.0, 15.0, 14.0, 23.0, 35.0, 28.0, 43.0, 64.0, 69.0, 60.0, 71.0, 75.0, 90.0, 69.0, 72.0, 64.0, 39.0, 32.0, 22.0, 24.0, 16.0, 19.0, 10.0, 3.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.186187744140625, -0.18048095703125, -0.174774169921875, -0.1690673828125, -0.163360595703125, -0.15765380859375, -0.151947021484375, -0.146240234375, -0.140533447265625, -0.13482666015625, -0.129119873046875, -0.1234130859375, -0.117706298828125, -0.11199951171875, -0.106292724609375, -0.1005859375, -0.094879150390625, -0.08917236328125, -0.083465576171875, -0.0777587890625, -0.072052001953125, -0.06634521484375, -0.060638427734375, -0.054931640625, -0.049224853515625, -0.04351806640625, -0.037811279296875, -0.0321044921875, -0.026397705078125, -0.02069091796875, -0.014984130859375, -0.00927734375, -0.003570556640625, 0.00213623046875, 0.007843017578125, 0.0135498046875, 0.019256591796875, 0.02496337890625, 0.030670166015625, 0.036376953125, 0.042083740234375, 0.04779052734375, 0.053497314453125, 0.0592041015625, 0.064910888671875, 0.07061767578125, 0.076324462890625, 0.08203125, 0.087738037109375, 0.09344482421875, 0.099151611328125, 0.1048583984375, 0.110565185546875, 0.11627197265625, 0.121978759765625, 0.127685546875, 0.133392333984375, 0.13909912109375, 0.144805908203125, 0.1505126953125, 0.156219482421875, 0.16192626953125, 0.167633056640625, 0.17333984375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 13.0, 14.0, 14.0, 18.0, 25.0, 46.0, 36.0, 44.0, 69.0, 67.0, 73.0, 81.0, 64.0, 64.0, 65.0, 47.0, 59.0, 35.0, 37.0, 25.0, 13.0, 18.0, 13.0, 12.0, 14.0, 6.0, 2.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.153614044189453, -23.462472915649414, -22.771333694458008, -22.08019256591797, -21.389053344726562, -20.697912216186523, -20.006771087646484, -19.315631866455078, -18.624492645263672, -17.933351516723633, -17.242212295532227, -16.551071166992188, -15.859931945800781, -15.168790817260742, -14.47765064239502, -13.786510467529297, -13.095369338989258, -12.404229164123535, -11.713088989257812, -11.021947860717773, -10.330808639526367, -9.639667510986328, -8.948527336120605, -8.257387161254883, -7.56624698638916, -6.8751068115234375, -6.183966636657715, -5.492825984954834, -4.801685810089111, -4.110545635223389, -3.419404983520508, -2.728264808654785, -2.0371227264404297, -1.3459824323654175, -0.6548421382904053, 0.036298274993896484, 0.7274384498596191, 1.4185786247253418, 2.1097192764282227, 2.8008594512939453, 3.491999626159668, 4.183139801025391, 4.874279975891113, 5.565420627593994, 6.256560802459717, 6.9477009773254395, 7.63884162902832, 8.329981803894043, 9.021121978759766, 9.712262153625488, 10.403402328491211, 11.09454345703125, 11.785682678222656, 12.476823806762695, 13.167963981628418, 13.85910415649414, 14.550244331359863, 15.241384506225586, 15.932524681091309, 16.62366485595703, 17.31480598449707, 18.005945205688477, 18.697086334228516, 19.388225555419922, 20.07936668395996]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 6.0, 20.0, 3.0, 6.0, 9.0, 13.0, 17.0, 21.0, 12.0, 19.0, 16.0, 33.0, 32.0, 35.0, 29.0, 37.0, 38.0, 38.0, 45.0, 39.0, 35.0, 33.0, 48.0, 36.0, 43.0, 41.0, 30.0, 28.0, 21.0, 35.0, 28.0, 22.0, 22.0, 19.0, 13.0, 9.0, 11.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.05845832824707, -9.748851776123047, -9.439245223999023, -9.129639625549316, -8.820033073425293, -8.51042652130127, -8.200819969177246, -7.891213417053223, -7.581607341766357, -7.272000789642334, -6.962394714355469, -6.652788162231445, -6.343181610107422, -6.033575534820557, -5.723968982696533, -5.414362907409668, -5.1047563552856445, -4.795149803161621, -4.485543727874756, -4.175937175750732, -3.866330862045288, -3.5567245483398438, -3.2471179962158203, -2.937511682510376, -2.6279053688049316, -2.3182990550994873, -2.008692741394043, -1.6990861892700195, -1.3894798755645752, -1.0798735618591309, -0.770267128944397, -0.4606606960296631, -0.15105533599853516, 0.15855103731155396, 0.46815741062164307, 0.7777637839317322, 1.0873701572418213, 1.3969764709472656, 1.7065829038619995, 2.0161893367767334, 2.3257956504821777, 2.635401964187622, 2.9450082778930664, 3.25461483001709, 3.564221143722534, 3.8738274574279785, 4.183434009552002, 4.493040084838867, 4.802646636962891, 5.112253189086914, 5.421859264373779, 5.731465816497803, 6.041071891784668, 6.350678443908691, 6.660284996032715, 6.969891548156738, 7.2794976234436035, 7.589104175567627, 7.898710250854492, 8.208316802978516, 8.517923355102539, 8.827529907226562, 9.13713550567627, 9.446742057800293, 9.756348609924316]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 16.0, 21.0, 22.0, 40.0, 65.0, 82.0, 119.0, 208.0, 311.0, 456.0, 658.0, 1022.0, 1477.0, 2237.0, 3447.0, 5261.0, 7790.0, 12128.0, 18322.0, 28694.0, 43800.0, 67374.0, 98738.0, 133001.0, 152243.0, 141185.0, 109757.0, 76332.0, 50160.0, 32374.0, 21059.0, 13701.0, 8941.0, 5796.0, 3911.0, 2580.0, 1708.0, 1120.0, 791.0, 540.0, 340.0, 224.0, 157.0, 113.0, 79.0, 40.0, 41.0, 20.0, 15.0, 18.0, 10.0, 3.0, 5.0, 1.0, 2.0], "bins": [-11.5390625, -11.1961669921875, -10.853271484375, -10.5103759765625, -10.16748046875, -9.8245849609375, -9.481689453125, -9.1387939453125, -8.7958984375, -8.4530029296875, -8.110107421875, -7.7672119140625, -7.42431640625, -7.0814208984375, -6.738525390625, -6.3956298828125, -6.052734375, -5.7098388671875, -5.366943359375, -5.0240478515625, -4.68115234375, -4.3382568359375, -3.995361328125, -3.6524658203125, -3.3095703125, -2.9666748046875, -2.623779296875, -2.2808837890625, -1.93798828125, -1.5950927734375, -1.252197265625, -0.9093017578125, -0.56640625, -0.2235107421875, 0.119384765625, 0.4622802734375, 0.80517578125, 1.1480712890625, 1.490966796875, 1.8338623046875, 2.1767578125, 2.5196533203125, 2.862548828125, 3.2054443359375, 3.54833984375, 3.8912353515625, 4.234130859375, 4.5770263671875, 4.919921875, 5.2628173828125, 5.605712890625, 5.9486083984375, 6.29150390625, 6.6343994140625, 6.977294921875, 7.3201904296875, 7.6630859375, 8.0059814453125, 8.348876953125, 8.6917724609375, 9.03466796875, 9.3775634765625, 9.720458984375, 10.0633544921875, 10.40625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 12.0, 10.0, 16.0, 10.0, 20.0, 14.0, 18.0, 25.0, 16.0, 36.0, 31.0, 42.0, 54.0, 39.0, 52.0, 38.0, 38.0, 53.0, 39.0, 45.0, 56.0, 44.0, 40.0, 40.0, 28.0, 24.0, 23.0, 28.0, 21.0, 17.0, 12.0, 10.0, 5.0, 6.0, 3.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5035400390625, -11.108642578125, -10.7137451171875, -10.31884765625, -9.9239501953125, -9.529052734375, -9.1341552734375, -8.7392578125, -8.3443603515625, -7.949462890625, -7.5545654296875, -7.15966796875, -6.7647705078125, -6.369873046875, -5.9749755859375, -5.580078125, -5.1851806640625, -4.790283203125, -4.3953857421875, -4.00048828125, -3.6055908203125, -3.210693359375, -2.8157958984375, -2.4208984375, -2.0260009765625, -1.631103515625, -1.2362060546875, -0.84130859375, -0.4464111328125, -0.051513671875, 0.3433837890625, 0.73828125, 1.1331787109375, 1.528076171875, 1.9229736328125, 2.31787109375, 2.7127685546875, 3.107666015625, 3.5025634765625, 3.8974609375, 4.2923583984375, 4.687255859375, 5.0821533203125, 5.47705078125, 5.8719482421875, 6.266845703125, 6.6617431640625, 7.056640625, 7.4515380859375, 7.846435546875, 8.2413330078125, 8.63623046875, 9.0311279296875, 9.426025390625, 9.8209228515625, 10.2158203125, 10.6107177734375, 11.005615234375, 11.4005126953125, 11.79541015625, 12.1903076171875, 12.585205078125, 12.9801025390625, 13.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 13.0, 15.0, 21.0, 34.0, 51.0, 104.0, 176.0, 253.0, 523.0, 852.0, 1557.0, 2753.0, 4992.0, 9427.0, 18472.0, 36812.0, 74367.0, 144065.0, 225440.0, 227839.0, 146876.0, 76077.0, 37661.0, 18724.0, 9701.0, 5163.0, 2923.0, 1562.0, 857.0, 482.0, 315.0, 162.0, 112.0, 70.0, 45.0, 34.0, 15.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.046875, -18.412353515625, -17.77783203125, -17.143310546875, -16.5087890625, -15.874267578125, -15.23974609375, -14.605224609375, -13.970703125, -13.336181640625, -12.70166015625, -12.067138671875, -11.4326171875, -10.798095703125, -10.16357421875, -9.529052734375, -8.89453125, -8.260009765625, -7.62548828125, -6.990966796875, -6.3564453125, -5.721923828125, -5.08740234375, -4.452880859375, -3.818359375, -3.183837890625, -2.54931640625, -1.914794921875, -1.2802734375, -0.645751953125, -0.01123046875, 0.623291015625, 1.2578125, 1.892333984375, 2.52685546875, 3.161376953125, 3.7958984375, 4.430419921875, 5.06494140625, 5.699462890625, 6.333984375, 6.968505859375, 7.60302734375, 8.237548828125, 8.8720703125, 9.506591796875, 10.14111328125, 10.775634765625, 11.41015625, 12.044677734375, 12.67919921875, 13.313720703125, 13.9482421875, 14.582763671875, 15.21728515625, 15.851806640625, 16.486328125, 17.120849609375, 17.75537109375, 18.389892578125, 19.0244140625, 19.658935546875, 20.29345703125, 20.927978515625, 21.5625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 3.0, 9.0, 8.0, 11.0, 13.0, 12.0, 23.0, 13.0, 20.0, 22.0, 26.0, 32.0, 35.0, 30.0, 33.0, 35.0, 35.0, 36.0, 36.0, 42.0, 56.0, 33.0, 30.0, 38.0, 43.0, 41.0, 25.0, 28.0, 32.0, 23.0, 30.0, 24.0, 14.0, 8.0, 16.0, 24.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.10040283203125, -6.8609619140625, -6.62152099609375, -6.382080078125, -6.14263916015625, -5.9031982421875, -5.66375732421875, -5.42431640625, -5.18487548828125, -4.9454345703125, -4.70599365234375, -4.466552734375, -4.22711181640625, -3.9876708984375, -3.74822998046875, -3.5087890625, -3.26934814453125, -3.0299072265625, -2.79046630859375, -2.551025390625, -2.31158447265625, -2.0721435546875, -1.83270263671875, -1.59326171875, -1.35382080078125, -1.1143798828125, -0.87493896484375, -0.635498046875, -0.39605712890625, -0.1566162109375, 0.08282470703125, 0.322265625, 0.56170654296875, 0.8011474609375, 1.04058837890625, 1.280029296875, 1.51947021484375, 1.7589111328125, 1.99835205078125, 2.23779296875, 2.47723388671875, 2.7166748046875, 2.95611572265625, 3.195556640625, 3.43499755859375, 3.6744384765625, 3.91387939453125, 4.1533203125, 4.39276123046875, 4.6322021484375, 4.87164306640625, 5.111083984375, 5.35052490234375, 5.5899658203125, 5.82940673828125, 6.06884765625, 6.30828857421875, 6.5477294921875, 6.78717041015625, 7.026611328125, 7.26605224609375, 7.5054931640625, 7.74493408203125, 7.984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 10.0, 13.0, 20.0, 23.0, 49.0, 81.0, 126.0, 170.0, 272.0, 415.0, 690.0, 1066.0, 1779.0, 2999.0, 5096.0, 9468.0, 18204.0, 38130.0, 85346.0, 187133.0, 291096.0, 214732.0, 100859.0, 44598.0, 21216.0, 10671.0, 5730.0, 3342.0, 1991.0, 1182.0, 722.0, 463.0, 313.0, 191.0, 137.0, 74.0, 49.0, 37.0, 21.0, 14.0, 6.0, 11.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.993896484375, -15.48779296875, -14.981689453125, -14.4755859375, -13.969482421875, -13.46337890625, -12.957275390625, -12.451171875, -11.945068359375, -11.43896484375, -10.932861328125, -10.4267578125, -9.920654296875, -9.41455078125, -8.908447265625, -8.40234375, -7.896240234375, -7.39013671875, -6.884033203125, -6.3779296875, -5.871826171875, -5.36572265625, -4.859619140625, -4.353515625, -3.847412109375, -3.34130859375, -2.835205078125, -2.3291015625, -1.822998046875, -1.31689453125, -0.810791015625, -0.3046875, 0.201416015625, 0.70751953125, 1.213623046875, 1.7197265625, 2.225830078125, 2.73193359375, 3.238037109375, 3.744140625, 4.250244140625, 4.75634765625, 5.262451171875, 5.7685546875, 6.274658203125, 6.78076171875, 7.286865234375, 7.79296875, 8.299072265625, 8.80517578125, 9.311279296875, 9.8173828125, 10.323486328125, 10.82958984375, 11.335693359375, 11.841796875, 12.347900390625, 12.85400390625, 13.360107421875, 13.8662109375, 14.372314453125, 14.87841796875, 15.384521484375, 15.890625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 15.0, 24.0, 38.0, 48.0, 66.0, 99.0, 112.0, 130.0, 125.0, 99.0, 67.0, 40.0, 39.0, 18.0, 14.0, 6.0, 5.0, 6.0, 5.0, 8.0, 0.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0021152496337890625, -0.0020520389080047607, -0.001988828182220459, -0.0019256174564361572, -0.0018624067306518555, -0.0017991960048675537, -0.001735985279083252, -0.0016727745532989502, -0.0016095638275146484, -0.0015463531017303467, -0.001483142375946045, -0.0014199316501617432, -0.0013567209243774414, -0.0012935101985931396, -0.0012302994728088379, -0.0011670887470245361, -0.0011038780212402344, -0.0010406672954559326, -0.0009774565696716309, -0.0009142458438873291, -0.0008510351181030273, -0.0007878243923187256, -0.0007246136665344238, -0.0006614029407501221, -0.0005981922149658203, -0.0005349814891815186, -0.0004717707633972168, -0.00040856003761291504, -0.0003453493118286133, -0.0002821385860443115, -0.00021892786026000977, -0.000155717134475708, -9.250640869140625e-05, -2.9295682907104492e-05, 3.3915042877197266e-05, 9.712576866149902e-05, 0.00016033649444580078, 0.00022354722023010254, 0.0002867579460144043, 0.00034996867179870605, 0.0004131793975830078, 0.00047639012336730957, 0.0005396008491516113, 0.0006028115749359131, 0.0006660223007202148, 0.0007292330265045166, 0.0007924437522888184, 0.0008556544780731201, 0.0009188652038574219, 0.0009820759296417236, 0.0010452866554260254, 0.0011084973812103271, 0.001171708106994629, 0.0012349188327789307, 0.0012981295585632324, 0.0013613402843475342, 0.001424551010131836, 0.0014877617359161377, 0.0015509724617004395, 0.0016141831874847412, 0.001677393913269043, 0.0017406046390533447, 0.0018038153648376465, 0.0018670260906219482, 0.00193023681640625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 10.0, 17.0, 28.0, 31.0, 40.0, 67.0, 102.0, 143.0, 213.0, 283.0, 395.0, 727.0, 1108.0, 1657.0, 2590.0, 4259.0, 7306.0, 13148.0, 24474.0, 46591.0, 93395.0, 179572.0, 251538.0, 197615.0, 106089.0, 53910.0, 27542.0, 14651.0, 8161.0, 4736.0, 2878.0, 1766.0, 1152.0, 777.0, 491.0, 329.0, 227.0, 176.0, 104.0, 70.0, 49.0, 30.0, 28.0, 24.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.7421875, -13.3072509765625, -12.872314453125, -12.4373779296875, -12.00244140625, -11.5675048828125, -11.132568359375, -10.6976318359375, -10.2626953125, -9.8277587890625, -9.392822265625, -8.9578857421875, -8.52294921875, -8.0880126953125, -7.653076171875, -7.2181396484375, -6.783203125, -6.3482666015625, -5.913330078125, -5.4783935546875, -5.04345703125, -4.6085205078125, -4.173583984375, -3.7386474609375, -3.3037109375, -2.8687744140625, -2.433837890625, -1.9989013671875, -1.56396484375, -1.1290283203125, -0.694091796875, -0.2591552734375, 0.17578125, 0.6107177734375, 1.045654296875, 1.4805908203125, 1.91552734375, 2.3504638671875, 2.785400390625, 3.2203369140625, 3.6552734375, 4.0902099609375, 4.525146484375, 4.9600830078125, 5.39501953125, 5.8299560546875, 6.264892578125, 6.6998291015625, 7.134765625, 7.5697021484375, 8.004638671875, 8.4395751953125, 8.87451171875, 9.3094482421875, 9.744384765625, 10.1793212890625, 10.6142578125, 11.0491943359375, 11.484130859375, 11.9190673828125, 12.35400390625, 12.7889404296875, 13.223876953125, 13.6588134765625, 14.09375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 11.0, 11.0, 21.0, 22.0, 20.0, 31.0, 36.0, 58.0, 59.0, 68.0, 75.0, 98.0, 81.0, 82.0, 76.0, 52.0, 49.0, 37.0, 26.0, 16.0, 16.0, 11.0, 7.0, 11.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.67388916015625, -5.5274658203125, -5.38104248046875, -5.234619140625, -5.08819580078125, -4.9417724609375, -4.79534912109375, -4.64892578125, -4.50250244140625, -4.3560791015625, -4.20965576171875, -4.063232421875, -3.91680908203125, -3.7703857421875, -3.62396240234375, -3.4775390625, -3.33111572265625, -3.1846923828125, -3.03826904296875, -2.891845703125, -2.74542236328125, -2.5989990234375, -2.45257568359375, -2.30615234375, -2.15972900390625, -2.0133056640625, -1.86688232421875, -1.720458984375, -1.57403564453125, -1.4276123046875, -1.28118896484375, -1.134765625, -0.98834228515625, -0.8419189453125, -0.69549560546875, -0.549072265625, -0.40264892578125, -0.2562255859375, -0.10980224609375, 0.03662109375, 0.18304443359375, 0.3294677734375, 0.47589111328125, 0.622314453125, 0.76873779296875, 0.9151611328125, 1.06158447265625, 1.2080078125, 1.35443115234375, 1.5008544921875, 1.64727783203125, 1.793701171875, 1.94012451171875, 2.0865478515625, 2.23297119140625, 2.37939453125, 2.52581787109375, 2.6722412109375, 2.81866455078125, 2.965087890625, 3.11151123046875, 3.2579345703125, 3.40435791015625, 3.55078125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 16.0, 4.0, 10.0, 13.0, 21.0, 26.0, 33.0, 43.0, 46.0, 62.0, 65.0, 62.0, 82.0, 67.0, 73.0, 49.0, 65.0, 51.0, 45.0, 38.0, 35.0, 18.0, 22.0, 14.0, 7.0, 5.0, 7.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.947654724121094, -24.218374252319336, -23.489093780517578, -22.759815216064453, -22.030534744262695, -21.301254272460938, -20.57197380065918, -19.842693328857422, -19.113414764404297, -18.38413429260254, -17.65485382080078, -16.925575256347656, -16.1962947845459, -15.46701431274414, -14.737733840942383, -14.008454322814941, -13.279173851013184, -12.549893379211426, -11.820613861083984, -11.091333389282227, -10.362053871154785, -9.632773399353027, -8.903493881225586, -8.174213409423828, -7.4449334144592285, -6.715653419494629, -5.986373424530029, -5.25709342956543, -4.527812957763672, -3.7985332012176514, -3.0692529678344727, -2.339972972869873, -1.6106929779052734, -0.881412923336029, -0.15213286876678467, 0.5771472454071045, 1.306427240371704, 2.0357072353363037, 2.7649874687194824, 3.494267463684082, 4.223547458648682, 4.952827453613281, 5.682107448577881, 6.4113874435424805, 7.140667915344238, 7.86994743347168, 8.599227905273438, 9.328508377075195, 10.057787895202637, 10.787068367004395, 11.516347885131836, 12.245628356933594, 12.974907875061035, 13.704188346862793, 14.433467864990234, 15.162748336791992, 15.89202880859375, 16.621309280395508, 17.350589752197266, 18.07986831665039, 18.80914878845215, 19.538429260253906, 20.267709732055664, 20.996990203857422, 21.726268768310547]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 4.0, 13.0, 14.0, 12.0, 14.0, 16.0, 15.0, 17.0, 22.0, 25.0, 27.0, 19.0, 28.0, 38.0, 38.0, 49.0, 46.0, 31.0, 30.0, 52.0, 45.0, 33.0, 33.0, 37.0, 38.0, 33.0, 27.0, 34.0, 20.0, 22.0, 21.0, 19.0, 21.0, 16.0, 12.0, 14.0, 8.0, 5.0, 5.0, 5.0, 7.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.778368949890137, -10.42904281616211, -10.079717636108398, -9.730391502380371, -9.38106632232666, -9.031740188598633, -8.682415008544922, -8.333088874816895, -7.983763217926025, -7.634437561035156, -7.285111904144287, -6.935786247253418, -6.586460113525391, -6.23713493347168, -5.887808799743652, -5.538483142852783, -5.189157485961914, -4.839831829071045, -4.490506172180176, -4.141180038452148, -3.7918546199798584, -3.4425289630889893, -3.093203067779541, -2.743877410888672, -2.3945517539978027, -2.0452260971069336, -1.695900321006775, -1.3465745449066162, -0.9972488880157471, -0.6479232311248779, -0.2985973358154297, 0.05072832107543945, 0.4000539779663086, 0.7493796944618225, 1.0987054109573364, 1.4480311870574951, 1.7973568439483643, 2.1466825008392334, 2.4960083961486816, 2.845334053039551, 3.19465970993042, 3.543985366821289, 3.893311023712158, 4.242636680603027, 4.591962814331055, 4.941287994384766, 5.290614128112793, 5.639939785003662, 5.989265441894531, 6.3385910987854, 6.6879167556762695, 7.037242889404297, 7.386568069458008, 7.735894203186035, 8.085220336914062, 8.434545516967773, 8.783870697021484, 9.133196830749512, 9.482522010803223, 9.83184814453125, 10.181173324584961, 10.530499458312988, 10.879825592041016, 11.229150772094727, 11.578476905822754]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 2.0, 5.0, 8.0, 16.0, 19.0, 31.0, 39.0, 46.0, 68.0, 93.0, 131.0, 192.0, 284.0, 423.0, 622.0, 932.0, 1424.0, 2214.0, 3475.0, 6026.0, 10561.0, 20107.0, 42129.0, 95281.0, 244619.0, 649963.0, 1251706.0, 1068706.0, 477663.0, 178803.0, 71653.0, 31914.0, 15394.0, 8185.0, 4647.0, 2656.0, 1612.0, 987.0, 625.0, 345.0, 242.0, 161.0, 100.0, 57.0, 39.0, 23.0, 20.0, 17.0, 7.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.375, -25.61767578125, -24.8603515625, -24.10302734375, -23.345703125, -22.58837890625, -21.8310546875, -21.07373046875, -20.31640625, -19.55908203125, -18.8017578125, -18.04443359375, -17.287109375, -16.52978515625, -15.7724609375, -15.01513671875, -14.2578125, -13.50048828125, -12.7431640625, -11.98583984375, -11.228515625, -10.47119140625, -9.7138671875, -8.95654296875, -8.19921875, -7.44189453125, -6.6845703125, -5.92724609375, -5.169921875, -4.41259765625, -3.6552734375, -2.89794921875, -2.140625, -1.38330078125, -0.6259765625, 0.13134765625, 0.888671875, 1.64599609375, 2.4033203125, 3.16064453125, 3.91796875, 4.67529296875, 5.4326171875, 6.18994140625, 6.947265625, 7.70458984375, 8.4619140625, 9.21923828125, 9.9765625, 10.73388671875, 11.4912109375, 12.24853515625, 13.005859375, 13.76318359375, 14.5205078125, 15.27783203125, 16.03515625, 16.79248046875, 17.5498046875, 18.30712890625, 19.064453125, 19.82177734375, 20.5791015625, 21.33642578125, 22.09375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 2.0, 6.0, 5.0, 5.0, 4.0, 18.0, 4.0, 16.0, 21.0, 24.0, 20.0, 18.0, 30.0, 28.0, 24.0, 20.0, 33.0, 34.0, 37.0, 48.0, 44.0, 41.0, 46.0, 38.0, 38.0, 37.0, 45.0, 36.0, 38.0, 26.0, 37.0, 34.0, 16.0, 18.0, 20.0, 14.0, 17.0, 14.0, 6.0, 7.0, 7.0, 2.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.6015625, -12.219482421875, -11.83740234375, -11.455322265625, -11.0732421875, -10.691162109375, -10.30908203125, -9.927001953125, -9.544921875, -9.162841796875, -8.78076171875, -8.398681640625, -8.0166015625, -7.634521484375, -7.25244140625, -6.870361328125, -6.48828125, -6.106201171875, -5.72412109375, -5.342041015625, -4.9599609375, -4.577880859375, -4.19580078125, -3.813720703125, -3.431640625, -3.049560546875, -2.66748046875, -2.285400390625, -1.9033203125, -1.521240234375, -1.13916015625, -0.757080078125, -0.375, 0.007080078125, 0.38916015625, 0.771240234375, 1.1533203125, 1.535400390625, 1.91748046875, 2.299560546875, 2.681640625, 3.063720703125, 3.44580078125, 3.827880859375, 4.2099609375, 4.592041015625, 4.97412109375, 5.356201171875, 5.73828125, 6.120361328125, 6.50244140625, 6.884521484375, 7.2666015625, 7.648681640625, 8.03076171875, 8.412841796875, 8.794921875, 9.177001953125, 9.55908203125, 9.941162109375, 10.3232421875, 10.705322265625, 11.08740234375, 11.469482421875, 11.8515625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 19.0, 21.0, 64.0, 84.0, 134.0, 191.0, 305.0, 493.0, 760.0, 1199.0, 2016.0, 3254.0, 5983.0, 11249.0, 21931.0, 47053.0, 111589.0, 293156.0, 805060.0, 1468642.0, 876051.0, 322839.0, 120922.0, 50897.0, 23437.0, 11722.0, 6343.0, 3367.0, 2101.0, 1294.0, 753.0, 471.0, 308.0, 190.0, 123.0, 82.0, 52.0, 38.0, 17.0, 20.0, 14.0, 5.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.78125, -40.57177734375, -39.3623046875, -38.15283203125, -36.943359375, -35.73388671875, -34.5244140625, -33.31494140625, -32.10546875, -30.89599609375, -29.6865234375, -28.47705078125, -27.267578125, -26.05810546875, -24.8486328125, -23.63916015625, -22.4296875, -21.22021484375, -20.0107421875, -18.80126953125, -17.591796875, -16.38232421875, -15.1728515625, -13.96337890625, -12.75390625, -11.54443359375, -10.3349609375, -9.12548828125, -7.916015625, -6.70654296875, -5.4970703125, -4.28759765625, -3.078125, -1.86865234375, -0.6591796875, 0.55029296875, 1.759765625, 2.96923828125, 4.1787109375, 5.38818359375, 6.59765625, 7.80712890625, 9.0166015625, 10.22607421875, 11.435546875, 12.64501953125, 13.8544921875, 15.06396484375, 16.2734375, 17.48291015625, 18.6923828125, 19.90185546875, 21.111328125, 22.32080078125, 23.5302734375, 24.73974609375, 25.94921875, 27.15869140625, 28.3681640625, 29.57763671875, 30.787109375, 31.99658203125, 33.2060546875, 34.41552734375, 35.625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 10.0, 6.0, 4.0, 10.0, 9.0, 21.0, 26.0, 32.0, 34.0, 55.0, 62.0, 69.0, 98.0, 122.0, 158.0, 139.0, 222.0, 254.0, 277.0, 293.0, 300.0, 327.0, 279.0, 270.0, 206.0, 177.0, 147.0, 113.0, 82.0, 54.0, 44.0, 39.0, 28.0, 25.0, 20.0, 18.0, 13.0, 8.0, 6.0, 5.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7734375, -8.5018310546875, -8.230224609375, -7.9586181640625, -7.68701171875, -7.4154052734375, -7.143798828125, -6.8721923828125, -6.6005859375, -6.3289794921875, -6.057373046875, -5.7857666015625, -5.51416015625, -5.2425537109375, -4.970947265625, -4.6993408203125, -4.427734375, -4.1561279296875, -3.884521484375, -3.6129150390625, -3.34130859375, -3.0697021484375, -2.798095703125, -2.5264892578125, -2.2548828125, -1.9832763671875, -1.711669921875, -1.4400634765625, -1.16845703125, -0.8968505859375, -0.625244140625, -0.3536376953125, -0.08203125, 0.1895751953125, 0.461181640625, 0.7327880859375, 1.00439453125, 1.2760009765625, 1.547607421875, 1.8192138671875, 2.0908203125, 2.3624267578125, 2.634033203125, 2.9056396484375, 3.17724609375, 3.4488525390625, 3.720458984375, 3.9920654296875, 4.263671875, 4.5352783203125, 4.806884765625, 5.0784912109375, 5.35009765625, 5.6217041015625, 5.893310546875, 6.1649169921875, 6.4365234375, 6.7081298828125, 6.979736328125, 7.2513427734375, 7.52294921875, 7.7945556640625, 8.066162109375, 8.3377685546875, 8.609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 7.0, 14.0, 18.0, 18.0, 23.0, 25.0, 45.0, 55.0, 73.0, 69.0, 86.0, 89.0, 63.0, 84.0, 63.0, 73.0, 38.0, 30.0, 33.0, 27.0, 18.0, 14.0, 9.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.48189926147461, -42.149715423583984, -40.81753158569336, -39.4853515625, -38.153167724609375, -36.82098388671875, -35.488800048828125, -34.1566162109375, -32.824432373046875, -31.49224853515625, -30.160066604614258, -28.827882766723633, -27.49570083618164, -26.163516998291016, -24.83133316040039, -23.499149322509766, -22.166969299316406, -20.83478546142578, -19.50260353088379, -18.170419692993164, -16.838237762451172, -15.506053924560547, -14.173870086669922, -12.841687202453613, -11.509504318237305, -10.177321434020996, -8.845138549804688, -7.5129547119140625, -6.180771827697754, -4.848588943481445, -3.5164055824279785, -2.1842222213745117, -0.8520393371582031, 0.48014378547668457, 1.8123269081115723, 3.14451003074646, 4.476693153381348, 5.808876037597656, 7.141059398651123, 8.47324275970459, 9.805425643920898, 11.137608528137207, 12.469791412353516, 13.80197525024414, 15.13415813446045, 16.466341018676758, 17.798524856567383, 19.130706787109375, 20.462890625, 21.795074462890625, 23.127256393432617, 24.459440231323242, 25.791622161865234, 27.12380599975586, 28.455989837646484, 29.78817367553711, 31.1203556060791, 32.452537536621094, 33.78472137451172, 35.116905212402344, 36.44908905029297, 37.781272888183594, 39.11345291137695, 40.44563674926758, 41.7778205871582]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 10.0, 11.0, 10.0, 10.0, 14.0, 23.0, 26.0, 18.0, 31.0, 34.0, 31.0, 44.0, 35.0, 42.0, 48.0, 45.0, 49.0, 46.0, 48.0, 48.0, 43.0, 40.0, 31.0, 28.0, 33.0, 31.0, 29.0, 20.0, 20.0, 20.0, 13.0, 9.0, 7.0, 9.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.327486038208008, -19.72764778137207, -19.127809524536133, -18.527971267700195, -17.928131103515625, -17.328292846679688, -16.72845458984375, -16.128616333007812, -15.528778076171875, -14.928939819335938, -14.3291015625, -13.729262351989746, -13.129424095153809, -12.529585838317871, -11.929746627807617, -11.32990837097168, -10.730070114135742, -10.130231857299805, -9.530393600463867, -8.930554389953613, -8.330716133117676, -7.730877876281738, -7.131039142608643, -6.531200408935547, -5.931362152099609, -5.331523895263672, -4.731685161590576, -4.1318464279174805, -3.532008171081543, -2.9321696758270264, -2.3323311805725098, -1.732492446899414, -1.1326560974121094, -0.5328176021575928, 0.06702089309692383, 0.6668593883514404, 1.266697883605957, 1.8665363788604736, 2.4663748741149902, 3.066213607788086, 3.6660518646240234, 4.265890121459961, 4.865728855133057, 5.465567588806152, 6.06540584564209, 6.665244102478027, 7.265082836151123, 7.864921569824219, 8.464759826660156, 9.064598083496094, 9.664436340332031, 10.264275550842285, 10.864113807678223, 11.46395206451416, 12.063791275024414, 12.663629531860352, 13.263467788696289, 13.863306045532227, 14.463144302368164, 15.062983512878418, 15.662821769714355, 16.26266098022461, 16.862499237060547, 17.462337493896484, 18.062175750732422]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 14.0, 15.0, 27.0, 34.0, 52.0, 74.0, 93.0, 119.0, 212.0, 353.0, 457.0, 729.0, 1087.0, 1670.0, 2507.0, 3925.0, 6105.0, 9554.0, 15934.0, 26600.0, 46321.0, 81192.0, 144783.0, 221323.0, 200613.0, 119909.0, 67479.0, 38294.0, 22320.0, 13353.0, 8425.0, 5290.0, 3418.0, 2078.0, 1378.0, 948.0, 612.0, 412.0, 260.0, 190.0, 121.0, 72.0, 57.0, 52.0, 31.0, 22.0, 14.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.62890625, -2.54632568359375, -2.4637451171875, -2.38116455078125, -2.298583984375, -2.21600341796875, -2.1334228515625, -2.05084228515625, -1.96826171875, -1.88568115234375, -1.8031005859375, -1.72052001953125, -1.637939453125, -1.55535888671875, -1.4727783203125, -1.39019775390625, -1.3076171875, -1.22503662109375, -1.1424560546875, -1.05987548828125, -0.977294921875, -0.89471435546875, -0.8121337890625, -0.72955322265625, -0.64697265625, -0.56439208984375, -0.4818115234375, -0.39923095703125, -0.316650390625, -0.23406982421875, -0.1514892578125, -0.06890869140625, 0.013671875, 0.09625244140625, 0.1788330078125, 0.26141357421875, 0.343994140625, 0.42657470703125, 0.5091552734375, 0.59173583984375, 0.67431640625, 0.75689697265625, 0.8394775390625, 0.92205810546875, 1.004638671875, 1.08721923828125, 1.1697998046875, 1.25238037109375, 1.3349609375, 1.41754150390625, 1.5001220703125, 1.58270263671875, 1.665283203125, 1.74786376953125, 1.8304443359375, 1.91302490234375, 1.99560546875, 2.07818603515625, 2.1607666015625, 2.24334716796875, 2.325927734375, 2.40850830078125, 2.4910888671875, 2.57366943359375, 2.65625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 11.0, 10.0, 9.0, 12.0, 21.0, 18.0, 22.0, 30.0, 22.0, 24.0, 19.0, 32.0, 42.0, 35.0, 51.0, 27.0, 36.0, 43.0, 50.0, 45.0, 41.0, 38.0, 44.0, 40.0, 29.0, 28.0, 33.0, 27.0, 23.0, 19.0, 16.0, 16.0, 14.0, 5.0, 13.0, 6.0, 7.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.984375, -19.35791015625, -18.7314453125, -18.10498046875, -17.478515625, -16.85205078125, -16.2255859375, -15.59912109375, -14.97265625, -14.34619140625, -13.7197265625, -13.09326171875, -12.466796875, -11.84033203125, -11.2138671875, -10.58740234375, -9.9609375, -9.33447265625, -8.7080078125, -8.08154296875, -7.455078125, -6.82861328125, -6.2021484375, -5.57568359375, -4.94921875, -4.32275390625, -3.6962890625, -3.06982421875, -2.443359375, -1.81689453125, -1.1904296875, -0.56396484375, 0.0625, 0.68896484375, 1.3154296875, 1.94189453125, 2.568359375, 3.19482421875, 3.8212890625, 4.44775390625, 5.07421875, 5.70068359375, 6.3271484375, 6.95361328125, 7.580078125, 8.20654296875, 8.8330078125, 9.45947265625, 10.0859375, 10.71240234375, 11.3388671875, 11.96533203125, 12.591796875, 13.21826171875, 13.8447265625, 14.47119140625, 15.09765625, 15.72412109375, 16.3505859375, 16.97705078125, 17.603515625, 18.22998046875, 18.8564453125, 19.48291015625, 20.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 16.0, 11.0, 16.0, 16.0, 24.0, 40.0, 58.0, 74.0, 113.0, 160.0, 232.0, 380.0, 512.0, 824.0, 1294.0, 2251.0, 4143.0, 7679.0, 17034.0, 53417.0, 838213.0, 81577.0, 20076.0, 9061.0, 4555.0, 2570.0, 1541.0, 882.0, 554.0, 384.0, 243.0, 170.0, 118.0, 101.0, 56.0, 43.0, 35.0, 24.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0], "bins": [-8.5546875, -8.3209228515625, -8.087158203125, -7.8533935546875, -7.61962890625, -7.3858642578125, -7.152099609375, -6.9183349609375, -6.6845703125, -6.4508056640625, -6.217041015625, -5.9832763671875, -5.74951171875, -5.5157470703125, -5.281982421875, -5.0482177734375, -4.814453125, -4.5806884765625, -4.346923828125, -4.1131591796875, -3.87939453125, -3.6456298828125, -3.411865234375, -3.1781005859375, -2.9443359375, -2.7105712890625, -2.476806640625, -2.2430419921875, -2.00927734375, -1.7755126953125, -1.541748046875, -1.3079833984375, -1.07421875, -0.8404541015625, -0.606689453125, -0.3729248046875, -0.13916015625, 0.0946044921875, 0.328369140625, 0.5621337890625, 0.7958984375, 1.0296630859375, 1.263427734375, 1.4971923828125, 1.73095703125, 1.9647216796875, 2.198486328125, 2.4322509765625, 2.666015625, 2.8997802734375, 3.133544921875, 3.3673095703125, 3.60107421875, 3.8348388671875, 4.068603515625, 4.3023681640625, 4.5361328125, 4.7698974609375, 5.003662109375, 5.2374267578125, 5.47119140625, 5.7049560546875, 5.938720703125, 6.1724853515625, 6.40625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 7.0, 12.0, 12.0, 9.0, 14.0, 12.0, 18.0, 19.0, 25.0, 23.0, 32.0, 30.0, 33.0, 39.0, 33.0, 37.0, 44.0, 58.0, 48.0, 40.0, 48.0, 50.0, 40.0, 44.0, 36.0, 39.0, 34.0, 29.0, 17.0, 21.0, 15.0, 17.0, 14.0, 14.0, 7.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.578125, -13.171875, -12.765625, -12.359375, -11.953125, -11.546875, -11.140625, -10.734375, -10.328125, -9.921875, -9.515625, -9.109375, -8.703125, -8.296875, -7.890625, -7.484375, -7.078125, -6.671875, -6.265625, -5.859375, -5.453125, -5.046875, -4.640625, -4.234375, -3.828125, -3.421875, -3.015625, -2.609375, -2.203125, -1.796875, -1.390625, -0.984375, -0.578125, -0.171875, 0.234375, 0.640625, 1.046875, 1.453125, 1.859375, 2.265625, 2.671875, 3.078125, 3.484375, 3.890625, 4.296875, 4.703125, 5.109375, 5.515625, 5.921875, 6.328125, 6.734375, 7.140625, 7.546875, 7.953125, 8.359375, 8.765625, 9.171875, 9.578125, 9.984375, 10.390625, 10.796875, 11.203125, 11.609375, 12.015625, 12.421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 19.0, 14.0, 30.0, 33.0, 47.0, 69.0, 97.0, 140.0, 196.0, 384.0, 530.0, 837.0, 1356.0, 2229.0, 4160.0, 7858.0, 15736.0, 37813.0, 877374.0, 58803.0, 19653.0, 9415.0, 4925.0, 2670.0, 1615.0, 930.0, 568.0, 333.0, 247.0, 176.0, 93.0, 56.0, 48.0, 22.0, 27.0, 14.0, 14.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6240081787109375, -1.577117919921875, -1.5302276611328125, -1.48333740234375, -1.4364471435546875, -1.389556884765625, -1.3426666259765625, -1.2957763671875, -1.2488861083984375, -1.201995849609375, -1.1551055908203125, -1.10821533203125, -1.0613250732421875, -1.014434814453125, -0.9675445556640625, -0.920654296875, -0.8737640380859375, -0.826873779296875, -0.7799835205078125, -0.73309326171875, -0.6862030029296875, -0.639312744140625, -0.5924224853515625, -0.5455322265625, -0.4986419677734375, -0.451751708984375, -0.4048614501953125, -0.35797119140625, -0.3110809326171875, -0.264190673828125, -0.2173004150390625, -0.17041015625, -0.1235198974609375, -0.076629638671875, -0.0297393798828125, 0.01715087890625, 0.0640411376953125, 0.110931396484375, 0.1578216552734375, 0.2047119140625, 0.2516021728515625, 0.298492431640625, 0.3453826904296875, 0.39227294921875, 0.4391632080078125, 0.486053466796875, 0.5329437255859375, 0.579833984375, 0.6267242431640625, 0.673614501953125, 0.7205047607421875, 0.76739501953125, 0.8142852783203125, 0.861175537109375, 0.9080657958984375, 0.9549560546875, 1.0018463134765625, 1.048736572265625, 1.0956268310546875, 1.14251708984375, 1.1894073486328125, 1.236297607421875, 1.2831878662109375, 1.330078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 1.0, 8.0, 2.0, 6.0, 11.0, 7.0, 26.0, 17.0, 27.0, 34.0, 34.0, 30.0, 40.0, 51.0, 48.0, 51.0, 52.0, 57.0, 63.0, 52.0, 50.0, 34.0, 48.0, 30.0, 46.0, 32.0, 21.0, 20.0, 16.0, 16.0, 16.0, 18.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.8683414459228516e-05, -3.740284591913223e-05, -3.612227737903595e-05, -3.484170883893967e-05, -3.3561140298843384e-05, -3.22805717587471e-05, -3.100000321865082e-05, -2.9719434678554535e-05, -2.8438866138458252e-05, -2.715829759836197e-05, -2.5877729058265686e-05, -2.4597160518169403e-05, -2.331659197807312e-05, -2.2036023437976837e-05, -2.0755454897880554e-05, -1.947488635778427e-05, -1.8194317817687988e-05, -1.6913749277591705e-05, -1.5633180737495422e-05, -1.435261219739914e-05, -1.3072043657302856e-05, -1.1791475117206573e-05, -1.051090657711029e-05, -9.230338037014008e-06, -7.949769496917725e-06, -6.669200956821442e-06, -5.388632416725159e-06, -4.108063876628876e-06, -2.8274953365325928e-06, -1.5469267964363098e-06, -2.6635825634002686e-07, 1.014210283756256e-06, 2.294778823852539e-06, 3.575347363948822e-06, 4.855915904045105e-06, 6.136484444141388e-06, 7.417052984237671e-06, 8.697621524333954e-06, 9.978190064430237e-06, 1.125875860452652e-05, 1.2539327144622803e-05, 1.3819895684719086e-05, 1.5100464224815369e-05, 1.638103276491165e-05, 1.7661601305007935e-05, 1.8942169845104218e-05, 2.02227383852005e-05, 2.1503306925296783e-05, 2.2783875465393066e-05, 2.406444400548935e-05, 2.5345012545585632e-05, 2.6625581085681915e-05, 2.7906149625778198e-05, 2.918671816587448e-05, 3.0467286705970764e-05, 3.174785524606705e-05, 3.302842378616333e-05, 3.430899232625961e-05, 3.5589560866355896e-05, 3.687012940645218e-05, 3.815069794654846e-05, 3.9431266486644745e-05, 4.071183502674103e-05, 4.199240356683731e-05, 4.3272972106933594e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 13.0, 20.0, 37.0, 41.0, 69.0, 109.0, 175.0, 267.0, 415.0, 666.0, 1116.0, 1923.0, 3407.0, 6298.0, 11915.0, 23021.0, 45435.0, 92075.0, 175556.0, 252648.0, 205127.0, 112716.0, 55933.0, 27806.0, 14184.0, 7515.0, 4113.0, 2383.0, 1342.0, 832.0, 487.0, 279.0, 220.0, 114.0, 95.0, 49.0, 46.0, 34.0, 19.0, 10.0, 3.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7511672973632812, -0.7274322509765625, -0.7036972045898438, -0.679962158203125, -0.6562271118164062, -0.6324920654296875, -0.6087570190429688, -0.58502197265625, -0.5612869262695312, -0.5375518798828125, -0.5138168334960938, -0.490081787109375, -0.46634674072265625, -0.4426116943359375, -0.41887664794921875, -0.3951416015625, -0.37140655517578125, -0.3476715087890625, -0.32393646240234375, -0.300201416015625, -0.27646636962890625, -0.2527313232421875, -0.22899627685546875, -0.20526123046875, -0.18152618408203125, -0.1577911376953125, -0.13405609130859375, -0.110321044921875, -0.08658599853515625, -0.0628509521484375, -0.03911590576171875, -0.015380859375, 0.00835418701171875, 0.0320892333984375, 0.05582427978515625, 0.079559326171875, 0.10329437255859375, 0.1270294189453125, 0.15076446533203125, 0.17449951171875, 0.19823455810546875, 0.2219696044921875, 0.24570465087890625, 0.269439697265625, 0.29317474365234375, 0.3169097900390625, 0.34064483642578125, 0.3643798828125, 0.38811492919921875, 0.4118499755859375, 0.43558502197265625, 0.459320068359375, 0.48305511474609375, 0.5067901611328125, 0.5305252075195312, 0.55426025390625, 0.5779953002929688, 0.6017303466796875, 0.6254653930664062, 0.649200439453125, 0.6729354858398438, 0.6966705322265625, 0.7204055786132812, 0.744140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 10.0, 5.0, 13.0, 14.0, 23.0, 22.0, 33.0, 52.0, 51.0, 58.0, 83.0, 81.0, 76.0, 61.0, 83.0, 57.0, 57.0, 52.0, 47.0, 33.0, 25.0, 23.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20371627807617188, -0.19551849365234375, -0.18732070922851562, -0.1791229248046875, -0.17092514038085938, -0.16272735595703125, -0.15452957153320312, -0.146331787109375, -0.13813400268554688, -0.12993621826171875, -0.12173843383789062, -0.1135406494140625, -0.10534286499023438, -0.09714508056640625, -0.08894729614257812, -0.08074951171875, -0.07255172729492188, -0.06435394287109375, -0.056156158447265625, -0.0479583740234375, -0.039760589599609375, -0.03156280517578125, -0.023365020751953125, -0.015167236328125, -0.006969451904296875, 0.00122833251953125, 0.009426116943359375, 0.0176239013671875, 0.025821685791015625, 0.03401947021484375, 0.042217254638671875, 0.0504150390625, 0.058612823486328125, 0.06681060791015625, 0.07500839233398438, 0.0832061767578125, 0.09140396118164062, 0.09960174560546875, 0.10779953002929688, 0.115997314453125, 0.12419509887695312, 0.13239288330078125, 0.14059066772460938, 0.1487884521484375, 0.15698623657226562, 0.16518402099609375, 0.17338180541992188, 0.18157958984375, 0.18977737426757812, 0.19797515869140625, 0.20617294311523438, 0.2143707275390625, 0.22256851196289062, 0.23076629638671875, 0.23896408081054688, 0.247161865234375, 0.2553596496582031, 0.26355743408203125, 0.2717552185058594, 0.2799530029296875, 0.2881507873535156, 0.29634857177734375, 0.3045463562011719, 0.312744140625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 17.0, 16.0, 23.0, 21.0, 28.0, 51.0, 52.0, 86.0, 69.0, 88.0, 76.0, 79.0, 72.0, 63.0, 70.0, 31.0, 33.0, 33.0, 20.0, 17.0, 14.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.14012145996094, -41.805110931396484, -40.47010040283203, -39.135093688964844, -37.80008316040039, -36.46507263183594, -35.13006591796875, -33.7950553894043, -32.460044860839844, -31.12503433227539, -29.79002571105957, -28.45501708984375, -27.120006561279297, -25.784996032714844, -24.449987411499023, -23.114978790283203, -21.77996826171875, -20.444957733154297, -19.109949111938477, -17.774940490722656, -16.439929962158203, -15.104920387268066, -13.76991081237793, -12.434901237487793, -11.099891662597656, -9.76488208770752, -8.429872512817383, -7.094862937927246, -5.759853363037109, -4.424843788146973, -3.089834213256836, -1.7548246383666992, -0.4198188781738281, 0.9151906967163086, 2.2502002716064453, 3.585209846496582, 4.920219421386719, 6.2552289962768555, 7.590238571166992, 8.925248146057129, 10.260257720947266, 11.595267295837402, 12.930276870727539, 14.265286445617676, 15.600296020507812, 16.935306549072266, 18.270315170288086, 19.605323791503906, 20.94033432006836, 22.275344848632812, 23.610353469848633, 24.945362091064453, 26.280372619628906, 27.61538314819336, 28.95039176940918, 30.285400390625, 31.620410919189453, 32.955421447753906, 34.290428161621094, 35.62543869018555, 36.96044921875, 38.29545974731445, 39.630470275878906, 40.965476989746094, 42.30048751831055]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 13.0, 10.0, 10.0, 11.0, 12.0, 23.0, 25.0, 21.0, 29.0, 33.0, 32.0, 40.0, 38.0, 43.0, 44.0, 47.0, 51.0, 46.0, 48.0, 49.0, 42.0, 36.0, 37.0, 27.0, 28.0, 35.0, 29.0, 21.0, 19.0, 22.0, 10.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.5731201171875, -19.966615676879883, -19.360111236572266, -18.75360679626465, -18.14710235595703, -17.540597915649414, -16.934093475341797, -16.327587127685547, -15.721083641052246, -15.114579200744629, -14.508074760437012, -13.901570320129395, -13.295064926147461, -12.688560485839844, -12.082056045532227, -11.47555160522461, -10.869047164916992, -10.262542724609375, -9.656038284301758, -9.04953384399414, -8.443029403686523, -7.836524486541748, -7.230019569396973, -6.6235151290893555, -6.017010688781738, -5.410506248474121, -4.804001808166504, -4.1974968910217285, -3.5909924507141113, -2.984488010406494, -2.377983331680298, -1.7714786529541016, -1.1649742126464844, -0.5584696531295776, 0.0480349063873291, 0.6545394659042358, 1.2610440254211426, 1.8675484657287598, 2.474053144454956, 3.0805578231811523, 3.6870622634887695, 4.293566703796387, 4.900071144104004, 5.506576061248779, 6.1130805015563965, 6.719584941864014, 7.326089859008789, 7.932594299316406, 8.539098739624023, 9.14560317993164, 9.752107620239258, 10.358612060546875, 10.965116500854492, 11.57162094116211, 12.178126335144043, 12.78463077545166, 13.391135215759277, 13.997639656066895, 14.604144096374512, 15.210648536682129, 15.817153930664062, 16.42365837097168, 17.030162811279297, 17.636667251586914, 18.24317169189453]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 15.0, 17.0, 28.0, 49.0, 67.0, 88.0, 142.0, 188.0, 285.0, 413.0, 566.0, 777.0, 1192.0, 1792.0, 2631.0, 3779.0, 5997.0, 9123.0, 14755.0, 23935.0, 40241.0, 68816.0, 114528.0, 168787.0, 189364.0, 152537.0, 98586.0, 58525.0, 34310.0, 20429.0, 12606.0, 8035.0, 5292.0, 3368.0, 2352.0, 1606.0, 953.0, 770.0, 528.0, 350.0, 234.0, 162.0, 111.0, 80.0, 50.0, 39.0, 16.0, 12.0, 9.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.896484375, -19.26171875, -18.626953125, -17.9921875, -17.357421875, -16.72265625, -16.087890625, -15.453125, -14.818359375, -14.18359375, -13.548828125, -12.9140625, -12.279296875, -11.64453125, -11.009765625, -10.375, -9.740234375, -9.10546875, -8.470703125, -7.8359375, -7.201171875, -6.56640625, -5.931640625, -5.296875, -4.662109375, -4.02734375, -3.392578125, -2.7578125, -2.123046875, -1.48828125, -0.853515625, -0.21875, 0.416015625, 1.05078125, 1.685546875, 2.3203125, 2.955078125, 3.58984375, 4.224609375, 4.859375, 5.494140625, 6.12890625, 6.763671875, 7.3984375, 8.033203125, 8.66796875, 9.302734375, 9.9375, 10.572265625, 11.20703125, 11.841796875, 12.4765625, 13.111328125, 13.74609375, 14.380859375, 15.015625, 15.650390625, 16.28515625, 16.919921875, 17.5546875, 18.189453125, 18.82421875, 19.458984375, 20.09375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 5.0, 6.0, 12.0, 11.0, 22.0, 15.0, 21.0, 23.0, 25.0, 25.0, 24.0, 31.0, 39.0, 45.0, 41.0, 38.0, 51.0, 47.0, 62.0, 48.0, 43.0, 36.0, 51.0, 32.0, 29.0, 40.0, 30.0, 23.0, 18.0, 17.0, 18.0, 12.0, 10.0, 12.0, 8.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-23.953125, -23.32421875, -22.6953125, -22.06640625, -21.4375, -20.80859375, -20.1796875, -19.55078125, -18.921875, -18.29296875, -17.6640625, -17.03515625, -16.40625, -15.77734375, -15.1484375, -14.51953125, -13.890625, -13.26171875, -12.6328125, -12.00390625, -11.375, -10.74609375, -10.1171875, -9.48828125, -8.859375, -8.23046875, -7.6015625, -6.97265625, -6.34375, -5.71484375, -5.0859375, -4.45703125, -3.828125, -3.19921875, -2.5703125, -1.94140625, -1.3125, -0.68359375, -0.0546875, 0.57421875, 1.203125, 1.83203125, 2.4609375, 3.08984375, 3.71875, 4.34765625, 4.9765625, 5.60546875, 6.234375, 6.86328125, 7.4921875, 8.12109375, 8.75, 9.37890625, 10.0078125, 10.63671875, 11.265625, 11.89453125, 12.5234375, 13.15234375, 13.78125, 14.41015625, 15.0390625, 15.66796875, 16.296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 8.0, 12.0, 12.0, 19.0, 30.0, 53.0, 70.0, 121.0, 169.0, 236.0, 362.0, 546.0, 814.0, 1245.0, 1936.0, 3051.0, 4913.0, 7861.0, 13112.0, 22049.0, 38202.0, 67804.0, 117949.0, 182642.0, 207099.0, 155486.0, 93811.0, 52769.0, 30238.0, 17677.0, 10581.0, 6392.0, 3951.0, 2550.0, 1662.0, 1108.0, 714.0, 431.0, 309.0, 189.0, 129.0, 79.0, 59.0, 35.0, 34.0, 15.0, 10.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.328125, -27.392822265625, -26.45751953125, -25.522216796875, -24.5869140625, -23.651611328125, -22.71630859375, -21.781005859375, -20.845703125, -19.910400390625, -18.97509765625, -18.039794921875, -17.1044921875, -16.169189453125, -15.23388671875, -14.298583984375, -13.36328125, -12.427978515625, -11.49267578125, -10.557373046875, -9.6220703125, -8.686767578125, -7.75146484375, -6.816162109375, -5.880859375, -4.945556640625, -4.01025390625, -3.074951171875, -2.1396484375, -1.204345703125, -0.26904296875, 0.666259765625, 1.6015625, 2.536865234375, 3.47216796875, 4.407470703125, 5.3427734375, 6.278076171875, 7.21337890625, 8.148681640625, 9.083984375, 10.019287109375, 10.95458984375, 11.889892578125, 12.8251953125, 13.760498046875, 14.69580078125, 15.631103515625, 16.56640625, 17.501708984375, 18.43701171875, 19.372314453125, 20.3076171875, 21.242919921875, 22.17822265625, 23.113525390625, 24.048828125, 24.984130859375, 25.91943359375, 26.854736328125, 27.7900390625, 28.725341796875, 29.66064453125, 30.595947265625, 31.53125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 10.0, 4.0, 6.0, 8.0, 11.0, 16.0, 17.0, 16.0, 17.0, 23.0, 35.0, 23.0, 50.0, 26.0, 35.0, 47.0, 45.0, 47.0, 40.0, 52.0, 33.0, 42.0, 36.0, 38.0, 35.0, 38.0, 34.0, 23.0, 19.0, 27.0, 27.0, 22.0, 11.0, 13.0, 11.0, 14.0, 12.0, 4.0, 6.0, 4.0, 4.0, 4.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -10.962158203125, -10.57275390625, -10.183349609375, -9.7939453125, -9.404541015625, -9.01513671875, -8.625732421875, -8.236328125, -7.846923828125, -7.45751953125, -7.068115234375, -6.6787109375, -6.289306640625, -5.89990234375, -5.510498046875, -5.12109375, -4.731689453125, -4.34228515625, -3.952880859375, -3.5634765625, -3.174072265625, -2.78466796875, -2.395263671875, -2.005859375, -1.616455078125, -1.22705078125, -0.837646484375, -0.4482421875, -0.058837890625, 0.33056640625, 0.719970703125, 1.109375, 1.498779296875, 1.88818359375, 2.277587890625, 2.6669921875, 3.056396484375, 3.44580078125, 3.835205078125, 4.224609375, 4.614013671875, 5.00341796875, 5.392822265625, 5.7822265625, 6.171630859375, 6.56103515625, 6.950439453125, 7.33984375, 7.729248046875, 8.11865234375, 8.508056640625, 8.8974609375, 9.286865234375, 9.67626953125, 10.065673828125, 10.455078125, 10.844482421875, 11.23388671875, 11.623291015625, 12.0126953125, 12.402099609375, 12.79150390625, 13.180908203125, 13.5703125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 6.0, 14.0, 11.0, 22.0, 26.0, 46.0, 60.0, 108.0, 141.0, 210.0, 294.0, 428.0, 687.0, 1093.0, 1664.0, 2731.0, 4531.0, 7720.0, 13522.0, 25709.0, 51235.0, 106695.0, 202641.0, 257463.0, 182316.0, 92094.0, 44456.0, 22573.0, 12034.0, 6938.0, 4072.0, 2591.0, 1522.0, 986.0, 633.0, 426.0, 265.0, 186.0, 128.0, 69.0, 65.0, 46.0, 31.0, 23.0, 14.0, 6.0, 6.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.4052734375, -17.779296875, -17.1533203125, -16.52734375, -15.9013671875, -15.275390625, -14.6494140625, -14.0234375, -13.3974609375, -12.771484375, -12.1455078125, -11.51953125, -10.8935546875, -10.267578125, -9.6416015625, -9.015625, -8.3896484375, -7.763671875, -7.1376953125, -6.51171875, -5.8857421875, -5.259765625, -4.6337890625, -4.0078125, -3.3818359375, -2.755859375, -2.1298828125, -1.50390625, -0.8779296875, -0.251953125, 0.3740234375, 1.0, 1.6259765625, 2.251953125, 2.8779296875, 3.50390625, 4.1298828125, 4.755859375, 5.3818359375, 6.0078125, 6.6337890625, 7.259765625, 7.8857421875, 8.51171875, 9.1376953125, 9.763671875, 10.3896484375, 11.015625, 11.6416015625, 12.267578125, 12.8935546875, 13.51953125, 14.1455078125, 14.771484375, 15.3974609375, 16.0234375, 16.6494140625, 17.275390625, 17.9013671875, 18.52734375, 19.1533203125, 19.779296875, 20.4052734375, 21.03125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 8.0, 7.0, 9.0, 18.0, 14.0, 19.0, 25.0, 22.0, 33.0, 44.0, 74.0, 92.0, 79.0, 82.0, 81.0, 72.0, 76.0, 57.0, 41.0, 28.0, 19.0, 19.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.0021779239177703857, -0.0021089911460876465, -0.0020400583744049072, -0.001971125602722168, -0.0019021928310394287, -0.0018332600593566895, -0.0017643272876739502, -0.001695394515991211, -0.0016264617443084717, -0.0015575289726257324, -0.0014885962009429932, -0.001419663429260254, -0.0013507306575775146, -0.0012817978858947754, -0.0012128651142120361, -0.0011439323425292969, -0.0010749995708465576, -0.0010060667991638184, -0.0009371340274810791, -0.0008682012557983398, -0.0007992684841156006, -0.0007303357124328613, -0.0006614029407501221, -0.0005924701690673828, -0.0005235373973846436, -0.0004546046257019043, -0.00038567185401916504, -0.0003167390823364258, -0.0002478063106536865, -0.00017887353897094727, -0.00010994076728820801, -4.100799560546875e-05, 2.7924776077270508e-05, 9.685754776000977e-05, 0.00016579031944274902, 0.00023472309112548828, 0.00030365586280822754, 0.0003725886344909668, 0.00044152140617370605, 0.0005104541778564453, 0.0005793869495391846, 0.0006483197212219238, 0.0007172524929046631, 0.0007861852645874023, 0.0008551180362701416, 0.0009240508079528809, 0.0009929835796356201, 0.0010619163513183594, 0.0011308491230010986, 0.0011997818946838379, 0.0012687146663665771, 0.0013376474380493164, 0.0014065802097320557, 0.001475512981414795, 0.0015444457530975342, 0.0016133785247802734, 0.0016823112964630127, 0.001751244068145752, 0.0018201768398284912, 0.0018891096115112305, 0.0019580423831939697, 0.002026975154876709, 0.0020959079265594482, 0.0021648406982421875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 14.0, 21.0, 36.0, 50.0, 57.0, 99.0, 134.0, 168.0, 241.0, 367.0, 560.0, 803.0, 1291.0, 2093.0, 3475.0, 5592.0, 10330.0, 19105.0, 37284.0, 78492.0, 163228.0, 262228.0, 225455.0, 119018.0, 56119.0, 27500.0, 14619.0, 7982.0, 4504.0, 2762.0, 1691.0, 1088.0, 698.0, 424.0, 299.0, 236.0, 131.0, 99.0, 82.0, 52.0, 40.0, 23.0, 16.0, 14.0, 5.0, 5.0, 4.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.3125, -17.717529296875, -17.12255859375, -16.527587890625, -15.9326171875, -15.337646484375, -14.74267578125, -14.147705078125, -13.552734375, -12.957763671875, -12.36279296875, -11.767822265625, -11.1728515625, -10.577880859375, -9.98291015625, -9.387939453125, -8.79296875, -8.197998046875, -7.60302734375, -7.008056640625, -6.4130859375, -5.818115234375, -5.22314453125, -4.628173828125, -4.033203125, -3.438232421875, -2.84326171875, -2.248291015625, -1.6533203125, -1.058349609375, -0.46337890625, 0.131591796875, 0.7265625, 1.321533203125, 1.91650390625, 2.511474609375, 3.1064453125, 3.701416015625, 4.29638671875, 4.891357421875, 5.486328125, 6.081298828125, 6.67626953125, 7.271240234375, 7.8662109375, 8.461181640625, 9.05615234375, 9.651123046875, 10.24609375, 10.841064453125, 11.43603515625, 12.031005859375, 12.6259765625, 13.220947265625, 13.81591796875, 14.410888671875, 15.005859375, 15.600830078125, 16.19580078125, 16.790771484375, 17.3857421875, 17.980712890625, 18.57568359375, 19.170654296875, 19.765625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 8.0, 20.0, 20.0, 25.0, 22.0, 29.0, 31.0, 25.0, 49.0, 47.0, 59.0, 58.0, 56.0, 66.0, 50.0, 40.0, 39.0, 46.0, 38.0, 49.0, 31.0, 22.0, 23.0, 25.0, 11.0, 14.0, 9.0, 8.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.939453125, -3.817626953125, -3.69580078125, -3.573974609375, -3.4521484375, -3.330322265625, -3.20849609375, -3.086669921875, -2.96484375, -2.843017578125, -2.72119140625, -2.599365234375, -2.4775390625, -2.355712890625, -2.23388671875, -2.112060546875, -1.990234375, -1.868408203125, -1.74658203125, -1.624755859375, -1.5029296875, -1.381103515625, -1.25927734375, -1.137451171875, -1.015625, -0.893798828125, -0.77197265625, -0.650146484375, -0.5283203125, -0.406494140625, -0.28466796875, -0.162841796875, -0.041015625, 0.080810546875, 0.20263671875, 0.324462890625, 0.4462890625, 0.568115234375, 0.68994140625, 0.811767578125, 0.93359375, 1.055419921875, 1.17724609375, 1.299072265625, 1.4208984375, 1.542724609375, 1.66455078125, 1.786376953125, 1.908203125, 2.030029296875, 2.15185546875, 2.273681640625, 2.3955078125, 2.517333984375, 2.63916015625, 2.760986328125, 2.8828125, 3.004638671875, 3.12646484375, 3.248291015625, 3.3701171875, 3.491943359375, 3.61376953125, 3.735595703125, 3.857421875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 8.0, 5.0, 4.0, 11.0, 16.0, 20.0, 25.0, 24.0, 29.0, 24.0, 49.0, 67.0, 68.0, 58.0, 69.0, 76.0, 72.0, 59.0, 50.0, 63.0, 43.0, 35.0, 31.0, 23.0, 22.0, 11.0, 11.0, 10.0, 5.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53688430786133, -37.30178451538086, -36.06668472290039, -34.83158493041992, -33.59648513793945, -32.36138153076172, -31.126283645629883, -29.89118194580078, -28.656082153320312, -27.420982360839844, -26.185882568359375, -24.950782775878906, -23.715681076049805, -22.480581283569336, -21.245481491088867, -20.010379791259766, -18.77528190612793, -17.54018211364746, -16.305082321166992, -15.069981575012207, -13.834880828857422, -12.599781036376953, -11.364681243896484, -10.1295804977417, -8.89448070526123, -7.6593804359436035, -6.424280166625977, -5.189180374145508, -3.954080104827881, -2.718979835510254, -1.4838800430297852, -0.248779296875, 0.9863204956054688, 2.2214207649230957, 3.4565207958221436, 4.691620826721191, 5.926721096038818, 7.161821365356445, 8.396921157836914, 9.6320219039917, 10.867121696472168, 12.102221488952637, 13.337322235107422, 14.57242202758789, 15.80752182006836, 17.042621612548828, 18.277721405029297, 19.5128231048584, 20.747922897338867, 21.983022689819336, 23.218122482299805, 24.453224182128906, 25.688323974609375, 26.923423767089844, 28.158523559570312, 29.39362335205078, 30.62872314453125, 31.86382293701172, 33.09892272949219, 34.334022521972656, 35.569122314453125, 36.804222106933594, 38.03932189941406, 39.2744255065918, 40.509525299072266]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 6.0, 5.0, 13.0, 14.0, 10.0, 13.0, 14.0, 18.0, 26.0, 33.0, 25.0, 35.0, 41.0, 51.0, 53.0, 54.0, 51.0, 56.0, 46.0, 51.0, 47.0, 44.0, 41.0, 37.0, 25.0, 22.0, 24.0, 26.0, 17.0, 17.0, 15.0, 13.0, 9.0, 7.0, 5.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.1720027923584, -27.324731826782227, -26.477462768554688, -25.630191802978516, -24.782920837402344, -23.935651779174805, -23.088380813598633, -22.241111755371094, -21.393840789794922, -20.54656982421875, -19.69930076599121, -18.85202980041504, -18.0047607421875, -17.157489776611328, -16.310218811035156, -15.4629487991333, -14.615678787231445, -13.76840877532959, -12.921138763427734, -12.073867797851562, -11.226597785949707, -10.379327774047852, -9.53205680847168, -8.684786796569824, -7.837516784667969, -6.990246772766113, -6.1429762840271, -5.295705795288086, -4.4484357833862305, -3.601165771484375, -2.7538952827453613, -1.9066247940063477, -1.0593547821044922, -0.21208453178405762, 0.635185718536377, 1.4824559688568115, 2.329726219177246, 3.1769962310791016, 4.024266719818115, 4.871537208557129, 5.718807220458984, 6.56607723236084, 7.4133477210998535, 8.260618209838867, 9.107888221740723, 9.955158233642578, 10.80242919921875, 11.649699211120605, 12.496969223022461, 13.344239234924316, 14.191509246826172, 15.038780212402344, 15.8860502243042, 16.733320236206055, 17.580591201782227, 18.427860260009766, 19.275131225585938, 20.12240219116211, 20.96967124938965, 21.81694221496582, 22.66421127319336, 23.51148223876953, 24.358753204345703, 25.206024169921875, 26.053293228149414]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 9.0, 11.0, 9.0, 14.0, 16.0, 19.0, 15.0, 24.0, 28.0, 25.0, 33.0, 63.0, 92.0, 184.0, 374.0, 682.0, 1439.0, 3415.0, 507871.0, 5862.0, 1996.0, 917.0, 457.0, 226.0, 115.0, 92.0, 66.0, 31.0, 24.0, 17.0, 20.0, 13.0, 13.0, 12.0, 10.0, 20.0, 6.0, 4.0, 4.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-774.417236328125, -752.728271484375, -731.0392456054688, -709.3502807617188, -687.6612548828125, -665.9722900390625, -644.2833251953125, -622.5942993164062, -600.9053344726562, -579.2163696289062, -557.52734375, -535.83837890625, -514.1493530273438, -492.46038818359375, -470.7713928222656, -449.0823974609375, -427.3934020996094, -405.70440673828125, -384.0154113769531, -362.326416015625, -340.637451171875, -318.9484558105469, -297.25946044921875, -275.57049560546875, -253.88148498535156, -232.19248962402344, -210.50350952148438, -188.81451416015625, -167.12551879882812, -145.43653869628906, -123.74754333496094, -102.05856323242188, -80.36956787109375, -58.680580139160156, -36.9915885925293, -15.302597045898438, 6.386390686035156, 28.07537841796875, 49.764373779296875, 71.45335388183594, 93.14234924316406, 114.83133697509766, 136.52032470703125, 158.20932006835938, 179.8983154296875, 201.58729553222656, 223.2762908935547, 244.96527099609375, 266.6542663574219, 288.34326171875, 310.0322570800781, 331.72125244140625, 353.41021728515625, 375.0992126464844, 396.7882080078125, 418.4771728515625, 440.16619873046875, 461.8551940917969, 483.544189453125, 505.233154296875, 526.9221801757812, 548.6111450195312, 570.3001708984375, 591.9891357421875, 613.6781005859375]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 9.0, 7.0, 6.0, 8.0, 13.0, 13.0, 9.0, 16.0, 16.0, 26.0, 34.0, 24.0, 31.0, 43.0, 43.0, 49.0, 55.0, 51.0, 1080.0, 56.0, 50.0, 43.0, 46.0, 43.0, 40.0, 27.0, 22.0, 25.0, 22.0, 26.0, 13.0, 16.0, 13.0, 12.0, 5.0, 8.0, 2.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-912.578857421875, -885.506103515625, -858.4334106445312, -831.3606567382812, -804.2879638671875, -777.2152099609375, -750.1424560546875, -723.0697021484375, -695.9970092773438, -668.9242553710938, -641.8515625, -614.77880859375, -587.7060546875, -560.6333618164062, -533.5606079101562, -506.4878845214844, -479.4151611328125, -452.3424377441406, -425.26971435546875, -398.19696044921875, -371.1242370605469, -344.051513671875, -316.978759765625, -289.9060363769531, -262.83331298828125, -235.76058959960938, -208.68785095214844, -181.6151123046875, -154.54238891601562, -127.46966552734375, -100.39692687988281, -73.32418823242188, -46.25140380859375, -19.178672790527344, 7.8940582275390625, 34.96678924560547, 62.039520263671875, 89.11224365234375, 116.18498229980469, 143.25772094726562, 170.3304443359375, 197.40316772460938, 224.4759063720703, 251.54864501953125, 278.6213684082031, 305.694091796875, 332.766845703125, 359.8395690917969, 386.91229248046875, 413.9850158691406, 441.0577392578125, 468.1304931640625, 495.2032165527344, 522.2759399414062, 549.3486938476562, 576.42138671875, 603.494140625, 630.56689453125, 657.6395874023438, 684.7123413085938, 711.7850341796875, 738.8577880859375, 765.9305419921875, 793.0032958984375, 820.0759887695312]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 14.0, 14.0, 20.0, 24.0, 32.0, 49.0, 68.0, 68.0, 83.0, 102.0, 143.0, 155.0, 200.0, 235.0, 320.0, 419.0, 521.0, 661.0, 958.0, 1068.0, 1451.0, 2004.0, 4214.0, 19206.0, 31198024.0, 10843.0, 4036.0, 3086.0, 2397.0, 1548.0, 1290.0, 607.0, 229.0, 100.0, 70.0, 56.0, 26.0, 29.0, 20.0, 21.0, 20.0, 15.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-880.484375, -855.5458984375, -830.6073608398438, -805.6688842773438, -780.7304077148438, -755.7919311523438, -730.8533935546875, -705.9149169921875, -680.9764404296875, -656.0379638671875, -631.0994262695312, -606.1609497070312, -581.2224731445312, -556.2839965820312, -531.345458984375, -506.406982421875, -481.4684753417969, -456.52996826171875, -431.59149169921875, -406.6529846191406, -381.7145080566406, -356.7760009765625, -331.8375244140625, -306.8990173339844, -281.96051025390625, -257.0220031738281, -232.08352661132812, -207.14501953125, -182.20654296875, -157.26803588867188, -132.3295440673828, -107.39105224609375, -82.45257568359375, -57.51408386230469, -32.57558822631836, -7.637092590332031, 17.30139923095703, 42.239891052246094, 67.17839050292969, 92.11688232421875, 117.05537414550781, 141.99386596679688, 166.93235778808594, 191.870849609375, 216.80935668945312, 241.74783325195312, 266.68634033203125, 291.62481689453125, 316.5633239746094, 341.5018310546875, 366.4403076171875, 391.3788146972656, 416.3172912597656, 441.25579833984375, 466.19427490234375, 491.1327819824219, 516.0712890625, 541.009765625, 565.9483032226562, 590.8867797851562, 615.8252563476562, 640.7637329101562, 665.7022705078125, 690.6407470703125, 715.5792236328125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 13.0, 9.0, 10.0, 12.0, 15.0, 27.0, 21.0, 40.0, 33.0, 42.0, 51.0, 56.0, 71.0, 91.0, 68.0, 74.0, 58.0, 57.0, 43.0, 30.0, 30.0, 21.0, 18.0, 21.0, 10.0, 8.0, 16.0, 8.0, 10.0, 6.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-515.4827270507812, -501.5868225097656, -487.6909484863281, -473.7950439453125, -459.899169921875, -446.0032653808594, -432.10736083984375, -418.21148681640625, -404.3155822753906, -390.419677734375, -376.5238037109375, -362.6278991699219, -348.7320251464844, -334.83612060546875, -320.94024658203125, -307.0443420410156, -293.1484375, -279.2525329589844, -265.3566589355469, -251.46075439453125, -237.5648651123047, -223.66897583007812, -209.77308654785156, -195.877197265625, -181.9813232421875, -168.08543395996094, -154.18954467773438, -140.29364013671875, -126.39775085449219, -112.50186157226562, -98.60597229003906, -84.71007537841797, -70.81417846679688, -56.91828536987305, -43.02239227294922, -29.126502990722656, -15.230609893798828, -1.334716796875, 12.561172485351562, 26.457069396972656, 40.35295867919922, 54.24885177612305, 68.14474487304688, 82.04063415527344, 95.9365234375, 109.8324203491211, 123.72830963134766, 137.62420654296875, 151.5200958251953, 165.41598510742188, 179.31187438964844, 193.207763671875, 207.10366821289062, 220.9995574951172, 234.89544677734375, 248.79135131835938, 262.6872253417969, 276.5831298828125, 290.47900390625, 304.3749084472656, 318.2707824707031, 332.16668701171875, 346.06256103515625, 359.9584655761719, 373.8543701171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 12.0, 10.0, 16.0, 13.0, 19.0, 12.0, 25.0, 23.0, 24.0, 37.0, 33.0, 34.0, 54.0, 86.0, 75.0, 89.0, 71.0, 57.0, 39.0, 33.0, 33.0, 29.0, 32.0, 19.0, 16.0, 21.0, 7.0, 8.0, 11.0, 10.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.020751953125, -669.9324340820312, -646.8441772460938, -623.755859375, -600.6676025390625, -577.5792846679688, -554.490966796875, -531.4027099609375, -508.31439208984375, -485.2261047363281, -462.1378173828125, -439.04949951171875, -415.9612121582031, -392.8729248046875, -369.7846374511719, -346.69635009765625, -323.6080627441406, -300.519775390625, -277.4314880371094, -254.3431854248047, -231.2548828125, -208.16659545898438, -185.07830810546875, -161.99000549316406, -138.90171813964844, -115.81342315673828, -92.72512817382812, -69.6368408203125, -46.548545837402344, -23.460250854492188, -0.3719635009765625, 22.716339111328125, 45.80462646484375, 68.8929214477539, 91.98121643066406, 115.06950378417969, 138.15780639648438, 161.24609375, 184.33438110351562, 207.4226837158203, 230.51097106933594, 253.59925842285156, 276.68756103515625, 299.7758483886719, 322.8641357421875, 345.95245361328125, 369.04071044921875, 392.1290283203125, 415.2173156738281, 438.30560302734375, 461.3938903808594, 484.482177734375, 507.57049560546875, 530.6588134765625, 553.7470703125, 576.8353881835938, 599.9236450195312, 623.011962890625, 646.1002197265625, 669.1885375976562, 692.2767944335938, 715.3651123046875, 738.453369140625, 761.5416870117188, 784.6300048828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 24.0, 22.0, 39.0, 60.0, 98.0, 179.0, 255.0, 418.0, 686.0, 1021.0, 1681.0, 2668.0, 4259.0, 6588.0, 11093.0, 17703.0, 28708.0, 48592.0, 82383.0, 144257.0, 263641.0, 533397.0, 1477572.0, 771378.0, 356542.0, 187770.0, 103516.0, 59946.0, 34925.0, 20818.0, 12610.0, 7751.0, 4897.0, 3123.0, 1940.0, 1291.0, 789.0, 550.0, 353.0, 229.0, 181.0, 103.0, 59.0, 48.0, 35.0, 27.0, 13.0, 9.0, 10.0, 6.0, 9.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.979736328125, -9.65478515625, -9.329833984375, -9.0048828125, -8.679931640625, -8.35498046875, -8.030029296875, -7.705078125, -7.380126953125, -7.05517578125, -6.730224609375, -6.4052734375, -6.080322265625, -5.75537109375, -5.430419921875, -5.10546875, -4.780517578125, -4.45556640625, -4.130615234375, -3.8056640625, -3.480712890625, -3.15576171875, -2.830810546875, -2.505859375, -2.180908203125, -1.85595703125, -1.531005859375, -1.2060546875, -0.881103515625, -0.55615234375, -0.231201171875, 0.09375, 0.418701171875, 0.74365234375, 1.068603515625, 1.3935546875, 1.718505859375, 2.04345703125, 2.368408203125, 2.693359375, 3.018310546875, 3.34326171875, 3.668212890625, 3.9931640625, 4.318115234375, 4.64306640625, 4.968017578125, 5.29296875, 5.617919921875, 5.94287109375, 6.267822265625, 6.5927734375, 6.917724609375, 7.24267578125, 7.567626953125, 7.892578125, 8.217529296875, 8.54248046875, 8.867431640625, 9.1923828125, 9.517333984375, 9.84228515625, 10.167236328125, 10.4921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 3.0, 3.0, 8.0, 14.0, 10.0, 11.0, 14.0, 16.0, 14.0, 19.0, 28.0, 42.0, 34.0, 31.0, 31.0, 53.0, 51.0, 57.0, 54.0, 47.0, 69.0, 35.0, 50.0, 40.0, 35.0, 34.0, 31.0, 32.0, 24.0, 21.0, 21.0, 11.0, 8.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99755859375, -0.9640884399414062, -0.9306182861328125, -0.8971481323242188, -0.863677978515625, -0.8302078247070312, -0.7967376708984375, -0.7632675170898438, -0.72979736328125, -0.6963272094726562, -0.6628570556640625, -0.6293869018554688, -0.595916748046875, -0.5624465942382812, -0.5289764404296875, -0.49550628662109375, -0.4620361328125, -0.42856597900390625, -0.3950958251953125, -0.36162567138671875, -0.328155517578125, -0.29468536376953125, -0.2612152099609375, -0.22774505615234375, -0.19427490234375, -0.16080474853515625, -0.1273345947265625, -0.09386444091796875, -0.060394287109375, -0.02692413330078125, 0.0065460205078125, 0.04001617431640625, 0.073486328125, 0.10695648193359375, 0.1404266357421875, 0.17389678955078125, 0.207366943359375, 0.24083709716796875, 0.2743072509765625, 0.30777740478515625, 0.34124755859375, 0.37471771240234375, 0.4081878662109375, 0.44165802001953125, 0.475128173828125, 0.5085983276367188, 0.5420684814453125, 0.5755386352539062, 0.6090087890625, 0.6424789428710938, 0.6759490966796875, 0.7094192504882812, 0.742889404296875, 0.7763595581054688, 0.8098297119140625, 0.8432998657226562, 0.87677001953125, 0.9102401733398438, 0.9437103271484375, 0.9771804809570312, 1.010650634765625, 1.0441207885742188, 1.0775909423828125, 1.1110610961914062, 1.14453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 3.0, 7.0, 11.0, 14.0, 17.0, 18.0, 26.0, 53.0, 68.0, 95.0, 204.0, 369.0, 723.0, 1691.0, 4430.0, 12890.0, 41263.0, 156289.0, 707722.0, 2228516.0, 798413.0, 174907.0, 44778.0, 13638.0, 4714.0, 1823.0, 779.0, 345.0, 175.0, 111.0, 54.0, 34.0, 26.0, 18.0, 17.0, 12.0, 12.0, 3.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1328125, -14.6947021484375, -14.256591796875, -13.8184814453125, -13.38037109375, -12.9422607421875, -12.504150390625, -12.0660400390625, -11.6279296875, -11.1898193359375, -10.751708984375, -10.3135986328125, -9.87548828125, -9.4373779296875, -8.999267578125, -8.5611572265625, -8.123046875, -7.6849365234375, -7.246826171875, -6.8087158203125, -6.37060546875, -5.9324951171875, -5.494384765625, -5.0562744140625, -4.6181640625, -4.1800537109375, -3.741943359375, -3.3038330078125, -2.86572265625, -2.4276123046875, -1.989501953125, -1.5513916015625, -1.11328125, -0.6751708984375, -0.237060546875, 0.2010498046875, 0.63916015625, 1.0772705078125, 1.515380859375, 1.9534912109375, 2.3916015625, 2.8297119140625, 3.267822265625, 3.7059326171875, 4.14404296875, 4.5821533203125, 5.020263671875, 5.4583740234375, 5.896484375, 6.3345947265625, 6.772705078125, 7.2108154296875, 7.64892578125, 8.0870361328125, 8.525146484375, 8.9632568359375, 9.4013671875, 9.8394775390625, 10.277587890625, 10.7156982421875, 11.15380859375, 11.5919189453125, 12.030029296875, 12.4681396484375, 12.90625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 21.0, 17.0, 32.0, 31.0, 37.0, 46.0, 74.0, 78.0, 116.0, 144.0, 173.0, 214.0, 246.0, 286.0, 387.0, 474.0, 310.0, 281.0, 223.0, 203.0, 130.0, 117.0, 99.0, 71.0, 57.0, 41.0, 40.0, 27.0, 12.0, 16.0, 10.0, 10.0, 12.0, 3.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -4.0042724609375, -3.887451171875, -3.7706298828125, -3.65380859375, -3.5369873046875, -3.420166015625, -3.3033447265625, -3.1865234375, -3.0697021484375, -2.952880859375, -2.8360595703125, -2.71923828125, -2.6024169921875, -2.485595703125, -2.3687744140625, -2.251953125, -2.1351318359375, -2.018310546875, -1.9014892578125, -1.78466796875, -1.6678466796875, -1.551025390625, -1.4342041015625, -1.3173828125, -1.2005615234375, -1.083740234375, -0.9669189453125, -0.85009765625, -0.7332763671875, -0.616455078125, -0.4996337890625, -0.3828125, -0.2659912109375, -0.149169921875, -0.0323486328125, 0.08447265625, 0.2012939453125, 0.318115234375, 0.4349365234375, 0.5517578125, 0.6685791015625, 0.785400390625, 0.9022216796875, 1.01904296875, 1.1358642578125, 1.252685546875, 1.3695068359375, 1.486328125, 1.6031494140625, 1.719970703125, 1.8367919921875, 1.95361328125, 2.0704345703125, 2.187255859375, 2.3040771484375, 2.4208984375, 2.5377197265625, 2.654541015625, 2.7713623046875, 2.88818359375, 3.0050048828125, 3.121826171875, 3.2386474609375, 3.35546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 11.0, 5.0, 5.0, 11.0, 18.0, 24.0, 23.0, 31.0, 38.0, 53.0, 61.0, 80.0, 82.0, 92.0, 73.0, 76.0, 55.0, 68.0, 51.0, 27.0, 26.0, 21.0, 20.0, 8.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.129074096679688, -26.11540412902832, -25.101736068725586, -24.08806610107422, -23.074398040771484, -22.060728073120117, -21.04705810546875, -20.033390045166016, -19.01972198486328, -18.006052017211914, -16.99238395690918, -15.978713989257812, -14.965045928955078, -13.951375961303711, -12.93770694732666, -11.92403793334961, -10.910367965698242, -9.896698951721191, -8.88302993774414, -7.869360446929932, -6.855691432952881, -5.84202241897583, -4.828352928161621, -3.8146839141845703, -2.8010149002075195, -1.7873457670211792, -0.7736766338348389, 0.23999261856079102, 1.2536616325378418, 2.2673306465148926, 3.2810001373291016, 4.294669151306152, 5.308338165283203, 6.322007179260254, 7.335676193237305, 8.349346160888672, 9.363014221191406, 10.376684188842773, 11.390353202819824, 12.404022216796875, 13.417691230773926, 14.431360244750977, 15.445029258728027, 16.458698272705078, 17.472368240356445, 18.48603630065918, 19.499706268310547, 20.51337432861328, 21.52704429626465, 22.540714263916016, 23.55438232421875, 24.568052291870117, 25.58172035217285, 26.59539031982422, 27.609058380126953, 28.62272834777832, 29.636398315429688, 30.650068283081055, 31.66373634338379, 32.677406311035156, 33.69107437133789, 34.704742431640625, 35.718414306640625, 36.73208236694336, 37.745750427246094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 1.0, 5.0, 5.0, 11.0, 8.0, 9.0, 16.0, 13.0, 20.0, 22.0, 34.0, 34.0, 40.0, 37.0, 35.0, 38.0, 48.0, 56.0, 47.0, 50.0, 50.0, 45.0, 30.0, 44.0, 43.0, 31.0, 32.0, 42.0, 35.0, 18.0, 18.0, 23.0, 10.0, 13.0, 10.0, 8.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.053157806396484, -28.218116760253906, -27.383075714111328, -26.54803466796875, -25.712993621826172, -24.877952575683594, -24.042911529541016, -23.207868576049805, -22.372827529907227, -21.53778648376465, -20.70274543762207, -19.867704391479492, -19.032663345336914, -18.197620391845703, -17.362579345703125, -16.527538299560547, -15.692498207092285, -14.857457160949707, -14.022416114807129, -13.187374114990234, -12.352333068847656, -11.517292022705078, -10.6822509765625, -9.847209930419922, -9.012168884277344, -8.177127838134766, -7.342086315155029, -6.507045269012451, -5.672003746032715, -4.836962699890137, -4.001921653747559, -3.1668801307678223, -2.331838607788086, -1.4967973232269287, -0.661756157875061, 0.17328500747680664, 1.0083262920379639, 1.843367576599121, 2.678408622741699, 3.5134501457214355, 4.348491191864014, 5.183532238006592, 6.018573760986328, 6.853614807128906, 7.688655853271484, 8.523696899414062, 9.35873794555664, 10.193779945373535, 11.028820991516113, 11.863862037658691, 12.69890308380127, 13.533945083618164, 14.368986129760742, 15.20402717590332, 16.0390682220459, 16.874109268188477, 17.709150314331055, 18.544191360473633, 19.37923240661621, 20.21427345275879, 21.049314498901367, 21.884357452392578, 22.719398498535156, 23.554439544677734, 24.389480590820312]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 11.0, 10.0, 15.0, 30.0, 31.0, 34.0, 65.0, 85.0, 147.0, 275.0, 448.0, 625.0, 1055.0, 1832.0, 3102.0, 5030.0, 8501.0, 14493.0, 25984.0, 48620.0, 102034.0, 232388.0, 306626.0, 149003.0, 67990.0, 34549.0, 18778.0, 10663.0, 6320.0, 3752.0, 2350.0, 1418.0, 860.0, 544.0, 316.0, 213.0, 131.0, 78.0, 40.0, 31.0, 38.0, 14.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-8.1953125, -7.9691162109375, -7.742919921875, -7.5167236328125, -7.29052734375, -7.0643310546875, -6.838134765625, -6.6119384765625, -6.3857421875, -6.1595458984375, -5.933349609375, -5.7071533203125, -5.48095703125, -5.2547607421875, -5.028564453125, -4.8023681640625, -4.576171875, -4.3499755859375, -4.123779296875, -3.8975830078125, -3.67138671875, -3.4451904296875, -3.218994140625, -2.9927978515625, -2.7666015625, -2.5404052734375, -2.314208984375, -2.0880126953125, -1.86181640625, -1.6356201171875, -1.409423828125, -1.1832275390625, -0.95703125, -0.7308349609375, -0.504638671875, -0.2784423828125, -0.05224609375, 0.1739501953125, 0.400146484375, 0.6263427734375, 0.8525390625, 1.0787353515625, 1.304931640625, 1.5311279296875, 1.75732421875, 1.9835205078125, 2.209716796875, 2.4359130859375, 2.662109375, 2.8883056640625, 3.114501953125, 3.3406982421875, 3.56689453125, 3.7930908203125, 4.019287109375, 4.2454833984375, 4.4716796875, 4.6978759765625, 4.924072265625, 5.1502685546875, 5.37646484375, 5.6026611328125, 5.828857421875, 6.0550537109375, 6.28125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 3.0, 8.0, 13.0, 21.0, 20.0, 11.0, 20.0, 25.0, 29.0, 28.0, 32.0, 45.0, 55.0, 59.0, 60.0, 50.0, 44.0, 57.0, 47.0, 44.0, 75.0, 40.0, 37.0, 32.0, 21.0, 28.0, 23.0, 13.0, 15.0, 11.0, 12.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.348419189453125, -1.30230712890625, -1.256195068359375, -1.2100830078125, -1.163970947265625, -1.11785888671875, -1.071746826171875, -1.025634765625, -0.979522705078125, -0.93341064453125, -0.887298583984375, -0.8411865234375, -0.795074462890625, -0.74896240234375, -0.702850341796875, -0.65673828125, -0.610626220703125, -0.56451416015625, -0.518402099609375, -0.4722900390625, -0.426177978515625, -0.38006591796875, -0.333953857421875, -0.287841796875, -0.241729736328125, -0.19561767578125, -0.149505615234375, -0.1033935546875, -0.057281494140625, -0.01116943359375, 0.034942626953125, 0.0810546875, 0.127166748046875, 0.17327880859375, 0.219390869140625, 0.2655029296875, 0.311614990234375, 0.35772705078125, 0.403839111328125, 0.449951171875, 0.496063232421875, 0.54217529296875, 0.588287353515625, 0.6343994140625, 0.680511474609375, 0.72662353515625, 0.772735595703125, 0.81884765625, 0.864959716796875, 0.91107177734375, 0.957183837890625, 1.0032958984375, 1.049407958984375, 1.09552001953125, 1.141632080078125, 1.187744140625, 1.233856201171875, 1.27996826171875, 1.326080322265625, 1.3721923828125, 1.418304443359375, 1.46441650390625, 1.510528564453125, 1.556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 8.0, 6.0, 13.0, 19.0, 15.0, 28.0, 46.0, 66.0, 90.0, 145.0, 239.0, 414.0, 726.0, 1380.0, 2804.0, 6278.0, 15182.0, 42691.0, 152937.0, 536633.0, 203307.0, 53112.0, 18230.0, 7182.0, 3348.0, 1573.0, 825.0, 473.0, 276.0, 167.0, 108.0, 71.0, 46.0, 34.0, 24.0, 16.0, 12.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.25933837890625, -6.9757080078125, -6.69207763671875, -6.408447265625, -6.12481689453125, -5.8411865234375, -5.55755615234375, -5.27392578125, -4.99029541015625, -4.7066650390625, -4.42303466796875, -4.139404296875, -3.85577392578125, -3.5721435546875, -3.28851318359375, -3.0048828125, -2.72125244140625, -2.4376220703125, -2.15399169921875, -1.870361328125, -1.58673095703125, -1.3031005859375, -1.01947021484375, -0.73583984375, -0.45220947265625, -0.1685791015625, 0.11505126953125, 0.398681640625, 0.68231201171875, 0.9659423828125, 1.24957275390625, 1.533203125, 1.81683349609375, 2.1004638671875, 2.38409423828125, 2.667724609375, 2.95135498046875, 3.2349853515625, 3.51861572265625, 3.80224609375, 4.08587646484375, 4.3695068359375, 4.65313720703125, 4.936767578125, 5.22039794921875, 5.5040283203125, 5.78765869140625, 6.0712890625, 6.35491943359375, 6.6385498046875, 6.92218017578125, 7.205810546875, 7.48944091796875, 7.7730712890625, 8.05670166015625, 8.34033203125, 8.62396240234375, 8.9075927734375, 9.19122314453125, 9.474853515625, 9.75848388671875, 10.0421142578125, 10.32574462890625, 10.609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 6.0, 6.0, 6.0, 9.0, 10.0, 12.0, 10.0, 19.0, 23.0, 16.0, 27.0, 28.0, 26.0, 42.0, 34.0, 33.0, 34.0, 42.0, 32.0, 34.0, 42.0, 42.0, 24.0, 40.0, 41.0, 34.0, 43.0, 32.0, 23.0, 36.0, 28.0, 24.0, 12.0, 18.0, 19.0, 11.0, 14.0, 15.0, 5.0, 7.0, 4.0, 11.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.93359375, -5.74249267578125, -5.5513916015625, -5.36029052734375, -5.169189453125, -4.97808837890625, -4.7869873046875, -4.59588623046875, -4.40478515625, -4.21368408203125, -4.0225830078125, -3.83148193359375, -3.640380859375, -3.44927978515625, -3.2581787109375, -3.06707763671875, -2.8759765625, -2.68487548828125, -2.4937744140625, -2.30267333984375, -2.111572265625, -1.92047119140625, -1.7293701171875, -1.53826904296875, -1.34716796875, -1.15606689453125, -0.9649658203125, -0.77386474609375, -0.582763671875, -0.39166259765625, -0.2005615234375, -0.00946044921875, 0.181640625, 0.37274169921875, 0.5638427734375, 0.75494384765625, 0.946044921875, 1.13714599609375, 1.3282470703125, 1.51934814453125, 1.71044921875, 1.90155029296875, 2.0926513671875, 2.28375244140625, 2.474853515625, 2.66595458984375, 2.8570556640625, 3.04815673828125, 3.2392578125, 3.43035888671875, 3.6214599609375, 3.81256103515625, 4.003662109375, 4.19476318359375, 4.3858642578125, 4.57696533203125, 4.76806640625, 4.95916748046875, 5.1502685546875, 5.34136962890625, 5.532470703125, 5.72357177734375, 5.9146728515625, 6.10577392578125, 6.296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 6.0, 12.0, 23.0, 32.0, 57.0, 78.0, 118.0, 228.0, 405.0, 797.0, 1804.0, 5222.0, 21943.0, 342291.0, 632683.0, 32172.0, 6457.0, 2125.0, 971.0, 449.0, 260.0, 141.0, 73.0, 55.0, 34.0, 31.0, 17.0, 14.0, 4.0, 12.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.296875, -15.73681640625, -15.1767578125, -14.61669921875, -14.056640625, -13.49658203125, -12.9365234375, -12.37646484375, -11.81640625, -11.25634765625, -10.6962890625, -10.13623046875, -9.576171875, -9.01611328125, -8.4560546875, -7.89599609375, -7.3359375, -6.77587890625, -6.2158203125, -5.65576171875, -5.095703125, -4.53564453125, -3.9755859375, -3.41552734375, -2.85546875, -2.29541015625, -1.7353515625, -1.17529296875, -0.615234375, -0.05517578125, 0.5048828125, 1.06494140625, 1.625, 2.18505859375, 2.7451171875, 3.30517578125, 3.865234375, 4.42529296875, 4.9853515625, 5.54541015625, 6.10546875, 6.66552734375, 7.2255859375, 7.78564453125, 8.345703125, 8.90576171875, 9.4658203125, 10.02587890625, 10.5859375, 11.14599609375, 11.7060546875, 12.26611328125, 12.826171875, 13.38623046875, 13.9462890625, 14.50634765625, 15.06640625, 15.62646484375, 16.1865234375, 16.74658203125, 17.306640625, 17.86669921875, 18.4267578125, 18.98681640625, 19.546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 8.0, 7.0, 17.0, 32.0, 42.0, 61.0, 87.0, 143.0, 144.0, 128.0, 107.0, 72.0, 45.0, 36.0, 23.0, 20.0, 7.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007219314575195312, -0.0007022097706794739, -0.0006824880838394165, -0.0006627663969993591, -0.0006430447101593018, -0.0006233230233192444, -0.000603601336479187, -0.0005838796496391296, -0.0005641579627990723, -0.0005444362759590149, -0.0005247145891189575, -0.0005049929022789001, -0.0004852712154388428, -0.0004655495285987854, -0.00044582784175872803, -0.00042610615491867065, -0.0004063844680786133, -0.0003866627812385559, -0.00036694109439849854, -0.00034721940755844116, -0.0003274977207183838, -0.0003077760338783264, -0.00028805434703826904, -0.00026833266019821167, -0.0002486109733581543, -0.00022888928651809692, -0.00020916759967803955, -0.00018944591283798218, -0.0001697242259979248, -0.00015000253915786743, -0.00013028085231781006, -0.00011055916547775269, -9.083747863769531e-05, -7.111579179763794e-05, -5.1394104957580566e-05, -3.167241811752319e-05, -1.195073127746582e-05, 7.770955562591553e-06, 2.7492642402648926e-05, 4.72143292427063e-05, 6.693601608276367e-05, 8.665770292282104e-05, 0.00010637938976287842, 0.0001261010766029358, 0.00014582276344299316, 0.00016554445028305054, 0.0001852661371231079, 0.00020498782396316528, 0.00022470951080322266, 0.00024443119764328003, 0.0002641528844833374, 0.0002838745713233948, 0.00030359625816345215, 0.0003233179450035095, 0.0003430396318435669, 0.00036276131868362427, 0.00038248300552368164, 0.000402204692363739, 0.0004219263792037964, 0.00044164806604385376, 0.00046136975288391113, 0.0004810914397239685, 0.0005008131265640259, 0.0005205348134040833, 0.0005402565002441406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 8.0, 11.0, 17.0, 20.0, 46.0, 70.0, 105.0, 156.0, 292.0, 544.0, 1010.0, 2167.0, 4860.0, 12847.0, 43382.0, 217307.0, 573739.0, 142609.0, 31684.0, 10003.0, 3897.0, 1797.0, 858.0, 501.0, 254.0, 141.0, 76.0, 48.0, 34.0, 31.0, 17.0, 12.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.1339111328125, -9.830322265625, -9.5267333984375, -9.22314453125, -8.9195556640625, -8.615966796875, -8.3123779296875, -8.0087890625, -7.7052001953125, -7.401611328125, -7.0980224609375, -6.79443359375, -6.4908447265625, -6.187255859375, -5.8836669921875, -5.580078125, -5.2764892578125, -4.972900390625, -4.6693115234375, -4.36572265625, -4.0621337890625, -3.758544921875, -3.4549560546875, -3.1513671875, -2.8477783203125, -2.544189453125, -2.2406005859375, -1.93701171875, -1.6334228515625, -1.329833984375, -1.0262451171875, -0.72265625, -0.4190673828125, -0.115478515625, 0.1881103515625, 0.49169921875, 0.7952880859375, 1.098876953125, 1.4024658203125, 1.7060546875, 2.0096435546875, 2.313232421875, 2.6168212890625, 2.92041015625, 3.2239990234375, 3.527587890625, 3.8311767578125, 4.134765625, 4.4383544921875, 4.741943359375, 5.0455322265625, 5.34912109375, 5.6527099609375, 5.956298828125, 6.2598876953125, 6.5634765625, 6.8670654296875, 7.170654296875, 7.4742431640625, 7.77783203125, 8.0814208984375, 8.385009765625, 8.6885986328125, 8.9921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 11.0, 10.0, 22.0, 11.0, 31.0, 29.0, 39.0, 38.0, 49.0, 43.0, 72.0, 75.0, 82.0, 68.0, 71.0, 66.0, 55.0, 48.0, 32.0, 31.0, 15.0, 22.0, 16.0, 8.0, 8.0, 9.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.24725341796875, -4.0804443359375, -3.91363525390625, -3.746826171875, -3.58001708984375, -3.4132080078125, -3.24639892578125, -3.07958984375, -2.91278076171875, -2.7459716796875, -2.57916259765625, -2.412353515625, -2.24554443359375, -2.0787353515625, -1.91192626953125, -1.7451171875, -1.57830810546875, -1.4114990234375, -1.24468994140625, -1.077880859375, -0.91107177734375, -0.7442626953125, -0.57745361328125, -0.41064453125, -0.24383544921875, -0.0770263671875, 0.08978271484375, 0.256591796875, 0.42340087890625, 0.5902099609375, 0.75701904296875, 0.923828125, 1.09063720703125, 1.2574462890625, 1.42425537109375, 1.591064453125, 1.75787353515625, 1.9246826171875, 2.09149169921875, 2.25830078125, 2.42510986328125, 2.5919189453125, 2.75872802734375, 2.925537109375, 3.09234619140625, 3.2591552734375, 3.42596435546875, 3.5927734375, 3.75958251953125, 3.9263916015625, 4.09320068359375, 4.260009765625, 4.42681884765625, 4.5936279296875, 4.76043701171875, 4.92724609375, 5.09405517578125, 5.2608642578125, 5.42767333984375, 5.594482421875, 5.76129150390625, 5.9281005859375, 6.09490966796875, 6.26171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 12.0, 15.0, 13.0, 34.0, 54.0, 113.0, 203.0, 228.0, 143.0, 65.0, 48.0, 22.0, 16.0, 6.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.15704345703125, -149.9176025390625, -146.67816162109375, -143.438720703125, -140.19927978515625, -136.9598388671875, -133.7203826904297, -130.48094177246094, -127.24150085449219, -124.00205993652344, -120.76261901855469, -117.5231704711914, -114.28372955322266, -111.0442886352539, -107.80484771728516, -104.56539916992188, -101.32595825195312, -98.08651733398438, -94.84707641601562, -91.60762786865234, -88.3681869506836, -85.12874603271484, -81.8893051147461, -78.64985656738281, -75.4104232788086, -72.17098236083984, -68.9315414428711, -65.69209289550781, -62.45265197753906, -59.21321105957031, -55.97377014160156, -52.73432540893555, -49.4948844909668, -46.25544357299805, -43.01599884033203, -39.77655792236328, -36.537113189697266, -33.297672271728516, -30.058229446411133, -26.81878662109375, -23.579343795776367, -20.339900970458984, -17.1004581451416, -13.861016273498535, -10.621573448181152, -7.382131576538086, -4.142688751220703, -0.9032459259033203, 2.3361968994140625, 5.575639724731445, 8.815082550048828, 12.054524421691895, 15.293967247009277, 18.533409118652344, 21.772851943969727, 25.01229476928711, 28.251737594604492, 31.491180419921875, 34.730621337890625, 37.97006607055664, 41.20950698852539, 44.448951721191406, 47.688392639160156, 50.927833557128906, 54.16727828979492]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 10.0, 8.0, 13.0, 43.0, 86.0, 90.0, 128.0, 167.0, 136.0, 109.0, 67.0, 44.0, 27.0, 17.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-193.52972412109375, -188.77713012695312, -184.0245361328125, -179.27194213867188, -174.51934814453125, -169.76675415039062, -165.01416015625, -160.26156616210938, -155.50897216796875, -150.75637817382812, -146.0037841796875, -141.25119018554688, -136.49859619140625, -131.74600219726562, -126.99340057373047, -122.24080657958984, -117.48820495605469, -112.73561096191406, -107.98301696777344, -103.23042297363281, -98.47782897949219, -93.72523498535156, -88.9726333618164, -84.22003936767578, -79.46744537353516, -74.71485137939453, -69.9622573852539, -65.20966339111328, -60.45706558227539, -55.704471588134766, -50.951873779296875, -46.19927978515625, -41.446693420410156, -36.69409942626953, -31.941503524780273, -27.188907623291016, -22.43631362915039, -17.683719635009766, -12.931123733520508, -8.17852783203125, -3.425933837890625, 1.3266611099243164, 6.079256057739258, 10.8318510055542, 15.58444595336914, 20.337039947509766, 25.089635848999023, 29.84223175048828, 34.594825744628906, 39.34741973876953, 44.100013732910156, 48.85261154174805, 53.60520553588867, 58.3577995300293, 63.11039733886719, 67.86299133300781, 72.61558532714844, 77.36817932128906, 82.12077331542969, 86.87336730957031, 91.62596130371094, 96.37855529785156, 101.13115692138672, 105.88375091552734, 110.63634490966797]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 2.0, 7.0, 3.0, 9.0, 13.0, 18.0, 28.0, 35.0, 49.0, 70.0, 115.0, 172.0, 363.0, 758.0, 1585.0, 3460.0, 7893.0, 19224.0, 56255.0, 227910.0, 3425098.0, 337482.0, 72969.0, 24202.0, 9249.0, 3960.0, 1755.0, 797.0, 381.0, 180.0, 101.0, 56.0, 34.0, 10.0, 14.0, 10.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.625, -42.5234375, -41.421875, -40.3203125, -39.21875, -38.1171875, -37.015625, -35.9140625, -34.8125, -33.7109375, -32.609375, -31.5078125, -30.40625, -29.3046875, -28.203125, -27.1015625, -26.0, -24.8984375, -23.796875, -22.6953125, -21.59375, -20.4921875, -19.390625, -18.2890625, -17.1875, -16.0859375, -14.984375, -13.8828125, -12.78125, -11.6796875, -10.578125, -9.4765625, -8.375, -7.2734375, -6.171875, -5.0703125, -3.96875, -2.8671875, -1.765625, -0.6640625, 0.4375, 1.5390625, 2.640625, 3.7421875, 4.84375, 5.9453125, 7.046875, 8.1484375, 9.25, 10.3515625, 11.453125, 12.5546875, 13.65625, 14.7578125, 15.859375, 16.9609375, 18.0625, 19.1640625, 20.265625, 21.3671875, 22.46875, 23.5703125, 24.671875, 25.7734375, 26.875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 9.0, 15.0, 18.0, 23.0, 30.0, 30.0, 37.0, 56.0, 74.0, 80.0, 74.0, 67.0, 67.0, 69.0, 68.0, 54.0, 55.0, 36.0, 35.0, 21.0, 14.0, 19.0, 6.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.708984375, -2.6436767578125, -2.578369140625, -2.5130615234375, -2.44775390625, -2.3824462890625, -2.317138671875, -2.2518310546875, -2.1865234375, -2.1212158203125, -2.055908203125, -1.9906005859375, -1.92529296875, -1.8599853515625, -1.794677734375, -1.7293701171875, -1.6640625, -1.5987548828125, -1.533447265625, -1.4681396484375, -1.40283203125, -1.3375244140625, -1.272216796875, -1.2069091796875, -1.1416015625, -1.0762939453125, -1.010986328125, -0.9456787109375, -0.88037109375, -0.8150634765625, -0.749755859375, -0.6844482421875, -0.619140625, -0.5538330078125, -0.488525390625, -0.4232177734375, -0.35791015625, -0.2926025390625, -0.227294921875, -0.1619873046875, -0.0966796875, -0.0313720703125, 0.033935546875, 0.0992431640625, 0.16455078125, 0.2298583984375, 0.295166015625, 0.3604736328125, 0.42578125, 0.4910888671875, 0.556396484375, 0.6217041015625, 0.68701171875, 0.7523193359375, 0.817626953125, 0.8829345703125, 0.9482421875, 1.0135498046875, 1.078857421875, 1.1441650390625, 1.20947265625, 1.2747802734375, 1.340087890625, 1.4053955078125, 1.470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 13.0, 17.0, 28.0, 54.0, 51.0, 80.0, 144.0, 193.0, 338.0, 506.0, 852.0, 1231.0, 2178.0, 3849.0, 7004.0, 14045.0, 29196.0, 67946.0, 186606.0, 732713.0, 2670402.0, 298521.0, 99016.0, 40082.0, 18553.0, 9098.0, 4830.0, 2529.0, 1564.0, 977.0, 607.0, 350.0, 259.0, 151.0, 81.0, 64.0, 49.0, 25.0, 21.0, 17.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.6875, -20.044921875, -19.40234375, -18.759765625, -18.1171875, -17.474609375, -16.83203125, -16.189453125, -15.546875, -14.904296875, -14.26171875, -13.619140625, -12.9765625, -12.333984375, -11.69140625, -11.048828125, -10.40625, -9.763671875, -9.12109375, -8.478515625, -7.8359375, -7.193359375, -6.55078125, -5.908203125, -5.265625, -4.623046875, -3.98046875, -3.337890625, -2.6953125, -2.052734375, -1.41015625, -0.767578125, -0.125, 0.517578125, 1.16015625, 1.802734375, 2.4453125, 3.087890625, 3.73046875, 4.373046875, 5.015625, 5.658203125, 6.30078125, 6.943359375, 7.5859375, 8.228515625, 8.87109375, 9.513671875, 10.15625, 10.798828125, 11.44140625, 12.083984375, 12.7265625, 13.369140625, 14.01171875, 14.654296875, 15.296875, 15.939453125, 16.58203125, 17.224609375, 17.8671875, 18.509765625, 19.15234375, 19.794921875, 20.4375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 15.0, 11.0, 14.0, 16.0, 24.0, 34.0, 28.0, 54.0, 60.0, 78.0, 126.0, 175.0, 286.0, 1156.0, 1001.0, 279.0, 206.0, 113.0, 86.0, 59.0, 54.0, 43.0, 32.0, 35.0, 24.0, 16.0, 3.0, 9.0, 3.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.68609619140625, -4.5440673828125, -4.40203857421875, -4.260009765625, -4.11798095703125, -3.9759521484375, -3.83392333984375, -3.69189453125, -3.54986572265625, -3.4078369140625, -3.26580810546875, -3.123779296875, -2.98175048828125, -2.8397216796875, -2.69769287109375, -2.5556640625, -2.41363525390625, -2.2716064453125, -2.12957763671875, -1.987548828125, -1.84552001953125, -1.7034912109375, -1.56146240234375, -1.41943359375, -1.27740478515625, -1.1353759765625, -0.99334716796875, -0.851318359375, -0.70928955078125, -0.5672607421875, -0.42523193359375, -0.283203125, -0.14117431640625, 0.0008544921875, 0.14288330078125, 0.284912109375, 0.42694091796875, 0.5689697265625, 0.71099853515625, 0.85302734375, 0.99505615234375, 1.1370849609375, 1.27911376953125, 1.421142578125, 1.56317138671875, 1.7052001953125, 1.84722900390625, 1.9892578125, 2.13128662109375, 2.2733154296875, 2.41534423828125, 2.557373046875, 2.69940185546875, 2.8414306640625, 2.98345947265625, 3.12548828125, 3.26751708984375, 3.4095458984375, 3.55157470703125, 3.693603515625, 3.83563232421875, 3.9776611328125, 4.11968994140625, 4.26171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 16.0, 37.0, 125.0, 273.0, 250.0, 169.0, 67.0, 33.0, 12.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.41628646850586, -23.110261917114258, -20.804237365722656, -18.498210906982422, -16.192188262939453, -13.886162757873535, -11.580137252807617, -9.274112701416016, -6.968088150024414, -4.6620635986328125, -2.3560385704040527, -0.05001354217529297, 2.2560110092163086, 4.56203556060791, 6.868061065673828, 9.17408561706543, 11.480110168457031, 13.786134719848633, 16.092159271240234, 18.39818572998047, 20.704208374023438, 23.010234832763672, 25.316259384155273, 27.622283935546875, 29.928308486938477, 32.23433303833008, 34.54035949707031, 36.84638214111328, 39.152408599853516, 41.458431243896484, 43.76445770263672, 46.07048034667969, 48.376502990722656, 50.68252944946289, 52.98855209350586, 55.294578552246094, 57.60060119628906, 59.9066276550293, 62.21265411376953, 64.5186767578125, 66.82469940185547, 69.13072204589844, 71.43675231933594, 73.7427749633789, 76.04879760742188, 78.35482025146484, 80.66085052490234, 82.96687316894531, 85.27290344238281, 87.57892608642578, 89.88495635986328, 92.19097900390625, 94.49700164794922, 96.80302429199219, 99.10905456542969, 101.41507720947266, 103.72109985351562, 106.0271224975586, 108.3331527709961, 110.63917541503906, 112.94519805908203, 115.251220703125, 117.5572509765625, 119.86327362060547, 122.16929626464844]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 11.0, 6.0, 7.0, 11.0, 20.0, 10.0, 25.0, 20.0, 27.0, 27.0, 27.0, 43.0, 28.0, 41.0, 46.0, 55.0, 52.0, 57.0, 44.0, 44.0, 51.0, 54.0, 51.0, 30.0, 34.0, 33.0, 34.0, 25.0, 13.0, 14.0, 12.0, 14.0, 8.0, 2.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.712379455566406, -21.021015167236328, -20.329652786254883, -19.638288497924805, -18.94692611694336, -18.25556182861328, -17.564197540283203, -16.872833251953125, -16.18147087097168, -15.490107536315918, -14.798744201660156, -14.107379913330078, -13.416016578674316, -12.724653244018555, -12.033288955688477, -11.341925621032715, -10.650562286376953, -9.959198951721191, -9.26783561706543, -8.576471328735352, -7.88510799407959, -7.193744659423828, -6.502380847930908, -5.811017036437988, -5.119653701782227, -4.428290367126465, -3.736926555633545, -3.045562982559204, -2.3541994094848633, -1.6628358364105225, -0.9714722633361816, -0.2801084518432617, 0.4112548828125, 1.1026184558868408, 1.7939820289611816, 2.4853456020355225, 3.1767091751098633, 3.868072748184204, 4.559436321258545, 5.250800132751465, 5.942163467407227, 6.633526802062988, 7.324890613555908, 8.016254425048828, 8.70761775970459, 9.398981094360352, 10.09034538269043, 10.781708717346191, 11.473072052001953, 12.164435386657715, 12.855798721313477, 13.547163009643555, 14.238526344299316, 14.929889678955078, 15.621253967285156, 16.312618255615234, 17.00398063659668, 17.695344924926758, 18.386707305908203, 19.07807159423828, 19.76943588256836, 20.460798263549805, 21.152162551879883, 21.843524932861328, 22.534889221191406]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 16.0, 26.0, 27.0, 38.0, 72.0, 120.0, 179.0, 290.0, 400.0, 605.0, 992.0, 1531.0, 2453.0, 4067.0, 7288.0, 14040.0, 30030.0, 76133.0, 286752.0, 441064.0, 105337.0, 38389.0, 17233.0, 8677.0, 4931.0, 2865.0, 1729.0, 1162.0, 737.0, 464.0, 328.0, 182.0, 135.0, 82.0, 60.0, 28.0, 20.0, 15.0, 11.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0], "bins": [-23.25, -22.6405029296875, -22.031005859375, -21.4215087890625, -20.81201171875, -20.2025146484375, -19.593017578125, -18.9835205078125, -18.3740234375, -17.7645263671875, -17.155029296875, -16.5455322265625, -15.93603515625, -15.3265380859375, -14.717041015625, -14.1075439453125, -13.498046875, -12.8885498046875, -12.279052734375, -11.6695556640625, -11.06005859375, -10.4505615234375, -9.841064453125, -9.2315673828125, -8.6220703125, -8.0125732421875, -7.403076171875, -6.7935791015625, -6.18408203125, -5.5745849609375, -4.965087890625, -4.3555908203125, -3.74609375, -3.1365966796875, -2.527099609375, -1.9176025390625, -1.30810546875, -0.6986083984375, -0.089111328125, 0.5203857421875, 1.1298828125, 1.7393798828125, 2.348876953125, 2.9583740234375, 3.56787109375, 4.1773681640625, 4.786865234375, 5.3963623046875, 6.005859375, 6.6153564453125, 7.224853515625, 7.8343505859375, 8.44384765625, 9.0533447265625, 9.662841796875, 10.2723388671875, 10.8818359375, 11.4913330078125, 12.100830078125, 12.7103271484375, 13.31982421875, 13.9293212890625, 14.538818359375, 15.1483154296875, 15.7578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 3.0, 5.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 10.0, 21.0, 20.0, 15.0, 16.0, 27.0, 23.0, 34.0, 39.0, 38.0, 47.0, 48.0, 49.0, 53.0, 46.0, 35.0, 37.0, 43.0, 37.0, 46.0, 37.0, 25.0, 30.0, 32.0, 23.0, 14.0, 19.0, 11.0, 6.0, 13.0, 7.0, 13.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.296875, -1.254852294921875, -1.21282958984375, -1.170806884765625, -1.1287841796875, -1.086761474609375, -1.04473876953125, -1.002716064453125, -0.960693359375, -0.918670654296875, -0.87664794921875, -0.834625244140625, -0.7926025390625, -0.750579833984375, -0.70855712890625, -0.666534423828125, -0.62451171875, -0.582489013671875, -0.54046630859375, -0.498443603515625, -0.4564208984375, -0.414398193359375, -0.37237548828125, -0.330352783203125, -0.288330078125, -0.246307373046875, -0.20428466796875, -0.162261962890625, -0.1202392578125, -0.078216552734375, -0.03619384765625, 0.005828857421875, 0.0478515625, 0.089874267578125, 0.13189697265625, 0.173919677734375, 0.2159423828125, 0.257965087890625, 0.29998779296875, 0.342010498046875, 0.384033203125, 0.426055908203125, 0.46807861328125, 0.510101318359375, 0.5521240234375, 0.594146728515625, 0.63616943359375, 0.678192138671875, 0.72021484375, 0.762237548828125, 0.80426025390625, 0.846282958984375, 0.8883056640625, 0.930328369140625, 0.97235107421875, 1.014373779296875, 1.056396484375, 1.098419189453125, 1.14044189453125, 1.182464599609375, 1.2244873046875, 1.266510009765625, 1.30853271484375, 1.350555419921875, 1.392578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 6.0, 1.0, 4.0, 5.0, 1.0, 12.0, 9.0, 9.0, 13.0, 16.0, 94.0, 523.0, 16315.0, 1022282.0, 8688.0, 396.0, 74.0, 25.0, 15.0, 10.0, 15.0, 4.0, 6.0, 5.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.3125, -101.6083984375, -97.904296875, -94.2001953125, -90.49609375, -86.7919921875, -83.087890625, -79.3837890625, -75.6796875, -71.9755859375, -68.271484375, -64.5673828125, -60.86328125, -57.1591796875, -53.455078125, -49.7509765625, -46.046875, -42.3427734375, -38.638671875, -34.9345703125, -31.23046875, -27.5263671875, -23.822265625, -20.1181640625, -16.4140625, -12.7099609375, -9.005859375, -5.3017578125, -1.59765625, 2.1064453125, 5.810546875, 9.5146484375, 13.21875, 16.9228515625, 20.626953125, 24.3310546875, 28.03515625, 31.7392578125, 35.443359375, 39.1474609375, 42.8515625, 46.5556640625, 50.259765625, 53.9638671875, 57.66796875, 61.3720703125, 65.076171875, 68.7802734375, 72.484375, 76.1884765625, 79.892578125, 83.5966796875, 87.30078125, 91.0048828125, 94.708984375, 98.4130859375, 102.1171875, 105.8212890625, 109.525390625, 113.2294921875, 116.93359375, 120.6376953125, 124.341796875, 128.0458984375, 131.75]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 10.0, 18.0, 16.0, 22.0, 15.0, 26.0, 26.0, 32.0, 43.0, 32.0, 42.0, 49.0, 47.0, 48.0, 53.0, 51.0, 42.0, 60.0, 36.0, 35.0, 43.0, 32.0, 29.0, 26.0, 28.0, 18.0, 17.0, 18.0, 10.0, 14.0, 3.0, 6.0, 1.0, 5.0, 3.0, 1.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.84375, -6.606689453125, -6.36962890625, -6.132568359375, -5.8955078125, -5.658447265625, -5.42138671875, -5.184326171875, -4.947265625, -4.710205078125, -4.47314453125, -4.236083984375, -3.9990234375, -3.761962890625, -3.52490234375, -3.287841796875, -3.05078125, -2.813720703125, -2.57666015625, -2.339599609375, -2.1025390625, -1.865478515625, -1.62841796875, -1.391357421875, -1.154296875, -0.917236328125, -0.68017578125, -0.443115234375, -0.2060546875, 0.031005859375, 0.26806640625, 0.505126953125, 0.7421875, 0.979248046875, 1.21630859375, 1.453369140625, 1.6904296875, 1.927490234375, 2.16455078125, 2.401611328125, 2.638671875, 2.875732421875, 3.11279296875, 3.349853515625, 3.5869140625, 3.823974609375, 4.06103515625, 4.298095703125, 4.53515625, 4.772216796875, 5.00927734375, 5.246337890625, 5.4833984375, 5.720458984375, 5.95751953125, 6.194580078125, 6.431640625, 6.668701171875, 6.90576171875, 7.142822265625, 7.3798828125, 7.616943359375, 7.85400390625, 8.091064453125, 8.328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 8.0, 14.0, 10.0, 22.0, 51.0, 236.0, 4229.0, 1040773.0, 2883.0, 200.0, 43.0, 14.0, 15.0, 7.0, 14.0, 3.0, 4.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.375, -170.583984375, -164.79296875, -159.001953125, -153.2109375, -147.419921875, -141.62890625, -135.837890625, -130.046875, -124.255859375, -118.46484375, -112.673828125, -106.8828125, -101.091796875, -95.30078125, -89.509765625, -83.71875, -77.927734375, -72.13671875, -66.345703125, -60.5546875, -54.763671875, -48.97265625, -43.181640625, -37.390625, -31.599609375, -25.80859375, -20.017578125, -14.2265625, -8.435546875, -2.64453125, 3.146484375, 8.9375, 14.728515625, 20.51953125, 26.310546875, 32.1015625, 37.892578125, 43.68359375, 49.474609375, 55.265625, 61.056640625, 66.84765625, 72.638671875, 78.4296875, 84.220703125, 90.01171875, 95.802734375, 101.59375, 107.384765625, 113.17578125, 118.966796875, 124.7578125, 130.548828125, 136.33984375, 142.130859375, 147.921875, 153.712890625, 159.50390625, 165.294921875, 171.0859375, 176.876953125, 182.66796875, 188.458984375, 194.25]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 10.0, 12.0, 16.0, 13.0, 26.0, 38.0, 61.0, 77.0, 124.0, 169.0, 122.0, 99.0, 75.0, 54.0, 34.0, 12.0, 7.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007829666137695312, -0.0007590055465698242, -0.0007350444793701172, -0.0007110834121704102, -0.0006871223449707031, -0.0006631612777709961, -0.0006392002105712891, -0.000615239143371582, -0.000591278076171875, -0.000567317008972168, -0.0005433559417724609, -0.0005193948745727539, -0.0004954338073730469, -0.00047147274017333984, -0.0004475116729736328, -0.0004235506057739258, -0.00039958953857421875, -0.0003756284713745117, -0.0003516674041748047, -0.00032770633697509766, -0.0003037452697753906, -0.0002797842025756836, -0.00025582313537597656, -0.00023186206817626953, -0.0002079010009765625, -0.00018393993377685547, -0.00015997886657714844, -0.0001360177993774414, -0.00011205673217773438, -8.809566497802734e-05, -6.413459777832031e-05, -4.017353057861328e-05, -1.621246337890625e-05, 7.748603820800781e-06, 3.170967102050781e-05, 5.5670738220214844e-05, 7.963180541992188e-05, 0.0001035928726196289, 0.00012755393981933594, 0.00015151500701904297, 0.00017547607421875, 0.00019943714141845703, 0.00022339820861816406, 0.0002473592758178711, 0.0002713203430175781, 0.00029528141021728516, 0.0003192424774169922, 0.0003432035446166992, 0.00036716461181640625, 0.0003911256790161133, 0.0004150867462158203, 0.00043904781341552734, 0.0004630088806152344, 0.0004869699478149414, 0.0005109310150146484, 0.0005348920822143555, 0.0005588531494140625, 0.0005828142166137695, 0.0006067752838134766, 0.0006307363510131836, 0.0006546974182128906, 0.0006786584854125977, 0.0007026195526123047, 0.0007265806198120117, 0.0007505416870117188]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 18.0, 6.0, 14.0, 27.0, 42.0, 54.0, 94.0, 117.0, 159.0, 240.0, 372.0, 540.0, 909.0, 1358.0, 2384.0, 4282.0, 8294.0, 20655.0, 87557.0, 688707.0, 179668.0, 30434.0, 10604.0, 5017.0, 2764.0, 1551.0, 931.0, 615.0, 356.0, 242.0, 167.0, 107.0, 77.0, 66.0, 35.0, 21.0, 14.0, 18.0, 5.0, 8.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.21875, -26.41015625, -25.6015625, -24.79296875, -23.984375, -23.17578125, -22.3671875, -21.55859375, -20.75, -19.94140625, -19.1328125, -18.32421875, -17.515625, -16.70703125, -15.8984375, -15.08984375, -14.28125, -13.47265625, -12.6640625, -11.85546875, -11.046875, -10.23828125, -9.4296875, -8.62109375, -7.8125, -7.00390625, -6.1953125, -5.38671875, -4.578125, -3.76953125, -2.9609375, -2.15234375, -1.34375, -0.53515625, 0.2734375, 1.08203125, 1.890625, 2.69921875, 3.5078125, 4.31640625, 5.125, 5.93359375, 6.7421875, 7.55078125, 8.359375, 9.16796875, 9.9765625, 10.78515625, 11.59375, 12.40234375, 13.2109375, 14.01953125, 14.828125, 15.63671875, 16.4453125, 17.25390625, 18.0625, 18.87109375, 19.6796875, 20.48828125, 21.296875, 22.10546875, 22.9140625, 23.72265625, 24.53125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 6.0, 9.0, 5.0, 17.0, 16.0, 21.0, 48.0, 46.0, 89.0, 119.0, 237.0, 119.0, 92.0, 48.0, 38.0, 16.0, 21.0, 13.0, 5.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.578125, -17.0819091796875, -16.585693359375, -16.0894775390625, -15.59326171875, -15.0970458984375, -14.600830078125, -14.1046142578125, -13.6083984375, -13.1121826171875, -12.615966796875, -12.1197509765625, -11.62353515625, -11.1273193359375, -10.631103515625, -10.1348876953125, -9.638671875, -9.1424560546875, -8.646240234375, -8.1500244140625, -7.65380859375, -7.1575927734375, -6.661376953125, -6.1651611328125, -5.6689453125, -5.1727294921875, -4.676513671875, -4.1802978515625, -3.68408203125, -3.1878662109375, -2.691650390625, -2.1954345703125, -1.69921875, -1.2030029296875, -0.706787109375, -0.2105712890625, 0.28564453125, 0.7818603515625, 1.278076171875, 1.7742919921875, 2.2705078125, 2.7667236328125, 3.262939453125, 3.7591552734375, 4.25537109375, 4.7515869140625, 5.247802734375, 5.7440185546875, 6.240234375, 6.7364501953125, 7.232666015625, 7.7288818359375, 8.22509765625, 8.7213134765625, 9.217529296875, 9.7137451171875, 10.2099609375, 10.7061767578125, 11.202392578125, 11.6986083984375, 12.19482421875, 12.6910400390625, 13.187255859375, 13.6834716796875, 14.1796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 11.0, 10.0, 16.0, 25.0, 48.0, 59.0, 73.0, 109.0, 123.0, 130.0, 116.0, 78.0, 74.0, 39.0, 26.0, 18.0, 13.0, 13.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.41889953613281, -85.94677734375, -83.47464752197266, -81.00252532958984, -78.53040313720703, -76.05827331542969, -73.58615112304688, -71.11402893066406, -68.64190673828125, -66.16978454589844, -63.69765853881836, -61.22553253173828, -58.75341033935547, -56.28128433227539, -53.80915832519531, -51.3370361328125, -48.864906311035156, -46.39278030395508, -43.920658111572266, -41.44853210449219, -38.976409912109375, -36.5042839050293, -34.03215789794922, -31.560033798217773, -29.087909698486328, -26.615785598754883, -24.143661499023438, -21.67153549194336, -19.199411392211914, -16.72728729248047, -14.255162239074707, -11.783037185668945, -9.3109130859375, -6.8387885093688965, -4.366663932800293, -1.8945393562316895, 0.5775852203369141, 3.0497093200683594, 5.521834373474121, 7.993959426879883, 10.466083526611328, 12.938207626342773, 15.410332679748535, 17.882457733154297, 20.354581832885742, 22.826705932617188, 25.298831939697266, 27.77095603942871, 30.243080139160156, 32.715206146240234, 35.18732833862305, 37.659454345703125, 40.13157653808594, 42.603702545166016, 45.075828552246094, 47.547950744628906, 50.020076751708984, 52.49220275878906, 54.964324951171875, 57.43645095825195, 59.90857696533203, 62.380699157714844, 64.85282135009766, 67.324951171875, 69.79707336425781]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 6.0, 9.0, 5.0, 16.0, 14.0, 20.0, 21.0, 24.0, 27.0, 40.0, 44.0, 34.0, 57.0, 60.0, 57.0, 46.0, 56.0, 63.0, 48.0, 61.0, 39.0, 40.0, 34.0, 28.0, 25.0, 23.0, 16.0, 14.0, 9.0, 14.0, 3.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.00212097167969, -47.37638473510742, -45.750648498535156, -44.124916076660156, -42.49917984008789, -40.873443603515625, -39.24770736694336, -37.621971130371094, -35.996238708496094, -34.37050247192383, -32.74476623535156, -31.11903190612793, -29.493297576904297, -27.86756134033203, -26.241825103759766, -24.616090774536133, -22.990354537963867, -21.3646183013916, -19.73888397216797, -18.113147735595703, -16.48741340637207, -14.861677169799805, -13.235941886901855, -11.610206604003906, -9.984471321105957, -8.358736038208008, -6.733000755310059, -5.107264995574951, -3.481529712677002, -1.8557939529418945, -0.2300586700439453, 1.395676612854004, 3.021411895751953, 4.647147178649902, 6.272882461547852, 7.898618221282959, 9.52435302734375, 11.150089263916016, 12.775824546813965, 14.401559829711914, 16.027294158935547, 17.653030395507812, 19.278764724731445, 20.90450096130371, 22.530235290527344, 24.15597152709961, 25.781707763671875, 27.407442092895508, 29.033178329467773, 30.65891456604004, 32.28464889526367, 33.91038513183594, 35.5361213684082, 37.16185760498047, 38.78759002685547, 40.413326263427734, 42.0390625, 43.664798736572266, 45.29053497314453, 46.91626739501953, 48.5420036315918, 50.16773986816406, 51.79347610473633, 53.419212341308594, 55.044944763183594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 15.0, 16.0, 29.0, 33.0, 58.0, 96.0, 158.0, 182.0, 298.0, 486.0, 728.0, 1147.0, 1939.0, 3298.0, 5962.0, 11832.0, 27691.0, 85336.0, 1535081.0, 2377271.0, 87939.0, 28811.0, 12182.0, 5869.0, 3117.0, 1798.0, 1067.0, 669.0, 416.0, 215.0, 179.0, 111.0, 68.0, 63.0, 36.0, 19.0, 15.0, 10.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-44.15625, -42.962890625, -41.76953125, -40.576171875, -39.3828125, -38.189453125, -36.99609375, -35.802734375, -34.609375, -33.416015625, -32.22265625, -31.029296875, -29.8359375, -28.642578125, -27.44921875, -26.255859375, -25.0625, -23.869140625, -22.67578125, -21.482421875, -20.2890625, -19.095703125, -17.90234375, -16.708984375, -15.515625, -14.322265625, -13.12890625, -11.935546875, -10.7421875, -9.548828125, -8.35546875, -7.162109375, -5.96875, -4.775390625, -3.58203125, -2.388671875, -1.1953125, -0.001953125, 1.19140625, 2.384765625, 3.578125, 4.771484375, 5.96484375, 7.158203125, 8.3515625, 9.544921875, 10.73828125, 11.931640625, 13.125, 14.318359375, 15.51171875, 16.705078125, 17.8984375, 19.091796875, 20.28515625, 21.478515625, 22.671875, 23.865234375, 25.05859375, 26.251953125, 27.4453125, 28.638671875, 29.83203125, 31.025390625, 32.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 4.0, 13.0, 11.0, 5.0, 15.0, 10.0, 16.0, 17.0, 21.0, 23.0, 18.0, 17.0, 36.0, 37.0, 38.0, 42.0, 43.0, 45.0, 35.0, 42.0, 35.0, 43.0, 38.0, 43.0, 43.0, 36.0, 39.0, 32.0, 27.0, 21.0, 20.0, 23.0, 21.0, 9.0, 11.0, 8.0, 10.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2844696044921875, -1.243743896484375, -1.2030181884765625, -1.16229248046875, -1.1215667724609375, -1.080841064453125, -1.0401153564453125, -0.9993896484375, -0.9586639404296875, -0.917938232421875, -0.8772125244140625, -0.83648681640625, -0.7957611083984375, -0.755035400390625, -0.7143096923828125, -0.673583984375, -0.6328582763671875, -0.592132568359375, -0.5514068603515625, -0.51068115234375, -0.4699554443359375, -0.429229736328125, -0.3885040283203125, -0.3477783203125, -0.3070526123046875, -0.266326904296875, -0.2256011962890625, -0.18487548828125, -0.1441497802734375, -0.103424072265625, -0.0626983642578125, -0.02197265625, 0.0187530517578125, 0.059478759765625, 0.1002044677734375, 0.14093017578125, 0.1816558837890625, 0.222381591796875, 0.2631072998046875, 0.3038330078125, 0.3445587158203125, 0.385284423828125, 0.4260101318359375, 0.46673583984375, 0.5074615478515625, 0.548187255859375, 0.5889129638671875, 0.629638671875, 0.6703643798828125, 0.711090087890625, 0.7518157958984375, 0.79254150390625, 0.8332672119140625, 0.873992919921875, 0.9147186279296875, 0.9554443359375, 0.9961700439453125, 1.036895751953125, 1.0776214599609375, 1.11834716796875, 1.1590728759765625, 1.199798583984375, 1.2405242919921875, 1.28125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 2.0, 8.0, 12.0, 16.0, 24.0, 31.0, 34.0, 56.0, 106.0, 267.0, 1297.0, 17173.0, 3504416.0, 658125.0, 11186.0, 996.0, 234.0, 95.0, 42.0, 34.0, 32.0, 27.0, 11.0, 11.0, 9.0, 10.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-94.875, -90.91015625, -86.9453125, -82.98046875, -79.015625, -75.05078125, -71.0859375, -67.12109375, -63.15625, -59.19140625, -55.2265625, -51.26171875, -47.296875, -43.33203125, -39.3671875, -35.40234375, -31.4375, -27.47265625, -23.5078125, -19.54296875, -15.578125, -11.61328125, -7.6484375, -3.68359375, 0.28125, 4.24609375, 8.2109375, 12.17578125, 16.140625, 20.10546875, 24.0703125, 28.03515625, 32.0, 35.96484375, 39.9296875, 43.89453125, 47.859375, 51.82421875, 55.7890625, 59.75390625, 63.71875, 67.68359375, 71.6484375, 75.61328125, 79.578125, 83.54296875, 87.5078125, 91.47265625, 95.4375, 99.40234375, 103.3671875, 107.33203125, 111.296875, 115.26171875, 119.2265625, 123.19140625, 127.15625, 131.12109375, 135.0859375, 139.05078125, 143.015625, 146.98046875, 150.9453125, 154.91015625, 158.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 12.0, 10.0, 10.0, 11.0, 16.0, 36.0, 22.0, 29.0, 50.0, 59.0, 95.0, 133.0, 171.0, 365.0, 1962.0, 398.0, 203.0, 140.0, 95.0, 46.0, 49.0, 34.0, 21.0, 16.0, 12.0, 24.0, 8.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.41015625, -5.2579345703125, -5.105712890625, -4.9534912109375, -4.80126953125, -4.6490478515625, -4.496826171875, -4.3446044921875, -4.1923828125, -4.0401611328125, -3.887939453125, -3.7357177734375, -3.58349609375, -3.4312744140625, -3.279052734375, -3.1268310546875, -2.974609375, -2.8223876953125, -2.670166015625, -2.5179443359375, -2.36572265625, -2.2135009765625, -2.061279296875, -1.9090576171875, -1.7568359375, -1.6046142578125, -1.452392578125, -1.3001708984375, -1.14794921875, -0.9957275390625, -0.843505859375, -0.6912841796875, -0.5390625, -0.3868408203125, -0.234619140625, -0.0823974609375, 0.06982421875, 0.2220458984375, 0.374267578125, 0.5264892578125, 0.6787109375, 0.8309326171875, 0.983154296875, 1.1353759765625, 1.28759765625, 1.4398193359375, 1.592041015625, 1.7442626953125, 1.896484375, 2.0487060546875, 2.200927734375, 2.3531494140625, 2.50537109375, 2.6575927734375, 2.809814453125, 2.9620361328125, 3.1142578125, 3.2664794921875, 3.418701171875, 3.5709228515625, 3.72314453125, 3.8753662109375, 4.027587890625, 4.1798095703125, 4.33203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 8.0, 14.0, 31.0, 47.0, 111.0, 184.0, 215.0, 187.0, 110.0, 45.0, 26.0, 16.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.04010009765625, -37.99589920043945, -35.951698303222656, -33.907493591308594, -31.863292694091797, -29.819091796875, -27.77488899230957, -25.73068618774414, -23.686485290527344, -21.642284393310547, -19.598081588745117, -17.553878784179688, -15.50967788696289, -13.465476036071777, -11.421274185180664, -9.37707233428955, -7.3328704833984375, -5.288668632507324, -3.244466781616211, -1.2002649307250977, 0.8439369201660156, 2.888138771057129, 4.932340621948242, 6.9765424728393555, 9.020744323730469, 11.064946174621582, 13.109148025512695, 15.153349876403809, 17.197551727294922, 19.24175262451172, 21.28595542907715, 23.330158233642578, 25.374359130859375, 27.418560028076172, 29.4627628326416, 31.50696563720703, 33.55116653442383, 35.595367431640625, 37.63957214355469, 39.683773040771484, 41.72797393798828, 43.77217483520508, 45.816375732421875, 47.86058044433594, 49.904781341552734, 51.94898223876953, 53.993186950683594, 56.03738784790039, 58.08158874511719, 60.125789642333984, 62.16999053955078, 64.21419525146484, 66.25839233398438, 68.30259704589844, 70.3468017578125, 72.39099884033203, 74.4352035522461, 76.47940826416016, 78.52360534667969, 80.56781005859375, 82.61201477050781, 84.65621185302734, 86.7004165649414, 88.74461364746094, 90.788818359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 10.0, 9.0, 11.0, 17.0, 24.0, 38.0, 41.0, 44.0, 58.0, 56.0, 55.0, 67.0, 52.0, 68.0, 62.0, 50.0, 59.0, 40.0, 42.0, 37.0, 27.0, 28.0, 23.0, 15.0, 19.0, 10.0, 8.0, 1.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.928178787231445, -21.188501358032227, -20.448823928833008, -19.70914649963379, -18.96946907043457, -18.22979164123535, -17.490114212036133, -16.750436782836914, -16.010759353637695, -15.271081924438477, -14.531404495239258, -13.791727066040039, -13.05204963684082, -12.312372207641602, -11.572694778442383, -10.833017349243164, -10.093339920043945, -9.353662490844727, -8.613985061645508, -7.874307632446289, -7.13463020324707, -6.394952774047852, -5.655275344848633, -4.915597915649414, -4.175920486450195, -3.4362430572509766, -2.696565628051758, -1.956888198852539, -1.2172107696533203, -0.47753334045410156, 0.2621440887451172, 1.001821517944336, 1.7414970397949219, 2.4811744689941406, 3.2208518981933594, 3.960529327392578, 4.700206756591797, 5.439884185791016, 6.179561614990234, 6.919239044189453, 7.658916473388672, 8.39859390258789, 9.13827133178711, 9.877948760986328, 10.617626190185547, 11.357303619384766, 12.096981048583984, 12.836658477783203, 13.576335906982422, 14.31601333618164, 15.05569076538086, 15.795368194580078, 16.535045623779297, 17.274723052978516, 18.014400482177734, 18.754077911376953, 19.493755340576172, 20.23343276977539, 20.97311019897461, 21.712787628173828, 22.452465057373047, 23.192142486572266, 23.931819915771484, 24.671497344970703, 25.411174774169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 6.0, 6.0, 11.0, 14.0, 8.0, 24.0, 22.0, 23.0, 20.0, 18.0, 37.0, 26.0, 36.0, 41.0, 63.0, 244.0, 2123.0, 22033.0, 367558.0, 608510.0, 43181.0, 3700.0, 444.0, 77.0, 35.0, 44.0, 34.0, 30.0, 31.0, 24.0, 18.0, 15.0, 13.0, 22.0, 11.0, 10.0, 3.0, 1.0, 9.0, 9.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-70.1875, -68.296875, -66.40625, -64.515625, -62.625, -60.734375, -58.84375, -56.953125, -55.0625, -53.171875, -51.28125, -49.390625, -47.5, -45.609375, -43.71875, -41.828125, -39.9375, -38.046875, -36.15625, -34.265625, -32.375, -30.484375, -28.59375, -26.703125, -24.8125, -22.921875, -21.03125, -19.140625, -17.25, -15.359375, -13.46875, -11.578125, -9.6875, -7.796875, -5.90625, -4.015625, -2.125, -0.234375, 1.65625, 3.546875, 5.4375, 7.328125, 9.21875, 11.109375, 13.0, 14.890625, 16.78125, 18.671875, 20.5625, 22.453125, 24.34375, 26.234375, 28.125, 30.015625, 31.90625, 33.796875, 35.6875, 37.578125, 39.46875, 41.359375, 43.25, 45.140625, 47.03125, 48.921875, 50.8125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 14.0, 25.0, 35.0, 69.0, 86.0, 109.0, 152.0, 146.0, 134.0, 110.0, 57.0, 34.0, 21.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.292327880859375, -1.14910888671875, -1.005889892578125, -0.8626708984375, -0.719451904296875, -0.57623291015625, -0.433013916015625, -0.289794921875, -0.146575927734375, -0.00335693359375, 0.139862060546875, 0.2830810546875, 0.426300048828125, 0.56951904296875, 0.712738037109375, 0.85595703125, 0.999176025390625, 1.14239501953125, 1.285614013671875, 1.4288330078125, 1.572052001953125, 1.71527099609375, 1.858489990234375, 2.001708984375, 2.144927978515625, 2.28814697265625, 2.431365966796875, 2.5745849609375, 2.717803955078125, 2.86102294921875, 3.004241943359375, 3.1474609375, 3.290679931640625, 3.43389892578125, 3.577117919921875, 3.7203369140625, 3.863555908203125, 4.00677490234375, 4.149993896484375, 4.293212890625, 4.436431884765625, 4.57965087890625, 4.722869873046875, 4.8660888671875, 5.009307861328125, 5.15252685546875, 5.295745849609375, 5.43896484375, 5.582183837890625, 5.72540283203125, 5.868621826171875, 6.0118408203125, 6.155059814453125, 6.29827880859375, 6.441497802734375, 6.584716796875, 6.727935791015625, 6.87115478515625, 7.014373779296875, 7.1575927734375, 7.300811767578125, 7.44403076171875, 7.587249755859375, 7.73046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 6.0, 10.0, 13.0, 12.0, 15.0, 43.0, 54.0, 60.0, 103.0, 140.0, 161.0, 262.0, 394.0, 606.0, 904.0, 1463.0, 2569.0, 4270.0, 7750.0, 14447.0, 27949.0, 55181.0, 106608.0, 187590.0, 241053.0, 181821.0, 102935.0, 53010.0, 26877.0, 13895.0, 7456.0, 4226.0, 2444.0, 1470.0, 905.0, 556.0, 382.0, 272.0, 182.0, 155.0, 80.0, 64.0, 50.0, 23.0, 34.0, 18.0, 13.0, 10.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3203125, -13.850341796875, -13.38037109375, -12.910400390625, -12.4404296875, -11.970458984375, -11.50048828125, -11.030517578125, -10.560546875, -10.090576171875, -9.62060546875, -9.150634765625, -8.6806640625, -8.210693359375, -7.74072265625, -7.270751953125, -6.80078125, -6.330810546875, -5.86083984375, -5.390869140625, -4.9208984375, -4.450927734375, -3.98095703125, -3.510986328125, -3.041015625, -2.571044921875, -2.10107421875, -1.631103515625, -1.1611328125, -0.691162109375, -0.22119140625, 0.248779296875, 0.71875, 1.188720703125, 1.65869140625, 2.128662109375, 2.5986328125, 3.068603515625, 3.53857421875, 4.008544921875, 4.478515625, 4.948486328125, 5.41845703125, 5.888427734375, 6.3583984375, 6.828369140625, 7.29833984375, 7.768310546875, 8.23828125, 8.708251953125, 9.17822265625, 9.648193359375, 10.1181640625, 10.588134765625, 11.05810546875, 11.528076171875, 11.998046875, 12.468017578125, 12.93798828125, 13.407958984375, 13.8779296875, 14.347900390625, 14.81787109375, 15.287841796875, 15.7578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 9.0, 6.0, 11.0, 15.0, 19.0, 11.0, 14.0, 27.0, 18.0, 21.0, 28.0, 31.0, 34.0, 43.0, 44.0, 32.0, 30.0, 43.0, 45.0, 34.0, 38.0, 46.0, 29.0, 45.0, 29.0, 44.0, 28.0, 35.0, 33.0, 27.0, 24.0, 22.0, 9.0, 14.0, 7.0, 10.0, 6.0, 1.0, 6.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5089111328125, -8.205322265625, -7.9017333984375, -7.59814453125, -7.2945556640625, -6.990966796875, -6.6873779296875, -6.3837890625, -6.0802001953125, -5.776611328125, -5.4730224609375, -5.16943359375, -4.8658447265625, -4.562255859375, -4.2586669921875, -3.955078125, -3.6514892578125, -3.347900390625, -3.0443115234375, -2.74072265625, -2.4371337890625, -2.133544921875, -1.8299560546875, -1.5263671875, -1.2227783203125, -0.919189453125, -0.6156005859375, -0.31201171875, -0.0084228515625, 0.295166015625, 0.5987548828125, 0.90234375, 1.2059326171875, 1.509521484375, 1.8131103515625, 2.11669921875, 2.4202880859375, 2.723876953125, 3.0274658203125, 3.3310546875, 3.6346435546875, 3.938232421875, 4.2418212890625, 4.54541015625, 4.8489990234375, 5.152587890625, 5.4561767578125, 5.759765625, 6.0633544921875, 6.366943359375, 6.6705322265625, 6.97412109375, 7.2777099609375, 7.581298828125, 7.8848876953125, 8.1884765625, 8.4920654296875, 8.795654296875, 9.0992431640625, 9.40283203125, 9.7064208984375, 10.010009765625, 10.3135986328125, 10.6171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 17.0, 18.0, 21.0, 41.0, 42.0, 77.0, 104.0, 158.0, 255.0, 411.0, 662.0, 1251.0, 2291.0, 4532.0, 10023.0, 25797.0, 71400.0, 206698.0, 375768.0, 222574.0, 77899.0, 27547.0, 10705.0, 4753.0, 2337.0, 1217.0, 705.0, 449.0, 263.0, 171.0, 116.0, 74.0, 44.0, 36.0, 25.0, 13.0, 12.0, 9.0, 5.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0], "bins": [-15.5390625, -15.101806640625, -14.66455078125, -14.227294921875, -13.7900390625, -13.352783203125, -12.91552734375, -12.478271484375, -12.041015625, -11.603759765625, -11.16650390625, -10.729248046875, -10.2919921875, -9.854736328125, -9.41748046875, -8.980224609375, -8.54296875, -8.105712890625, -7.66845703125, -7.231201171875, -6.7939453125, -6.356689453125, -5.91943359375, -5.482177734375, -5.044921875, -4.607666015625, -4.17041015625, -3.733154296875, -3.2958984375, -2.858642578125, -2.42138671875, -1.984130859375, -1.546875, -1.109619140625, -0.67236328125, -0.235107421875, 0.2021484375, 0.639404296875, 1.07666015625, 1.513916015625, 1.951171875, 2.388427734375, 2.82568359375, 3.262939453125, 3.7001953125, 4.137451171875, 4.57470703125, 5.011962890625, 5.44921875, 5.886474609375, 6.32373046875, 6.760986328125, 7.1982421875, 7.635498046875, 8.07275390625, 8.510009765625, 8.947265625, 9.384521484375, 9.82177734375, 10.259033203125, 10.6962890625, 11.133544921875, 11.57080078125, 12.008056640625, 12.4453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 8.0, 4.0, 2.0, 5.0, 11.0, 16.0, 17.0, 28.0, 32.0, 42.0, 64.0, 80.0, 93.0, 114.0, 117.0, 102.0, 66.0, 53.0, 34.0, 37.0, 19.0, 17.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020732879638671875, -0.0019927024841308594, -0.0019121170043945312, -0.0018315315246582031, -0.001750946044921875, -0.0016703605651855469, -0.0015897750854492188, -0.0015091896057128906, -0.0014286041259765625, -0.0013480186462402344, -0.0012674331665039062, -0.0011868476867675781, -0.00110626220703125, -0.0010256767272949219, -0.0009450912475585938, -0.0008645057678222656, -0.0007839202880859375, -0.0007033348083496094, -0.0006227493286132812, -0.0005421638488769531, -0.000461578369140625, -0.0003809928894042969, -0.00030040740966796875, -0.00021982192993164062, -0.0001392364501953125, -5.8650970458984375e-05, 2.193450927734375e-05, 0.00010251998901367188, 0.00018310546875, 0.0002636909484863281, 0.00034427642822265625, 0.0004248619079589844, 0.0005054473876953125, 0.0005860328674316406, 0.0006666183471679688, 0.0007472038269042969, 0.000827789306640625, 0.0009083747863769531, 0.0009889602661132812, 0.0010695457458496094, 0.0011501312255859375, 0.0012307167053222656, 0.0013113021850585938, 0.0013918876647949219, 0.00147247314453125, 0.0015530586242675781, 0.0016336441040039062, 0.0017142295837402344, 0.0017948150634765625, 0.0018754005432128906, 0.0019559860229492188, 0.002036571502685547, 0.002117156982421875, 0.002197742462158203, 0.0022783279418945312, 0.0023589134216308594, 0.0024394989013671875, 0.0025200843811035156, 0.0026006698608398438, 0.002681255340576172, 0.0027618408203125, 0.002842426300048828, 0.0029230117797851562, 0.0030035972595214844, 0.0030841827392578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 14.0, 31.0, 34.0, 50.0, 67.0, 127.0, 177.0, 305.0, 484.0, 851.0, 1506.0, 2955.0, 6069.0, 14789.0, 40602.0, 134706.0, 398756.0, 306603.0, 90785.0, 28476.0, 10663.0, 4861.0, 2340.0, 1318.0, 775.0, 418.0, 245.0, 167.0, 119.0, 61.0, 54.0, 27.0, 25.0, 15.0, 19.0, 7.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.1943359375, -16.654296875, -16.1142578125, -15.57421875, -15.0341796875, -14.494140625, -13.9541015625, -13.4140625, -12.8740234375, -12.333984375, -11.7939453125, -11.25390625, -10.7138671875, -10.173828125, -9.6337890625, -9.09375, -8.5537109375, -8.013671875, -7.4736328125, -6.93359375, -6.3935546875, -5.853515625, -5.3134765625, -4.7734375, -4.2333984375, -3.693359375, -3.1533203125, -2.61328125, -2.0732421875, -1.533203125, -0.9931640625, -0.453125, 0.0869140625, 0.626953125, 1.1669921875, 1.70703125, 2.2470703125, 2.787109375, 3.3271484375, 3.8671875, 4.4072265625, 4.947265625, 5.4873046875, 6.02734375, 6.5673828125, 7.107421875, 7.6474609375, 8.1875, 8.7275390625, 9.267578125, 9.8076171875, 10.34765625, 10.8876953125, 11.427734375, 11.9677734375, 12.5078125, 13.0478515625, 13.587890625, 14.1279296875, 14.66796875, 15.2080078125, 15.748046875, 16.2880859375, 16.828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 17.0, 18.0, 12.0, 36.0, 41.0, 45.0, 64.0, 68.0, 77.0, 67.0, 68.0, 94.0, 73.0, 46.0, 52.0, 46.0, 28.0, 26.0, 15.0, 22.0, 16.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.914306640625, -7.63330078125, -7.352294921875, -7.0712890625, -6.790283203125, -6.50927734375, -6.228271484375, -5.947265625, -5.666259765625, -5.38525390625, -5.104248046875, -4.8232421875, -4.542236328125, -4.26123046875, -3.980224609375, -3.69921875, -3.418212890625, -3.13720703125, -2.856201171875, -2.5751953125, -2.294189453125, -2.01318359375, -1.732177734375, -1.451171875, -1.170166015625, -0.88916015625, -0.608154296875, -0.3271484375, -0.046142578125, 0.23486328125, 0.515869140625, 0.796875, 1.077880859375, 1.35888671875, 1.639892578125, 1.9208984375, 2.201904296875, 2.48291015625, 2.763916015625, 3.044921875, 3.325927734375, 3.60693359375, 3.887939453125, 4.1689453125, 4.449951171875, 4.73095703125, 5.011962890625, 5.29296875, 5.573974609375, 5.85498046875, 6.135986328125, 6.4169921875, 6.697998046875, 6.97900390625, 7.260009765625, 7.541015625, 7.822021484375, 8.10302734375, 8.384033203125, 8.6650390625, 8.946044921875, 9.22705078125, 9.508056640625, 9.7890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 12.0, 33.0, 43.0, 82.0, 107.0, 153.0, 168.0, 153.0, 93.0, 62.0, 30.0, 23.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.18307495117188, -162.0477294921875, -155.91236877441406, -149.7770233154297, -143.64166259765625, -137.50631713867188, -131.3709716796875, -125.2356185913086, -119.10026550292969, -112.96491241455078, -106.82955932617188, -100.6942138671875, -94.5588607788086, -88.42350769042969, -82.28816223144531, -76.1528091430664, -70.0174560546875, -63.882102966308594, -57.74675369262695, -51.61140441894531, -45.476051330566406, -39.3406982421875, -33.20534896850586, -27.06999969482422, -20.934646606445312, -14.799295425415039, -8.663944244384766, -2.528593063354492, 3.6067581176757812, 9.742109298706055, 15.877460479736328, 22.01280975341797, 28.148178100585938, 34.283531188964844, 40.418880462646484, 46.554229736328125, 52.68958282470703, 58.82493591308594, 64.96028137207031, 71.09563446044922, 77.23098754882812, 83.36634063720703, 89.50169372558594, 95.63703918457031, 101.77239227294922, 107.90774536132812, 114.0430908203125, 120.1784439086914, 126.31379699707031, 132.4491424560547, 138.58450317382812, 144.7198486328125, 150.85519409179688, 156.9905548095703, 163.1259002685547, 169.26126098632812, 175.3966064453125, 181.53195190429688, 187.6673126220703, 193.8026580810547, 199.93801879882812, 206.0733642578125, 212.20870971679688, 218.34405517578125, 224.4794158935547]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 22.0, 28.0, 28.0, 42.0, 46.0, 54.0, 43.0, 50.0, 63.0, 63.0, 70.0, 47.0, 57.0, 55.0, 47.0, 46.0, 35.0, 34.0, 21.0, 26.0, 24.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.76068115234375, -89.60670471191406, -86.4527359008789, -83.29875946044922, -80.14479064941406, -76.99081420898438, -73.83683776855469, -70.68286895751953, -67.52890014648438, -64.37492370605469, -61.22095489501953, -58.066978454589844, -54.91300964355469, -51.759033203125, -48.60506057739258, -45.451087951660156, -42.29711151123047, -39.14313888549805, -35.989166259765625, -32.83518981933594, -29.68121910095215, -26.527246475219727, -23.373271942138672, -20.21929931640625, -17.065326690673828, -13.911354064941406, -10.757380485534668, -7.60340690612793, -4.449434280395508, -1.295461654663086, 1.8585128784179688, 5.012485504150391, 8.166458129882812, 11.320430755615234, 14.474404335021973, 17.62837791442871, 20.782350540161133, 23.936323165893555, 27.09029769897461, 30.24427032470703, 33.39824295043945, 36.552215576171875, 39.7061882019043, 42.86016082763672, 46.014137268066406, 49.16810607910156, 52.32208251953125, 55.47605514526367, 58.630027770996094, 61.784000396728516, 64.93797302246094, 68.09194946289062, 71.24591827392578, 74.39989471435547, 77.55386352539062, 80.70783996582031, 83.86181640625, 87.01579284667969, 90.16976165771484, 93.32373809814453, 96.47770690917969, 99.63168334960938, 102.78565979003906, 105.93962860107422, 109.09359741210938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 14.0, 28.0, 59.0, 123.0, 449.0, 3360.0, 98816.0, 4068077.0, 20883.0, 1638.0, 414.0, 152.0, 84.0, 54.0, 27.0, 29.0, 22.0, 9.0, 11.0, 6.0, 7.0, 9.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.1875, -120.2431640625, -113.298828125, -106.3544921875, -99.41015625, -92.4658203125, -85.521484375, -78.5771484375, -71.6328125, -64.6884765625, -57.744140625, -50.7998046875, -43.85546875, -36.9111328125, -29.966796875, -23.0224609375, -16.078125, -9.1337890625, -2.189453125, 4.7548828125, 11.69921875, 18.6435546875, 25.587890625, 32.5322265625, 39.4765625, 46.4208984375, 53.365234375, 60.3095703125, 67.25390625, 74.1982421875, 81.142578125, 88.0869140625, 95.03125, 101.9755859375, 108.919921875, 115.8642578125, 122.80859375, 129.7529296875, 136.697265625, 143.6416015625, 150.5859375, 157.5302734375, 164.474609375, 171.4189453125, 178.36328125, 185.3076171875, 192.251953125, 199.1962890625, 206.140625, 213.0849609375, 220.029296875, 226.9736328125, 233.91796875, 240.8623046875, 247.806640625, 254.7509765625, 261.6953125, 268.6396484375, 275.583984375, 282.5283203125, 289.47265625, 296.4169921875, 303.361328125, 310.3056640625, 317.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 15.0, 30.0, 49.0, 68.0, 101.0, 127.0, 128.0, 122.0, 109.0, 101.0, 64.0, 40.0, 18.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3828125, -3.203125, -3.0234375, -2.84375, -2.6640625, -2.484375, -2.3046875, -2.125, -1.9453125, -1.765625, -1.5859375, -1.40625, -1.2265625, -1.046875, -0.8671875, -0.6875, -0.5078125, -0.328125, -0.1484375, 0.03125, 0.2109375, 0.390625, 0.5703125, 0.75, 0.9296875, 1.109375, 1.2890625, 1.46875, 1.6484375, 1.828125, 2.0078125, 2.1875, 2.3671875, 2.546875, 2.7265625, 2.90625, 3.0859375, 3.265625, 3.4453125, 3.625, 3.8046875, 3.984375, 4.1640625, 4.34375, 4.5234375, 4.703125, 4.8828125, 5.0625, 5.2421875, 5.421875, 5.6015625, 5.78125, 5.9609375, 6.140625, 6.3203125, 6.5, 6.6796875, 6.859375, 7.0390625, 7.21875, 7.3984375, 7.578125, 7.7578125, 7.9375, 8.1171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 10.0, 4.0, 13.0, 32.0, 33.0, 56.0, 93.0, 209.0, 375.0, 593.0, 1277.0, 2629.0, 6459.0, 17289.0, 50495.0, 194083.0, 3083280.0, 672751.0, 112789.0, 32400.0, 11250.0, 4374.0, 1940.0, 900.0, 423.0, 220.0, 111.0, 62.0, 40.0, 28.0, 19.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.56689453125, -48.0087890625, -46.45068359375, -44.892578125, -43.33447265625, -41.7763671875, -40.21826171875, -38.66015625, -37.10205078125, -35.5439453125, -33.98583984375, -32.427734375, -30.86962890625, -29.3115234375, -27.75341796875, -26.1953125, -24.63720703125, -23.0791015625, -21.52099609375, -19.962890625, -18.40478515625, -16.8466796875, -15.28857421875, -13.73046875, -12.17236328125, -10.6142578125, -9.05615234375, -7.498046875, -5.93994140625, -4.3818359375, -2.82373046875, -1.265625, 0.29248046875, 1.8505859375, 3.40869140625, 4.966796875, 6.52490234375, 8.0830078125, 9.64111328125, 11.19921875, 12.75732421875, 14.3154296875, 15.87353515625, 17.431640625, 18.98974609375, 20.5478515625, 22.10595703125, 23.6640625, 25.22216796875, 26.7802734375, 28.33837890625, 29.896484375, 31.45458984375, 33.0126953125, 34.57080078125, 36.12890625, 37.68701171875, 39.2451171875, 40.80322265625, 42.361328125, 43.91943359375, 45.4775390625, 47.03564453125, 48.59375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 18.0, 21.0, 21.0, 32.0, 34.0, 35.0, 39.0, 60.0, 70.0, 88.0, 162.0, 310.0, 1434.0, 815.0, 263.0, 177.0, 114.0, 89.0, 55.0, 52.0, 36.0, 20.0, 17.0, 16.0, 17.0, 9.0, 7.0, 7.0, 4.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.8046875, -8.5662841796875, -8.327880859375, -8.0894775390625, -7.85107421875, -7.6126708984375, -7.374267578125, -7.1358642578125, -6.8974609375, -6.6590576171875, -6.420654296875, -6.1822509765625, -5.94384765625, -5.7054443359375, -5.467041015625, -5.2286376953125, -4.990234375, -4.7518310546875, -4.513427734375, -4.2750244140625, -4.03662109375, -3.7982177734375, -3.559814453125, -3.3214111328125, -3.0830078125, -2.8446044921875, -2.606201171875, -2.3677978515625, -2.12939453125, -1.8909912109375, -1.652587890625, -1.4141845703125, -1.17578125, -0.9373779296875, -0.698974609375, -0.4605712890625, -0.22216796875, 0.0162353515625, 0.254638671875, 0.4930419921875, 0.7314453125, 0.9698486328125, 1.208251953125, 1.4466552734375, 1.68505859375, 1.9234619140625, 2.161865234375, 2.4002685546875, 2.638671875, 2.8770751953125, 3.115478515625, 3.3538818359375, 3.59228515625, 3.8306884765625, 4.069091796875, 4.3074951171875, 4.5458984375, 4.7843017578125, 5.022705078125, 5.2611083984375, 5.49951171875, 5.7379150390625, 5.976318359375, 6.2147216796875, 6.453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 14.0, 22.0, 44.0, 113.0, 209.0, 251.0, 178.0, 108.0, 26.0, 21.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.11924743652344, -76.93621826171875, -72.75318145751953, -68.57014465332031, -64.38711547851562, -60.20408248901367, -56.02104949951172, -51.838016510009766, -47.65498352050781, -43.47195053100586, -39.288917541503906, -35.10588455200195, -30.9228515625, -26.739818572998047, -22.556785583496094, -18.37375259399414, -14.190719604492188, -10.007686614990234, -5.824653625488281, -1.6416206359863281, 2.541412353515625, 6.724445343017578, 10.907478332519531, 15.090511322021484, 19.273544311523438, 23.45657730102539, 27.639610290527344, 31.822643280029297, 36.00567626953125, 40.1887092590332, 44.371742248535156, 48.55477523803711, 52.737823486328125, 56.92085647583008, 61.10388946533203, 65.28692626953125, 69.46995544433594, 73.65298461914062, 77.83602142333984, 82.01905822753906, 86.20208740234375, 90.38511657714844, 94.56815338134766, 98.75119018554688, 102.93421936035156, 107.11724853515625, 111.30028533935547, 115.48332214355469, 119.66635131835938, 123.84938049316406, 128.03240966796875, 132.2154541015625, 136.3984832763672, 140.58151245117188, 144.76455688476562, 148.9475860595703, 153.130615234375, 157.3136444091797, 161.49667358398438, 165.67971801757812, 169.8627471923828, 174.0457763671875, 178.22882080078125, 182.41184997558594, 186.59487915039062]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 22.0, 16.0, 11.0, 28.0, 29.0, 35.0, 39.0, 29.0, 31.0, 45.0, 39.0, 51.0, 74.0, 68.0, 63.0, 46.0, 52.0, 48.0, 39.0, 46.0, 29.0, 33.0, 30.0, 18.0, 16.0, 14.0, 4.0, 10.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.939788818359375, -51.66326904296875, -50.38675308227539, -49.110233306884766, -47.833717346191406, -46.55719757080078, -45.28068161010742, -44.0041618347168, -42.72764587402344, -41.45112609863281, -40.17461013793945, -38.89809036254883, -37.62157440185547, -36.345054626464844, -35.068538665771484, -33.79201889038086, -32.515499114990234, -31.238981246948242, -29.96246337890625, -28.685945510864258, -27.409427642822266, -26.13290786743164, -24.85638999938965, -23.579872131347656, -22.303354263305664, -21.026836395263672, -19.75031852722168, -18.473800659179688, -17.197280883789062, -15.920763969421387, -14.644245147705078, -13.367727279663086, -12.09121322631836, -10.814695358276367, -9.538177490234375, -8.261658668518066, -6.985140800476074, -5.708622932434082, -4.432104587554932, -3.1555862426757812, -1.879068374633789, -0.6025502681732178, 0.6739678382873535, 1.9504859447479248, 3.227004051208496, 4.503521919250488, 5.780040264129639, 7.056558609008789, 8.333076477050781, 9.609594345092773, 10.886112213134766, 12.162631034851074, 13.439148902893066, 14.715666770935059, 15.992185592651367, 17.26870346069336, 18.54522132873535, 19.821739196777344, 21.098257064819336, 22.374774932861328, 23.651294708251953, 24.927810668945312, 26.204330444335938, 27.48084831237793, 28.757366180419922]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 10.0, 14.0, 11.0, 13.0, 13.0, 20.0, 23.0, 29.0, 40.0, 39.0, 72.0, 86.0, 157.0, 241.0, 399.0, 870.0, 2517.0, 11406.0, 79577.0, 533715.0, 361882.0, 46411.0, 7351.0, 1833.0, 690.0, 372.0, 230.0, 128.0, 96.0, 55.0, 42.0, 35.0, 33.0, 31.0, 23.0, 16.0, 8.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-44.71875, -43.2216796875, -41.724609375, -40.2275390625, -38.73046875, -37.2333984375, -35.736328125, -34.2392578125, -32.7421875, -31.2451171875, -29.748046875, -28.2509765625, -26.75390625, -25.2568359375, -23.759765625, -22.2626953125, -20.765625, -19.2685546875, -17.771484375, -16.2744140625, -14.77734375, -13.2802734375, -11.783203125, -10.2861328125, -8.7890625, -7.2919921875, -5.794921875, -4.2978515625, -2.80078125, -1.3037109375, 0.193359375, 1.6904296875, 3.1875, 4.6845703125, 6.181640625, 7.6787109375, 9.17578125, 10.6728515625, 12.169921875, 13.6669921875, 15.1640625, 16.6611328125, 18.158203125, 19.6552734375, 21.15234375, 22.6494140625, 24.146484375, 25.6435546875, 27.140625, 28.6376953125, 30.134765625, 31.6318359375, 33.12890625, 34.6259765625, 36.123046875, 37.6201171875, 39.1171875, 40.6142578125, 42.111328125, 43.6083984375, 45.10546875, 46.6025390625, 48.099609375, 49.5966796875, 51.09375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 13.0, 28.0, 55.0, 74.0, 117.0, 155.0, 140.0, 149.0, 110.0, 65.0, 47.0, 23.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.0828857421875, -5.868896484375, -5.6549072265625, -5.44091796875, -5.2269287109375, -5.012939453125, -4.7989501953125, -4.5849609375, -4.3709716796875, -4.156982421875, -3.9429931640625, -3.72900390625, -3.5150146484375, -3.301025390625, -3.0870361328125, -2.873046875, -2.6590576171875, -2.445068359375, -2.2310791015625, -2.01708984375, -1.8031005859375, -1.589111328125, -1.3751220703125, -1.1611328125, -0.9471435546875, -0.733154296875, -0.5191650390625, -0.30517578125, -0.0911865234375, 0.122802734375, 0.3367919921875, 0.55078125, 0.7647705078125, 0.978759765625, 1.1927490234375, 1.40673828125, 1.6207275390625, 1.834716796875, 2.0487060546875, 2.2626953125, 2.4766845703125, 2.690673828125, 2.9046630859375, 3.11865234375, 3.3326416015625, 3.546630859375, 3.7606201171875, 3.974609375, 4.1885986328125, 4.402587890625, 4.6165771484375, 4.83056640625, 5.0445556640625, 5.258544921875, 5.4725341796875, 5.6865234375, 5.9005126953125, 6.114501953125, 6.3284912109375, 6.54248046875, 6.7564697265625, 6.970458984375, 7.1844482421875, 7.3984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 7.0, 8.0, 7.0, 15.0, 19.0, 27.0, 38.0, 63.0, 81.0, 169.0, 247.0, 335.0, 547.0, 997.0, 1795.0, 3481.0, 7535.0, 18106.0, 47233.0, 131751.0, 336893.0, 308139.0, 117440.0, 42658.0, 16484.0, 6965.0, 3253.0, 1669.0, 924.0, 562.0, 368.0, 233.0, 151.0, 116.0, 67.0, 46.0, 37.0, 23.0, 22.0, 16.0, 9.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-23.4375, -22.72607421875, -22.0146484375, -21.30322265625, -20.591796875, -19.88037109375, -19.1689453125, -18.45751953125, -17.74609375, -17.03466796875, -16.3232421875, -15.61181640625, -14.900390625, -14.18896484375, -13.4775390625, -12.76611328125, -12.0546875, -11.34326171875, -10.6318359375, -9.92041015625, -9.208984375, -8.49755859375, -7.7861328125, -7.07470703125, -6.36328125, -5.65185546875, -4.9404296875, -4.22900390625, -3.517578125, -2.80615234375, -2.0947265625, -1.38330078125, -0.671875, 0.03955078125, 0.7509765625, 1.46240234375, 2.173828125, 2.88525390625, 3.5966796875, 4.30810546875, 5.01953125, 5.73095703125, 6.4423828125, 7.15380859375, 7.865234375, 8.57666015625, 9.2880859375, 9.99951171875, 10.7109375, 11.42236328125, 12.1337890625, 12.84521484375, 13.556640625, 14.26806640625, 14.9794921875, 15.69091796875, 16.40234375, 17.11376953125, 17.8251953125, 18.53662109375, 19.248046875, 19.95947265625, 20.6708984375, 21.38232421875, 22.09375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 14.0, 13.0, 25.0, 21.0, 19.0, 20.0, 30.0, 23.0, 36.0, 40.0, 34.0, 41.0, 61.0, 43.0, 39.0, 44.0, 47.0, 52.0, 40.0, 33.0, 43.0, 30.0, 34.0, 31.0, 26.0, 23.0, 24.0, 15.0, 12.0, 12.0, 11.0, 8.0, 14.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.3214111328125, -10.892822265625, -10.4642333984375, -10.03564453125, -9.6070556640625, -9.178466796875, -8.7498779296875, -8.3212890625, -7.8927001953125, -7.464111328125, -7.0355224609375, -6.60693359375, -6.1783447265625, -5.749755859375, -5.3211669921875, -4.892578125, -4.4639892578125, -4.035400390625, -3.6068115234375, -3.17822265625, -2.7496337890625, -2.321044921875, -1.8924560546875, -1.4638671875, -1.0352783203125, -0.606689453125, -0.1781005859375, 0.25048828125, 0.6790771484375, 1.107666015625, 1.5362548828125, 1.96484375, 2.3934326171875, 2.822021484375, 3.2506103515625, 3.67919921875, 4.1077880859375, 4.536376953125, 4.9649658203125, 5.3935546875, 5.8221435546875, 6.250732421875, 6.6793212890625, 7.10791015625, 7.5364990234375, 7.965087890625, 8.3936767578125, 8.822265625, 9.2508544921875, 9.679443359375, 10.1080322265625, 10.53662109375, 10.9652099609375, 11.393798828125, 11.8223876953125, 12.2509765625, 12.6795654296875, 13.108154296875, 13.5367431640625, 13.96533203125, 14.3939208984375, 14.822509765625, 15.2510986328125, 15.6796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 10.0, 21.0, 13.0, 15.0, 37.0, 65.0, 79.0, 109.0, 159.0, 293.0, 591.0, 1170.0, 2746.0, 7550.0, 28130.0, 140546.0, 539039.0, 260361.0, 48638.0, 11981.0, 3838.0, 1525.0, 690.0, 363.0, 214.0, 119.0, 78.0, 62.0, 25.0, 16.0, 17.0, 13.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.53125, -20.910400390625, -20.28955078125, -19.668701171875, -19.0478515625, -18.427001953125, -17.80615234375, -17.185302734375, -16.564453125, -15.943603515625, -15.32275390625, -14.701904296875, -14.0810546875, -13.460205078125, -12.83935546875, -12.218505859375, -11.59765625, -10.976806640625, -10.35595703125, -9.735107421875, -9.1142578125, -8.493408203125, -7.87255859375, -7.251708984375, -6.630859375, -6.010009765625, -5.38916015625, -4.768310546875, -4.1474609375, -3.526611328125, -2.90576171875, -2.284912109375, -1.6640625, -1.043212890625, -0.42236328125, 0.198486328125, 0.8193359375, 1.440185546875, 2.06103515625, 2.681884765625, 3.302734375, 3.923583984375, 4.54443359375, 5.165283203125, 5.7861328125, 6.406982421875, 7.02783203125, 7.648681640625, 8.26953125, 8.890380859375, 9.51123046875, 10.132080078125, 10.7529296875, 11.373779296875, 11.99462890625, 12.615478515625, 13.236328125, 13.857177734375, 14.47802734375, 15.098876953125, 15.7197265625, 16.340576171875, 16.96142578125, 17.582275390625, 18.203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 4.0, 9.0, 14.0, 11.0, 13.0, 18.0, 19.0, 30.0, 29.0, 37.0, 35.0, 37.0, 55.0, 57.0, 74.0, 95.0, 73.0, 61.0, 57.0, 49.0, 35.0, 30.0, 29.0, 19.0, 24.0, 27.0, 10.0, 9.0, 10.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001495361328125, -0.0014433115720748901, -0.0013912618160247803, -0.0013392120599746704, -0.0012871623039245605, -0.0012351125478744507, -0.0011830627918243408, -0.001131013035774231, -0.001078963279724121, -0.0010269135236740112, -0.0009748637676239014, -0.0009228140115737915, -0.0008707642555236816, -0.0008187144994735718, -0.0007666647434234619, -0.000714614987373352, -0.0006625652313232422, -0.0006105154752731323, -0.0005584657192230225, -0.0005064159631729126, -0.00045436620712280273, -0.00040231645107269287, -0.000350266695022583, -0.00029821693897247314, -0.0002461671829223633, -0.00019411742687225342, -0.00014206767082214355, -9.001791477203369e-05, -3.796815872192383e-05, 1.4081597328186035e-05, 6.61313533782959e-05, 0.00011818110942840576, 0.00017023086547851562, 0.0002222806215286255, 0.00027433037757873535, 0.0003263801336288452, 0.0003784298896789551, 0.00043047964572906494, 0.0004825294017791748, 0.0005345791578292847, 0.0005866289138793945, 0.0006386786699295044, 0.0006907284259796143, 0.0007427781820297241, 0.000794827938079834, 0.0008468776941299438, 0.0008989274501800537, 0.0009509772062301636, 0.0010030269622802734, 0.0010550767183303833, 0.0011071264743804932, 0.001159176230430603, 0.0012112259864807129, 0.0012632757425308228, 0.0013153254985809326, 0.0013673752546310425, 0.0014194250106811523, 0.0014714747667312622, 0.001523524522781372, 0.001575574278831482, 0.0016276240348815918, 0.0016796737909317017, 0.0017317235469818115, 0.0017837733030319214, 0.0018358230590820312]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 5.0, 7.0, 9.0, 25.0, 36.0, 71.0, 82.0, 203.0, 415.0, 955.0, 2558.0, 8391.0, 46375.0, 541848.0, 402948.0, 34355.0, 6693.0, 2103.0, 699.0, 355.0, 166.0, 89.0, 63.0, 39.0, 24.0, 9.0, 10.0, 4.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.66162109375, -32.5732421875, -31.48486328125, -30.396484375, -29.30810546875, -28.2197265625, -27.13134765625, -26.04296875, -24.95458984375, -23.8662109375, -22.77783203125, -21.689453125, -20.60107421875, -19.5126953125, -18.42431640625, -17.3359375, -16.24755859375, -15.1591796875, -14.07080078125, -12.982421875, -11.89404296875, -10.8056640625, -9.71728515625, -8.62890625, -7.54052734375, -6.4521484375, -5.36376953125, -4.275390625, -3.18701171875, -2.0986328125, -1.01025390625, 0.078125, 1.16650390625, 2.2548828125, 3.34326171875, 4.431640625, 5.52001953125, 6.6083984375, 7.69677734375, 8.78515625, 9.87353515625, 10.9619140625, 12.05029296875, 13.138671875, 14.22705078125, 15.3154296875, 16.40380859375, 17.4921875, 18.58056640625, 19.6689453125, 20.75732421875, 21.845703125, 22.93408203125, 24.0224609375, 25.11083984375, 26.19921875, 27.28759765625, 28.3759765625, 29.46435546875, 30.552734375, 31.64111328125, 32.7294921875, 33.81787109375, 34.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 9.0, 4.0, 6.0, 11.0, 15.0, 18.0, 20.0, 23.0, 34.0, 35.0, 45.0, 65.0, 68.0, 82.0, 71.0, 85.0, 82.0, 61.0, 46.0, 36.0, 42.0, 27.0, 20.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 0.0, 6.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.484375, -9.21697998046875, -8.9495849609375, -8.68218994140625, -8.414794921875, -8.14739990234375, -7.8800048828125, -7.61260986328125, -7.34521484375, -7.07781982421875, -6.8104248046875, -6.54302978515625, -6.275634765625, -6.00823974609375, -5.7408447265625, -5.47344970703125, -5.2060546875, -4.93865966796875, -4.6712646484375, -4.40386962890625, -4.136474609375, -3.86907958984375, -3.6016845703125, -3.33428955078125, -3.06689453125, -2.79949951171875, -2.5321044921875, -2.26470947265625, -1.997314453125, -1.72991943359375, -1.4625244140625, -1.19512939453125, -0.927734375, -0.66033935546875, -0.3929443359375, -0.12554931640625, 0.141845703125, 0.40924072265625, 0.6766357421875, 0.94403076171875, 1.21142578125, 1.47882080078125, 1.7462158203125, 2.01361083984375, 2.281005859375, 2.54840087890625, 2.8157958984375, 3.08319091796875, 3.3505859375, 3.61798095703125, 3.8853759765625, 4.15277099609375, 4.420166015625, 4.68756103515625, 4.9549560546875, 5.22235107421875, 5.48974609375, 5.75714111328125, 6.0245361328125, 6.29193115234375, 6.559326171875, 6.82672119140625, 7.0941162109375, 7.36151123046875, 7.62890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 14.0, 15.0, 29.0, 43.0, 68.0, 121.0, 148.0, 154.0, 173.0, 92.0, 60.0, 31.0, 19.0, 13.0, 11.0, 6.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.89096069335938, -206.52386474609375, -200.15676879882812, -193.7896728515625, -187.42257690429688, -181.0554656982422, -174.68836975097656, -168.32127380371094, -161.9541778564453, -155.5870819091797, -149.21998596191406, -142.85289001464844, -136.48577880859375, -130.11868286132812, -123.7515869140625, -117.38449096679688, -111.01739501953125, -104.65029907226562, -98.283203125, -91.91609954833984, -85.54900360107422, -79.1819076538086, -72.81480407714844, -66.44770812988281, -60.08061218261719, -53.71351623535156, -47.34641647338867, -40.97931671142578, -34.612220764160156, -28.2451229095459, -21.87802505493164, -15.51092529296875, -9.143844604492188, -2.7767467498779297, 3.590351104736328, 9.957448959350586, 16.324546813964844, 22.6916446685791, 29.05874252319336, 35.42584228515625, 41.792938232421875, 48.1600341796875, 54.52713394165039, 60.89423370361328, 67.2613296508789, 73.62842559814453, 79.99552917480469, 86.36262512207031, 92.72972106933594, 99.09681701660156, 105.46391296386719, 111.83101654052734, 118.19811248779297, 124.5652084350586, 130.93231201171875, 137.29940795898438, 143.66650390625, 150.03359985351562, 156.40069580078125, 162.76779174804688, 169.1348876953125, 175.5019989013672, 181.8690948486328, 188.23619079589844, 194.60328674316406]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 7.0, 13.0, 19.0, 19.0, 22.0, 24.0, 38.0, 38.0, 45.0, 55.0, 53.0, 66.0, 66.0, 62.0, 50.0, 54.0, 48.0, 41.0, 49.0, 37.0, 40.0, 24.0, 34.0, 13.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.28388977050781, -119.3560562133789, -115.42822265625, -111.50039672851562, -107.57256317138672, -103.64472961425781, -99.7168960571289, -95.7890625, -91.86123657226562, -87.93340301513672, -84.00556945800781, -80.07774353027344, -76.14990997314453, -72.22207641601562, -68.29424285888672, -64.36640930175781, -60.43857955932617, -56.510746002197266, -52.582916259765625, -48.65508270263672, -44.72725296020508, -40.79941940307617, -36.87158966064453, -32.943756103515625, -29.01592445373535, -25.088092803955078, -21.160261154174805, -17.23242950439453, -13.304596900939941, -9.376764297485352, -5.448932647705078, -1.5211009979248047, 2.4067306518554688, 6.334562301635742, 10.262393951416016, 14.190226554870605, 18.118057250976562, 22.04589080810547, 25.973722457885742, 29.901554107666016, 33.829383850097656, 37.75721740722656, 41.6850471496582, 45.61288070678711, 49.54071044921875, 53.468544006347656, 57.39637756347656, 61.3242073059082, 65.25204467773438, 69.17987823486328, 73.10771179199219, 77.03553771972656, 80.96337127685547, 84.89120483398438, 88.81903839111328, 92.74687194824219, 96.67469787597656, 100.60253143310547, 104.53036499023438, 108.45819091796875, 112.38602447509766, 116.31385803222656, 120.24169158935547, 124.16952514648438, 128.09735107421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 12.0, 17.0, 22.0, 37.0, 69.0, 98.0, 186.0, 339.0, 808.0, 2366.0, 10029.0, 69226.0, 3847943.0, 235919.0, 20484.0, 4198.0, 1260.0, 521.0, 245.0, 166.0, 101.0, 74.0, 39.0, 29.0, 26.0, 13.0, 15.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.25, -88.54296875, -85.8359375, -83.12890625, -80.421875, -77.71484375, -75.0078125, -72.30078125, -69.59375, -66.88671875, -64.1796875, -61.47265625, -58.765625, -56.05859375, -53.3515625, -50.64453125, -47.9375, -45.23046875, -42.5234375, -39.81640625, -37.109375, -34.40234375, -31.6953125, -28.98828125, -26.28125, -23.57421875, -20.8671875, -18.16015625, -15.453125, -12.74609375, -10.0390625, -7.33203125, -4.625, -1.91796875, 0.7890625, 3.49609375, 6.203125, 8.91015625, 11.6171875, 14.32421875, 17.03125, 19.73828125, 22.4453125, 25.15234375, 27.859375, 30.56640625, 33.2734375, 35.98046875, 38.6875, 41.39453125, 44.1015625, 46.80859375, 49.515625, 52.22265625, 54.9296875, 57.63671875, 60.34375, 63.05078125, 65.7578125, 68.46484375, 71.171875, 73.87890625, 76.5859375, 79.29296875, 82.0]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 15.0, 16.0, 39.0, 47.0, 48.0, 60.0, 84.0, 91.0, 105.0, 91.0, 83.0, 70.0, 69.0, 55.0, 30.0, 33.0, 20.0, 9.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.58984375, -3.42578125, -3.26171875, -3.09765625, -2.93359375, -2.76953125, -2.60546875, -2.44140625, -2.27734375, -2.11328125, -1.94921875, -1.78515625, -1.62109375, -1.45703125, -1.29296875, -1.12890625, -0.96484375, -0.80078125, -0.63671875, -0.47265625, -0.30859375, -0.14453125, 0.01953125, 0.18359375, 0.34765625, 0.51171875, 0.67578125, 0.83984375, 1.00390625, 1.16796875, 1.33203125, 1.49609375, 1.66015625, 1.82421875, 1.98828125, 2.15234375, 2.31640625, 2.48046875, 2.64453125, 2.80859375, 2.97265625, 3.13671875, 3.30078125, 3.46484375, 3.62890625, 3.79296875, 3.95703125, 4.12109375, 4.28515625, 4.44921875, 4.61328125, 4.77734375, 4.94140625, 5.10546875, 5.26953125, 5.43359375, 5.59765625, 5.76171875, 5.92578125, 6.08984375, 6.25390625, 6.41796875, 6.58203125, 6.74609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 1.0, 15.0, 22.0, 20.0, 37.0, 45.0, 65.0, 157.0, 573.0, 3845.0, 137995.0, 4027512.0, 21783.0, 1494.0, 325.0, 138.0, 64.0, 40.0, 50.0, 28.0, 23.0, 11.0, 15.0, 11.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.875, -142.828125, -137.78125, -132.734375, -127.6875, -122.640625, -117.59375, -112.546875, -107.5, -102.453125, -97.40625, -92.359375, -87.3125, -82.265625, -77.21875, -72.171875, -67.125, -62.078125, -57.03125, -51.984375, -46.9375, -41.890625, -36.84375, -31.796875, -26.75, -21.703125, -16.65625, -11.609375, -6.5625, -1.515625, 3.53125, 8.578125, 13.625, 18.671875, 23.71875, 28.765625, 33.8125, 38.859375, 43.90625, 48.953125, 54.0, 59.046875, 64.09375, 69.140625, 74.1875, 79.234375, 84.28125, 89.328125, 94.375, 99.421875, 104.46875, 109.515625, 114.5625, 119.609375, 124.65625, 129.703125, 134.75, 139.796875, 144.84375, 149.890625, 154.9375, 159.984375, 165.03125, 170.078125, 175.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 7.0, 6.0, 11.0, 24.0, 52.0, 110.0, 283.0, 1353.0, 1748.0, 276.0, 102.0, 59.0, 23.0, 14.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -12.825927734375, -12.15185546875, -11.477783203125, -10.8037109375, -10.129638671875, -9.45556640625, -8.781494140625, -8.107421875, -7.433349609375, -6.75927734375, -6.085205078125, -5.4111328125, -4.737060546875, -4.06298828125, -3.388916015625, -2.71484375, -2.040771484375, -1.36669921875, -0.692626953125, -0.0185546875, 0.655517578125, 1.32958984375, 2.003662109375, 2.677734375, 3.351806640625, 4.02587890625, 4.699951171875, 5.3740234375, 6.048095703125, 6.72216796875, 7.396240234375, 8.0703125, 8.744384765625, 9.41845703125, 10.092529296875, 10.7666015625, 11.440673828125, 12.11474609375, 12.788818359375, 13.462890625, 14.136962890625, 14.81103515625, 15.485107421875, 16.1591796875, 16.833251953125, 17.50732421875, 18.181396484375, 18.85546875, 19.529541015625, 20.20361328125, 20.877685546875, 21.5517578125, 22.225830078125, 22.89990234375, 23.573974609375, 24.248046875, 24.922119140625, 25.59619140625, 26.270263671875, 26.9443359375, 27.618408203125, 28.29248046875, 28.966552734375, 29.640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 11.0, 13.0, 26.0, 58.0, 87.0, 157.0, 197.0, 193.0, 117.0, 63.0, 44.0, 23.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.9610595703125, -169.48158264160156, -166.00210571289062, -162.52261352539062, -159.0431365966797, -155.56365966796875, -152.0841827392578, -148.60470581054688, -145.12522888183594, -141.645751953125, -138.16627502441406, -134.68679809570312, -131.20730590820312, -127.72782897949219, -124.24835205078125, -120.76887512207031, -117.28938293457031, -113.80990600585938, -110.3304214477539, -106.85094451904297, -103.37146759033203, -99.89198303222656, -96.41250610351562, -92.93302917480469, -89.45355224609375, -85.97407531738281, -82.49459075927734, -79.0151138305664, -75.53563690185547, -72.05615234375, -68.57667541503906, -65.09719848632812, -61.617713928222656, -58.13823318481445, -54.658756256103516, -51.17927551269531, -47.69979476928711, -44.220314025878906, -40.74083709716797, -37.261356353759766, -33.78187561035156, -30.302396774291992, -26.82291603088379, -23.34343719482422, -19.863956451416016, -16.384477615356445, -12.904998779296875, -9.425518035888672, -5.946041107177734, -2.4665615558624268, 1.0129179954528809, 4.492397308349609, 7.971877098083496, 11.451356887817383, 14.930835723876953, 18.410316467285156, 21.889795303344727, 25.369274139404297, 28.8487548828125, 32.32823181152344, 35.80771255493164, 39.287193298339844, 42.76667022705078, 46.24615478515625, 49.72563171386719]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 9.0, 5.0, 15.0, 18.0, 15.0, 20.0, 33.0, 32.0, 45.0, 45.0, 55.0, 54.0, 41.0, 57.0, 69.0, 74.0, 52.0, 50.0, 52.0, 37.0, 32.0, 23.0, 24.0, 21.0, 27.0, 26.0, 11.0, 8.0, 8.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.37733840942383, -44.99847412109375, -43.619606018066406, -42.24074172973633, -40.86187744140625, -39.483009338378906, -38.10414505004883, -36.72528076171875, -35.346412658691406, -33.96754837036133, -32.588680267333984, -31.209815979003906, -29.830949783325195, -28.452083587646484, -27.073219299316406, -25.694353103637695, -24.315486907958984, -22.936620712280273, -21.557754516601562, -20.178890228271484, -18.800024032592773, -17.421157836914062, -16.042293548583984, -14.663427352905273, -13.284561157226562, -11.905694961547852, -10.526829719543457, -9.147964477539062, -7.769098281860352, -6.390232563018799, -5.011366844177246, -3.6325016021728516, -2.2536354064941406, -0.8747696876525879, 0.5040960311889648, 1.8829617500305176, 3.2618274688720703, 4.640693187713623, 6.019558906555176, 7.39842414855957, 8.777290344238281, 10.156156539916992, 11.535021781921387, 12.913887023925781, 14.292753219604492, 15.671619415283203, 17.05048370361328, 18.429349899291992, 19.808216094970703, 21.187082290649414, 22.565948486328125, 23.944812774658203, 25.323678970336914, 26.702545166015625, 28.081409454345703, 29.460275650024414, 30.839141845703125, 32.2180061340332, 33.59687423706055, 34.975738525390625, 36.35460662841797, 37.73347091674805, 39.112335205078125, 40.49120330810547, 41.87006759643555]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 6.0, 12.0, 17.0, 13.0, 31.0, 38.0, 49.0, 75.0, 112.0, 239.0, 396.0, 782.0, 1829.0, 5157.0, 21559.0, 123663.0, 539650.0, 290565.0, 49073.0, 9979.0, 2841.0, 1144.0, 508.0, 283.0, 165.0, 129.0, 62.0, 52.0, 38.0, 15.0, 11.0, 16.0, 8.0, 8.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -33.67822265625, -32.4189453125, -31.15966796875, -29.900390625, -28.64111328125, -27.3818359375, -26.12255859375, -24.86328125, -23.60400390625, -22.3447265625, -21.08544921875, -19.826171875, -18.56689453125, -17.3076171875, -16.04833984375, -14.7890625, -13.52978515625, -12.2705078125, -11.01123046875, -9.751953125, -8.49267578125, -7.2333984375, -5.97412109375, -4.71484375, -3.45556640625, -2.1962890625, -0.93701171875, 0.322265625, 1.58154296875, 2.8408203125, 4.10009765625, 5.359375, 6.61865234375, 7.8779296875, 9.13720703125, 10.396484375, 11.65576171875, 12.9150390625, 14.17431640625, 15.43359375, 16.69287109375, 17.9521484375, 19.21142578125, 20.470703125, 21.72998046875, 22.9892578125, 24.24853515625, 25.5078125, 26.76708984375, 28.0263671875, 29.28564453125, 30.544921875, 31.80419921875, 33.0634765625, 34.32275390625, 35.58203125, 36.84130859375, 38.1005859375, 39.35986328125, 40.619140625, 41.87841796875, 43.1376953125, 44.39697265625, 45.65625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 6.0, 24.0, 30.0, 53.0, 62.0, 89.0, 87.0, 115.0, 117.0, 111.0, 78.0, 74.0, 52.0, 36.0, 17.0, 10.0, 12.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.662353515625, -5.45361328125, -5.244873046875, -5.0361328125, -4.827392578125, -4.61865234375, -4.409912109375, -4.201171875, -3.992431640625, -3.78369140625, -3.574951171875, -3.3662109375, -3.157470703125, -2.94873046875, -2.739990234375, -2.53125, -2.322509765625, -2.11376953125, -1.905029296875, -1.6962890625, -1.487548828125, -1.27880859375, -1.070068359375, -0.861328125, -0.652587890625, -0.44384765625, -0.235107421875, -0.0263671875, 0.182373046875, 0.39111328125, 0.599853515625, 0.80859375, 1.017333984375, 1.22607421875, 1.434814453125, 1.6435546875, 1.852294921875, 2.06103515625, 2.269775390625, 2.478515625, 2.687255859375, 2.89599609375, 3.104736328125, 3.3134765625, 3.522216796875, 3.73095703125, 3.939697265625, 4.1484375, 4.357177734375, 4.56591796875, 4.774658203125, 4.9833984375, 5.192138671875, 5.40087890625, 5.609619140625, 5.818359375, 6.027099609375, 6.23583984375, 6.444580078125, 6.6533203125, 6.862060546875, 7.07080078125, 7.279541015625, 7.48828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 9.0, 14.0, 18.0, 20.0, 25.0, 31.0, 36.0, 49.0, 81.0, 100.0, 174.0, 226.0, 379.0, 594.0, 952.0, 1730.0, 3053.0, 6309.0, 13794.0, 32718.0, 83322.0, 203381.0, 332941.0, 215034.0, 89196.0, 35165.0, 14637.0, 6654.0, 3395.0, 1717.0, 982.0, 591.0, 377.0, 246.0, 167.0, 125.0, 80.0, 63.0, 45.0, 32.0, 15.0, 24.0, 9.0, 11.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-18.0625, -17.48974609375, -16.9169921875, -16.34423828125, -15.771484375, -15.19873046875, -14.6259765625, -14.05322265625, -13.48046875, -12.90771484375, -12.3349609375, -11.76220703125, -11.189453125, -10.61669921875, -10.0439453125, -9.47119140625, -8.8984375, -8.32568359375, -7.7529296875, -7.18017578125, -6.607421875, -6.03466796875, -5.4619140625, -4.88916015625, -4.31640625, -3.74365234375, -3.1708984375, -2.59814453125, -2.025390625, -1.45263671875, -0.8798828125, -0.30712890625, 0.265625, 0.83837890625, 1.4111328125, 1.98388671875, 2.556640625, 3.12939453125, 3.7021484375, 4.27490234375, 4.84765625, 5.42041015625, 5.9931640625, 6.56591796875, 7.138671875, 7.71142578125, 8.2841796875, 8.85693359375, 9.4296875, 10.00244140625, 10.5751953125, 11.14794921875, 11.720703125, 12.29345703125, 12.8662109375, 13.43896484375, 14.01171875, 14.58447265625, 15.1572265625, 15.72998046875, 16.302734375, 16.87548828125, 17.4482421875, 18.02099609375, 18.59375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 5.0, 6.0, 8.0, 11.0, 10.0, 24.0, 20.0, 31.0, 28.0, 30.0, 31.0, 32.0, 38.0, 38.0, 47.0, 50.0, 49.0, 49.0, 38.0, 39.0, 51.0, 51.0, 37.0, 36.0, 31.0, 31.0, 28.0, 20.0, 20.0, 10.0, 19.0, 13.0, 10.0, 10.0, 5.0, 1.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.9375, -14.44677734375, -13.9560546875, -13.46533203125, -12.974609375, -12.48388671875, -11.9931640625, -11.50244140625, -11.01171875, -10.52099609375, -10.0302734375, -9.53955078125, -9.048828125, -8.55810546875, -8.0673828125, -7.57666015625, -7.0859375, -6.59521484375, -6.1044921875, -5.61376953125, -5.123046875, -4.63232421875, -4.1416015625, -3.65087890625, -3.16015625, -2.66943359375, -2.1787109375, -1.68798828125, -1.197265625, -0.70654296875, -0.2158203125, 0.27490234375, 0.765625, 1.25634765625, 1.7470703125, 2.23779296875, 2.728515625, 3.21923828125, 3.7099609375, 4.20068359375, 4.69140625, 5.18212890625, 5.6728515625, 6.16357421875, 6.654296875, 7.14501953125, 7.6357421875, 8.12646484375, 8.6171875, 9.10791015625, 9.5986328125, 10.08935546875, 10.580078125, 11.07080078125, 11.5615234375, 12.05224609375, 12.54296875, 13.03369140625, 13.5244140625, 14.01513671875, 14.505859375, 14.99658203125, 15.4873046875, 15.97802734375, 16.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 9.0, 13.0, 13.0, 29.0, 27.0, 41.0, 66.0, 114.0, 166.0, 306.0, 620.0, 1131.0, 2731.0, 7388.0, 24498.0, 97795.0, 365961.0, 394590.0, 111668.0, 27325.0, 8317.0, 3041.0, 1244.0, 614.0, 332.0, 185.0, 124.0, 70.0, 42.0, 22.0, 26.0, 18.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.6171875, -12.24658203125, -11.8759765625, -11.50537109375, -11.134765625, -10.76416015625, -10.3935546875, -10.02294921875, -9.65234375, -9.28173828125, -8.9111328125, -8.54052734375, -8.169921875, -7.79931640625, -7.4287109375, -7.05810546875, -6.6875, -6.31689453125, -5.9462890625, -5.57568359375, -5.205078125, -4.83447265625, -4.4638671875, -4.09326171875, -3.72265625, -3.35205078125, -2.9814453125, -2.61083984375, -2.240234375, -1.86962890625, -1.4990234375, -1.12841796875, -0.7578125, -0.38720703125, -0.0166015625, 0.35400390625, 0.724609375, 1.09521484375, 1.4658203125, 1.83642578125, 2.20703125, 2.57763671875, 2.9482421875, 3.31884765625, 3.689453125, 4.06005859375, 4.4306640625, 4.80126953125, 5.171875, 5.54248046875, 5.9130859375, 6.28369140625, 6.654296875, 7.02490234375, 7.3955078125, 7.76611328125, 8.13671875, 8.50732421875, 8.8779296875, 9.24853515625, 9.619140625, 9.98974609375, 10.3603515625, 10.73095703125, 11.1015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 6.0, 13.0, 18.0, 22.0, 53.0, 42.0, 57.0, 85.0, 96.0, 84.0, 128.0, 97.0, 64.0, 52.0, 46.0, 38.0, 16.0, 18.0, 17.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00231170654296875, -0.00224873423576355, -0.0021857619285583496, -0.0021227896213531494, -0.0020598173141479492, -0.001996845006942749, -0.0019338726997375488, -0.0018709003925323486, -0.0018079280853271484, -0.0017449557781219482, -0.001681983470916748, -0.0016190111637115479, -0.0015560388565063477, -0.0014930665493011475, -0.0014300942420959473, -0.001367121934890747, -0.0013041496276855469, -0.0012411773204803467, -0.0011782050132751465, -0.0011152327060699463, -0.001052260398864746, -0.000989288091659546, -0.0009263157844543457, -0.0008633434772491455, -0.0008003711700439453, -0.0007373988628387451, -0.0006744265556335449, -0.0006114542484283447, -0.0005484819412231445, -0.00048550963401794434, -0.00042253732681274414, -0.00035956501960754395, -0.00029659271240234375, -0.00023362040519714355, -0.00017064809799194336, -0.00010767579078674316, -4.470348358154297e-05, 1.8268823623657227e-05, 8.124113082885742e-05, 0.00014421343803405762, 0.0002071857452392578, 0.000270158052444458, 0.0003331303596496582, 0.0003961026668548584, 0.0004590749740600586, 0.0005220472812652588, 0.000585019588470459, 0.0006479918956756592, 0.0007109642028808594, 0.0007739365100860596, 0.0008369088172912598, 0.00089988112449646, 0.0009628534317016602, 0.0010258257389068604, 0.0010887980461120605, 0.0011517703533172607, 0.001214742660522461, 0.0012777149677276611, 0.0013406872749328613, 0.0014036595821380615, 0.0014666318893432617, 0.001529604196548462, 0.0015925765037536621, 0.0016555488109588623, 0.0017185211181640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 12.0, 18.0, 22.0, 37.0, 62.0, 79.0, 125.0, 246.0, 443.0, 880.0, 1727.0, 4279.0, 11922.0, 38277.0, 157413.0, 473758.0, 267175.0, 63416.0, 17569.0, 6216.0, 2487.0, 1107.0, 558.0, 256.0, 178.0, 98.0, 57.0, 44.0, 25.0, 19.0, 12.0, 11.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.015625, -15.612060546875, -15.20849609375, -14.804931640625, -14.4013671875, -13.997802734375, -13.59423828125, -13.190673828125, -12.787109375, -12.383544921875, -11.97998046875, -11.576416015625, -11.1728515625, -10.769287109375, -10.36572265625, -9.962158203125, -9.55859375, -9.155029296875, -8.75146484375, -8.347900390625, -7.9443359375, -7.540771484375, -7.13720703125, -6.733642578125, -6.330078125, -5.926513671875, -5.52294921875, -5.119384765625, -4.7158203125, -4.312255859375, -3.90869140625, -3.505126953125, -3.1015625, -2.697998046875, -2.29443359375, -1.890869140625, -1.4873046875, -1.083740234375, -0.68017578125, -0.276611328125, 0.126953125, 0.530517578125, 0.93408203125, 1.337646484375, 1.7412109375, 2.144775390625, 2.54833984375, 2.951904296875, 3.35546875, 3.759033203125, 4.16259765625, 4.566162109375, 4.9697265625, 5.373291015625, 5.77685546875, 6.180419921875, 6.583984375, 6.987548828125, 7.39111328125, 7.794677734375, 8.1982421875, 8.601806640625, 9.00537109375, 9.408935546875, 9.8125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 7.0, 8.0, 6.0, 11.0, 19.0, 18.0, 20.0, 13.0, 26.0, 39.0, 46.0, 67.0, 59.0, 54.0, 60.0, 70.0, 59.0, 59.0, 41.0, 54.0, 40.0, 37.0, 38.0, 26.0, 21.0, 17.0, 10.0, 14.0, 7.0, 8.0, 10.0, 3.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.0323486328125, -5.842041015625, -5.6517333984375, -5.46142578125, -5.2711181640625, -5.080810546875, -4.8905029296875, -4.7001953125, -4.5098876953125, -4.319580078125, -4.1292724609375, -3.93896484375, -3.7486572265625, -3.558349609375, -3.3680419921875, -3.177734375, -2.9874267578125, -2.797119140625, -2.6068115234375, -2.41650390625, -2.2261962890625, -2.035888671875, -1.8455810546875, -1.6552734375, -1.4649658203125, -1.274658203125, -1.0843505859375, -0.89404296875, -0.7037353515625, -0.513427734375, -0.3231201171875, -0.1328125, 0.0574951171875, 0.247802734375, 0.4381103515625, 0.62841796875, 0.8187255859375, 1.009033203125, 1.1993408203125, 1.3896484375, 1.5799560546875, 1.770263671875, 1.9605712890625, 2.15087890625, 2.3411865234375, 2.531494140625, 2.7218017578125, 2.912109375, 3.1024169921875, 3.292724609375, 3.4830322265625, 3.67333984375, 3.8636474609375, 4.053955078125, 4.2442626953125, 4.4345703125, 4.6248779296875, 4.815185546875, 5.0054931640625, 5.19580078125, 5.3861083984375, 5.576416015625, 5.7667236328125, 5.95703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 11.0, 27.0, 48.0, 68.0, 97.0, 147.0, 145.0, 157.0, 114.0, 67.0, 53.0, 26.0, 10.0, 10.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.79756164550781, -117.58443450927734, -112.37130737304688, -107.1581802368164, -101.94505310058594, -96.73193359375, -91.51880645751953, -86.30567932128906, -81.0925521850586, -75.87942504882812, -70.66629791259766, -65.45317077636719, -60.240047454833984, -55.026920318603516, -49.81379699707031, -44.600669860839844, -39.387542724609375, -34.174415588378906, -28.96129035949707, -23.748165130615234, -18.535037994384766, -13.321910858154297, -8.108785629272461, -2.895660400390625, 2.3174667358398438, 7.530592918395996, 12.743719100952148, 17.956844329833984, 23.169971466064453, 28.383098602294922, 33.596221923828125, 38.809349060058594, 44.0224609375, 49.23558807373047, 54.44871520996094, 59.66183853149414, 64.87496948242188, 70.08808898925781, 75.30121612548828, 80.51434326171875, 85.72747039794922, 90.94059753417969, 96.15372467041016, 101.36685180664062, 106.57997131347656, 111.79310607910156, 117.0062255859375, 122.21935272216797, 127.43247985839844, 132.64559936523438, 137.85873413085938, 143.0718536376953, 148.2849884033203, 153.49810791015625, 158.71124267578125, 163.9243621826172, 169.13748168945312, 174.35060119628906, 179.56373596191406, 184.77685546875, 189.989990234375, 195.20310974121094, 200.41624450683594, 205.62936401367188, 210.84249877929688]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 5.0, 18.0, 11.0, 25.0, 28.0, 34.0, 35.0, 42.0, 44.0, 47.0, 50.0, 71.0, 69.0, 48.0, 50.0, 60.0, 54.0, 50.0, 43.0, 34.0, 29.0, 29.0, 18.0, 18.0, 16.0, 12.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.1722412109375, -100.70118713378906, -97.23013305664062, -93.75908660888672, -90.28803253173828, -86.81697845458984, -83.34593200683594, -79.8748779296875, -76.40382385253906, -72.93276977539062, -69.46171569824219, -65.99066925048828, -62.519615173339844, -59.048561096191406, -55.577510833740234, -52.10646057128906, -48.635406494140625, -45.16435241699219, -41.693302154541016, -38.222251892089844, -34.751197814941406, -31.2801456451416, -27.809093475341797, -24.338041305541992, -20.866989135742188, -17.395936965942383, -13.924884796142578, -10.453832626342773, -6.982780456542969, -3.511728286743164, -0.040676116943359375, 3.4303760528564453, 6.90142822265625, 10.372480392456055, 13.84353256225586, 17.314584732055664, 20.78563690185547, 24.256689071655273, 27.727741241455078, 31.198793411254883, 34.66984558105469, 38.140899658203125, 41.6119499206543, 45.08300018310547, 48.554054260253906, 52.025108337402344, 55.496158599853516, 58.96720886230469, 62.438262939453125, 65.90931701660156, 69.38037109375, 72.8514175415039, 76.32247161865234, 79.79352569580078, 83.26457214355469, 86.73562622070312, 90.20668029785156, 93.677734375, 97.14878845214844, 100.61983489990234, 104.09088897705078, 107.56194305419922, 111.03298950195312, 114.50404357910156, 117.97509765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 15.0, 13.0, 23.0, 29.0, 33.0, 53.0, 82.0, 171.0, 291.0, 706.0, 2048.0, 7909.0, 49407.0, 3824029.0, 281664.0, 20788.0, 4437.0, 1406.0, 519.0, 269.0, 132.0, 84.0, 43.0, 33.0, 21.0, 13.0, 12.0, 10.0, 4.0, 5.0, 3.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.48486328125, -47.3134765625, -45.14208984375, -42.970703125, -40.79931640625, -38.6279296875, -36.45654296875, -34.28515625, -32.11376953125, -29.9423828125, -27.77099609375, -25.599609375, -23.42822265625, -21.2568359375, -19.08544921875, -16.9140625, -14.74267578125, -12.5712890625, -10.39990234375, -8.228515625, -6.05712890625, -3.8857421875, -1.71435546875, 0.45703125, 2.62841796875, 4.7998046875, 6.97119140625, 9.142578125, 11.31396484375, 13.4853515625, 15.65673828125, 17.828125, 19.99951171875, 22.1708984375, 24.34228515625, 26.513671875, 28.68505859375, 30.8564453125, 33.02783203125, 35.19921875, 37.37060546875, 39.5419921875, 41.71337890625, 43.884765625, 46.05615234375, 48.2275390625, 50.39892578125, 52.5703125, 54.74169921875, 56.9130859375, 59.08447265625, 61.255859375, 63.42724609375, 65.5986328125, 67.77001953125, 69.94140625, 72.11279296875, 74.2841796875, 76.45556640625, 78.626953125, 80.79833984375, 82.9697265625, 85.14111328125, 87.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 23.0, 43.0, 65.0, 69.0, 101.0, 114.0, 113.0, 132.0, 107.0, 84.0, 57.0, 33.0, 17.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.35546875, -7.11444091796875, -6.8734130859375, -6.63238525390625, -6.391357421875, -6.15032958984375, -5.9093017578125, -5.66827392578125, -5.42724609375, -5.18621826171875, -4.9451904296875, -4.70416259765625, -4.463134765625, -4.22210693359375, -3.9810791015625, -3.74005126953125, -3.4990234375, -3.25799560546875, -3.0169677734375, -2.77593994140625, -2.534912109375, -2.29388427734375, -2.0528564453125, -1.81182861328125, -1.57080078125, -1.32977294921875, -1.0887451171875, -0.84771728515625, -0.606689453125, -0.36566162109375, -0.1246337890625, 0.11639404296875, 0.357421875, 0.59844970703125, 0.8394775390625, 1.08050537109375, 1.321533203125, 1.56256103515625, 1.8035888671875, 2.04461669921875, 2.28564453125, 2.52667236328125, 2.7677001953125, 3.00872802734375, 3.249755859375, 3.49078369140625, 3.7318115234375, 3.97283935546875, 4.2138671875, 4.45489501953125, 4.6959228515625, 4.93695068359375, 5.177978515625, 5.41900634765625, 5.6600341796875, 5.90106201171875, 6.14208984375, 6.38311767578125, 6.6241455078125, 6.86517333984375, 7.106201171875, 7.34722900390625, 7.5882568359375, 7.82928466796875, 8.0703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 5.0, 10.0, 24.0, 30.0, 28.0, 68.0, 82.0, 144.0, 220.0, 446.0, 871.0, 2105.0, 6579.0, 31736.0, 362594.0, 3661634.0, 105379.0, 15636.0, 3960.0, 1348.0, 588.0, 263.0, 162.0, 104.0, 65.0, 61.0, 29.0, 29.0, 17.0, 16.0, 16.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.625, -48.89599609375, -47.1669921875, -45.43798828125, -43.708984375, -41.97998046875, -40.2509765625, -38.52197265625, -36.79296875, -35.06396484375, -33.3349609375, -31.60595703125, -29.876953125, -28.14794921875, -26.4189453125, -24.68994140625, -22.9609375, -21.23193359375, -19.5029296875, -17.77392578125, -16.044921875, -14.31591796875, -12.5869140625, -10.85791015625, -9.12890625, -7.39990234375, -5.6708984375, -3.94189453125, -2.212890625, -0.48388671875, 1.2451171875, 2.97412109375, 4.703125, 6.43212890625, 8.1611328125, 9.89013671875, 11.619140625, 13.34814453125, 15.0771484375, 16.80615234375, 18.53515625, 20.26416015625, 21.9931640625, 23.72216796875, 25.451171875, 27.18017578125, 28.9091796875, 30.63818359375, 32.3671875, 34.09619140625, 35.8251953125, 37.55419921875, 39.283203125, 41.01220703125, 42.7412109375, 44.47021484375, 46.19921875, 47.92822265625, 49.6572265625, 51.38623046875, 53.115234375, 54.84423828125, 56.5732421875, 58.30224609375, 60.03125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 11.0, 11.0, 13.0, 26.0, 55.0, 79.0, 140.0, 340.0, 1772.0, 1001.0, 274.0, 128.0, 74.0, 40.0, 32.0, 19.0, 20.0, 11.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.2607421875, -8.888671875, -8.5166015625, -8.14453125, -7.7724609375, -7.400390625, -7.0283203125, -6.65625, -6.2841796875, -5.912109375, -5.5400390625, -5.16796875, -4.7958984375, -4.423828125, -4.0517578125, -3.6796875, -3.3076171875, -2.935546875, -2.5634765625, -2.19140625, -1.8193359375, -1.447265625, -1.0751953125, -0.703125, -0.3310546875, 0.041015625, 0.4130859375, 0.78515625, 1.1572265625, 1.529296875, 1.9013671875, 2.2734375, 2.6455078125, 3.017578125, 3.3896484375, 3.76171875, 4.1337890625, 4.505859375, 4.8779296875, 5.25, 5.6220703125, 5.994140625, 6.3662109375, 6.73828125, 7.1103515625, 7.482421875, 7.8544921875, 8.2265625, 8.5986328125, 8.970703125, 9.3427734375, 9.71484375, 10.0869140625, 10.458984375, 10.8310546875, 11.203125, 11.5751953125, 11.947265625, 12.3193359375, 12.69140625, 13.0634765625, 13.435546875, 13.8076171875, 14.1796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 7.0, 24.0, 81.0, 226.0, 368.0, 200.0, 64.0, 28.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.130615234375, -159.07444763183594, -154.0182647705078, -148.96209716796875, -143.9059295654297, -138.84976196289062, -133.7935791015625, -128.73741149902344, -123.68123626708984, -118.62506103515625, -113.56889343261719, -108.5127182006836, -103.45654296875, -98.40037536621094, -93.34420013427734, -88.28802490234375, -83.23185729980469, -78.1756820678711, -73.11951446533203, -68.06333923339844, -63.00716781616211, -57.95099639892578, -52.89482116699219, -47.83864974975586, -42.78247833251953, -37.7263069152832, -32.670135498046875, -27.61396026611328, -22.557788848876953, -17.501617431640625, -12.445444107055664, -7.389270782470703, -2.3331146240234375, 2.723057746887207, 7.779230117797852, 12.835402488708496, 17.89157485961914, 22.94774627685547, 28.00391960144043, 33.06009292602539, 38.11626434326172, 43.17243576049805, 48.228607177734375, 53.28478240966797, 58.3409538269043, 63.397125244140625, 68.45330047607422, 73.50947570800781, 78.56564331054688, 83.62181854248047, 88.67798614501953, 93.73416137695312, 98.79032897949219, 103.84650421142578, 108.90267944335938, 113.95884704589844, 119.01502227783203, 124.07119750976562, 129.1273651123047, 134.18353271484375, 139.23971557617188, 144.29588317871094, 149.35205078125, 154.40823364257812, 159.4644012451172]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 13.0, 16.0, 17.0, 24.0, 23.0, 31.0, 27.0, 35.0, 46.0, 48.0, 52.0, 59.0, 56.0, 48.0, 43.0, 60.0, 56.0, 48.0, 49.0, 33.0, 30.0, 25.0, 24.0, 26.0, 20.0, 22.0, 9.0, 9.0, 9.0, 8.0, 3.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.57499313354492, -33.52218246459961, -32.4693717956543, -31.416561126708984, -30.363750457763672, -29.31093978881836, -28.258127212524414, -27.2053165435791, -26.15250587463379, -25.099695205688477, -24.046884536743164, -22.99407386779785, -21.941261291503906, -20.888450622558594, -19.83563995361328, -18.78282928466797, -17.730018615722656, -16.677207946777344, -15.624397277832031, -14.571585655212402, -13.51877498626709, -12.465964317321777, -11.413152694702148, -10.360342025756836, -9.307531356811523, -8.254720687866211, -7.20190954208374, -6.1490983963012695, -5.096287727355957, -4.0434770584106445, -2.990665912628174, -1.9378547668457031, -0.8850479125976562, 0.16776299476623535, 1.220573902130127, 2.2733848094940186, 3.32619571685791, 4.379006385803223, 5.431817531585693, 6.484628677368164, 7.537439346313477, 8.590250015258789, 9.643060684204102, 10.69587230682373, 11.748682975769043, 12.801493644714355, 13.854305267333984, 14.907115936279297, 15.95992660522461, 17.012737274169922, 18.065547943115234, 19.118358612060547, 20.17116928100586, 21.223979949951172, 22.276792526245117, 23.32960319519043, 24.382413864135742, 25.435224533081055, 26.488035202026367, 27.54084587097168, 28.593658447265625, 29.646469116210938, 30.69927978515625, 31.752090454101562, 32.804901123046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 8.0, 14.0, 22.0, 27.0, 36.0, 66.0, 120.0, 181.0, 321.0, 661.0, 1298.0, 3242.0, 10603.0, 47955.0, 276624.0, 547801.0, 125986.0, 23313.0, 6091.0, 2102.0, 926.0, 456.0, 234.0, 157.0, 94.0, 60.0, 45.0, 27.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.6396484375, -30.435546875, -29.2314453125, -28.02734375, -26.8232421875, -25.619140625, -24.4150390625, -23.2109375, -22.0068359375, -20.802734375, -19.5986328125, -18.39453125, -17.1904296875, -15.986328125, -14.7822265625, -13.578125, -12.3740234375, -11.169921875, -9.9658203125, -8.76171875, -7.5576171875, -6.353515625, -5.1494140625, -3.9453125, -2.7412109375, -1.537109375, -0.3330078125, 0.87109375, 2.0751953125, 3.279296875, 4.4833984375, 5.6875, 6.8916015625, 8.095703125, 9.2998046875, 10.50390625, 11.7080078125, 12.912109375, 14.1162109375, 15.3203125, 16.5244140625, 17.728515625, 18.9326171875, 20.13671875, 21.3408203125, 22.544921875, 23.7490234375, 24.953125, 26.1572265625, 27.361328125, 28.5654296875, 29.76953125, 30.9736328125, 32.177734375, 33.3818359375, 34.5859375, 35.7900390625, 36.994140625, 38.1982421875, 39.40234375, 40.6064453125, 41.810546875, 43.0146484375, 44.21875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 18.0, 31.0, 45.0, 56.0, 82.0, 109.0, 111.0, 117.0, 110.0, 87.0, 75.0, 54.0, 40.0, 18.0, 12.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28125, -6.0513916015625, -5.821533203125, -5.5916748046875, -5.36181640625, -5.1319580078125, -4.902099609375, -4.6722412109375, -4.4423828125, -4.2125244140625, -3.982666015625, -3.7528076171875, -3.52294921875, -3.2930908203125, -3.063232421875, -2.8333740234375, -2.603515625, -2.3736572265625, -2.143798828125, -1.9139404296875, -1.68408203125, -1.4542236328125, -1.224365234375, -0.9945068359375, -0.7646484375, -0.5347900390625, -0.304931640625, -0.0750732421875, 0.15478515625, 0.3846435546875, 0.614501953125, 0.8443603515625, 1.07421875, 1.3040771484375, 1.533935546875, 1.7637939453125, 1.99365234375, 2.2235107421875, 2.453369140625, 2.6832275390625, 2.9130859375, 3.1429443359375, 3.372802734375, 3.6026611328125, 3.83251953125, 4.0623779296875, 4.292236328125, 4.5220947265625, 4.751953125, 4.9818115234375, 5.211669921875, 5.4415283203125, 5.67138671875, 5.9012451171875, 6.131103515625, 6.3609619140625, 6.5908203125, 6.8206787109375, 7.050537109375, 7.2803955078125, 7.51025390625, 7.7401123046875, 7.969970703125, 8.1998291015625, 8.4296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 15.0, 22.0, 22.0, 31.0, 35.0, 59.0, 78.0, 116.0, 175.0, 242.0, 408.0, 708.0, 1224.0, 2340.0, 4933.0, 11159.0, 28581.0, 77736.0, 209624.0, 370461.0, 211554.0, 78651.0, 28607.0, 11182.0, 4968.0, 2341.0, 1245.0, 684.0, 459.0, 279.0, 194.0, 129.0, 92.0, 47.0, 36.0, 25.0, 20.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.74072265625, -14.1845703125, -13.62841796875, -13.072265625, -12.51611328125, -11.9599609375, -11.40380859375, -10.84765625, -10.29150390625, -9.7353515625, -9.17919921875, -8.623046875, -8.06689453125, -7.5107421875, -6.95458984375, -6.3984375, -5.84228515625, -5.2861328125, -4.72998046875, -4.173828125, -3.61767578125, -3.0615234375, -2.50537109375, -1.94921875, -1.39306640625, -0.8369140625, -0.28076171875, 0.275390625, 0.83154296875, 1.3876953125, 1.94384765625, 2.5, 3.05615234375, 3.6123046875, 4.16845703125, 4.724609375, 5.28076171875, 5.8369140625, 6.39306640625, 6.94921875, 7.50537109375, 8.0615234375, 8.61767578125, 9.173828125, 9.72998046875, 10.2861328125, 10.84228515625, 11.3984375, 11.95458984375, 12.5107421875, 13.06689453125, 13.623046875, 14.17919921875, 14.7353515625, 15.29150390625, 15.84765625, 16.40380859375, 16.9599609375, 17.51611328125, 18.072265625, 18.62841796875, 19.1845703125, 19.74072265625, 20.296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 6.0, 11.0, 14.0, 9.0, 12.0, 18.0, 21.0, 17.0, 24.0, 39.0, 39.0, 29.0, 46.0, 35.0, 49.0, 62.0, 41.0, 57.0, 56.0, 43.0, 34.0, 45.0, 39.0, 36.0, 25.0, 17.0, 35.0, 28.0, 27.0, 8.0, 19.0, 14.0, 14.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.833984375, -13.36328125, -12.892578125, -12.421875, -11.951171875, -11.48046875, -11.009765625, -10.5390625, -10.068359375, -9.59765625, -9.126953125, -8.65625, -8.185546875, -7.71484375, -7.244140625, -6.7734375, -6.302734375, -5.83203125, -5.361328125, -4.890625, -4.419921875, -3.94921875, -3.478515625, -3.0078125, -2.537109375, -2.06640625, -1.595703125, -1.125, -0.654296875, -0.18359375, 0.287109375, 0.7578125, 1.228515625, 1.69921875, 2.169921875, 2.640625, 3.111328125, 3.58203125, 4.052734375, 4.5234375, 4.994140625, 5.46484375, 5.935546875, 6.40625, 6.876953125, 7.34765625, 7.818359375, 8.2890625, 8.759765625, 9.23046875, 9.701171875, 10.171875, 10.642578125, 11.11328125, 11.583984375, 12.0546875, 12.525390625, 12.99609375, 13.466796875, 13.9375, 14.408203125, 14.87890625, 15.349609375, 15.8203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 2.0, 5.0, 7.0, 5.0, 4.0, 16.0, 26.0, 23.0, 36.0, 51.0, 62.0, 121.0, 223.0, 347.0, 611.0, 1265.0, 3037.0, 8332.0, 29202.0, 123858.0, 439001.0, 332363.0, 79479.0, 19811.0, 6095.0, 2232.0, 1040.0, 470.0, 276.0, 167.0, 106.0, 68.0, 57.0, 31.0, 23.0, 24.0, 12.0, 12.0, 6.0, 6.0, 6.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-10.546875, -10.225830078125, -9.90478515625, -9.583740234375, -9.2626953125, -8.941650390625, -8.62060546875, -8.299560546875, -7.978515625, -7.657470703125, -7.33642578125, -7.015380859375, -6.6943359375, -6.373291015625, -6.05224609375, -5.731201171875, -5.41015625, -5.089111328125, -4.76806640625, -4.447021484375, -4.1259765625, -3.804931640625, -3.48388671875, -3.162841796875, -2.841796875, -2.520751953125, -2.19970703125, -1.878662109375, -1.5576171875, -1.236572265625, -0.91552734375, -0.594482421875, -0.2734375, 0.047607421875, 0.36865234375, 0.689697265625, 1.0107421875, 1.331787109375, 1.65283203125, 1.973876953125, 2.294921875, 2.615966796875, 2.93701171875, 3.258056640625, 3.5791015625, 3.900146484375, 4.22119140625, 4.542236328125, 4.86328125, 5.184326171875, 5.50537109375, 5.826416015625, 6.1474609375, 6.468505859375, 6.78955078125, 7.110595703125, 7.431640625, 7.752685546875, 8.07373046875, 8.394775390625, 8.7158203125, 9.036865234375, 9.35791015625, 9.678955078125, 10.0]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 10.0, 15.0, 14.0, 10.0, 22.0, 33.0, 40.0, 53.0, 59.0, 60.0, 70.0, 78.0, 91.0, 71.0, 81.0, 50.0, 42.0, 39.0, 31.0, 23.0, 13.0, 18.0, 12.0, 8.0, 8.0, 6.0, 2.0, 7.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014743804931640625, -0.0014344602823257446, -0.0013945400714874268, -0.0013546198606491089, -0.001314699649810791, -0.0012747794389724731, -0.0012348592281341553, -0.0011949390172958374, -0.0011550188064575195, -0.0011150985956192017, -0.0010751783847808838, -0.001035258173942566, -0.000995337963104248, -0.0009554177522659302, -0.0009154975414276123, -0.0008755773305892944, -0.0008356571197509766, -0.0007957369089126587, -0.0007558166980743408, -0.000715896487236023, -0.0006759762763977051, -0.0006360560655593872, -0.0005961358547210693, -0.0005562156438827515, -0.0005162954330444336, -0.0004763752222061157, -0.00043645501136779785, -0.00039653480052948, -0.0003566145896911621, -0.00031669437885284424, -0.00027677416801452637, -0.0002368539571762085, -0.00019693374633789062, -0.00015701353549957275, -0.00011709332466125488, -7.717311382293701e-05, -3.725290298461914e-05, 2.6673078536987305e-06, 4.25875186920166e-05, 8.250772953033447e-05, 0.00012242794036865234, 0.00016234815120697021, 0.00020226836204528809, 0.00024218857288360596, 0.00028210878372192383, 0.0003220289945602417, 0.00036194920539855957, 0.00040186941623687744, 0.0004417896270751953, 0.0004817098379135132, 0.0005216300487518311, 0.0005615502595901489, 0.0006014704704284668, 0.0006413906812667847, 0.0006813108921051025, 0.0007212311029434204, 0.0007611513137817383, 0.0008010715246200562, 0.000840991735458374, 0.0008809119462966919, 0.0009208321571350098, 0.0009607523679733276, 0.0010006725788116455, 0.0010405927896499634, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 19.0, 23.0, 27.0, 26.0, 79.0, 111.0, 173.0, 342.0, 592.0, 1171.0, 2240.0, 5011.0, 12955.0, 41201.0, 166137.0, 483733.0, 245848.0, 58999.0, 17626.0, 6381.0, 2796.0, 1407.0, 669.0, 400.0, 208.0, 128.0, 88.0, 53.0, 20.0, 23.0, 19.0, 13.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-12.53125, -12.189208984375, -11.84716796875, -11.505126953125, -11.1630859375, -10.821044921875, -10.47900390625, -10.136962890625, -9.794921875, -9.452880859375, -9.11083984375, -8.768798828125, -8.4267578125, -8.084716796875, -7.74267578125, -7.400634765625, -7.05859375, -6.716552734375, -6.37451171875, -6.032470703125, -5.6904296875, -5.348388671875, -5.00634765625, -4.664306640625, -4.322265625, -3.980224609375, -3.63818359375, -3.296142578125, -2.9541015625, -2.612060546875, -2.27001953125, -1.927978515625, -1.5859375, -1.243896484375, -0.90185546875, -0.559814453125, -0.2177734375, 0.124267578125, 0.46630859375, 0.808349609375, 1.150390625, 1.492431640625, 1.83447265625, 2.176513671875, 2.5185546875, 2.860595703125, 3.20263671875, 3.544677734375, 3.88671875, 4.228759765625, 4.57080078125, 4.912841796875, 5.2548828125, 5.596923828125, 5.93896484375, 6.281005859375, 6.623046875, 6.965087890625, 7.30712890625, 7.649169921875, 7.9912109375, 8.333251953125, 8.67529296875, 9.017333984375, 9.359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 9.0, 12.0, 19.0, 24.0, 33.0, 33.0, 42.0, 61.0, 56.0, 71.0, 85.0, 80.0, 72.0, 74.0, 60.0, 53.0, 36.0, 36.0, 22.0, 12.0, 16.0, 15.0, 10.0, 8.0, 10.0, 3.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.92279052734375, -5.7205810546875, -5.51837158203125, -5.316162109375, -5.11395263671875, -4.9117431640625, -4.70953369140625, -4.50732421875, -4.30511474609375, -4.1029052734375, -3.90069580078125, -3.698486328125, -3.49627685546875, -3.2940673828125, -3.09185791015625, -2.8896484375, -2.68743896484375, -2.4852294921875, -2.28302001953125, -2.080810546875, -1.87860107421875, -1.6763916015625, -1.47418212890625, -1.27197265625, -1.06976318359375, -0.8675537109375, -0.66534423828125, -0.463134765625, -0.26092529296875, -0.0587158203125, 0.14349365234375, 0.345703125, 0.54791259765625, 0.7501220703125, 0.95233154296875, 1.154541015625, 1.35675048828125, 1.5589599609375, 1.76116943359375, 1.96337890625, 2.16558837890625, 2.3677978515625, 2.57000732421875, 2.772216796875, 2.97442626953125, 3.1766357421875, 3.37884521484375, 3.5810546875, 3.78326416015625, 3.9854736328125, 4.18768310546875, 4.389892578125, 4.59210205078125, 4.7943115234375, 4.99652099609375, 5.19873046875, 5.40093994140625, 5.6031494140625, 5.80535888671875, 6.007568359375, 6.20977783203125, 6.4119873046875, 6.61419677734375, 6.81640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 14.0, 21.0, 58.0, 137.0, 237.0, 273.0, 159.0, 75.0, 22.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.6604919433594, -280.36700439453125, -271.0735168457031, -261.780029296875, -252.48654174804688, -243.19305419921875, -233.89956665039062, -224.6060791015625, -215.31259155273438, -206.01910400390625, -196.72561645507812, -187.43212890625, -178.13864135742188, -168.84515380859375, -159.55166625976562, -150.2581787109375, -140.96469116210938, -131.67120361328125, -122.37771606445312, -113.084228515625, -103.79074096679688, -94.49725341796875, -85.20376586914062, -75.9102783203125, -66.61679077148438, -57.32330322265625, -48.029815673828125, -38.736328125, -29.442840576171875, -20.14935302734375, -10.855865478515625, -1.5623779296875, 7.73114013671875, 17.024627685546875, 26.318115234375, 35.611602783203125, 44.90509033203125, 54.198577880859375, 63.4920654296875, 72.78555297851562, 82.07904052734375, 91.37252807617188, 100.666015625, 109.95950317382812, 119.25299072265625, 128.54647827148438, 137.8399658203125, 147.13345336914062, 156.42694091796875, 165.72042846679688, 175.013916015625, 184.30740356445312, 193.60089111328125, 202.89437866210938, 212.1878662109375, 221.48135375976562, 230.77484130859375, 240.06832885742188, 249.36181640625, 258.6553039550781, 267.94879150390625, 277.2422790527344, 286.5357666015625, 295.8292541503906, 305.12274169921875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 3.0, 10.0, 14.0, 11.0, 24.0, 22.0, 18.0, 14.0, 36.0, 27.0, 36.0, 40.0, 43.0, 56.0, 51.0, 62.0, 53.0, 48.0, 33.0, 57.0, 47.0, 49.0, 46.0, 32.0, 24.0, 17.0, 25.0, 20.0, 14.0, 23.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.94471740722656, -86.02000427246094, -83.09529876708984, -80.17058563232422, -77.2458724975586, -74.32115936279297, -71.39645385742188, -68.47174072265625, -65.54702758789062, -62.622318267822266, -59.69760513305664, -56.77289581298828, -53.848182678222656, -50.9234733581543, -47.99876403808594, -45.07405090332031, -42.14934158325195, -39.224632263183594, -36.29991912841797, -33.37520980834961, -30.450496673583984, -27.525787353515625, -24.601076126098633, -21.67636489868164, -18.75165367126465, -15.826942443847656, -12.902231216430664, -9.977520942687988, -7.052809715270996, -4.128098487854004, -1.2033882141113281, 1.721323013305664, 4.646034240722656, 7.570745468139648, 10.49545669555664, 13.420166969299316, 16.344879150390625, 19.269588470458984, 22.194299697875977, 25.11901092529297, 28.04372215270996, 30.968433380126953, 33.89314270019531, 36.81785583496094, 39.7425651550293, 42.66727828979492, 45.59198760986328, 48.516700744628906, 51.441410064697266, 54.366119384765625, 57.29083251953125, 60.21554183959961, 63.140254974365234, 66.0649642944336, 68.98967742919922, 71.91438293457031, 74.83909606933594, 77.76380920410156, 80.68851470947266, 83.61322784423828, 86.5379409790039, 89.46265411376953, 92.38735961914062, 95.31207275390625, 98.23678588867188]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 16.0, 14.0, 14.0, 32.0, 63.0, 63.0, 118.0, 228.0, 412.0, 975.0, 2533.0, 8095.0, 36898.0, 504503.0, 3555053.0, 66350.0, 12475.0, 3636.0, 1377.0, 617.0, 295.0, 168.0, 94.0, 60.0, 42.0, 24.0, 20.0, 17.0, 20.0, 7.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.6875, -56.91748046875, -55.1474609375, -53.37744140625, -51.607421875, -49.83740234375, -48.0673828125, -46.29736328125, -44.52734375, -42.75732421875, -40.9873046875, -39.21728515625, -37.447265625, -35.67724609375, -33.9072265625, -32.13720703125, -30.3671875, -28.59716796875, -26.8271484375, -25.05712890625, -23.287109375, -21.51708984375, -19.7470703125, -17.97705078125, -16.20703125, -14.43701171875, -12.6669921875, -10.89697265625, -9.126953125, -7.35693359375, -5.5869140625, -3.81689453125, -2.046875, -0.27685546875, 1.4931640625, 3.26318359375, 5.033203125, 6.80322265625, 8.5732421875, 10.34326171875, 12.11328125, 13.88330078125, 15.6533203125, 17.42333984375, 19.193359375, 20.96337890625, 22.7333984375, 24.50341796875, 26.2734375, 28.04345703125, 29.8134765625, 31.58349609375, 33.353515625, 35.12353515625, 36.8935546875, 38.66357421875, 40.43359375, 42.20361328125, 43.9736328125, 45.74365234375, 47.513671875, 49.28369140625, 51.0537109375, 52.82373046875, 54.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 12.0, 31.0, 48.0, 56.0, 69.0, 82.0, 107.0, 139.0, 115.0, 107.0, 76.0, 53.0, 43.0, 21.0, 15.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.581298828125, -6.34228515625, -6.103271484375, -5.8642578125, -5.625244140625, -5.38623046875, -5.147216796875, -4.908203125, -4.669189453125, -4.43017578125, -4.191162109375, -3.9521484375, -3.713134765625, -3.47412109375, -3.235107421875, -2.99609375, -2.757080078125, -2.51806640625, -2.279052734375, -2.0400390625, -1.801025390625, -1.56201171875, -1.322998046875, -1.083984375, -0.844970703125, -0.60595703125, -0.366943359375, -0.1279296875, 0.111083984375, 0.35009765625, 0.589111328125, 0.828125, 1.067138671875, 1.30615234375, 1.545166015625, 1.7841796875, 2.023193359375, 2.26220703125, 2.501220703125, 2.740234375, 2.979248046875, 3.21826171875, 3.457275390625, 3.6962890625, 3.935302734375, 4.17431640625, 4.413330078125, 4.65234375, 4.891357421875, 5.13037109375, 5.369384765625, 5.6083984375, 5.847412109375, 6.08642578125, 6.325439453125, 6.564453125, 6.803466796875, 7.04248046875, 7.281494140625, 7.5205078125, 7.759521484375, 7.99853515625, 8.237548828125, 8.4765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 9.0, 21.0, 34.0, 44.0, 68.0, 158.0, 383.0, 929.0, 3324.0, 28035.0, 3989637.0, 161786.0, 6876.0, 1664.0, 691.0, 265.0, 142.0, 63.0, 42.0, 22.0, 20.0, 26.0, 19.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.125, -86.7509765625, -83.376953125, -80.0029296875, -76.62890625, -73.2548828125, -69.880859375, -66.5068359375, -63.1328125, -59.7587890625, -56.384765625, -53.0107421875, -49.63671875, -46.2626953125, -42.888671875, -39.5146484375, -36.140625, -32.7666015625, -29.392578125, -26.0185546875, -22.64453125, -19.2705078125, -15.896484375, -12.5224609375, -9.1484375, -5.7744140625, -2.400390625, 0.9736328125, 4.34765625, 7.7216796875, 11.095703125, 14.4697265625, 17.84375, 21.2177734375, 24.591796875, 27.9658203125, 31.33984375, 34.7138671875, 38.087890625, 41.4619140625, 44.8359375, 48.2099609375, 51.583984375, 54.9580078125, 58.33203125, 61.7060546875, 65.080078125, 68.4541015625, 71.828125, 75.2021484375, 78.576171875, 81.9501953125, 85.32421875, 88.6982421875, 92.072265625, 95.4462890625, 98.8203125, 102.1943359375, 105.568359375, 108.9423828125, 112.31640625, 115.6904296875, 119.064453125, 122.4384765625, 125.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 21.0, 61.0, 106.0, 300.0, 1576.0, 1503.0, 282.0, 115.0, 35.0, 26.0, 15.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.6875, -17.875, -17.0625, -16.25, -15.4375, -14.625, -13.8125, -13.0, -12.1875, -11.375, -10.5625, -9.75, -8.9375, -8.125, -7.3125, -6.5, -5.6875, -4.875, -4.0625, -3.25, -2.4375, -1.625, -0.8125, 0.0, 0.8125, 1.625, 2.4375, 3.25, 4.0625, 4.875, 5.6875, 6.5, 7.3125, 8.125, 8.9375, 9.75, 10.5625, 11.375, 12.1875, 13.0, 13.8125, 14.625, 15.4375, 16.25, 17.0625, 17.875, 18.6875, 19.5, 20.3125, 21.125, 21.9375, 22.75, 23.5625, 24.375, 25.1875, 26.0, 26.8125, 27.625, 28.4375, 29.25, 30.0625, 30.875, 31.6875, 32.5]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 16.0, 39.0, 111.0, 235.0, 289.0, 188.0, 75.0, 21.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-321.3175048828125, -314.67431640625, -308.0311584472656, -301.3879699707031, -294.7447814941406, -288.10162353515625, -281.45843505859375, -274.81524658203125, -268.17205810546875, -261.52886962890625, -254.8856964111328, -248.24252319335938, -241.59933471679688, -234.95616149902344, -228.31298828125, -221.6697998046875, -215.02664184570312, -208.3834686279297, -201.7402801513672, -195.09710693359375, -188.45391845703125, -181.8107452392578, -175.16757202148438, -168.52438354492188, -161.88119506835938, -155.23802185058594, -148.59483337402344, -141.95166015625, -135.3084716796875, -128.66529846191406, -122.0221176147461, -115.37893676757812, -108.73575592041016, -102.09257507324219, -95.44939422607422, -88.80621337890625, -82.16304016113281, -75.51985931396484, -68.87667846679688, -62.23350143432617, -55.5903205871582, -48.947139739990234, -42.30396270751953, -35.66078186035156, -29.017602920532227, -22.37442398071289, -15.731243133544922, -9.088066101074219, -2.44488525390625, 4.198294162750244, 10.841473579406738, 17.48465347290039, 24.127832412719727, 30.771011352539062, 37.41419219970703, 44.057369232177734, 50.7005500793457, 57.34373092651367, 63.986907958984375, 70.63008880615234, 77.27326965332031, 83.91644287109375, 90.55963134765625, 97.20280456542969, 103.84598541259766]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 16.0, 25.0, 37.0, 42.0, 59.0, 74.0, 75.0, 88.0, 94.0, 106.0, 97.0, 84.0, 61.0, 40.0, 34.0, 23.0, 14.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-92.70051574707031, -89.85249328613281, -87.00447845458984, -84.15645599365234, -81.30844116210938, -78.46041870117188, -75.61239624023438, -72.76437377929688, -69.9163589477539, -67.0683364868164, -64.22032165527344, -61.37229919433594, -58.5242805480957, -55.67626190185547, -52.82823944091797, -49.980220794677734, -47.1322021484375, -44.284183502197266, -41.43616485595703, -38.58814239501953, -35.7401237487793, -32.89210510253906, -30.044084548950195, -27.196063995361328, -24.348045349121094, -21.50002670288086, -18.652006149291992, -15.803986549377441, -12.95596694946289, -10.10794734954834, -7.259927749633789, -4.411907196044922, -1.5638885498046875, 1.2841310501098633, 4.132150650024414, 6.980170249938965, 9.828189849853516, 12.676209449768066, 15.524229049682617, 18.372249603271484, 21.22026824951172, 24.068286895751953, 26.91630744934082, 29.764328002929688, 32.61234664916992, 35.460365295410156, 38.308387756347656, 41.15640640258789, 44.004425048828125, 46.85244369506836, 49.700462341308594, 52.548484802246094, 55.39650344848633, 58.24452209472656, 61.09254455566406, 63.9405632019043, 66.78858184814453, 69.63660430908203, 72.484619140625, 75.3326416015625, 78.1806640625, 81.02867889404297, 83.87670135498047, 86.72471618652344, 89.57273864746094]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 16.0, 26.0, 15.0, 25.0, 42.0, 69.0, 114.0, 143.0, 233.0, 411.0, 711.0, 1427.0, 3321.0, 11921.0, 66978.0, 540631.0, 361288.0, 46671.0, 8861.0, 2816.0, 1196.0, 614.0, 349.0, 223.0, 137.0, 107.0, 66.0, 40.0, 26.0, 15.0, 14.0, 15.0, 10.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.53125, -45.9931640625, -44.455078125, -42.9169921875, -41.37890625, -39.8408203125, -38.302734375, -36.7646484375, -35.2265625, -33.6884765625, -32.150390625, -30.6123046875, -29.07421875, -27.5361328125, -25.998046875, -24.4599609375, -22.921875, -21.3837890625, -19.845703125, -18.3076171875, -16.76953125, -15.2314453125, -13.693359375, -12.1552734375, -10.6171875, -9.0791015625, -7.541015625, -6.0029296875, -4.46484375, -2.9267578125, -1.388671875, 0.1494140625, 1.6875, 3.2255859375, 4.763671875, 6.3017578125, 7.83984375, 9.3779296875, 10.916015625, 12.4541015625, 13.9921875, 15.5302734375, 17.068359375, 18.6064453125, 20.14453125, 21.6826171875, 23.220703125, 24.7587890625, 26.296875, 27.8349609375, 29.373046875, 30.9111328125, 32.44921875, 33.9873046875, 35.525390625, 37.0634765625, 38.6015625, 40.1396484375, 41.677734375, 43.2158203125, 44.75390625, 46.2919921875, 47.830078125, 49.3681640625, 50.90625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 14.0, 27.0, 51.0, 53.0, 72.0, 100.0, 113.0, 113.0, 124.0, 95.0, 68.0, 63.0, 43.0, 13.0, 15.0, 11.0, 6.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.481201171875, -8.22802734375, -7.974853515625, -7.7216796875, -7.468505859375, -7.21533203125, -6.962158203125, -6.708984375, -6.455810546875, -6.20263671875, -5.949462890625, -5.6962890625, -5.443115234375, -5.18994140625, -4.936767578125, -4.68359375, -4.430419921875, -4.17724609375, -3.924072265625, -3.6708984375, -3.417724609375, -3.16455078125, -2.911376953125, -2.658203125, -2.405029296875, -2.15185546875, -1.898681640625, -1.6455078125, -1.392333984375, -1.13916015625, -0.885986328125, -0.6328125, -0.379638671875, -0.12646484375, 0.126708984375, 0.3798828125, 0.633056640625, 0.88623046875, 1.139404296875, 1.392578125, 1.645751953125, 1.89892578125, 2.152099609375, 2.4052734375, 2.658447265625, 2.91162109375, 3.164794921875, 3.41796875, 3.671142578125, 3.92431640625, 4.177490234375, 4.4306640625, 4.683837890625, 4.93701171875, 5.190185546875, 5.443359375, 5.696533203125, 5.94970703125, 6.202880859375, 6.4560546875, 6.709228515625, 6.96240234375, 7.215576171875, 7.46875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 13.0, 14.0, 12.0, 19.0, 40.0, 45.0, 56.0, 90.0, 130.0, 176.0, 269.0, 425.0, 616.0, 1107.0, 1995.0, 3765.0, 7498.0, 15630.0, 34122.0, 76985.0, 173919.0, 337401.0, 217274.0, 95672.0, 42288.0, 19216.0, 9193.0, 4633.0, 2471.0, 1267.0, 797.0, 476.0, 296.0, 180.0, 121.0, 93.0, 68.0, 53.0, 37.0, 22.0, 18.0, 12.0, 10.0, 12.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.546875, -11.1290283203125, -10.711181640625, -10.2933349609375, -9.87548828125, -9.4576416015625, -9.039794921875, -8.6219482421875, -8.2041015625, -7.7862548828125, -7.368408203125, -6.9505615234375, -6.53271484375, -6.1148681640625, -5.697021484375, -5.2791748046875, -4.861328125, -4.4434814453125, -4.025634765625, -3.6077880859375, -3.18994140625, -2.7720947265625, -2.354248046875, -1.9364013671875, -1.5185546875, -1.1007080078125, -0.682861328125, -0.2650146484375, 0.15283203125, 0.5706787109375, 0.988525390625, 1.4063720703125, 1.82421875, 2.2420654296875, 2.659912109375, 3.0777587890625, 3.49560546875, 3.9134521484375, 4.331298828125, 4.7491455078125, 5.1669921875, 5.5848388671875, 6.002685546875, 6.4205322265625, 6.83837890625, 7.2562255859375, 7.674072265625, 8.0919189453125, 8.509765625, 8.9276123046875, 9.345458984375, 9.7633056640625, 10.18115234375, 10.5989990234375, 11.016845703125, 11.4346923828125, 11.8525390625, 12.2703857421875, 12.688232421875, 13.1060791015625, 13.52392578125, 13.9417724609375, 14.359619140625, 14.7774658203125, 15.1953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 8.0, 10.0, 17.0, 16.0, 23.0, 33.0, 33.0, 35.0, 49.0, 53.0, 42.0, 57.0, 43.0, 64.0, 68.0, 60.0, 46.0, 51.0, 43.0, 42.0, 38.0, 34.0, 20.0, 21.0, 29.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.597412109375, -19.03857421875, -18.479736328125, -17.9208984375, -17.362060546875, -16.80322265625, -16.244384765625, -15.685546875, -15.126708984375, -14.56787109375, -14.009033203125, -13.4501953125, -12.891357421875, -12.33251953125, -11.773681640625, -11.21484375, -10.656005859375, -10.09716796875, -9.538330078125, -8.9794921875, -8.420654296875, -7.86181640625, -7.302978515625, -6.744140625, -6.185302734375, -5.62646484375, -5.067626953125, -4.5087890625, -3.949951171875, -3.39111328125, -2.832275390625, -2.2734375, -1.714599609375, -1.15576171875, -0.596923828125, -0.0380859375, 0.520751953125, 1.07958984375, 1.638427734375, 2.197265625, 2.756103515625, 3.31494140625, 3.873779296875, 4.4326171875, 4.991455078125, 5.55029296875, 6.109130859375, 6.66796875, 7.226806640625, 7.78564453125, 8.344482421875, 8.9033203125, 9.462158203125, 10.02099609375, 10.579833984375, 11.138671875, 11.697509765625, 12.25634765625, 12.815185546875, 13.3740234375, 13.932861328125, 14.49169921875, 15.050537109375, 15.609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 22.0, 17.0, 41.0, 59.0, 97.0, 129.0, 265.0, 425.0, 811.0, 1499.0, 3185.0, 7813.0, 26848.0, 152060.0, 641025.0, 169938.0, 29199.0, 8310.0, 3300.0, 1603.0, 783.0, 443.0, 247.0, 145.0, 98.0, 67.0, 33.0, 25.0, 19.0, 9.0, 8.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7398681640625, -13.221923828125, -12.7039794921875, -12.18603515625, -11.6680908203125, -11.150146484375, -10.6322021484375, -10.1142578125, -9.5963134765625, -9.078369140625, -8.5604248046875, -8.04248046875, -7.5245361328125, -7.006591796875, -6.4886474609375, -5.970703125, -5.4527587890625, -4.934814453125, -4.4168701171875, -3.89892578125, -3.3809814453125, -2.863037109375, -2.3450927734375, -1.8271484375, -1.3092041015625, -0.791259765625, -0.2733154296875, 0.24462890625, 0.7625732421875, 1.280517578125, 1.7984619140625, 2.31640625, 2.8343505859375, 3.352294921875, 3.8702392578125, 4.38818359375, 4.9061279296875, 5.424072265625, 5.9420166015625, 6.4599609375, 6.9779052734375, 7.495849609375, 8.0137939453125, 8.53173828125, 9.0496826171875, 9.567626953125, 10.0855712890625, 10.603515625, 11.1214599609375, 11.639404296875, 12.1573486328125, 12.67529296875, 13.1932373046875, 13.711181640625, 14.2291259765625, 14.7470703125, 15.2650146484375, 15.782958984375, 16.3009033203125, 16.81884765625, 17.3367919921875, 17.854736328125, 18.3726806640625, 18.890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 12.0, 29.0, 26.0, 40.0, 84.0, 94.0, 163.0, 165.0, 114.0, 74.0, 45.0, 31.0, 11.0, 21.0, 17.0, 7.0, 8.0, 4.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018243789672851562, -0.0017514973878860474, -0.0016786158084869385, -0.0016057342290878296, -0.0015328526496887207, -0.0014599710702896118, -0.001387089490890503, -0.001314207911491394, -0.0012413263320922852, -0.0011684447526931763, -0.0010955631732940674, -0.0010226815938949585, -0.0009498000144958496, -0.0008769184350967407, -0.0008040368556976318, -0.000731155276298523, -0.0006582736968994141, -0.0005853921175003052, -0.0005125105381011963, -0.0004396289587020874, -0.0003667473793029785, -0.00029386579990386963, -0.00022098422050476074, -0.00014810264110565186, -7.522106170654297e-05, -2.339482307434082e-06, 7.05420970916748e-05, 0.0001434236764907837, 0.00021630525588989258, 0.00028918683528900146, 0.00036206841468811035, 0.00043494999408721924, 0.0005078315734863281, 0.000580713152885437, 0.0006535947322845459, 0.0007264763116836548, 0.0007993578910827637, 0.0008722394704818726, 0.0009451210498809814, 0.0010180026292800903, 0.0010908842086791992, 0.001163765788078308, 0.001236647367477417, 0.0013095289468765259, 0.0013824105262756348, 0.0014552921056747437, 0.0015281736850738525, 0.0016010552644729614, 0.0016739368438720703, 0.0017468184232711792, 0.001819700002670288, 0.001892581582069397, 0.001965463161468506, 0.0020383447408676147, 0.0021112263202667236, 0.0021841078996658325, 0.0022569894790649414, 0.0023298710584640503, 0.002402752637863159, 0.002475634217262268, 0.002548515796661377, 0.002621397376060486, 0.0026942789554595947, 0.0027671605348587036, 0.0028400421142578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 9.0, 3.0, 10.0, 10.0, 22.0, 32.0, 39.0, 51.0, 86.0, 107.0, 173.0, 287.0, 410.0, 639.0, 1058.0, 1906.0, 3415.0, 6842.0, 15192.0, 41149.0, 156332.0, 500134.0, 228968.0, 54656.0, 18891.0, 8325.0, 4188.0, 2200.0, 1288.0, 728.0, 436.0, 325.0, 190.0, 144.0, 89.0, 56.0, 39.0, 33.0, 22.0, 11.0, 8.0, 8.0, 13.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-11.65625, -11.275634765625, -10.89501953125, -10.514404296875, -10.1337890625, -9.753173828125, -9.37255859375, -8.991943359375, -8.611328125, -8.230712890625, -7.85009765625, -7.469482421875, -7.0888671875, -6.708251953125, -6.32763671875, -5.947021484375, -5.56640625, -5.185791015625, -4.80517578125, -4.424560546875, -4.0439453125, -3.663330078125, -3.28271484375, -2.902099609375, -2.521484375, -2.140869140625, -1.76025390625, -1.379638671875, -0.9990234375, -0.618408203125, -0.23779296875, 0.142822265625, 0.5234375, 0.904052734375, 1.28466796875, 1.665283203125, 2.0458984375, 2.426513671875, 2.80712890625, 3.187744140625, 3.568359375, 3.948974609375, 4.32958984375, 4.710205078125, 5.0908203125, 5.471435546875, 5.85205078125, 6.232666015625, 6.61328125, 6.993896484375, 7.37451171875, 7.755126953125, 8.1357421875, 8.516357421875, 8.89697265625, 9.277587890625, 9.658203125, 10.038818359375, 10.41943359375, 10.800048828125, 11.1806640625, 11.561279296875, 11.94189453125, 12.322509765625, 12.703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 7.0, 3.0, 9.0, 11.0, 16.0, 17.0, 25.0, 30.0, 48.0, 62.0, 85.0, 85.0, 96.0, 103.0, 77.0, 76.0, 58.0, 49.0, 32.0, 26.0, 17.0, 7.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6875, -11.3697509765625, -11.052001953125, -10.7342529296875, -10.41650390625, -10.0987548828125, -9.781005859375, -9.4632568359375, -9.1455078125, -8.8277587890625, -8.510009765625, -8.1922607421875, -7.87451171875, -7.5567626953125, -7.239013671875, -6.9212646484375, -6.603515625, -6.2857666015625, -5.968017578125, -5.6502685546875, -5.33251953125, -5.0147705078125, -4.697021484375, -4.3792724609375, -4.0615234375, -3.7437744140625, -3.426025390625, -3.1082763671875, -2.79052734375, -2.4727783203125, -2.155029296875, -1.8372802734375, -1.51953125, -1.2017822265625, -0.884033203125, -0.5662841796875, -0.24853515625, 0.0692138671875, 0.386962890625, 0.7047119140625, 1.0224609375, 1.3402099609375, 1.657958984375, 1.9757080078125, 2.29345703125, 2.6112060546875, 2.928955078125, 3.2467041015625, 3.564453125, 3.8822021484375, 4.199951171875, 4.5177001953125, 4.83544921875, 5.1531982421875, 5.470947265625, 5.7886962890625, 6.1064453125, 6.4241943359375, 6.741943359375, 7.0596923828125, 7.37744140625, 7.6951904296875, 8.012939453125, 8.3306884765625, 8.6484375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 8.0, 9.0, 6.0, 10.0, 33.0, 45.0, 78.0, 94.0, 125.0, 153.0, 136.0, 123.0, 75.0, 45.0, 30.0, 18.0, 9.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-258.61578369140625, -253.43629455566406, -248.2567901611328, -243.07730102539062, -237.89781188964844, -232.71832275390625, -227.538818359375, -222.3593292236328, -217.17984008789062, -212.00035095214844, -206.8208465576172, -201.641357421875, -196.4618682861328, -191.28237915039062, -186.10287475585938, -180.9233856201172, -175.74388122558594, -170.56439208984375, -165.3848876953125, -160.2053985595703, -155.02590942382812, -149.84640502929688, -144.6669158935547, -139.4874267578125, -134.30792236328125, -129.12843322753906, -123.94893646240234, -118.76943969726562, -113.58995056152344, -108.41045379638672, -103.23095703125, -98.05146789550781, -92.87199401855469, -87.69249725341797, -82.51300811767578, -77.33351135253906, -72.15402221679688, -66.97452545166016, -61.79502868652344, -56.615535736083984, -51.43604278564453, -46.25654983520508, -41.077056884765625, -35.897560119628906, -30.718067169189453, -25.53857421875, -20.359079360961914, -15.179584503173828, -10.000091552734375, -4.8205976486206055, 0.35889625549316406, 5.538390159606934, 10.717884063720703, 15.897377014160156, 21.076871871948242, 26.256366729736328, 31.43585968017578, 36.615352630615234, 41.79484558105469, 46.974342346191406, 52.15383529663086, 57.33332824707031, 62.51282501220703, 67.69232177734375, 72.87181091308594]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 6.0, 10.0, 15.0, 16.0, 20.0, 24.0, 17.0, 27.0, 23.0, 25.0, 28.0, 31.0, 29.0, 46.0, 52.0, 51.0, 37.0, 39.0, 53.0, 45.0, 64.0, 42.0, 33.0, 33.0, 35.0, 37.0, 23.0, 21.0, 22.0, 16.0, 17.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.3358154296875, -87.82262420654297, -85.30943298339844, -82.79623413085938, -80.28304290771484, -77.76985168457031, -75.25666046142578, -72.74346923828125, -70.23027038574219, -67.71707916259766, -65.20388793945312, -62.69069290161133, -60.17749786376953, -57.664306640625, -55.15111541748047, -52.63792037963867, -50.12472915649414, -47.61153793334961, -45.09834289550781, -42.58515167236328, -40.071956634521484, -37.55876541137695, -35.045570373535156, -32.532379150390625, -30.01918601989746, -27.505992889404297, -24.992799758911133, -22.47960662841797, -19.966415405273438, -17.45322036743164, -14.94002914428711, -12.426836013793945, -9.913642883300781, -7.400449752807617, -4.887257099151611, -2.3740644454956055, 0.1391286849975586, 2.6523218154907227, 5.16551399230957, 7.678707122802734, 10.191900253295898, 12.705093383789062, 15.218286514282227, 17.73147964477539, 20.244670867919922, 22.75786590576172, 25.27105712890625, 27.784250259399414, 30.297443389892578, 32.81063461303711, 35.323829650878906, 37.83702087402344, 40.350215911865234, 42.863407135009766, 45.37660217285156, 47.889793395996094, 50.402984619140625, 52.916175842285156, 55.42937088012695, 57.942562103271484, 60.45575714111328, 62.96894836425781, 65.48213958740234, 67.99533081054688, 70.50852966308594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 11.0, 10.0, 9.0, 19.0, 39.0, 54.0, 84.0, 151.0, 317.0, 616.0, 1587.0, 5467.0, 31768.0, 3581675.0, 544553.0, 21214.0, 4078.0, 1277.0, 550.0, 319.0, 162.0, 120.0, 70.0, 35.0, 24.0, 14.0, 16.0, 14.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.75, -72.4072265625, -70.064453125, -67.7216796875, -65.37890625, -63.0361328125, -60.693359375, -58.3505859375, -56.0078125, -53.6650390625, -51.322265625, -48.9794921875, -46.63671875, -44.2939453125, -41.951171875, -39.6083984375, -37.265625, -34.9228515625, -32.580078125, -30.2373046875, -27.89453125, -25.5517578125, -23.208984375, -20.8662109375, -18.5234375, -16.1806640625, -13.837890625, -11.4951171875, -9.15234375, -6.8095703125, -4.466796875, -2.1240234375, 0.21875, 2.5615234375, 4.904296875, 7.2470703125, 9.58984375, 11.9326171875, 14.275390625, 16.6181640625, 18.9609375, 21.3037109375, 23.646484375, 25.9892578125, 28.33203125, 30.6748046875, 33.017578125, 35.3603515625, 37.703125, 40.0458984375, 42.388671875, 44.7314453125, 47.07421875, 49.4169921875, 51.759765625, 54.1025390625, 56.4453125, 58.7880859375, 61.130859375, 63.4736328125, 65.81640625, 68.1591796875, 70.501953125, 72.8447265625, 75.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 18.0, 42.0, 62.0, 72.0, 79.0, 101.0, 99.0, 119.0, 91.0, 88.0, 84.0, 40.0, 24.0, 20.0, 16.0, 10.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.4012451171875, -8.154052734375, -7.9068603515625, -7.65966796875, -7.4124755859375, -7.165283203125, -6.9180908203125, -6.6708984375, -6.4237060546875, -6.176513671875, -5.9293212890625, -5.68212890625, -5.4349365234375, -5.187744140625, -4.9405517578125, -4.693359375, -4.4461669921875, -4.198974609375, -3.9517822265625, -3.70458984375, -3.4573974609375, -3.210205078125, -2.9630126953125, -2.7158203125, -2.4686279296875, -2.221435546875, -1.9742431640625, -1.72705078125, -1.4798583984375, -1.232666015625, -0.9854736328125, -0.73828125, -0.4910888671875, -0.243896484375, 0.0032958984375, 0.25048828125, 0.4976806640625, 0.744873046875, 0.9920654296875, 1.2392578125, 1.4864501953125, 1.733642578125, 1.9808349609375, 2.22802734375, 2.4752197265625, 2.722412109375, 2.9696044921875, 3.216796875, 3.4639892578125, 3.711181640625, 3.9583740234375, 4.20556640625, 4.4527587890625, 4.699951171875, 4.9471435546875, 5.1943359375, 5.4415283203125, 5.688720703125, 5.9359130859375, 6.18310546875, 6.4302978515625, 6.677490234375, 6.9246826171875, 7.171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 11.0, 16.0, 41.0, 57.0, 94.0, 204.0, 460.0, 1042.0, 2694.0, 7414.0, 25019.0, 121618.0, 2937773.0, 982376.0, 86625.0, 19214.0, 5863.0, 2122.0, 868.0, 360.0, 185.0, 93.0, 48.0, 34.0, 12.0, 13.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.96337890625, -28.9267578125, -27.89013671875, -26.853515625, -25.81689453125, -24.7802734375, -23.74365234375, -22.70703125, -21.67041015625, -20.6337890625, -19.59716796875, -18.560546875, -17.52392578125, -16.4873046875, -15.45068359375, -14.4140625, -13.37744140625, -12.3408203125, -11.30419921875, -10.267578125, -9.23095703125, -8.1943359375, -7.15771484375, -6.12109375, -5.08447265625, -4.0478515625, -3.01123046875, -1.974609375, -0.93798828125, 0.0986328125, 1.13525390625, 2.171875, 3.20849609375, 4.2451171875, 5.28173828125, 6.318359375, 7.35498046875, 8.3916015625, 9.42822265625, 10.46484375, 11.50146484375, 12.5380859375, 13.57470703125, 14.611328125, 15.64794921875, 16.6845703125, 17.72119140625, 18.7578125, 19.79443359375, 20.8310546875, 21.86767578125, 22.904296875, 23.94091796875, 24.9775390625, 26.01416015625, 27.05078125, 28.08740234375, 29.1240234375, 30.16064453125, 31.197265625, 32.23388671875, 33.2705078125, 34.30712890625, 35.34375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 2.0, 6.0, 4.0, 13.0, 12.0, 10.0, 24.0, 32.0, 34.0, 55.0, 69.0, 100.0, 145.0, 285.0, 502.0, 1554.0, 444.0, 254.0, 151.0, 108.0, 59.0, 61.0, 39.0, 18.0, 20.0, 11.0, 6.0, 7.0, 12.0, 4.0, 7.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.96514892578125, -7.7193603515625, -7.47357177734375, -7.227783203125, -6.98199462890625, -6.7362060546875, -6.49041748046875, -6.24462890625, -5.99884033203125, -5.7530517578125, -5.50726318359375, -5.261474609375, -5.01568603515625, -4.7698974609375, -4.52410888671875, -4.2783203125, -4.03253173828125, -3.7867431640625, -3.54095458984375, -3.295166015625, -3.04937744140625, -2.8035888671875, -2.55780029296875, -2.31201171875, -2.06622314453125, -1.8204345703125, -1.57464599609375, -1.328857421875, -1.08306884765625, -0.8372802734375, -0.59149169921875, -0.345703125, -0.09991455078125, 0.1458740234375, 0.39166259765625, 0.637451171875, 0.88323974609375, 1.1290283203125, 1.37481689453125, 1.62060546875, 1.86639404296875, 2.1121826171875, 2.35797119140625, 2.603759765625, 2.84954833984375, 3.0953369140625, 3.34112548828125, 3.5869140625, 3.83270263671875, 4.0784912109375, 4.32427978515625, 4.570068359375, 4.81585693359375, 5.0616455078125, 5.30743408203125, 5.55322265625, 5.79901123046875, 6.0447998046875, 6.29058837890625, 6.536376953125, 6.78216552734375, 7.0279541015625, 7.27374267578125, 7.51953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 12.0, 12.0, 12.0, 16.0, 33.0, 40.0, 51.0, 72.0, 100.0, 92.0, 110.0, 93.0, 104.0, 87.0, 58.0, 32.0, 27.0, 13.0, 14.0, 5.0, 9.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.348411560058594, -57.58020782470703, -55.8120002746582, -54.04379653930664, -52.27558898925781, -50.50738525390625, -48.73918151855469, -46.97097396850586, -45.20276641845703, -43.43456268310547, -41.66635513305664, -39.89815139770508, -38.12994384765625, -36.36174011230469, -34.593536376953125, -32.8253288269043, -31.057125091552734, -29.28891944885254, -27.520713806152344, -25.75251007080078, -23.984302520751953, -22.21609878540039, -20.447893142700195, -18.6796875, -16.911481857299805, -15.14327621459961, -13.375070571899414, -11.606865882873535, -9.83866024017334, -8.070454597473145, -6.302249908447266, -4.53404426574707, -2.7658348083496094, -0.9976294040679932, 0.770576000213623, 2.53878116607666, 4.3069868087768555, 6.075192451477051, 7.84339714050293, 9.611602783203125, 11.37980842590332, 13.148014068603516, 14.916219711303711, 16.684425354003906, 18.45262908935547, 20.220836639404297, 21.98904037475586, 23.757246017456055, 25.52545166015625, 27.293657302856445, 29.06186294555664, 30.830066680908203, 32.59827423095703, 34.366477966308594, 36.134681701660156, 37.902889251708984, 39.67109680175781, 41.439300537109375, 43.2075080871582, 44.975711822509766, 46.743919372558594, 48.512123107910156, 50.28032684326172, 52.04853439331055, 53.81673812866211]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 8.0, 7.0, 15.0, 14.0, 18.0, 18.0, 20.0, 25.0, 19.0, 26.0, 20.0, 24.0, 31.0, 34.0, 34.0, 42.0, 37.0, 42.0, 35.0, 43.0, 53.0, 32.0, 34.0, 36.0, 21.0, 32.0, 24.0, 24.0, 31.0, 28.0, 13.0, 15.0, 18.0, 15.0, 19.0, 10.0, 5.0, 11.0, 7.0, 7.0, 5.0, 5.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-23.49685287475586, -22.735055923461914, -21.97325897216797, -21.211462020874023, -20.449665069580078, -19.6878662109375, -18.926069259643555, -18.16427230834961, -17.402475357055664, -16.64067840576172, -15.878881454467773, -15.117083549499512, -14.355286598205566, -13.593489646911621, -12.83169174194336, -12.069894790649414, -11.308097839355469, -10.546300888061523, -9.784503936767578, -9.022706031799316, -8.260909080505371, -7.499112129211426, -6.737314701080322, -5.975517272949219, -5.213720321655273, -4.451923370361328, -3.6901259422302246, -2.9283287525177, -2.166531562805176, -1.4047343730926514, -0.642937183380127, 0.11886024475097656, 0.8806591033935547, 1.642456293106079, 2.4042534828186035, 3.166050672531128, 3.9278478622436523, 4.689644813537598, 5.451442241668701, 6.213239669799805, 6.97503662109375, 7.736833572387695, 8.49863052368164, 9.260428428649902, 10.022225379943848, 10.784022331237793, 11.545820236206055, 12.3076171875, 13.069414138793945, 13.83121109008789, 14.593008041381836, 15.354805946350098, 16.11660385131836, 16.878400802612305, 17.64019775390625, 18.401994705200195, 19.16379165649414, 19.925588607788086, 20.68738555908203, 21.449182510375977, 22.210979461669922, 22.9727783203125, 23.734575271606445, 24.49637222290039, 25.258169174194336]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 12.0, 11.0, 16.0, 34.0, 39.0, 67.0, 80.0, 145.0, 215.0, 340.0, 569.0, 1048.0, 2212.0, 5554.0, 19142.0, 91290.0, 526224.0, 325827.0, 54819.0, 12848.0, 4115.0, 1741.0, 851.0, 474.0, 279.0, 206.0, 114.0, 79.0, 55.0, 37.0, 26.0, 17.0, 16.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-43.09375, -41.74072265625, -40.3876953125, -39.03466796875, -37.681640625, -36.32861328125, -34.9755859375, -33.62255859375, -32.26953125, -30.91650390625, -29.5634765625, -28.21044921875, -26.857421875, -25.50439453125, -24.1513671875, -22.79833984375, -21.4453125, -20.09228515625, -18.7392578125, -17.38623046875, -16.033203125, -14.68017578125, -13.3271484375, -11.97412109375, -10.62109375, -9.26806640625, -7.9150390625, -6.56201171875, -5.208984375, -3.85595703125, -2.5029296875, -1.14990234375, 0.203125, 1.55615234375, 2.9091796875, 4.26220703125, 5.615234375, 6.96826171875, 8.3212890625, 9.67431640625, 11.02734375, 12.38037109375, 13.7333984375, 15.08642578125, 16.439453125, 17.79248046875, 19.1455078125, 20.49853515625, 21.8515625, 23.20458984375, 24.5576171875, 25.91064453125, 27.263671875, 28.61669921875, 29.9697265625, 31.32275390625, 32.67578125, 34.02880859375, 35.3818359375, 36.73486328125, 38.087890625, 39.44091796875, 40.7939453125, 42.14697265625, 43.5]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 12.0, 14.0, 30.0, 65.0, 64.0, 101.0, 106.0, 104.0, 88.0, 96.0, 99.0, 61.0, 57.0, 29.0, 19.0, 18.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.56097412109375, -8.3094482421875, -8.05792236328125, -7.806396484375, -7.55487060546875, -7.3033447265625, -7.05181884765625, -6.80029296875, -6.54876708984375, -6.2972412109375, -6.04571533203125, -5.794189453125, -5.54266357421875, -5.2911376953125, -5.03961181640625, -4.7880859375, -4.53656005859375, -4.2850341796875, -4.03350830078125, -3.781982421875, -3.53045654296875, -3.2789306640625, -3.02740478515625, -2.77587890625, -2.52435302734375, -2.2728271484375, -2.02130126953125, -1.769775390625, -1.51824951171875, -1.2667236328125, -1.01519775390625, -0.763671875, -0.51214599609375, -0.2606201171875, -0.00909423828125, 0.242431640625, 0.49395751953125, 0.7454833984375, 0.99700927734375, 1.24853515625, 1.50006103515625, 1.7515869140625, 2.00311279296875, 2.254638671875, 2.50616455078125, 2.7576904296875, 3.00921630859375, 3.2607421875, 3.51226806640625, 3.7637939453125, 4.01531982421875, 4.266845703125, 4.51837158203125, 4.7698974609375, 5.02142333984375, 5.27294921875, 5.52447509765625, 5.7760009765625, 6.02752685546875, 6.279052734375, 6.53057861328125, 6.7821044921875, 7.03363037109375, 7.28515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 12.0, 16.0, 30.0, 47.0, 52.0, 73.0, 103.0, 169.0, 252.0, 460.0, 837.0, 1605.0, 3725.0, 9857.0, 30276.0, 103072.0, 387839.0, 367200.0, 97359.0, 28865.0, 9535.0, 3696.0, 1604.0, 730.0, 406.0, 247.0, 163.0, 97.0, 70.0, 52.0, 38.0, 24.0, 11.0, 5.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.8125, -22.14111328125, -21.4697265625, -20.79833984375, -20.126953125, -19.45556640625, -18.7841796875, -18.11279296875, -17.44140625, -16.77001953125, -16.0986328125, -15.42724609375, -14.755859375, -14.08447265625, -13.4130859375, -12.74169921875, -12.0703125, -11.39892578125, -10.7275390625, -10.05615234375, -9.384765625, -8.71337890625, -8.0419921875, -7.37060546875, -6.69921875, -6.02783203125, -5.3564453125, -4.68505859375, -4.013671875, -3.34228515625, -2.6708984375, -1.99951171875, -1.328125, -0.65673828125, 0.0146484375, 0.68603515625, 1.357421875, 2.02880859375, 2.7001953125, 3.37158203125, 4.04296875, 4.71435546875, 5.3857421875, 6.05712890625, 6.728515625, 7.39990234375, 8.0712890625, 8.74267578125, 9.4140625, 10.08544921875, 10.7568359375, 11.42822265625, 12.099609375, 12.77099609375, 13.4423828125, 14.11376953125, 14.78515625, 15.45654296875, 16.1279296875, 16.79931640625, 17.470703125, 18.14208984375, 18.8134765625, 19.48486328125, 20.15625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 8.0, 5.0, 7.0, 7.0, 12.0, 14.0, 10.0, 10.0, 20.0, 22.0, 32.0, 21.0, 33.0, 22.0, 40.0, 33.0, 45.0, 43.0, 45.0, 34.0, 44.0, 44.0, 50.0, 44.0, 46.0, 43.0, 31.0, 35.0, 29.0, 19.0, 24.0, 27.0, 14.0, 13.0, 9.0, 18.0, 11.0, 10.0, 6.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.316650390625, -11.88330078125, -11.449951171875, -11.0166015625, -10.583251953125, -10.14990234375, -9.716552734375, -9.283203125, -8.849853515625, -8.41650390625, -7.983154296875, -7.5498046875, -7.116455078125, -6.68310546875, -6.249755859375, -5.81640625, -5.383056640625, -4.94970703125, -4.516357421875, -4.0830078125, -3.649658203125, -3.21630859375, -2.782958984375, -2.349609375, -1.916259765625, -1.48291015625, -1.049560546875, -0.6162109375, -0.182861328125, 0.25048828125, 0.683837890625, 1.1171875, 1.550537109375, 1.98388671875, 2.417236328125, 2.8505859375, 3.283935546875, 3.71728515625, 4.150634765625, 4.583984375, 5.017333984375, 5.45068359375, 5.884033203125, 6.3173828125, 6.750732421875, 7.18408203125, 7.617431640625, 8.05078125, 8.484130859375, 8.91748046875, 9.350830078125, 9.7841796875, 10.217529296875, 10.65087890625, 11.084228515625, 11.517578125, 11.950927734375, 12.38427734375, 12.817626953125, 13.2509765625, 13.684326171875, 14.11767578125, 14.551025390625, 14.984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 10.0, 3.0, 8.0, 9.0, 15.0, 17.0, 21.0, 39.0, 34.0, 73.0, 101.0, 141.0, 253.0, 368.0, 588.0, 928.0, 1662.0, 3097.0, 6418.0, 17790.0, 87146.0, 657879.0, 222345.0, 30985.0, 9262.0, 4080.0, 2095.0, 1207.0, 705.0, 446.0, 270.0, 194.0, 107.0, 80.0, 49.0, 27.0, 30.0, 31.0, 14.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-21.765625, -21.156005859375, -20.54638671875, -19.936767578125, -19.3271484375, -18.717529296875, -18.10791015625, -17.498291015625, -16.888671875, -16.279052734375, -15.66943359375, -15.059814453125, -14.4501953125, -13.840576171875, -13.23095703125, -12.621337890625, -12.01171875, -11.402099609375, -10.79248046875, -10.182861328125, -9.5732421875, -8.963623046875, -8.35400390625, -7.744384765625, -7.134765625, -6.525146484375, -5.91552734375, -5.305908203125, -4.6962890625, -4.086669921875, -3.47705078125, -2.867431640625, -2.2578125, -1.648193359375, -1.03857421875, -0.428955078125, 0.1806640625, 0.790283203125, 1.39990234375, 2.009521484375, 2.619140625, 3.228759765625, 3.83837890625, 4.447998046875, 5.0576171875, 5.667236328125, 6.27685546875, 6.886474609375, 7.49609375, 8.105712890625, 8.71533203125, 9.324951171875, 9.9345703125, 10.544189453125, 11.15380859375, 11.763427734375, 12.373046875, 12.982666015625, 13.59228515625, 14.201904296875, 14.8115234375, 15.421142578125, 16.03076171875, 16.640380859375, 17.25]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 20.0, 21.0, 38.0, 61.0, 84.0, 207.0, 232.0, 114.0, 80.0, 38.0, 20.0, 17.0, 11.0, 10.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027179718017578125, -0.0026006996631622314, -0.0024834275245666504, -0.0023661553859710693, -0.0022488832473754883, -0.0021316111087799072, -0.002014338970184326, -0.0018970668315887451, -0.001779794692993164, -0.001662522554397583, -0.001545250415802002, -0.001427978277206421, -0.0013107061386108398, -0.0011934340000152588, -0.0010761618614196777, -0.0009588897228240967, -0.0008416175842285156, -0.0007243454456329346, -0.0006070733070373535, -0.0004898011684417725, -0.0003725290298461914, -0.00025525689125061035, -0.0001379847526550293, -2.0712614059448242e-05, 9.655952453613281e-05, 0.00021383166313171387, 0.0003311038017272949, 0.000448375940322876, 0.000565648078918457, 0.0006829202175140381, 0.0008001923561096191, 0.0009174644947052002, 0.0010347366333007812, 0.0011520087718963623, 0.0012692809104919434, 0.0013865530490875244, 0.0015038251876831055, 0.0016210973262786865, 0.0017383694648742676, 0.0018556416034698486, 0.0019729137420654297, 0.0020901858806610107, 0.002207458019256592, 0.002324730157852173, 0.002442002296447754, 0.002559274435043335, 0.002676546573638916, 0.002793818712234497, 0.002911090850830078, 0.003028362989425659, 0.0031456351280212402, 0.0032629072666168213, 0.0033801794052124023, 0.0034974515438079834, 0.0036147236824035645, 0.0037319958209991455, 0.0038492679595947266, 0.003966540098190308, 0.004083812236785889, 0.00420108437538147, 0.004318356513977051, 0.004435628652572632, 0.004552900791168213, 0.004670172929763794, 0.004787445068359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 5.0, 6.0, 11.0, 9.0, 20.0, 17.0, 25.0, 24.0, 50.0, 68.0, 80.0, 126.0, 221.0, 364.0, 622.0, 1189.0, 2419.0, 5486.0, 15530.0, 65190.0, 549790.0, 342135.0, 44544.0, 11655.0, 4416.0, 2059.0, 1041.0, 527.0, 345.0, 173.0, 127.0, 70.0, 64.0, 29.0, 33.0, 16.0, 23.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.372314453125, -17.71337890625, -17.054443359375, -16.3955078125, -15.736572265625, -15.07763671875, -14.418701171875, -13.759765625, -13.100830078125, -12.44189453125, -11.782958984375, -11.1240234375, -10.465087890625, -9.80615234375, -9.147216796875, -8.48828125, -7.829345703125, -7.17041015625, -6.511474609375, -5.8525390625, -5.193603515625, -4.53466796875, -3.875732421875, -3.216796875, -2.557861328125, -1.89892578125, -1.239990234375, -0.5810546875, 0.077880859375, 0.73681640625, 1.395751953125, 2.0546875, 2.713623046875, 3.37255859375, 4.031494140625, 4.6904296875, 5.349365234375, 6.00830078125, 6.667236328125, 7.326171875, 7.985107421875, 8.64404296875, 9.302978515625, 9.9619140625, 10.620849609375, 11.27978515625, 11.938720703125, 12.59765625, 13.256591796875, 13.91552734375, 14.574462890625, 15.2333984375, 15.892333984375, 16.55126953125, 17.210205078125, 17.869140625, 18.528076171875, 19.18701171875, 19.845947265625, 20.5048828125, 21.163818359375, 21.82275390625, 22.481689453125, 23.140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 4.0, 6.0, 11.0, 13.0, 21.0, 31.0, 51.0, 70.0, 136.0, 161.0, 159.0, 129.0, 61.0, 36.0, 26.0, 21.0, 11.0, 11.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.015625, -17.4844970703125, -16.953369140625, -16.4222412109375, -15.89111328125, -15.3599853515625, -14.828857421875, -14.2977294921875, -13.7666015625, -13.2354736328125, -12.704345703125, -12.1732177734375, -11.64208984375, -11.1109619140625, -10.579833984375, -10.0487060546875, -9.517578125, -8.9864501953125, -8.455322265625, -7.9241943359375, -7.39306640625, -6.8619384765625, -6.330810546875, -5.7996826171875, -5.2685546875, -4.7374267578125, -4.206298828125, -3.6751708984375, -3.14404296875, -2.6129150390625, -2.081787109375, -1.5506591796875, -1.01953125, -0.4884033203125, 0.042724609375, 0.5738525390625, 1.10498046875, 1.6361083984375, 2.167236328125, 2.6983642578125, 3.2294921875, 3.7606201171875, 4.291748046875, 4.8228759765625, 5.35400390625, 5.8851318359375, 6.416259765625, 6.9473876953125, 7.478515625, 8.0096435546875, 8.540771484375, 9.0718994140625, 9.60302734375, 10.1341552734375, 10.665283203125, 11.1964111328125, 11.7275390625, 12.2586669921875, 12.789794921875, 13.3209228515625, 13.85205078125, 14.3831787109375, 14.914306640625, 15.4454345703125, 15.9765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 13.0, 30.0, 57.0, 144.0, 209.0, 239.0, 163.0, 96.0, 31.0, 12.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.89764404296875, -376.5121765136719, -367.126708984375, -357.7412109375, -348.3557434082031, -338.97027587890625, -329.5848083496094, -320.1993408203125, -310.8138427734375, -301.4283752441406, -292.04290771484375, -282.65740966796875, -273.2719421386719, -263.886474609375, -254.50100708007812, -245.11553955078125, -235.73007202148438, -226.3446044921875, -216.95912170410156, -207.5736541748047, -198.18817138671875, -188.80270385742188, -179.417236328125, -170.03176879882812, -160.6462860107422, -151.2608184814453, -141.87533569335938, -132.4898681640625, -123.1043930053711, -113.71891784667969, -104.33345031738281, -94.9479751586914, -85.56248474121094, -76.17700958251953, -66.79153442382812, -57.40606689453125, -48.020591735839844, -38.63511657714844, -29.249645233154297, -19.864173889160156, -10.47869873046875, -1.0932254791259766, 8.292247772216797, 17.67772102355957, 27.063194274902344, 36.44866943359375, 45.83414077758789, 55.21961212158203, 64.60508728027344, 73.99056243896484, 83.37603759765625, 92.76150512695312, 102.14698028564453, 111.53245544433594, 120.91792297363281, 130.30340576171875, 139.68887329101562, 149.0743408203125, 158.45982360839844, 167.8452911376953, 177.23077392578125, 186.61624145507812, 196.001708984375, 205.38717651367188, 214.7726593017578]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 8.0, 15.0, 16.0, 17.0, 21.0, 22.0, 33.0, 30.0, 34.0, 34.0, 44.0, 42.0, 55.0, 42.0, 52.0, 42.0, 50.0, 56.0, 38.0, 44.0, 39.0, 27.0, 32.0, 26.0, 22.0, 25.0, 20.0, 24.0, 13.0, 14.0, 11.0, 7.0, 12.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.11214447021484, -90.23584747314453, -87.35955047607422, -84.4832534790039, -81.60696411132812, -78.73066711425781, -75.8543701171875, -72.97807312011719, -70.10177612304688, -67.22547912597656, -64.34918212890625, -61.4728889465332, -58.59659194946289, -55.72029495239258, -52.84400177001953, -49.96770477294922, -47.091407775878906, -44.215110778808594, -41.33881378173828, -38.462520599365234, -35.58622360229492, -32.70992660522461, -29.83363151550293, -26.95733642578125, -24.081039428710938, -21.204742431640625, -18.328447341918945, -15.45215129852295, -12.575855255126953, -9.699559211730957, -6.823263168334961, -3.9469680786132812, -1.0706634521484375, 1.8056325912475586, 4.681928634643555, 7.558224678039551, 10.434520721435547, 13.310816764831543, 16.18711280822754, 19.06340789794922, 21.93970489501953, 24.816001892089844, 27.692296981811523, 30.568592071533203, 33.444889068603516, 36.32118606567383, 39.197479248046875, 42.07377624511719, 44.9500732421875, 47.82637023925781, 50.702667236328125, 53.57896041870117, 56.455257415771484, 59.3315544128418, 62.207847595214844, 65.08414459228516, 67.96044158935547, 70.83673858642578, 73.7130355834961, 76.5893325805664, 79.46562194824219, 82.3419189453125, 85.21821594238281, 88.09451293945312, 90.97080993652344]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 0.0, 5.0, 3.0, 4.0, 11.0, 11.0, 18.0, 29.0, 25.0, 18.0, 42.0, 54.0, 82.0, 118.0, 166.0, 292.0, 433.0, 771.0, 1602.0, 3775.0, 12105.0, 51836.0, 579497.0, 3409775.0, 103703.0, 19389.0, 5698.0, 2231.0, 1000.0, 582.0, 315.0, 223.0, 152.0, 99.0, 65.0, 53.0, 25.0, 25.0, 15.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.6875, -56.09326171875, -54.4990234375, -52.90478515625, -51.310546875, -49.71630859375, -48.1220703125, -46.52783203125, -44.93359375, -43.33935546875, -41.7451171875, -40.15087890625, -38.556640625, -36.96240234375, -35.3681640625, -33.77392578125, -32.1796875, -30.58544921875, -28.9912109375, -27.39697265625, -25.802734375, -24.20849609375, -22.6142578125, -21.02001953125, -19.42578125, -17.83154296875, -16.2373046875, -14.64306640625, -13.048828125, -11.45458984375, -9.8603515625, -8.26611328125, -6.671875, -5.07763671875, -3.4833984375, -1.88916015625, -0.294921875, 1.29931640625, 2.8935546875, 4.48779296875, 6.08203125, 7.67626953125, 9.2705078125, 10.86474609375, 12.458984375, 14.05322265625, 15.6474609375, 17.24169921875, 18.8359375, 20.43017578125, 22.0244140625, 23.61865234375, 25.212890625, 26.80712890625, 28.4013671875, 29.99560546875, 31.58984375, 33.18408203125, 34.7783203125, 36.37255859375, 37.966796875, 39.56103515625, 41.1552734375, 42.74951171875, 44.34375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 18.0, 30.0, 49.0, 65.0, 84.0, 89.0, 94.0, 94.0, 100.0, 86.0, 71.0, 66.0, 47.0, 28.0, 23.0, 16.0, 9.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.23895263671875, -7.9935302734375, -7.74810791015625, -7.502685546875, -7.25726318359375, -7.0118408203125, -6.76641845703125, -6.52099609375, -6.27557373046875, -6.0301513671875, -5.78472900390625, -5.539306640625, -5.29388427734375, -5.0484619140625, -4.80303955078125, -4.5576171875, -4.31219482421875, -4.0667724609375, -3.82135009765625, -3.575927734375, -3.33050537109375, -3.0850830078125, -2.83966064453125, -2.59423828125, -2.34881591796875, -2.1033935546875, -1.85797119140625, -1.612548828125, -1.36712646484375, -1.1217041015625, -0.87628173828125, -0.630859375, -0.38543701171875, -0.1400146484375, 0.10540771484375, 0.350830078125, 0.59625244140625, 0.8416748046875, 1.08709716796875, 1.33251953125, 1.57794189453125, 1.8233642578125, 2.06878662109375, 2.314208984375, 2.55963134765625, 2.8050537109375, 3.05047607421875, 3.2958984375, 3.54132080078125, 3.7867431640625, 4.03216552734375, 4.277587890625, 4.52301025390625, 4.7684326171875, 5.01385498046875, 5.25927734375, 5.50469970703125, 5.7501220703125, 5.99554443359375, 6.240966796875, 6.48638916015625, 6.7318115234375, 6.97723388671875, 7.22265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 14.0, 19.0, 29.0, 48.0, 52.0, 98.0, 223.0, 391.0, 833.0, 1762.0, 4516.0, 13715.0, 48536.0, 242711.0, 3092431.0, 657969.0, 94691.0, 23589.0, 7471.0, 2705.0, 1193.0, 539.0, 307.0, 184.0, 115.0, 47.0, 33.0, 17.0, 15.0, 11.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.625, -35.627685546875, -34.63037109375, -33.633056640625, -32.6357421875, -31.638427734375, -30.64111328125, -29.643798828125, -28.646484375, -27.649169921875, -26.65185546875, -25.654541015625, -24.6572265625, -23.659912109375, -22.66259765625, -21.665283203125, -20.66796875, -19.670654296875, -18.67333984375, -17.676025390625, -16.6787109375, -15.681396484375, -14.68408203125, -13.686767578125, -12.689453125, -11.692138671875, -10.69482421875, -9.697509765625, -8.7001953125, -7.702880859375, -6.70556640625, -5.708251953125, -4.7109375, -3.713623046875, -2.71630859375, -1.718994140625, -0.7216796875, 0.275634765625, 1.27294921875, 2.270263671875, 3.267578125, 4.264892578125, 5.26220703125, 6.259521484375, 7.2568359375, 8.254150390625, 9.25146484375, 10.248779296875, 11.24609375, 12.243408203125, 13.24072265625, 14.238037109375, 15.2353515625, 16.232666015625, 17.22998046875, 18.227294921875, 19.224609375, 20.221923828125, 21.21923828125, 22.216552734375, 23.2138671875, 24.211181640625, 25.20849609375, 26.205810546875, 27.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 11.0, 20.0, 20.0, 26.0, 46.0, 58.0, 85.0, 126.0, 215.0, 361.0, 897.0, 1071.0, 394.0, 241.0, 142.0, 89.0, 79.0, 50.0, 34.0, 28.0, 18.0, 14.0, 6.0, 8.0, 2.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1171875, -9.743408203125, -9.36962890625, -8.995849609375, -8.6220703125, -8.248291015625, -7.87451171875, -7.500732421875, -7.126953125, -6.753173828125, -6.37939453125, -6.005615234375, -5.6318359375, -5.258056640625, -4.88427734375, -4.510498046875, -4.13671875, -3.762939453125, -3.38916015625, -3.015380859375, -2.6416015625, -2.267822265625, -1.89404296875, -1.520263671875, -1.146484375, -0.772705078125, -0.39892578125, -0.025146484375, 0.3486328125, 0.722412109375, 1.09619140625, 1.469970703125, 1.84375, 2.217529296875, 2.59130859375, 2.965087890625, 3.3388671875, 3.712646484375, 4.08642578125, 4.460205078125, 4.833984375, 5.207763671875, 5.58154296875, 5.955322265625, 6.3291015625, 6.702880859375, 7.07666015625, 7.450439453125, 7.82421875, 8.197998046875, 8.57177734375, 8.945556640625, 9.3193359375, 9.693115234375, 10.06689453125, 10.440673828125, 10.814453125, 11.188232421875, 11.56201171875, 11.935791015625, 12.3095703125, 12.683349609375, 13.05712890625, 13.430908203125, 13.8046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 11.0, 18.0, 16.0, 29.0, 41.0, 60.0, 90.0, 100.0, 97.0, 99.0, 105.0, 84.0, 65.0, 46.0, 35.0, 36.0, 18.0, 16.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.03144836425781, -64.53826141357422, -62.04507827758789, -59.5518913269043, -57.05870819091797, -54.565521240234375, -52.07233428955078, -49.57915115356445, -47.085968017578125, -44.59278106689453, -42.0995979309082, -39.60641098022461, -37.11322784423828, -34.62004089355469, -32.126853942871094, -29.633670806884766, -27.140483856201172, -24.64729881286621, -22.15411376953125, -19.660926818847656, -17.167743682861328, -14.67455768585205, -12.181371688842773, -9.688186645507812, -7.195001602172852, -4.701816558837891, -2.2086310386657715, 0.28455448150634766, 2.7777395248413086, 5.2709245681762695, 7.764110565185547, 10.257295608520508, 12.750480651855469, 15.24366569519043, 17.73685073852539, 20.230037689208984, 22.723220825195312, 25.216407775878906, 27.709592819213867, 30.202777862548828, 32.695960998535156, 35.18914794921875, 37.68233108520508, 40.17551803588867, 42.668701171875, 45.161888122558594, 47.65507507324219, 50.148258209228516, 52.64144515991211, 55.1346321105957, 57.62781524658203, 60.121002197265625, 62.61418533325195, 65.10736846923828, 67.60055541992188, 70.09374237060547, 72.58692932128906, 75.08011627197266, 77.57330322265625, 80.06648254394531, 82.5596694946289, 85.0528564453125, 87.5460433959961, 90.03923034667969, 92.53240966796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 12.0, 18.0, 17.0, 9.0, 18.0, 21.0, 26.0, 37.0, 29.0, 36.0, 39.0, 33.0, 44.0, 35.0, 36.0, 39.0, 35.0, 40.0, 46.0, 51.0, 43.0, 41.0, 35.0, 31.0, 21.0, 26.0, 15.0, 21.0, 25.0, 24.0, 11.0, 19.0, 19.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-51.178184509277344, -49.73715591430664, -48.29612731933594, -46.8551025390625, -45.4140739440918, -43.973045349121094, -42.532020568847656, -41.09099197387695, -39.64996337890625, -38.20893478393555, -36.767906188964844, -35.326881408691406, -33.8858528137207, -32.44482421875, -31.00379753112793, -29.56277084350586, -28.121742248535156, -26.680713653564453, -25.239686965942383, -23.798660278320312, -22.35763168334961, -20.916603088378906, -19.475576400756836, -18.034549713134766, -16.593521118164062, -15.152493476867676, -13.711465835571289, -12.270438194274902, -10.829410552978516, -9.388382911682129, -7.947355270385742, -6.5063276290893555, -5.065299987792969, -3.624272346496582, -2.1832447052001953, -0.7422170639038086, 0.6988105773925781, 2.139838218688965, 3.5808658599853516, 5.021893501281738, 6.462921142578125, 7.903948783874512, 9.344976425170898, 10.786004066467285, 12.227031707763672, 13.668059349060059, 15.109086990356445, 16.550113677978516, 17.99114227294922, 19.432170867919922, 20.873197555541992, 22.314224243164062, 23.755252838134766, 25.19628143310547, 26.63730812072754, 28.07833480834961, 29.519363403320312, 30.960391998291016, 32.40142059326172, 33.842445373535156, 35.28347396850586, 36.72450256347656, 38.16552734375, 39.6065559387207, 41.047584533691406]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 7.0, 19.0, 28.0, 26.0, 54.0, 81.0, 122.0, 205.0, 332.0, 571.0, 1203.0, 2812.0, 8558.0, 32531.0, 171510.0, 676842.0, 117682.0, 24541.0, 6738.0, 2328.0, 981.0, 517.0, 285.0, 188.0, 131.0, 75.0, 43.0, 25.0, 32.0, 13.0, 8.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-42.375, -41.025390625, -39.67578125, -38.326171875, -36.9765625, -35.626953125, -34.27734375, -32.927734375, -31.578125, -30.228515625, -28.87890625, -27.529296875, -26.1796875, -24.830078125, -23.48046875, -22.130859375, -20.78125, -19.431640625, -18.08203125, -16.732421875, -15.3828125, -14.033203125, -12.68359375, -11.333984375, -9.984375, -8.634765625, -7.28515625, -5.935546875, -4.5859375, -3.236328125, -1.88671875, -0.537109375, 0.8125, 2.162109375, 3.51171875, 4.861328125, 6.2109375, 7.560546875, 8.91015625, 10.259765625, 11.609375, 12.958984375, 14.30859375, 15.658203125, 17.0078125, 18.357421875, 19.70703125, 21.056640625, 22.40625, 23.755859375, 25.10546875, 26.455078125, 27.8046875, 29.154296875, 30.50390625, 31.853515625, 33.203125, 34.552734375, 35.90234375, 37.251953125, 38.6015625, 39.951171875, 41.30078125, 42.650390625, 44.0]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 15.0, 18.0, 36.0, 43.0, 59.0, 67.0, 77.0, 114.0, 90.0, 92.0, 79.0, 66.0, 77.0, 44.0, 30.0, 27.0, 23.0, 12.0, 7.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.01318359375, -7.7685546875, -7.52392578125, -7.279296875, -7.03466796875, -6.7900390625, -6.54541015625, -6.30078125, -6.05615234375, -5.8115234375, -5.56689453125, -5.322265625, -5.07763671875, -4.8330078125, -4.58837890625, -4.34375, -4.09912109375, -3.8544921875, -3.60986328125, -3.365234375, -3.12060546875, -2.8759765625, -2.63134765625, -2.38671875, -2.14208984375, -1.8974609375, -1.65283203125, -1.408203125, -1.16357421875, -0.9189453125, -0.67431640625, -0.4296875, -0.18505859375, 0.0595703125, 0.30419921875, 0.548828125, 0.79345703125, 1.0380859375, 1.28271484375, 1.52734375, 1.77197265625, 2.0166015625, 2.26123046875, 2.505859375, 2.75048828125, 2.9951171875, 3.23974609375, 3.484375, 3.72900390625, 3.9736328125, 4.21826171875, 4.462890625, 4.70751953125, 4.9521484375, 5.19677734375, 5.44140625, 5.68603515625, 5.9306640625, 6.17529296875, 6.419921875, 6.66455078125, 6.9091796875, 7.15380859375, 7.3984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 1.0, 18.0, 6.0, 19.0, 23.0, 34.0, 50.0, 66.0, 94.0, 126.0, 200.0, 315.0, 463.0, 783.0, 1577.0, 3669.0, 8698.0, 24456.0, 72787.0, 279463.0, 485428.0, 111993.0, 35941.0, 12896.0, 4759.0, 2025.0, 988.0, 550.0, 351.0, 244.0, 148.0, 108.0, 80.0, 54.0, 42.0, 28.0, 23.0, 14.0, 7.0, 12.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.967529296875, -18.29443359375, -17.621337890625, -16.9482421875, -16.275146484375, -15.60205078125, -14.928955078125, -14.255859375, -13.582763671875, -12.90966796875, -12.236572265625, -11.5634765625, -10.890380859375, -10.21728515625, -9.544189453125, -8.87109375, -8.197998046875, -7.52490234375, -6.851806640625, -6.1787109375, -5.505615234375, -4.83251953125, -4.159423828125, -3.486328125, -2.813232421875, -2.14013671875, -1.467041015625, -0.7939453125, -0.120849609375, 0.55224609375, 1.225341796875, 1.8984375, 2.571533203125, 3.24462890625, 3.917724609375, 4.5908203125, 5.263916015625, 5.93701171875, 6.610107421875, 7.283203125, 7.956298828125, 8.62939453125, 9.302490234375, 9.9755859375, 10.648681640625, 11.32177734375, 11.994873046875, 12.66796875, 13.341064453125, 14.01416015625, 14.687255859375, 15.3603515625, 16.033447265625, 16.70654296875, 17.379638671875, 18.052734375, 18.725830078125, 19.39892578125, 20.072021484375, 20.7451171875, 21.418212890625, 22.09130859375, 22.764404296875, 23.4375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 7.0, 12.0, 9.0, 7.0, 20.0, 16.0, 21.0, 24.0, 25.0, 30.0, 35.0, 27.0, 40.0, 37.0, 40.0, 44.0, 49.0, 54.0, 38.0, 39.0, 39.0, 41.0, 39.0, 32.0, 42.0, 40.0, 29.0, 20.0, 29.0, 14.0, 17.0, 7.0, 15.0, 5.0, 9.0, 6.0, 3.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.234375, -15.7479248046875, -15.261474609375, -14.7750244140625, -14.28857421875, -13.8021240234375, -13.315673828125, -12.8292236328125, -12.3427734375, -11.8563232421875, -11.369873046875, -10.8834228515625, -10.39697265625, -9.9105224609375, -9.424072265625, -8.9376220703125, -8.451171875, -7.9647216796875, -7.478271484375, -6.9918212890625, -6.50537109375, -6.0189208984375, -5.532470703125, -5.0460205078125, -4.5595703125, -4.0731201171875, -3.586669921875, -3.1002197265625, -2.61376953125, -2.1273193359375, -1.640869140625, -1.1544189453125, -0.66796875, -0.1815185546875, 0.304931640625, 0.7913818359375, 1.27783203125, 1.7642822265625, 2.250732421875, 2.7371826171875, 3.2236328125, 3.7100830078125, 4.196533203125, 4.6829833984375, 5.16943359375, 5.6558837890625, 6.142333984375, 6.6287841796875, 7.115234375, 7.6016845703125, 8.088134765625, 8.5745849609375, 9.06103515625, 9.5474853515625, 10.033935546875, 10.5203857421875, 11.0068359375, 11.4932861328125, 11.979736328125, 12.4661865234375, 12.95263671875, 13.4390869140625, 13.925537109375, 14.4119873046875, 14.8984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 11.0, 16.0, 19.0, 22.0, 20.0, 40.0, 49.0, 75.0, 113.0, 149.0, 216.0, 409.0, 698.0, 1211.0, 2459.0, 5584.0, 15012.0, 61619.0, 664549.0, 246342.0, 32006.0, 9514.0, 3950.0, 1971.0, 985.0, 528.0, 313.0, 175.0, 153.0, 88.0, 62.0, 40.0, 32.0, 29.0, 24.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 8.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.671875, -18.119384765625, -17.56689453125, -17.014404296875, -16.4619140625, -15.909423828125, -15.35693359375, -14.804443359375, -14.251953125, -13.699462890625, -13.14697265625, -12.594482421875, -12.0419921875, -11.489501953125, -10.93701171875, -10.384521484375, -9.83203125, -9.279541015625, -8.72705078125, -8.174560546875, -7.6220703125, -7.069580078125, -6.51708984375, -5.964599609375, -5.412109375, -4.859619140625, -4.30712890625, -3.754638671875, -3.2021484375, -2.649658203125, -2.09716796875, -1.544677734375, -0.9921875, -0.439697265625, 0.11279296875, 0.665283203125, 1.2177734375, 1.770263671875, 2.32275390625, 2.875244140625, 3.427734375, 3.980224609375, 4.53271484375, 5.085205078125, 5.6376953125, 6.190185546875, 6.74267578125, 7.295166015625, 7.84765625, 8.400146484375, 8.95263671875, 9.505126953125, 10.0576171875, 10.610107421875, 11.16259765625, 11.715087890625, 12.267578125, 12.820068359375, 13.37255859375, 13.925048828125, 14.4775390625, 15.030029296875, 15.58251953125, 16.135009765625, 16.6875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 7.0, 10.0, 15.0, 15.0, 20.0, 32.0, 49.0, 75.0, 185.0, 205.0, 143.0, 67.0, 25.0, 35.0, 21.0, 18.0, 8.0, 9.0, 8.0, 4.0, 5.0, 1.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023212432861328125, -0.0022393763065338135, -0.0021575093269348145, -0.0020756423473358154, -0.0019937753677368164, -0.0019119083881378174, -0.0018300414085388184, -0.0017481744289398193, -0.0016663074493408203, -0.0015844404697418213, -0.0015025734901428223, -0.0014207065105438232, -0.0013388395309448242, -0.0012569725513458252, -0.0011751055717468262, -0.0010932385921478271, -0.0010113716125488281, -0.0009295046329498291, -0.0008476376533508301, -0.0007657706737518311, -0.000683903694152832, -0.000602036714553833, -0.000520169734954834, -0.00043830275535583496, -0.00035643577575683594, -0.0002745687961578369, -0.0001927018165588379, -0.00011083483695983887, -2.8967857360839844e-05, 5.289912223815918e-05, 0.0001347661018371582, 0.00021663308143615723, 0.00029850006103515625, 0.0003803670406341553, 0.0004622340202331543, 0.0005441009998321533, 0.0006259679794311523, 0.0007078349590301514, 0.0007897019386291504, 0.0008715689182281494, 0.0009534358978271484, 0.0010353028774261475, 0.0011171698570251465, 0.0011990368366241455, 0.0012809038162231445, 0.0013627707958221436, 0.0014446377754211426, 0.0015265047550201416, 0.0016083717346191406, 0.0016902387142181396, 0.0017721056938171387, 0.0018539726734161377, 0.0019358396530151367, 0.0020177066326141357, 0.0020995736122131348, 0.002181440591812134, 0.002263307571411133, 0.002345174551010132, 0.002427041530609131, 0.00250890851020813, 0.002590775489807129, 0.002672642469406128, 0.002754509449005127, 0.002836376428604126, 0.002918243408203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 20.0, 24.0, 31.0, 42.0, 75.0, 117.0, 217.0, 391.0, 768.0, 1859.0, 5424.0, 22067.0, 621258.0, 369634.0, 18495.0, 4807.0, 1679.0, 722.0, 383.0, 175.0, 98.0, 90.0, 54.0, 37.0, 18.0, 18.0, 10.0, 10.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.5, -33.38525390625, -32.2705078125, -31.15576171875, -30.041015625, -28.92626953125, -27.8115234375, -26.69677734375, -25.58203125, -24.46728515625, -23.3525390625, -22.23779296875, -21.123046875, -20.00830078125, -18.8935546875, -17.77880859375, -16.6640625, -15.54931640625, -14.4345703125, -13.31982421875, -12.205078125, -11.09033203125, -9.9755859375, -8.86083984375, -7.74609375, -6.63134765625, -5.5166015625, -4.40185546875, -3.287109375, -2.17236328125, -1.0576171875, 0.05712890625, 1.171875, 2.28662109375, 3.4013671875, 4.51611328125, 5.630859375, 6.74560546875, 7.8603515625, 8.97509765625, 10.08984375, 11.20458984375, 12.3193359375, 13.43408203125, 14.548828125, 15.66357421875, 16.7783203125, 17.89306640625, 19.0078125, 20.12255859375, 21.2373046875, 22.35205078125, 23.466796875, 24.58154296875, 25.6962890625, 26.81103515625, 27.92578125, 29.04052734375, 30.1552734375, 31.27001953125, 32.384765625, 33.49951171875, 34.6142578125, 35.72900390625, 36.84375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 11.0, 8.0, 9.0, 20.0, 27.0, 59.0, 152.0, 310.0, 198.0, 86.0, 36.0, 25.0, 15.0, 5.0, 3.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.08447265625, -17.4033203125, -16.72216796875, -16.041015625, -15.35986328125, -14.6787109375, -13.99755859375, -13.31640625, -12.63525390625, -11.9541015625, -11.27294921875, -10.591796875, -9.91064453125, -9.2294921875, -8.54833984375, -7.8671875, -7.18603515625, -6.5048828125, -5.82373046875, -5.142578125, -4.46142578125, -3.7802734375, -3.09912109375, -2.41796875, -1.73681640625, -1.0556640625, -0.37451171875, 0.306640625, 0.98779296875, 1.6689453125, 2.35009765625, 3.03125, 3.71240234375, 4.3935546875, 5.07470703125, 5.755859375, 6.43701171875, 7.1181640625, 7.79931640625, 8.48046875, 9.16162109375, 9.8427734375, 10.52392578125, 11.205078125, 11.88623046875, 12.5673828125, 13.24853515625, 13.9296875, 14.61083984375, 15.2919921875, 15.97314453125, 16.654296875, 17.33544921875, 18.0166015625, 18.69775390625, 19.37890625, 20.06005859375, 20.7412109375, 21.42236328125, 22.103515625, 22.78466796875, 23.4658203125, 24.14697265625, 24.828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 30.0, 120.0, 283.0, 380.0, 130.0, 35.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-687.7215576171875, -672.133056640625, -656.5445556640625, -640.9560546875, -625.3675537109375, -609.779052734375, -594.1905517578125, -578.60205078125, -563.0135498046875, -547.425048828125, -531.8365478515625, -516.248046875, -500.6595458984375, -485.071044921875, -469.4825439453125, -453.89404296875, -438.3055725097656, -422.7170715332031, -407.1285705566406, -391.5400695800781, -375.9515686035156, -360.3630676269531, -344.77459716796875, -329.18609619140625, -313.59759521484375, -298.00909423828125, -282.42059326171875, -266.83209228515625, -251.24359130859375, -235.65509033203125, -220.0666046142578, -204.4781036376953, -188.88958740234375, -173.30108642578125, -157.71258544921875, -142.12408447265625, -126.53559112548828, -110.94709014892578, -95.35859680175781, -79.77009582519531, -64.18159484863281, -48.59309387207031, -33.00459671020508, -17.416099548339844, -1.8275985717773438, 13.760902404785156, 29.349395751953125, 44.937896728515625, 60.526397705078125, 76.11489868164062, 91.70339965820312, 107.2918930053711, 122.8803939819336, 138.46890258789062, 154.05738830566406, 169.64588928222656, 185.23439025878906, 200.82289123535156, 216.41139221191406, 231.9998779296875, 247.58837890625, 263.1768798828125, 278.765380859375, 294.3538818359375, 309.9423828125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 16.0, 13.0, 17.0, 19.0, 20.0, 18.0, 41.0, 34.0, 30.0, 45.0, 36.0, 57.0, 43.0, 40.0, 35.0, 44.0, 43.0, 30.0, 44.0, 40.0, 32.0, 34.0, 35.0, 31.0, 26.0, 20.0, 20.0, 16.0, 12.0, 16.0, 10.0, 12.0, 7.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.71067810058594, -90.0806655883789, -87.45065307617188, -84.82064819335938, -82.19063568115234, -79.56062316894531, -76.93061065673828, -74.30059814453125, -71.67059326171875, -69.04058074951172, -66.41056823730469, -63.78055953979492, -61.150550842285156, -58.520538330078125, -55.890525817871094, -53.26051330566406, -50.63050079345703, -48.00048828125, -45.370479583740234, -42.7404670715332, -40.11045837402344, -37.480445861816406, -34.850433349609375, -32.220420837402344, -29.590412139892578, -26.96040153503418, -24.33039093017578, -21.70037841796875, -19.07036781311035, -16.440357208251953, -13.810345649719238, -11.180334091186523, -8.550331115722656, -5.9203200340271, -3.290308952331543, -0.6602978706359863, 1.9697132110595703, 4.599723815917969, 7.229735374450684, 9.859746932983398, 12.489757537841797, 15.119768142700195, 17.749778747558594, 20.379791259765625, 23.009801864624023, 25.639812469482422, 28.269824981689453, 30.89983558654785, 33.52984619140625, 36.15985870361328, 38.78986740112305, 41.41987991333008, 44.049888610839844, 46.679901123046875, 49.309913635253906, 51.93992614746094, 54.5699348449707, 57.199947357177734, 59.8299560546875, 62.45996856689453, 65.08998107910156, 67.71998596191406, 70.3499984741211, 72.98001098632812, 75.61002349853516]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 8.0, 11.0, 14.0, 19.0, 43.0, 46.0, 53.0, 84.0, 141.0, 221.0, 352.0, 671.0, 1344.0, 3196.0, 9718.0, 41597.0, 541936.0, 3494185.0, 77796.0, 14698.0, 4453.0, 1717.0, 818.0, 416.0, 258.0, 158.0, 97.0, 68.0, 39.0, 32.0, 26.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.0625, -51.30322265625, -49.5439453125, -47.78466796875, -46.025390625, -44.26611328125, -42.5068359375, -40.74755859375, -38.98828125, -37.22900390625, -35.4697265625, -33.71044921875, -31.951171875, -30.19189453125, -28.4326171875, -26.67333984375, -24.9140625, -23.15478515625, -21.3955078125, -19.63623046875, -17.876953125, -16.11767578125, -14.3583984375, -12.59912109375, -10.83984375, -9.08056640625, -7.3212890625, -5.56201171875, -3.802734375, -2.04345703125, -0.2841796875, 1.47509765625, 3.234375, 4.99365234375, 6.7529296875, 8.51220703125, 10.271484375, 12.03076171875, 13.7900390625, 15.54931640625, 17.30859375, 19.06787109375, 20.8271484375, 22.58642578125, 24.345703125, 26.10498046875, 27.8642578125, 29.62353515625, 31.3828125, 33.14208984375, 34.9013671875, 36.66064453125, 38.419921875, 40.17919921875, 41.9384765625, 43.69775390625, 45.45703125, 47.21630859375, 48.9755859375, 50.73486328125, 52.494140625, 54.25341796875, 56.0126953125, 57.77197265625, 59.53125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 17.0, 24.0, 37.0, 41.0, 59.0, 64.0, 74.0, 83.0, 86.0, 98.0, 67.0, 82.0, 63.0, 47.0, 41.0, 27.0, 23.0, 12.0, 16.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.92333984375, -7.6826171875, -7.44189453125, -7.201171875, -6.96044921875, -6.7197265625, -6.47900390625, -6.23828125, -5.99755859375, -5.7568359375, -5.51611328125, -5.275390625, -5.03466796875, -4.7939453125, -4.55322265625, -4.3125, -4.07177734375, -3.8310546875, -3.59033203125, -3.349609375, -3.10888671875, -2.8681640625, -2.62744140625, -2.38671875, -2.14599609375, -1.9052734375, -1.66455078125, -1.423828125, -1.18310546875, -0.9423828125, -0.70166015625, -0.4609375, -0.22021484375, 0.0205078125, 0.26123046875, 0.501953125, 0.74267578125, 0.9833984375, 1.22412109375, 1.46484375, 1.70556640625, 1.9462890625, 2.18701171875, 2.427734375, 2.66845703125, 2.9091796875, 3.14990234375, 3.390625, 3.63134765625, 3.8720703125, 4.11279296875, 4.353515625, 4.59423828125, 4.8349609375, 5.07568359375, 5.31640625, 5.55712890625, 5.7978515625, 6.03857421875, 6.279296875, 6.52001953125, 6.7607421875, 7.00146484375, 7.2421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 10.0, 24.0, 30.0, 38.0, 49.0, 79.0, 116.0, 209.0, 344.0, 625.0, 1123.0, 2382.0, 5011.0, 12235.0, 35010.0, 138693.0, 2363664.0, 1455838.0, 125210.0, 32279.0, 11618.0, 4760.0, 2257.0, 1134.0, 606.0, 311.0, 197.0, 121.0, 70.0, 51.0, 39.0, 33.0, 20.0, 13.0, 12.0, 12.0, 7.0, 3.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-35.46875, -34.482666015625, -33.49658203125, -32.510498046875, -31.5244140625, -30.538330078125, -29.55224609375, -28.566162109375, -27.580078125, -26.593994140625, -25.60791015625, -24.621826171875, -23.6357421875, -22.649658203125, -21.66357421875, -20.677490234375, -19.69140625, -18.705322265625, -17.71923828125, -16.733154296875, -15.7470703125, -14.760986328125, -13.77490234375, -12.788818359375, -11.802734375, -10.816650390625, -9.83056640625, -8.844482421875, -7.8583984375, -6.872314453125, -5.88623046875, -4.900146484375, -3.9140625, -2.927978515625, -1.94189453125, -0.955810546875, 0.0302734375, 1.016357421875, 2.00244140625, 2.988525390625, 3.974609375, 4.960693359375, 5.94677734375, 6.932861328125, 7.9189453125, 8.905029296875, 9.89111328125, 10.877197265625, 11.86328125, 12.849365234375, 13.83544921875, 14.821533203125, 15.8076171875, 16.793701171875, 17.77978515625, 18.765869140625, 19.751953125, 20.738037109375, 21.72412109375, 22.710205078125, 23.6962890625, 24.682373046875, 25.66845703125, 26.654541015625, 27.640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 13.0, 4.0, 11.0, 13.0, 35.0, 47.0, 82.0, 109.0, 220.0, 472.0, 1842.0, 588.0, 269.0, 132.0, 76.0, 47.0, 26.0, 22.0, 17.0, 10.0, 5.0, 9.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.1650390625, -12.705078125, -12.2451171875, -11.78515625, -11.3251953125, -10.865234375, -10.4052734375, -9.9453125, -9.4853515625, -9.025390625, -8.5654296875, -8.10546875, -7.6455078125, -7.185546875, -6.7255859375, -6.265625, -5.8056640625, -5.345703125, -4.8857421875, -4.42578125, -3.9658203125, -3.505859375, -3.0458984375, -2.5859375, -2.1259765625, -1.666015625, -1.2060546875, -0.74609375, -0.2861328125, 0.173828125, 0.6337890625, 1.09375, 1.5537109375, 2.013671875, 2.4736328125, 2.93359375, 3.3935546875, 3.853515625, 4.3134765625, 4.7734375, 5.2333984375, 5.693359375, 6.1533203125, 6.61328125, 7.0732421875, 7.533203125, 7.9931640625, 8.453125, 8.9130859375, 9.373046875, 9.8330078125, 10.29296875, 10.7529296875, 11.212890625, 11.6728515625, 12.1328125, 12.5927734375, 13.052734375, 13.5126953125, 13.97265625, 14.4326171875, 14.892578125, 15.3525390625, 15.8125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 11.0, 13.0, 37.0, 56.0, 76.0, 112.0, 143.0, 156.0, 131.0, 93.0, 66.0, 41.0, 21.0, 17.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.44892883300781, -102.56626892089844, -99.68360137939453, -96.80094146728516, -93.91827392578125, -91.03561401367188, -88.1529541015625, -85.2702865600586, -82.38761901855469, -79.50495910644531, -76.6222915649414, -73.73963165283203, -70.85696411132812, -67.97430419921875, -65.09164428710938, -62.20897674560547, -59.326316833496094, -56.44365310668945, -53.56098937988281, -50.67832946777344, -47.79566192626953, -44.913002014160156, -42.030338287353516, -39.147674560546875, -36.265010833740234, -33.382347106933594, -30.499683380126953, -27.617021560668945, -24.734357833862305, -21.851694107055664, -18.969032287597656, -16.086368560791016, -13.203704833984375, -10.321041107177734, -7.43837833404541, -4.555715560913086, -1.6730518341064453, 1.2096118927001953, 4.092273712158203, 6.974937438964844, 9.857601165771484, 12.740264892578125, 15.62292766571045, 18.505590438842773, 21.388254165649414, 24.270917892456055, 27.153579711914062, 30.036243438720703, 32.918907165527344, 35.801570892333984, 38.684234619140625, 41.56689453125, 44.449562072753906, 47.33222198486328, 50.21488571166992, 53.09754943847656, 55.9802131652832, 58.862876892089844, 61.745540618896484, 64.62820434570312, 67.5108642578125, 70.3935317993164, 73.27619171142578, 76.15885925292969, 79.04151916503906]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 13.0, 13.0, 21.0, 16.0, 25.0, 25.0, 29.0, 28.0, 29.0, 46.0, 47.0, 51.0, 50.0, 44.0, 58.0, 55.0, 51.0, 49.0, 52.0, 39.0, 39.0, 38.0, 36.0, 17.0, 22.0, 19.0, 18.0, 11.0, 10.0, 6.0, 7.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.01183319091797, -39.669464111328125, -38.32709503173828, -36.98472213745117, -35.64235305786133, -34.299983978271484, -32.95761489868164, -31.615243911743164, -30.272872924804688, -28.930503845214844, -27.588132858276367, -26.245763778686523, -24.903392791748047, -23.561023712158203, -22.21865463256836, -20.876283645629883, -19.53391456604004, -18.191545486450195, -16.84917449951172, -15.506805419921875, -14.164434432983398, -12.822065353393555, -11.479695320129395, -10.137325286865234, -8.794955253601074, -7.452585220336914, -6.110215187072754, -4.767845630645752, -3.425475597381592, -2.0831055641174316, -0.7407360076904297, 0.6016340255737305, 1.9440040588378906, 3.286374092102051, 4.628744125366211, 5.971113681793213, 7.313483715057373, 8.655853271484375, 9.998223304748535, 11.340593338012695, 12.682963371276855, 14.025333404541016, 15.367703437805176, 16.710073471069336, 18.05244255065918, 19.394813537597656, 20.7371826171875, 22.079551696777344, 23.42192268371582, 24.764291763305664, 26.10666275024414, 27.449031829833984, 28.79140281677246, 30.133771896362305, 31.47614288330078, 32.818511962890625, 34.16088104248047, 35.50325012207031, 36.845619201660156, 38.187992095947266, 39.53036117553711, 40.87273025512695, 42.2150993347168, 43.557472229003906, 44.89984130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 19.0, 18.0, 45.0, 51.0, 77.0, 123.0, 231.0, 388.0, 731.0, 1613.0, 4305.0, 14736.0, 61184.0, 412706.0, 462922.0, 65612.0, 15775.0, 4443.0, 1724.0, 810.0, 408.0, 239.0, 125.0, 76.0, 60.0, 36.0, 18.0, 7.0, 12.0, 8.0, 3.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-49.6875, -48.446044921875, -47.20458984375, -45.963134765625, -44.7216796875, -43.480224609375, -42.23876953125, -40.997314453125, -39.755859375, -38.514404296875, -37.27294921875, -36.031494140625, -34.7900390625, -33.548583984375, -32.30712890625, -31.065673828125, -29.82421875, -28.582763671875, -27.34130859375, -26.099853515625, -24.8583984375, -23.616943359375, -22.37548828125, -21.134033203125, -19.892578125, -18.651123046875, -17.40966796875, -16.168212890625, -14.9267578125, -13.685302734375, -12.44384765625, -11.202392578125, -9.9609375, -8.719482421875, -7.47802734375, -6.236572265625, -4.9951171875, -3.753662109375, -2.51220703125, -1.270751953125, -0.029296875, 1.212158203125, 2.45361328125, 3.695068359375, 4.9365234375, 6.177978515625, 7.41943359375, 8.660888671875, 9.90234375, 11.143798828125, 12.38525390625, 13.626708984375, 14.8681640625, 16.109619140625, 17.35107421875, 18.592529296875, 19.833984375, 21.075439453125, 22.31689453125, 23.558349609375, 24.7998046875, 26.041259765625, 27.28271484375, 28.524169921875, 29.765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 12.0, 19.0, 31.0, 39.0, 50.0, 70.0, 70.0, 82.0, 93.0, 96.0, 80.0, 66.0, 81.0, 59.0, 38.0, 31.0, 20.0, 9.0, 16.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4942626953125, -8.238525390625, -7.9827880859375, -7.72705078125, -7.4713134765625, -7.215576171875, -6.9598388671875, -6.7041015625, -6.4483642578125, -6.192626953125, -5.9368896484375, -5.68115234375, -5.4254150390625, -5.169677734375, -4.9139404296875, -4.658203125, -4.4024658203125, -4.146728515625, -3.8909912109375, -3.63525390625, -3.3795166015625, -3.123779296875, -2.8680419921875, -2.6123046875, -2.3565673828125, -2.100830078125, -1.8450927734375, -1.58935546875, -1.3336181640625, -1.077880859375, -0.8221435546875, -0.56640625, -0.3106689453125, -0.054931640625, 0.2008056640625, 0.45654296875, 0.7122802734375, 0.968017578125, 1.2237548828125, 1.4794921875, 1.7352294921875, 1.990966796875, 2.2467041015625, 2.50244140625, 2.7581787109375, 3.013916015625, 3.2696533203125, 3.525390625, 3.7811279296875, 4.036865234375, 4.2926025390625, 4.54833984375, 4.8040771484375, 5.059814453125, 5.3155517578125, 5.5712890625, 5.8270263671875, 6.082763671875, 6.3385009765625, 6.59423828125, 6.8499755859375, 7.105712890625, 7.3614501953125, 7.6171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 10.0, 11.0, 25.0, 32.0, 48.0, 60.0, 89.0, 161.0, 309.0, 596.0, 1283.0, 3222.0, 9058.0, 27549.0, 93078.0, 527697.0, 292420.0, 62444.0, 19331.0, 6467.0, 2536.0, 953.0, 530.0, 242.0, 126.0, 80.0, 57.0, 33.0, 27.0, 19.0, 15.0, 7.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.078125, -21.33837890625, -20.5986328125, -19.85888671875, -19.119140625, -18.37939453125, -17.6396484375, -16.89990234375, -16.16015625, -15.42041015625, -14.6806640625, -13.94091796875, -13.201171875, -12.46142578125, -11.7216796875, -10.98193359375, -10.2421875, -9.50244140625, -8.7626953125, -8.02294921875, -7.283203125, -6.54345703125, -5.8037109375, -5.06396484375, -4.32421875, -3.58447265625, -2.8447265625, -2.10498046875, -1.365234375, -0.62548828125, 0.1142578125, 0.85400390625, 1.59375, 2.33349609375, 3.0732421875, 3.81298828125, 4.552734375, 5.29248046875, 6.0322265625, 6.77197265625, 7.51171875, 8.25146484375, 8.9912109375, 9.73095703125, 10.470703125, 11.21044921875, 11.9501953125, 12.68994140625, 13.4296875, 14.16943359375, 14.9091796875, 15.64892578125, 16.388671875, 17.12841796875, 17.8681640625, 18.60791015625, 19.34765625, 20.08740234375, 20.8271484375, 21.56689453125, 22.306640625, 23.04638671875, 23.7861328125, 24.52587890625, 25.265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 7.0, 12.0, 13.0, 15.0, 26.0, 28.0, 21.0, 23.0, 42.0, 35.0, 52.0, 52.0, 53.0, 59.0, 52.0, 62.0, 60.0, 72.0, 46.0, 33.0, 37.0, 37.0, 27.0, 24.0, 28.0, 18.0, 17.0, 5.0, 10.0, 9.0, 9.0, 2.0, 3.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-26.140625, -25.466796875, -24.79296875, -24.119140625, -23.4453125, -22.771484375, -22.09765625, -21.423828125, -20.75, -20.076171875, -19.40234375, -18.728515625, -18.0546875, -17.380859375, -16.70703125, -16.033203125, -15.359375, -14.685546875, -14.01171875, -13.337890625, -12.6640625, -11.990234375, -11.31640625, -10.642578125, -9.96875, -9.294921875, -8.62109375, -7.947265625, -7.2734375, -6.599609375, -5.92578125, -5.251953125, -4.578125, -3.904296875, -3.23046875, -2.556640625, -1.8828125, -1.208984375, -0.53515625, 0.138671875, 0.8125, 1.486328125, 2.16015625, 2.833984375, 3.5078125, 4.181640625, 4.85546875, 5.529296875, 6.203125, 6.876953125, 7.55078125, 8.224609375, 8.8984375, 9.572265625, 10.24609375, 10.919921875, 11.59375, 12.267578125, 12.94140625, 13.615234375, 14.2890625, 14.962890625, 15.63671875, 16.310546875, 16.984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 11.0, 5.0, 9.0, 11.0, 21.0, 26.0, 41.0, 53.0, 68.0, 106.0, 148.0, 297.0, 464.0, 709.0, 1345.0, 2637.0, 5824.0, 16686.0, 102670.0, 782923.0, 105533.0, 17053.0, 5851.0, 2632.0, 1373.0, 763.0, 479.0, 255.0, 168.0, 117.0, 65.0, 43.0, 37.0, 29.0, 22.0, 13.0, 12.0, 10.0, 10.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.421875, -15.883544921875, -15.34521484375, -14.806884765625, -14.2685546875, -13.730224609375, -13.19189453125, -12.653564453125, -12.115234375, -11.576904296875, -11.03857421875, -10.500244140625, -9.9619140625, -9.423583984375, -8.88525390625, -8.346923828125, -7.80859375, -7.270263671875, -6.73193359375, -6.193603515625, -5.6552734375, -5.116943359375, -4.57861328125, -4.040283203125, -3.501953125, -2.963623046875, -2.42529296875, -1.886962890625, -1.3486328125, -0.810302734375, -0.27197265625, 0.266357421875, 0.8046875, 1.343017578125, 1.88134765625, 2.419677734375, 2.9580078125, 3.496337890625, 4.03466796875, 4.572998046875, 5.111328125, 5.649658203125, 6.18798828125, 6.726318359375, 7.2646484375, 7.802978515625, 8.34130859375, 8.879638671875, 9.41796875, 9.956298828125, 10.49462890625, 11.032958984375, 11.5712890625, 12.109619140625, 12.64794921875, 13.186279296875, 13.724609375, 14.262939453125, 14.80126953125, 15.339599609375, 15.8779296875, 16.416259765625, 16.95458984375, 17.492919921875, 18.03125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 17.0, 21.0, 26.0, 52.0, 121.0, 269.0, 229.0, 114.0, 35.0, 27.0, 17.0, 12.0, 11.0, 2.0, 1.0, 8.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031414031982421875, -0.0030396878719329834, -0.0029379725456237793, -0.002836257219314575, -0.002734541893005371, -0.002632826566696167, -0.002531111240386963, -0.002429395914077759, -0.0023276805877685547, -0.0022259652614593506, -0.0021242499351501465, -0.0020225346088409424, -0.0019208192825317383, -0.0018191039562225342, -0.00171738862991333, -0.001615673303604126, -0.0015139579772949219, -0.0014122426509857178, -0.0013105273246765137, -0.0012088119983673096, -0.0011070966720581055, -0.0010053813457489014, -0.0009036660194396973, -0.0008019506931304932, -0.0007002353668212891, -0.000598520040512085, -0.0004968047142028809, -0.00039508938789367676, -0.00029337406158447266, -0.00019165873527526855, -8.994340896606445e-05, 1.1771917343139648e-05, 0.00011348724365234375, 0.00021520256996154785, 0.00031691789627075195, 0.00041863322257995605, 0.0005203485488891602, 0.0006220638751983643, 0.0007237792015075684, 0.0008254945278167725, 0.0009272098541259766, 0.0010289251804351807, 0.0011306405067443848, 0.0012323558330535889, 0.001334071159362793, 0.001435786485671997, 0.0015375018119812012, 0.0016392171382904053, 0.0017409324645996094, 0.0018426477909088135, 0.0019443631172180176, 0.0020460784435272217, 0.0021477937698364258, 0.00224950909614563, 0.002351224422454834, 0.002452939748764038, 0.002554655075073242, 0.0026563704013824463, 0.0027580857276916504, 0.0028598010540008545, 0.0029615163803100586, 0.0030632317066192627, 0.003164947032928467, 0.003266662359237671, 0.003368377685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 12.0, 26.0, 18.0, 46.0, 59.0, 143.0, 228.0, 461.0, 1010.0, 2657.0, 10429.0, 661161.0, 358731.0, 9186.0, 2460.0, 969.0, 424.0, 226.0, 125.0, 67.0, 38.0, 28.0, 15.0, 10.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.21875, -57.47509765625, -55.7314453125, -53.98779296875, -52.244140625, -50.50048828125, -48.7568359375, -47.01318359375, -45.26953125, -43.52587890625, -41.7822265625, -40.03857421875, -38.294921875, -36.55126953125, -34.8076171875, -33.06396484375, -31.3203125, -29.57666015625, -27.8330078125, -26.08935546875, -24.345703125, -22.60205078125, -20.8583984375, -19.11474609375, -17.37109375, -15.62744140625, -13.8837890625, -12.14013671875, -10.396484375, -8.65283203125, -6.9091796875, -5.16552734375, -3.421875, -1.67822265625, 0.0654296875, 1.80908203125, 3.552734375, 5.29638671875, 7.0400390625, 8.78369140625, 10.52734375, 12.27099609375, 14.0146484375, 15.75830078125, 17.501953125, 19.24560546875, 20.9892578125, 22.73291015625, 24.4765625, 26.22021484375, 27.9638671875, 29.70751953125, 31.451171875, 33.19482421875, 34.9384765625, 36.68212890625, 38.42578125, 40.16943359375, 41.9130859375, 43.65673828125, 45.400390625, 47.14404296875, 48.8876953125, 50.63134765625, 52.375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 15.0, 52.0, 143.0, 497.0, 161.0, 54.0, 14.0, 10.0, 10.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.443359375, -35.35546875, -34.267578125, -33.1796875, -32.091796875, -31.00390625, -29.916015625, -28.828125, -27.740234375, -26.65234375, -25.564453125, -24.4765625, -23.388671875, -22.30078125, -21.212890625, -20.125, -19.037109375, -17.94921875, -16.861328125, -15.7734375, -14.685546875, -13.59765625, -12.509765625, -11.421875, -10.333984375, -9.24609375, -8.158203125, -7.0703125, -5.982421875, -4.89453125, -3.806640625, -2.71875, -1.630859375, -0.54296875, 0.544921875, 1.6328125, 2.720703125, 3.80859375, 4.896484375, 5.984375, 7.072265625, 8.16015625, 9.248046875, 10.3359375, 11.423828125, 12.51171875, 13.599609375, 14.6875, 15.775390625, 16.86328125, 17.951171875, 19.0390625, 20.126953125, 21.21484375, 22.302734375, 23.390625, 24.478515625, 25.56640625, 26.654296875, 27.7421875, 28.830078125, 29.91796875, 31.005859375, 32.09375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 18.0, 60.0, 145.0, 254.0, 278.0, 157.0, 50.0, 24.0, 13.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-408.7998352050781, -395.65716552734375, -382.5145263671875, -369.37188720703125, -356.2292175292969, -343.0865478515625, -329.94390869140625, -316.80126953125, -303.6585998535156, -290.51593017578125, -277.373291015625, -264.23065185546875, -251.08798217773438, -237.94532775878906, -224.80267333984375, -211.66001892089844, -198.51736450195312, -185.3747100830078, -172.2320556640625, -159.0894012451172, -145.94674682617188, -132.80409240722656, -119.66143798828125, -106.51878356933594, -93.37612915039062, -80.23347473144531, -67.0908203125, -53.94816589355469, -40.805511474609375, -27.662857055664062, -14.52020263671875, -1.3775482177734375, 11.765106201171875, 24.907760620117188, 38.0504150390625, 51.19306945800781, 64.33572387695312, 77.47837829589844, 90.62103271484375, 103.76368713378906, 116.90634155273438, 130.0489959716797, 143.191650390625, 156.3343048095703, 169.47695922851562, 182.61961364746094, 195.76226806640625, 208.90492248535156, 222.04757690429688, 235.1902313232422, 248.3328857421875, 261.47552490234375, 274.6181945800781, 287.7608642578125, 300.90350341796875, 314.046142578125, 327.1888122558594, 340.33148193359375, 353.47412109375, 366.61676025390625, 379.7594299316406, 392.902099609375, 406.04473876953125, 419.1873779296875, 432.3300476074219]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 5.0, 3.0, 12.0, 9.0, 8.0, 12.0, 16.0, 16.0, 21.0, 27.0, 19.0, 15.0, 34.0, 28.0, 35.0, 36.0, 36.0, 29.0, 36.0, 40.0, 49.0, 50.0, 39.0, 41.0, 37.0, 53.0, 39.0, 28.0, 37.0, 26.0, 29.0, 19.0, 21.0, 17.0, 17.0, 14.0, 6.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-107.05431365966797, -103.92790222167969, -100.80148315429688, -97.6750717163086, -94.54866027832031, -91.4222412109375, -88.29582977294922, -85.16941833496094, -82.04299926757812, -78.91658782958984, -75.79016876220703, -72.66375732421875, -69.53734588623047, -66.41093444824219, -63.284515380859375, -60.158103942871094, -57.03169250488281, -53.905277252197266, -50.778865814208984, -47.65245056152344, -44.526039123535156, -41.39962387084961, -38.27320861816406, -35.14679718017578, -32.020381927490234, -28.89396858215332, -25.767555236816406, -22.64113998413086, -19.514726638793945, -16.38831329345703, -13.261898040771484, -10.13548469543457, -7.009063720703125, -3.8826498985290527, -0.7562360763549805, 2.37017822265625, 5.496591567993164, 8.623004913330078, 11.749420166015625, 14.875833511352539, 18.002246856689453, 21.128660202026367, 24.25507354736328, 27.381488800048828, 30.507902145385742, 33.634315490722656, 36.7607307434082, 39.88714599609375, 43.01355743408203, 46.13997268676758, 49.26638412475586, 52.392799377441406, 55.51921081542969, 58.645626068115234, 61.77204132080078, 64.89845275878906, 68.02487182617188, 71.15128326416016, 74.27770233154297, 77.40411376953125, 80.53052520751953, 83.65693664550781, 86.78335571289062, 89.9097671508789, 93.03617858886719]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 13.0, 14.0, 18.0, 14.0, 41.0, 60.0, 80.0, 106.0, 203.0, 350.0, 595.0, 1158.0, 2346.0, 6224.0, 21169.0, 130928.0, 3822143.0, 171650.0, 25043.0, 6735.0, 2659.0, 1152.0, 628.0, 351.0, 219.0, 129.0, 82.0, 53.0, 41.0, 20.0, 15.0, 9.0, 4.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.189453125, -61.94140625, -59.693359375, -57.4453125, -55.197265625, -52.94921875, -50.701171875, -48.453125, -46.205078125, -43.95703125, -41.708984375, -39.4609375, -37.212890625, -34.96484375, -32.716796875, -30.46875, -28.220703125, -25.97265625, -23.724609375, -21.4765625, -19.228515625, -16.98046875, -14.732421875, -12.484375, -10.236328125, -7.98828125, -5.740234375, -3.4921875, -1.244140625, 1.00390625, 3.251953125, 5.5, 7.748046875, 9.99609375, 12.244140625, 14.4921875, 16.740234375, 18.98828125, 21.236328125, 23.484375, 25.732421875, 27.98046875, 30.228515625, 32.4765625, 34.724609375, 36.97265625, 39.220703125, 41.46875, 43.716796875, 45.96484375, 48.212890625, 50.4609375, 52.708984375, 54.95703125, 57.205078125, 59.453125, 61.701171875, 63.94921875, 66.197265625, 68.4453125, 70.693359375, 72.94140625, 75.189453125, 77.4375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 10.0, 13.0, 25.0, 23.0, 47.0, 41.0, 53.0, 68.0, 82.0, 79.0, 83.0, 93.0, 70.0, 67.0, 63.0, 47.0, 34.0, 29.0, 18.0, 12.0, 18.0, 8.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6488037109375, -8.391357421875, -8.1339111328125, -7.87646484375, -7.6190185546875, -7.361572265625, -7.1041259765625, -6.8466796875, -6.5892333984375, -6.331787109375, -6.0743408203125, -5.81689453125, -5.5594482421875, -5.302001953125, -5.0445556640625, -4.787109375, -4.5296630859375, -4.272216796875, -4.0147705078125, -3.75732421875, -3.4998779296875, -3.242431640625, -2.9849853515625, -2.7275390625, -2.4700927734375, -2.212646484375, -1.9552001953125, -1.69775390625, -1.4403076171875, -1.182861328125, -0.9254150390625, -0.66796875, -0.4105224609375, -0.153076171875, 0.1043701171875, 0.36181640625, 0.6192626953125, 0.876708984375, 1.1341552734375, 1.3916015625, 1.6490478515625, 1.906494140625, 2.1639404296875, 2.42138671875, 2.6788330078125, 2.936279296875, 3.1937255859375, 3.451171875, 3.7086181640625, 3.966064453125, 4.2235107421875, 4.48095703125, 4.7384033203125, 4.995849609375, 5.2532958984375, 5.5107421875, 5.7681884765625, 6.025634765625, 6.2830810546875, 6.54052734375, 6.7979736328125, 7.055419921875, 7.3128662109375, 7.5703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 9.0, 21.0, 31.0, 59.0, 91.0, 152.0, 263.0, 590.0, 1180.0, 2379.0, 5224.0, 13927.0, 47488.0, 286974.0, 3563903.0, 210999.0, 39622.0, 12100.0, 4712.0, 2171.0, 1089.0, 540.0, 323.0, 158.0, 105.0, 65.0, 31.0, 29.0, 11.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.578125, -40.0625, -38.546875, -37.03125, -35.515625, -34.0, -32.484375, -30.96875, -29.453125, -27.9375, -26.421875, -24.90625, -23.390625, -21.875, -20.359375, -18.84375, -17.328125, -15.8125, -14.296875, -12.78125, -11.265625, -9.75, -8.234375, -6.71875, -5.203125, -3.6875, -2.171875, -0.65625, 0.859375, 2.375, 3.890625, 5.40625, 6.921875, 8.4375, 9.953125, 11.46875, 12.984375, 14.5, 16.015625, 17.53125, 19.046875, 20.5625, 22.078125, 23.59375, 25.109375, 26.625, 28.140625, 29.65625, 31.171875, 32.6875, 34.203125, 35.71875, 37.234375, 38.75, 40.265625, 41.78125, 43.296875, 44.8125, 46.328125, 47.84375, 49.359375, 50.875, 52.390625, 53.90625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 11.0, 8.0, 11.0, 24.0, 34.0, 38.0, 60.0, 77.0, 139.0, 247.0, 593.0, 1873.0, 380.0, 192.0, 96.0, 66.0, 47.0, 35.0, 25.0, 16.0, 19.0, 8.0, 10.0, 11.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.140625, -11.6953125, -11.25, -10.8046875, -10.359375, -9.9140625, -9.46875, -9.0234375, -8.578125, -8.1328125, -7.6875, -7.2421875, -6.796875, -6.3515625, -5.90625, -5.4609375, -5.015625, -4.5703125, -4.125, -3.6796875, -3.234375, -2.7890625, -2.34375, -1.8984375, -1.453125, -1.0078125, -0.5625, -0.1171875, 0.328125, 0.7734375, 1.21875, 1.6640625, 2.109375, 2.5546875, 3.0, 3.4453125, 3.890625, 4.3359375, 4.78125, 5.2265625, 5.671875, 6.1171875, 6.5625, 7.0078125, 7.453125, 7.8984375, 8.34375, 8.7890625, 9.234375, 9.6796875, 10.125, 10.5703125, 11.015625, 11.4609375, 11.90625, 12.3515625, 12.796875, 13.2421875, 13.6875, 14.1328125, 14.578125, 15.0234375, 15.46875, 15.9140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 16.0, 68.0, 204.0, 317.0, 229.0, 97.0, 36.0, 23.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.7562255859375, -106.1827163696289, -97.60920715332031, -89.03569030761719, -80.4621810913086, -71.888671875, -63.31515884399414, -54.74164581298828, -46.16813659667969, -37.594627380371094, -29.021114349365234, -20.447603225708008, -11.874092102050781, -3.3005828857421875, 5.272930145263672, 13.846443176269531, 22.419952392578125, 30.99346351623535, 39.56697463989258, 48.14048767089844, 56.71399688720703, 65.28750610351562, 73.86102294921875, 82.43453216552734, 91.00804138183594, 99.58155059814453, 108.15505981445312, 116.72857666015625, 125.30208587646484, 133.87559509277344, 142.44911193847656, 151.02261352539062, 159.59609985351562, 168.16961669921875, 176.7431182861328, 185.31663513183594, 193.89013671875, 202.46365356445312, 211.03717041015625, 219.61068725585938, 228.18418884277344, 236.75770568847656, 245.33120727539062, 253.90472412109375, 262.4782409667969, 271.0517578125, 279.625244140625, 288.1987609863281, 296.77227783203125, 305.3457946777344, 313.9193115234375, 322.4927978515625, 331.0663146972656, 339.63983154296875, 348.2133483886719, 356.786865234375, 365.3603515625, 373.9338684082031, 382.50738525390625, 391.08087158203125, 399.6543884277344, 408.2279052734375, 416.8014221191406, 425.37493896484375, 433.9484558105469]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 10.0, 10.0, 18.0, 14.0, 25.0, 19.0, 15.0, 19.0, 31.0, 30.0, 32.0, 33.0, 47.0, 45.0, 41.0, 34.0, 45.0, 49.0, 47.0, 46.0, 34.0, 46.0, 41.0, 42.0, 35.0, 29.0, 18.0, 24.0, 21.0, 12.0, 13.0, 12.0, 13.0, 9.0, 10.0, 4.0, 3.0, 6.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-66.1232681274414, -64.26688385009766, -62.410499572753906, -60.554115295410156, -58.697731018066406, -56.841346740722656, -54.98496627807617, -53.12858200073242, -51.27219772338867, -49.41581344604492, -47.55942916870117, -45.70304489135742, -43.84666442871094, -41.99028015136719, -40.13389587402344, -38.27751159667969, -36.42112731933594, -34.56474304199219, -32.70835876464844, -30.85197639465332, -28.99559211730957, -27.13920783996582, -25.282825469970703, -23.426441192626953, -21.570056915283203, -19.713672637939453, -17.857288360595703, -16.000905990600586, -14.144521713256836, -12.288137435913086, -10.431754112243652, -8.575370788574219, -6.718990325927734, -4.862606525421143, -3.006222724914551, -1.149838924407959, 0.7065448760986328, 2.562929153442383, 4.419312477111816, 6.27569580078125, 8.132080078125, 9.98846435546875, 11.844847679138184, 13.701231002807617, 15.557615280151367, 17.413999557495117, 19.270381927490234, 21.126766204833984, 22.983150482177734, 24.839534759521484, 26.695919036865234, 28.55230140686035, 30.4086856842041, 32.26506805419922, 34.12145233154297, 35.97783660888672, 37.83422088623047, 39.69060516357422, 41.54698944091797, 43.40337371826172, 45.25975799560547, 47.11614227294922, 48.9725227355957, 50.82890701293945, 52.6852912902832]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 15.0, 15.0, 24.0, 27.0, 53.0, 68.0, 100.0, 163.0, 307.0, 560.0, 1081.0, 2371.0, 5565.0, 15427.0, 49516.0, 173591.0, 494142.0, 215012.0, 59854.0, 18568.0, 6616.0, 2756.0, 1265.0, 600.0, 329.0, 189.0, 129.0, 72.0, 30.0, 24.0, 23.0, 17.0, 12.0, 10.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.578125, -29.469482421875, -28.36083984375, -27.252197265625, -26.1435546875, -25.034912109375, -23.92626953125, -22.817626953125, -21.708984375, -20.600341796875, -19.49169921875, -18.383056640625, -17.2744140625, -16.165771484375, -15.05712890625, -13.948486328125, -12.83984375, -11.731201171875, -10.62255859375, -9.513916015625, -8.4052734375, -7.296630859375, -6.18798828125, -5.079345703125, -3.970703125, -2.862060546875, -1.75341796875, -0.644775390625, 0.4638671875, 1.572509765625, 2.68115234375, 3.789794921875, 4.8984375, 6.007080078125, 7.11572265625, 8.224365234375, 9.3330078125, 10.441650390625, 11.55029296875, 12.658935546875, 13.767578125, 14.876220703125, 15.98486328125, 17.093505859375, 18.2021484375, 19.310791015625, 20.41943359375, 21.528076171875, 22.63671875, 23.745361328125, 24.85400390625, 25.962646484375, 27.0712890625, 28.179931640625, 29.28857421875, 30.397216796875, 31.505859375, 32.614501953125, 33.72314453125, 34.831787109375, 35.9404296875, 37.049072265625, 38.15771484375, 39.266357421875, 40.375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 11.0, 17.0, 28.0, 28.0, 41.0, 44.0, 60.0, 52.0, 55.0, 61.0, 65.0, 67.0, 60.0, 53.0, 58.0, 56.0, 53.0, 32.0, 28.0, 32.0, 19.0, 14.0, 14.0, 9.0, 11.0, 3.0, 3.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.484375, -8.23760986328125, -7.9908447265625, -7.74407958984375, -7.497314453125, -7.25054931640625, -7.0037841796875, -6.75701904296875, -6.51025390625, -6.26348876953125, -6.0167236328125, -5.76995849609375, -5.523193359375, -5.27642822265625, -5.0296630859375, -4.78289794921875, -4.5361328125, -4.28936767578125, -4.0426025390625, -3.79583740234375, -3.549072265625, -3.30230712890625, -3.0555419921875, -2.80877685546875, -2.56201171875, -2.31524658203125, -2.0684814453125, -1.82171630859375, -1.574951171875, -1.32818603515625, -1.0814208984375, -0.83465576171875, -0.587890625, -0.34112548828125, -0.0943603515625, 0.15240478515625, 0.399169921875, 0.64593505859375, 0.8927001953125, 1.13946533203125, 1.38623046875, 1.63299560546875, 1.8797607421875, 2.12652587890625, 2.373291015625, 2.62005615234375, 2.8668212890625, 3.11358642578125, 3.3603515625, 3.60711669921875, 3.8538818359375, 4.10064697265625, 4.347412109375, 4.59417724609375, 4.8409423828125, 5.08770751953125, 5.33447265625, 5.58123779296875, 5.8280029296875, 6.07476806640625, 6.321533203125, 6.56829833984375, 6.8150634765625, 7.06182861328125, 7.30859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 6.0, 11.0, 7.0, 14.0, 15.0, 22.0, 38.0, 48.0, 71.0, 114.0, 184.0, 269.0, 406.0, 620.0, 1295.0, 2847.0, 8200.0, 31941.0, 159111.0, 624255.0, 170469.0, 34006.0, 8609.0, 2875.0, 1283.0, 680.0, 385.0, 242.0, 160.0, 91.0, 79.0, 49.0, 29.0, 29.0, 28.0, 17.0, 13.0, 6.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -30.98779296875, -29.8193359375, -28.65087890625, -27.482421875, -26.31396484375, -25.1455078125, -23.97705078125, -22.80859375, -21.64013671875, -20.4716796875, -19.30322265625, -18.134765625, -16.96630859375, -15.7978515625, -14.62939453125, -13.4609375, -12.29248046875, -11.1240234375, -9.95556640625, -8.787109375, -7.61865234375, -6.4501953125, -5.28173828125, -4.11328125, -2.94482421875, -1.7763671875, -0.60791015625, 0.560546875, 1.72900390625, 2.8974609375, 4.06591796875, 5.234375, 6.40283203125, 7.5712890625, 8.73974609375, 9.908203125, 11.07666015625, 12.2451171875, 13.41357421875, 14.58203125, 15.75048828125, 16.9189453125, 18.08740234375, 19.255859375, 20.42431640625, 21.5927734375, 22.76123046875, 23.9296875, 25.09814453125, 26.2666015625, 27.43505859375, 28.603515625, 29.77197265625, 30.9404296875, 32.10888671875, 33.27734375, 34.44580078125, 35.6142578125, 36.78271484375, 37.951171875, 39.11962890625, 40.2880859375, 41.45654296875, 42.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 18.0, 19.0, 10.0, 15.0, 24.0, 22.0, 33.0, 19.0, 29.0, 36.0, 36.0, 29.0, 45.0, 40.0, 43.0, 44.0, 44.0, 54.0, 35.0, 34.0, 38.0, 54.0, 34.0, 28.0, 25.0, 26.0, 24.0, 23.0, 16.0, 23.0, 10.0, 5.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5, -24.715087890625, -23.93017578125, -23.145263671875, -22.3603515625, -21.575439453125, -20.79052734375, -20.005615234375, -19.220703125, -18.435791015625, -17.65087890625, -16.865966796875, -16.0810546875, -15.296142578125, -14.51123046875, -13.726318359375, -12.94140625, -12.156494140625, -11.37158203125, -10.586669921875, -9.8017578125, -9.016845703125, -8.23193359375, -7.447021484375, -6.662109375, -5.877197265625, -5.09228515625, -4.307373046875, -3.5224609375, -2.737548828125, -1.95263671875, -1.167724609375, -0.3828125, 0.402099609375, 1.18701171875, 1.971923828125, 2.7568359375, 3.541748046875, 4.32666015625, 5.111572265625, 5.896484375, 6.681396484375, 7.46630859375, 8.251220703125, 9.0361328125, 9.821044921875, 10.60595703125, 11.390869140625, 12.17578125, 12.960693359375, 13.74560546875, 14.530517578125, 15.3154296875, 16.100341796875, 16.88525390625, 17.670166015625, 18.455078125, 19.239990234375, 20.02490234375, 20.809814453125, 21.5947265625, 22.379638671875, 23.16455078125, 23.949462890625, 24.734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 16.0, 14.0, 26.0, 28.0, 66.0, 82.0, 133.0, 230.0, 428.0, 929.0, 1857.0, 4280.0, 12472.0, 56295.0, 519265.0, 387779.0, 46253.0, 11022.0, 3874.0, 1706.0, 800.0, 410.0, 188.0, 138.0, 78.0, 51.0, 26.0, 23.0, 14.0, 15.0, 9.0, 10.0, 3.0, 8.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.452880859375, -18.78076171875, -18.108642578125, -17.4365234375, -16.764404296875, -16.09228515625, -15.420166015625, -14.748046875, -14.075927734375, -13.40380859375, -12.731689453125, -12.0595703125, -11.387451171875, -10.71533203125, -10.043212890625, -9.37109375, -8.698974609375, -8.02685546875, -7.354736328125, -6.6826171875, -6.010498046875, -5.33837890625, -4.666259765625, -3.994140625, -3.322021484375, -2.64990234375, -1.977783203125, -1.3056640625, -0.633544921875, 0.03857421875, 0.710693359375, 1.3828125, 2.054931640625, 2.72705078125, 3.399169921875, 4.0712890625, 4.743408203125, 5.41552734375, 6.087646484375, 6.759765625, 7.431884765625, 8.10400390625, 8.776123046875, 9.4482421875, 10.120361328125, 10.79248046875, 11.464599609375, 12.13671875, 12.808837890625, 13.48095703125, 14.153076171875, 14.8251953125, 15.497314453125, 16.16943359375, 16.841552734375, 17.513671875, 18.185791015625, 18.85791015625, 19.530029296875, 20.2021484375, 20.874267578125, 21.54638671875, 22.218505859375, 22.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 8.0, 6.0, 12.0, 21.0, 32.0, 45.0, 71.0, 141.0, 245.0, 167.0, 77.0, 54.0, 39.0, 21.0, 17.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0052337646484375, -0.005094558000564575, -0.00495535135269165, -0.004816144704818726, -0.004676938056945801, -0.004537731409072876, -0.004398524761199951, -0.004259318113327026, -0.0041201114654541016, -0.003980904817581177, -0.003841698169708252, -0.003702491521835327, -0.0035632848739624023, -0.0034240782260894775, -0.0032848715782165527, -0.003145664930343628, -0.003006458282470703, -0.0028672516345977783, -0.0027280449867248535, -0.0025888383388519287, -0.002449631690979004, -0.002310425043106079, -0.0021712183952331543, -0.0020320117473602295, -0.0018928050994873047, -0.0017535984516143799, -0.001614391803741455, -0.0014751851558685303, -0.0013359785079956055, -0.0011967718601226807, -0.0010575652122497559, -0.0009183585643768311, -0.0007791519165039062, -0.0006399452686309814, -0.0005007386207580566, -0.00036153197288513184, -0.00022232532501220703, -8.311867713928223e-05, 5.608797073364258e-05, 0.00019529461860656738, 0.0003345012664794922, 0.000473707914352417, 0.0006129145622253418, 0.0007521212100982666, 0.0008913278579711914, 0.0010305345058441162, 0.001169741153717041, 0.0013089478015899658, 0.0014481544494628906, 0.0015873610973358154, 0.0017265677452087402, 0.001865774393081665, 0.00200498104095459, 0.0021441876888275146, 0.0022833943367004395, 0.0024226009845733643, 0.002561807632446289, 0.002701014280319214, 0.0028402209281921387, 0.0029794275760650635, 0.0031186342239379883, 0.003257840871810913, 0.003397047519683838, 0.0035362541675567627, 0.0036754608154296875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 13.0, 15.0, 11.0, 20.0, 18.0, 53.0, 55.0, 91.0, 134.0, 207.0, 306.0, 530.0, 1026.0, 2079.0, 4348.0, 11545.0, 42186.0, 347430.0, 552125.0, 61033.0, 14597.0, 5410.0, 2421.0, 1162.0, 665.0, 384.0, 237.0, 140.0, 68.0, 66.0, 42.0, 25.0, 18.0, 14.0, 12.0, 13.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.890625, -22.15478515625, -21.4189453125, -20.68310546875, -19.947265625, -19.21142578125, -18.4755859375, -17.73974609375, -17.00390625, -16.26806640625, -15.5322265625, -14.79638671875, -14.060546875, -13.32470703125, -12.5888671875, -11.85302734375, -11.1171875, -10.38134765625, -9.6455078125, -8.90966796875, -8.173828125, -7.43798828125, -6.7021484375, -5.96630859375, -5.23046875, -4.49462890625, -3.7587890625, -3.02294921875, -2.287109375, -1.55126953125, -0.8154296875, -0.07958984375, 0.65625, 1.39208984375, 2.1279296875, 2.86376953125, 3.599609375, 4.33544921875, 5.0712890625, 5.80712890625, 6.54296875, 7.27880859375, 8.0146484375, 8.75048828125, 9.486328125, 10.22216796875, 10.9580078125, 11.69384765625, 12.4296875, 13.16552734375, 13.9013671875, 14.63720703125, 15.373046875, 16.10888671875, 16.8447265625, 17.58056640625, 18.31640625, 19.05224609375, 19.7880859375, 20.52392578125, 21.259765625, 21.99560546875, 22.7314453125, 23.46728515625, 24.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 9.0, 10.0, 16.0, 17.0, 27.0, 41.0, 44.0, 79.0, 109.0, 137.0, 107.0, 106.0, 65.0, 53.0, 31.0, 31.0, 27.0, 11.0, 15.0, 11.0, 5.0, 9.0, 3.0, 0.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.5, -18.92529296875, -18.3505859375, -17.77587890625, -17.201171875, -16.62646484375, -16.0517578125, -15.47705078125, -14.90234375, -14.32763671875, -13.7529296875, -13.17822265625, -12.603515625, -12.02880859375, -11.4541015625, -10.87939453125, -10.3046875, -9.72998046875, -9.1552734375, -8.58056640625, -8.005859375, -7.43115234375, -6.8564453125, -6.28173828125, -5.70703125, -5.13232421875, -4.5576171875, -3.98291015625, -3.408203125, -2.83349609375, -2.2587890625, -1.68408203125, -1.109375, -0.53466796875, 0.0400390625, 0.61474609375, 1.189453125, 1.76416015625, 2.3388671875, 2.91357421875, 3.48828125, 4.06298828125, 4.6376953125, 5.21240234375, 5.787109375, 6.36181640625, 6.9365234375, 7.51123046875, 8.0859375, 8.66064453125, 9.2353515625, 9.81005859375, 10.384765625, 10.95947265625, 11.5341796875, 12.10888671875, 12.68359375, 13.25830078125, 13.8330078125, 14.40771484375, 14.982421875, 15.55712890625, 16.1318359375, 16.70654296875, 17.28125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 13.0, 45.0, 97.0, 208.0, 244.0, 191.0, 116.0, 52.0, 14.0, 13.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-414.6982421875, -399.5536804199219, -384.40911865234375, -369.2645568847656, -354.1199951171875, -338.97540283203125, -323.8308410644531, -308.686279296875, -293.5417175292969, -278.39715576171875, -263.2525939941406, -248.10801696777344, -232.9634552001953, -217.8188934326172, -202.67431640625, -187.52975463867188, -172.38519287109375, -157.24063110351562, -142.0960693359375, -126.95149230957031, -111.80693054199219, -96.66236877441406, -81.5177993774414, -66.37322998046875, -51.228668212890625, -36.084102630615234, -20.939537048339844, -5.794971466064453, 9.349594116210938, 24.494155883789062, 39.63872528076172, 54.783294677734375, 69.9278564453125, 85.07241821289062, 100.21698760986328, 115.36155700683594, 130.50611877441406, 145.6506805419922, 160.79525756835938, 175.9398193359375, 191.08438110351562, 206.22894287109375, 221.37350463867188, 236.51808166503906, 251.6626434326172, 266.80718994140625, 281.9517822265625, 297.0963439941406, 312.24090576171875, 327.3854675292969, 342.530029296875, 357.6745910644531, 372.81915283203125, 387.9637451171875, 403.1083068847656, 418.25286865234375, 433.3974304199219, 448.5419921875, 463.6865539550781, 478.83111572265625, 493.9757080078125, 509.1202392578125, 524.2648315429688, 539.409423828125, 554.553955078125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 6.0, 9.0, 13.0, 8.0, 13.0, 10.0, 14.0, 20.0, 13.0, 21.0, 36.0, 31.0, 47.0, 36.0, 44.0, 43.0, 55.0, 51.0, 38.0, 39.0, 42.0, 47.0, 42.0, 40.0, 38.0, 26.0, 27.0, 30.0, 29.0, 18.0, 16.0, 14.0, 18.0, 12.0, 11.0, 3.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-152.98780822753906, -148.5850067138672, -144.1822052001953, -139.77940368652344, -135.37661743164062, -130.97381591796875, -126.57101440429688, -122.168212890625, -117.76541137695312, -113.36260986328125, -108.95980834960938, -104.55701446533203, -100.15421295166016, -95.75141143798828, -91.34861755371094, -86.94581604003906, -82.54301452636719, -78.14021301269531, -73.73741149902344, -69.3346176147461, -64.93181610107422, -60.529014587402344, -56.126216888427734, -51.723419189453125, -47.32061767578125, -42.917816162109375, -38.515018463134766, -34.112220764160156, -29.70941925048828, -25.30661964416504, -20.903820037841797, -16.501020431518555, -12.098236083984375, -7.695436477661133, -3.2926368713378906, 1.1101627349853516, 5.512962341308594, 9.915761947631836, 14.318561553955078, 18.72136116027832, 23.124160766601562, 27.526960372924805, 31.929759979248047, 36.332557678222656, 40.73535919189453, 45.138160705566406, 49.540958404541016, 53.943756103515625, 58.3465576171875, 62.749359130859375, 67.15216064453125, 71.5549545288086, 75.95775604248047, 80.36055755615234, 84.76335144042969, 89.16615295410156, 93.56895446777344, 97.97175598144531, 102.37455749511719, 106.77735137939453, 111.1801528930664, 115.58295440673828, 119.98574829101562, 124.3885498046875, 128.79135131835938]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 12.0, 25.0, 24.0, 36.0, 68.0, 67.0, 82.0, 140.0, 201.0, 284.0, 375.0, 594.0, 986.0, 1781.0, 3856.0, 9840.0, 33559.0, 206592.0, 3610289.0, 265172.0, 39915.0, 11244.0, 4198.0, 1928.0, 1054.0, 652.0, 409.0, 274.0, 177.0, 142.0, 86.0, 66.0, 46.0, 33.0, 26.0, 22.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.34375, -34.92138671875, -33.4990234375, -32.07666015625, -30.654296875, -29.23193359375, -27.8095703125, -26.38720703125, -24.96484375, -23.54248046875, -22.1201171875, -20.69775390625, -19.275390625, -17.85302734375, -16.4306640625, -15.00830078125, -13.5859375, -12.16357421875, -10.7412109375, -9.31884765625, -7.896484375, -6.47412109375, -5.0517578125, -3.62939453125, -2.20703125, -0.78466796875, 0.6376953125, 2.06005859375, 3.482421875, 4.90478515625, 6.3271484375, 7.74951171875, 9.171875, 10.59423828125, 12.0166015625, 13.43896484375, 14.861328125, 16.28369140625, 17.7060546875, 19.12841796875, 20.55078125, 21.97314453125, 23.3955078125, 24.81787109375, 26.240234375, 27.66259765625, 29.0849609375, 30.50732421875, 31.9296875, 33.35205078125, 34.7744140625, 36.19677734375, 37.619140625, 39.04150390625, 40.4638671875, 41.88623046875, 43.30859375, 44.73095703125, 46.1533203125, 47.57568359375, 48.998046875, 50.42041015625, 51.8427734375, 53.26513671875, 54.6875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 8.0, 11.0, 8.0, 17.0, 19.0, 23.0, 34.0, 42.0, 46.0, 51.0, 58.0, 60.0, 47.0, 61.0, 55.0, 64.0, 66.0, 52.0, 51.0, 36.0, 31.0, 33.0, 34.0, 19.0, 23.0, 11.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.171875, -7.9315185546875, -7.691162109375, -7.4508056640625, -7.21044921875, -6.9700927734375, -6.729736328125, -6.4893798828125, -6.2490234375, -6.0086669921875, -5.768310546875, -5.5279541015625, -5.28759765625, -5.0472412109375, -4.806884765625, -4.5665283203125, -4.326171875, -4.0858154296875, -3.845458984375, -3.6051025390625, -3.36474609375, -3.1243896484375, -2.884033203125, -2.6436767578125, -2.4033203125, -2.1629638671875, -1.922607421875, -1.6822509765625, -1.44189453125, -1.2015380859375, -0.961181640625, -0.7208251953125, -0.48046875, -0.2401123046875, 0.000244140625, 0.2406005859375, 0.48095703125, 0.7213134765625, 0.961669921875, 1.2020263671875, 1.4423828125, 1.6827392578125, 1.923095703125, 2.1634521484375, 2.40380859375, 2.6441650390625, 2.884521484375, 3.1248779296875, 3.365234375, 3.6055908203125, 3.845947265625, 4.0863037109375, 4.32666015625, 4.5670166015625, 4.807373046875, 5.0477294921875, 5.2880859375, 5.5284423828125, 5.768798828125, 6.0091552734375, 6.24951171875, 6.4898681640625, 6.730224609375, 6.9705810546875, 7.2109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 0.0, 4.0, 2.0, 6.0, 10.0, 11.0, 16.0, 29.0, 54.0, 88.0, 180.0, 226.0, 345.0, 634.0, 1021.0, 2077.0, 4211.0, 10500.0, 32807.0, 146166.0, 2740757.0, 1101585.0, 109699.0, 26939.0, 8978.0, 3737.0, 1838.0, 961.0, 539.0, 334.0, 220.0, 107.0, 82.0, 42.0, 30.0, 10.0, 10.0, 12.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.58837890625, -32.4267578125, -31.26513671875, -30.103515625, -28.94189453125, -27.7802734375, -26.61865234375, -25.45703125, -24.29541015625, -23.1337890625, -21.97216796875, -20.810546875, -19.64892578125, -18.4873046875, -17.32568359375, -16.1640625, -15.00244140625, -13.8408203125, -12.67919921875, -11.517578125, -10.35595703125, -9.1943359375, -8.03271484375, -6.87109375, -5.70947265625, -4.5478515625, -3.38623046875, -2.224609375, -1.06298828125, 0.0986328125, 1.26025390625, 2.421875, 3.58349609375, 4.7451171875, 5.90673828125, 7.068359375, 8.22998046875, 9.3916015625, 10.55322265625, 11.71484375, 12.87646484375, 14.0380859375, 15.19970703125, 16.361328125, 17.52294921875, 18.6845703125, 19.84619140625, 21.0078125, 22.16943359375, 23.3310546875, 24.49267578125, 25.654296875, 26.81591796875, 27.9775390625, 29.13916015625, 30.30078125, 31.46240234375, 32.6240234375, 33.78564453125, 34.947265625, 36.10888671875, 37.2705078125, 38.43212890625, 39.59375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 6.0, 15.0, 17.0, 24.0, 30.0, 43.0, 77.0, 134.0, 218.0, 524.0, 1898.0, 581.0, 217.0, 101.0, 73.0, 28.0, 21.0, 19.0, 12.0, 5.0, 7.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.961669921875, -20.25146484375, -19.541259765625, -18.8310546875, -18.120849609375, -17.41064453125, -16.700439453125, -15.990234375, -15.280029296875, -14.56982421875, -13.859619140625, -13.1494140625, -12.439208984375, -11.72900390625, -11.018798828125, -10.30859375, -9.598388671875, -8.88818359375, -8.177978515625, -7.4677734375, -6.757568359375, -6.04736328125, -5.337158203125, -4.626953125, -3.916748046875, -3.20654296875, -2.496337890625, -1.7861328125, -1.075927734375, -0.36572265625, 0.344482421875, 1.0546875, 1.764892578125, 2.47509765625, 3.185302734375, 3.8955078125, 4.605712890625, 5.31591796875, 6.026123046875, 6.736328125, 7.446533203125, 8.15673828125, 8.866943359375, 9.5771484375, 10.287353515625, 10.99755859375, 11.707763671875, 12.41796875, 13.128173828125, 13.83837890625, 14.548583984375, 15.2587890625, 15.968994140625, 16.67919921875, 17.389404296875, 18.099609375, 18.809814453125, 19.52001953125, 20.230224609375, 20.9404296875, 21.650634765625, 22.36083984375, 23.071044921875, 23.78125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 10.0, 16.0, 56.0, 160.0, 308.0, 280.0, 126.0, 32.0, 9.0, 7.0, 5.0], "bins": [-618.598876953125, -607.9883422851562, -597.3778686523438, -586.767333984375, -576.1568603515625, -565.5463256835938, -554.9358520507812, -544.3253173828125, -533.71484375, -523.1043090820312, -512.4938354492188, -501.8833312988281, -491.2728271484375, -480.66229248046875, -470.0517883300781, -459.4412841796875, -448.83074951171875, -438.2202453613281, -427.6097412109375, -416.9992370605469, -406.38873291015625, -395.7781982421875, -385.1676940917969, -374.55718994140625, -363.9466857910156, -353.336181640625, -342.7256774902344, -332.11517333984375, -321.504638671875, -310.8941345214844, -300.28363037109375, -289.6731262207031, -279.0625915527344, -268.45208740234375, -257.8415832519531, -247.23106384277344, -236.6205596923828, -226.0100555419922, -215.3995361328125, -204.78903198242188, -194.17852783203125, -183.56802368164062, -172.95751953125, -162.3470001220703, -151.7364959716797, -141.12599182128906, -130.51547241210938, -119.90496826171875, -109.29446411132812, -98.6839599609375, -88.07344818115234, -77.46293640136719, -66.85243225097656, -56.24192428588867, -45.63141632080078, -35.020904541015625, -24.410404205322266, -13.799896240234375, -3.1893882751464844, 7.421119689941406, 18.031627655029297, 28.642135620117188, 39.25264358520508, 49.863155364990234, 60.47365951538086]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 10.0, 3.0, 3.0, 8.0, 10.0, 10.0, 10.0, 10.0, 13.0, 24.0, 28.0, 25.0, 21.0, 27.0, 30.0, 35.0, 26.0, 44.0, 39.0, 35.0, 42.0, 28.0, 39.0, 35.0, 31.0, 36.0, 26.0, 32.0, 39.0, 34.0, 37.0, 24.0, 19.0, 29.0, 30.0, 20.0, 15.0, 14.0, 13.0, 8.0, 9.0, 8.0, 7.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0], "bins": [-72.7452163696289, -70.65095520019531, -68.55668640136719, -66.4624252319336, -64.36815643310547, -62.27389144897461, -60.17962646484375, -58.085365295410156, -55.99109649658203, -53.89683151245117, -51.80256652832031, -49.70830154418945, -47.614036560058594, -45.519771575927734, -43.425506591796875, -41.33124542236328, -39.23698043823242, -37.14271545410156, -35.0484504699707, -32.954185485839844, -30.859920501708984, -28.765655517578125, -26.6713924407959, -24.57712745666504, -22.48286247253418, -20.38859748840332, -18.29433250427246, -16.200069427490234, -14.105803489685059, -12.0115385055542, -9.917274475097656, -7.823009490966797, -5.728748321533203, -3.634483575820923, -1.5402188301086426, 0.5540456771850586, 2.648310661315918, 4.742575645446777, 6.83683967590332, 8.93110466003418, 11.025369644165039, 13.119634628295898, 15.213899612426758, 17.308162689208984, 19.402427673339844, 21.496692657470703, 23.590957641601562, 25.685222625732422, 27.77948760986328, 29.87375259399414, 31.968017578125, 34.06228256225586, 36.15654754638672, 38.25081253051758, 40.34507751464844, 42.43933868408203, 44.533607482910156, 46.627872467041016, 48.722137451171875, 50.816402435302734, 52.910667419433594, 55.00493240356445, 57.09919738769531, 59.193458557128906, 61.287723541259766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 18.0, 23.0, 25.0, 37.0, 76.0, 126.0, 194.0, 321.0, 657.0, 1263.0, 3010.0, 7436.0, 21931.0, 78690.0, 325153.0, 440808.0, 119841.0, 31662.0, 10140.0, 3730.0, 1603.0, 770.0, 398.0, 225.0, 142.0, 88.0, 53.0, 35.0, 27.0, 18.0, 14.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.73046875, -31.6796875, -30.62890625, -29.578125, -28.52734375, -27.4765625, -26.42578125, -25.375, -24.32421875, -23.2734375, -22.22265625, -21.171875, -20.12109375, -19.0703125, -18.01953125, -16.96875, -15.91796875, -14.8671875, -13.81640625, -12.765625, -11.71484375, -10.6640625, -9.61328125, -8.5625, -7.51171875, -6.4609375, -5.41015625, -4.359375, -3.30859375, -2.2578125, -1.20703125, -0.15625, 0.89453125, 1.9453125, 2.99609375, 4.046875, 5.09765625, 6.1484375, 7.19921875, 8.25, 9.30078125, 10.3515625, 11.40234375, 12.453125, 13.50390625, 14.5546875, 15.60546875, 16.65625, 17.70703125, 18.7578125, 19.80859375, 20.859375, 21.91015625, 22.9609375, 24.01171875, 25.0625, 26.11328125, 27.1640625, 28.21484375, 29.265625, 30.31640625, 31.3671875, 32.41796875, 33.46875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 2.0, 9.0, 7.0, 8.0, 14.0, 17.0, 24.0, 24.0, 25.0, 44.0, 32.0, 50.0, 59.0, 65.0, 64.0, 59.0, 49.0, 69.0, 60.0, 57.0, 53.0, 44.0, 36.0, 26.0, 29.0, 19.0, 13.0, 15.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.09375, -8.8250732421875, -8.556396484375, -8.2877197265625, -8.01904296875, -7.7503662109375, -7.481689453125, -7.2130126953125, -6.9443359375, -6.6756591796875, -6.406982421875, -6.1383056640625, -5.86962890625, -5.6009521484375, -5.332275390625, -5.0635986328125, -4.794921875, -4.5262451171875, -4.257568359375, -3.9888916015625, -3.72021484375, -3.4515380859375, -3.182861328125, -2.9141845703125, -2.6455078125, -2.3768310546875, -2.108154296875, -1.8394775390625, -1.57080078125, -1.3021240234375, -1.033447265625, -0.7647705078125, -0.49609375, -0.2274169921875, 0.041259765625, 0.3099365234375, 0.57861328125, 0.8472900390625, 1.115966796875, 1.3846435546875, 1.6533203125, 1.9219970703125, 2.190673828125, 2.4593505859375, 2.72802734375, 2.9967041015625, 3.265380859375, 3.5340576171875, 3.802734375, 4.0714111328125, 4.340087890625, 4.6087646484375, 4.87744140625, 5.1461181640625, 5.414794921875, 5.6834716796875, 5.9521484375, 6.2208251953125, 6.489501953125, 6.7581787109375, 7.02685546875, 7.2955322265625, 7.564208984375, 7.8328857421875, 8.1015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 10.0, 15.0, 18.0, 16.0, 33.0, 38.0, 52.0, 90.0, 113.0, 188.0, 274.0, 427.0, 748.0, 1444.0, 3542.0, 10633.0, 41238.0, 199154.0, 576426.0, 163597.0, 34712.0, 9417.0, 3141.0, 1357.0, 654.0, 396.0, 240.0, 159.0, 109.0, 81.0, 67.0, 51.0, 24.0, 17.0, 19.0, 11.0, 8.0, 6.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.96875, -33.923095703125, -32.87744140625, -31.831787109375, -30.7861328125, -29.740478515625, -28.69482421875, -27.649169921875, -26.603515625, -25.557861328125, -24.51220703125, -23.466552734375, -22.4208984375, -21.375244140625, -20.32958984375, -19.283935546875, -18.23828125, -17.192626953125, -16.14697265625, -15.101318359375, -14.0556640625, -13.010009765625, -11.96435546875, -10.918701171875, -9.873046875, -8.827392578125, -7.78173828125, -6.736083984375, -5.6904296875, -4.644775390625, -3.59912109375, -2.553466796875, -1.5078125, -0.462158203125, 0.58349609375, 1.629150390625, 2.6748046875, 3.720458984375, 4.76611328125, 5.811767578125, 6.857421875, 7.903076171875, 8.94873046875, 9.994384765625, 11.0400390625, 12.085693359375, 13.13134765625, 14.177001953125, 15.22265625, 16.268310546875, 17.31396484375, 18.359619140625, 19.4052734375, 20.450927734375, 21.49658203125, 22.542236328125, 23.587890625, 24.633544921875, 25.67919921875, 26.724853515625, 27.7705078125, 28.816162109375, 29.86181640625, 30.907470703125, 31.953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 14.0, 15.0, 13.0, 16.0, 11.0, 21.0, 36.0, 30.0, 33.0, 29.0, 37.0, 46.0, 44.0, 51.0, 36.0, 32.0, 49.0, 54.0, 44.0, 36.0, 43.0, 43.0, 36.0, 36.0, 31.0, 26.0, 20.0, 18.0, 23.0, 10.0, 6.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.40625, -29.46875, -28.53125, -27.59375, -26.65625, -25.71875, -24.78125, -23.84375, -22.90625, -21.96875, -21.03125, -20.09375, -19.15625, -18.21875, -17.28125, -16.34375, -15.40625, -14.46875, -13.53125, -12.59375, -11.65625, -10.71875, -9.78125, -8.84375, -7.90625, -6.96875, -6.03125, -5.09375, -4.15625, -3.21875, -2.28125, -1.34375, -0.40625, 0.53125, 1.46875, 2.40625, 3.34375, 4.28125, 5.21875, 6.15625, 7.09375, 8.03125, 8.96875, 9.90625, 10.84375, 11.78125, 12.71875, 13.65625, 14.59375, 15.53125, 16.46875, 17.40625, 18.34375, 19.28125, 20.21875, 21.15625, 22.09375, 23.03125, 23.96875, 24.90625, 25.84375, 26.78125, 27.71875, 28.65625, 29.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 14.0, 24.0, 25.0, 37.0, 46.0, 101.0, 184.0, 318.0, 675.0, 1673.0, 5436.0, 22380.0, 117454.0, 467897.0, 340689.0, 71253.0, 14226.0, 3679.0, 1207.0, 532.0, 273.0, 147.0, 101.0, 67.0, 32.0, 15.0, 20.0, 9.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2481689453125, -10.871337890625, -10.4945068359375, -10.11767578125, -9.7408447265625, -9.364013671875, -8.9871826171875, -8.6103515625, -8.2335205078125, -7.856689453125, -7.4798583984375, -7.10302734375, -6.7261962890625, -6.349365234375, -5.9725341796875, -5.595703125, -5.2188720703125, -4.842041015625, -4.4652099609375, -4.08837890625, -3.7115478515625, -3.334716796875, -2.9578857421875, -2.5810546875, -2.2042236328125, -1.827392578125, -1.4505615234375, -1.07373046875, -0.6968994140625, -0.320068359375, 0.0567626953125, 0.43359375, 0.8104248046875, 1.187255859375, 1.5640869140625, 1.94091796875, 2.3177490234375, 2.694580078125, 3.0714111328125, 3.4482421875, 3.8250732421875, 4.201904296875, 4.5787353515625, 4.95556640625, 5.3323974609375, 5.709228515625, 6.0860595703125, 6.462890625, 6.8397216796875, 7.216552734375, 7.5933837890625, 7.97021484375, 8.3470458984375, 8.723876953125, 9.1007080078125, 9.4775390625, 9.8543701171875, 10.231201171875, 10.6080322265625, 10.98486328125, 11.3616943359375, 11.738525390625, 12.1153564453125, 12.4921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 17.0, 7.0, 11.0, 12.0, 29.0, 42.0, 43.0, 65.0, 73.0, 116.0, 101.0, 94.0, 87.0, 77.0, 60.0, 41.0, 26.0, 27.0, 18.0, 17.0, 5.0, 5.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020580291748046875, -0.001984149217605591, -0.0019102692604064941, -0.0018363893032073975, -0.0017625093460083008, -0.001688629388809204, -0.0016147494316101074, -0.0015408694744110107, -0.001466989517211914, -0.0013931095600128174, -0.0013192296028137207, -0.001245349645614624, -0.0011714696884155273, -0.0010975897312164307, -0.001023709774017334, -0.0009498298168182373, -0.0008759498596191406, -0.0008020699024200439, -0.0007281899452209473, -0.0006543099880218506, -0.0005804300308227539, -0.0005065500736236572, -0.00043267011642456055, -0.00035879015922546387, -0.0002849102020263672, -0.0002110302448272705, -0.00013715028762817383, -6.327033042907715e-05, 1.0609626770019531e-05, 8.448958396911621e-05, 0.0001583695411682129, 0.00023224949836730957, 0.00030612945556640625, 0.00038000941276550293, 0.0004538893699645996, 0.0005277693271636963, 0.000601649284362793, 0.0006755292415618896, 0.0007494091987609863, 0.000823289155960083, 0.0008971691131591797, 0.0009710490703582764, 0.001044929027557373, 0.0011188089847564697, 0.0011926889419555664, 0.001266568899154663, 0.0013404488563537598, 0.0014143288135528564, 0.0014882087707519531, 0.0015620887279510498, 0.0016359686851501465, 0.0017098486423492432, 0.0017837285995483398, 0.0018576085567474365, 0.0019314885139465332, 0.00200536847114563, 0.0020792484283447266, 0.0021531283855438232, 0.00222700834274292, 0.0023008882999420166, 0.0023747682571411133, 0.00244864821434021, 0.0025225281715393066, 0.0025964081287384033, 0.0026702880859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 8.0, 10.0, 5.0, 24.0, 33.0, 42.0, 72.0, 151.0, 272.0, 556.0, 1499.0, 4754.0, 24267.0, 242288.0, 659321.0, 97915.0, 12301.0, 3078.0, 994.0, 427.0, 205.0, 112.0, 73.0, 48.0, 25.0, 17.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.328125, -20.72412109375, -20.1201171875, -19.51611328125, -18.912109375, -18.30810546875, -17.7041015625, -17.10009765625, -16.49609375, -15.89208984375, -15.2880859375, -14.68408203125, -14.080078125, -13.47607421875, -12.8720703125, -12.26806640625, -11.6640625, -11.06005859375, -10.4560546875, -9.85205078125, -9.248046875, -8.64404296875, -8.0400390625, -7.43603515625, -6.83203125, -6.22802734375, -5.6240234375, -5.02001953125, -4.416015625, -3.81201171875, -3.2080078125, -2.60400390625, -2.0, -1.39599609375, -0.7919921875, -0.18798828125, 0.416015625, 1.02001953125, 1.6240234375, 2.22802734375, 2.83203125, 3.43603515625, 4.0400390625, 4.64404296875, 5.248046875, 5.85205078125, 6.4560546875, 7.06005859375, 7.6640625, 8.26806640625, 8.8720703125, 9.47607421875, 10.080078125, 10.68408203125, 11.2880859375, 11.89208984375, 12.49609375, 13.10009765625, 13.7041015625, 14.30810546875, 14.912109375, 15.51611328125, 16.1201171875, 16.72412109375, 17.328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 19.0, 16.0, 14.0, 23.0, 37.0, 45.0, 56.0, 38.0, 65.0, 70.0, 79.0, 68.0, 76.0, 59.0, 70.0, 50.0, 39.0, 36.0, 25.0, 17.0, 16.0, 14.0, 14.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.6328125, -10.34381103515625, -10.0548095703125, -9.76580810546875, -9.476806640625, -9.18780517578125, -8.8988037109375, -8.60980224609375, -8.32080078125, -8.03179931640625, -7.7427978515625, -7.45379638671875, -7.164794921875, -6.87579345703125, -6.5867919921875, -6.29779052734375, -6.0087890625, -5.71978759765625, -5.4307861328125, -5.14178466796875, -4.852783203125, -4.56378173828125, -4.2747802734375, -3.98577880859375, -3.69677734375, -3.40777587890625, -3.1187744140625, -2.82977294921875, -2.540771484375, -2.25177001953125, -1.9627685546875, -1.67376708984375, -1.384765625, -1.09576416015625, -0.8067626953125, -0.51776123046875, -0.228759765625, 0.06024169921875, 0.3492431640625, 0.63824462890625, 0.92724609375, 1.21624755859375, 1.5052490234375, 1.79425048828125, 2.083251953125, 2.37225341796875, 2.6612548828125, 2.95025634765625, 3.2392578125, 3.52825927734375, 3.8172607421875, 4.10626220703125, 4.395263671875, 4.68426513671875, 4.9732666015625, 5.26226806640625, 5.55126953125, 5.84027099609375, 6.1292724609375, 6.41827392578125, 6.707275390625, 6.99627685546875, 7.2852783203125, 7.57427978515625, 7.86328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 19.0, 19.0, 81.0, 172.0, 250.0, 211.0, 149.0, 61.0, 22.0, 14.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.75823974609375, -119.47874450683594, -107.1992416381836, -94.91973876953125, -82.64024353027344, -70.36074829101562, -58.08124542236328, -45.80174255371094, -33.522247314453125, -21.242748260498047, -8.963249206542969, 3.3162498474121094, 15.595748901367188, 27.875247955322266, 40.154747009277344, 52.43424987792969, 64.7137451171875, 76.99324035644531, 89.27274322509766, 101.55224609375, 113.83174133300781, 126.11123657226562, 138.3907470703125, 150.6702423095703, 162.94973754882812, 175.22923278808594, 187.50872802734375, 199.78823852539062, 212.06773376464844, 224.34722900390625, 236.62673950195312, 248.90623474121094, 261.18572998046875, 273.4652404785156, 285.7447204589844, 298.02423095703125, 310.3037109375, 322.5832214355469, 334.86273193359375, 347.1422119140625, 359.4217224121094, 371.70123291015625, 383.980712890625, 396.2602233886719, 408.53973388671875, 420.8192138671875, 433.0987243652344, 445.37823486328125, 457.65771484375, 469.9372253417969, 482.2167053222656, 494.4962158203125, 506.77569580078125, 519.0552368164062, 531.334716796875, 543.6141967773438, 555.8936767578125, 568.1731567382812, 580.4526977539062, 592.732177734375, 605.0116577148438, 617.2911987304688, 629.5706787109375, 641.8501586914062, 654.1296997070312]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 4.0, 8.0, 11.0, 10.0, 5.0, 12.0, 14.0, 25.0, 20.0, 25.0, 34.0, 37.0, 42.0, 50.0, 51.0, 49.0, 38.0, 49.0, 44.0, 42.0, 66.0, 50.0, 38.0, 36.0, 34.0, 36.0, 21.0, 23.0, 20.0, 15.0, 17.0, 19.0, 11.0, 12.0, 7.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.80227661132812, -142.89404296875, -137.98580932617188, -133.0775604248047, -128.16932678222656, -123.26109313964844, -118.35285949707031, -113.44462585449219, -108.53638458251953, -103.6281509399414, -98.71990966796875, -93.81167602539062, -88.9034423828125, -83.99520111083984, -79.08696746826172, -74.17872619628906, -69.27049255371094, -64.36225891113281, -59.454017639160156, -54.54578399658203, -49.63754653930664, -44.72930908203125, -39.821075439453125, -34.912837982177734, -30.004600524902344, -25.096363067626953, -20.188127517700195, -15.279891014099121, -10.371654510498047, -5.463417053222656, -0.5551815032958984, 4.353054046630859, 9.261276245117188, 14.169512748718262, 19.077749252319336, 23.985984802246094, 28.894222259521484, 33.802459716796875, 38.710693359375, 43.61893081665039, 48.52716827392578, 53.43540573120117, 58.34364318847656, 63.25187683105469, 68.16011047363281, 73.06835174560547, 77.9765853881836, 82.88482666015625, 87.79306030273438, 92.7012939453125, 97.60953521728516, 102.51776885986328, 107.42601013183594, 112.33424377441406, 117.24247741699219, 122.15071105957031, 127.05895233154297, 131.96719360351562, 136.87542724609375, 141.78366088867188, 146.69189453125, 151.60012817382812, 156.5083770751953, 161.41661071777344, 166.32484436035156]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 7.0, 14.0, 14.0, 17.0, 27.0, 26.0, 34.0, 51.0, 65.0, 89.0, 121.0, 171.0, 255.0, 403.0, 737.0, 1389.0, 2873.0, 7261.0, 25073.0, 3794483.0, 327325.0, 21368.0, 6558.0, 2616.0, 1300.0, 713.0, 423.0, 261.0, 160.0, 118.0, 93.0, 70.0, 46.0, 29.0, 24.0, 18.0, 10.0, 10.0, 15.0, 5.0, 3.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.84375, -44.31298828125, -42.7822265625, -41.25146484375, -39.720703125, -38.18994140625, -36.6591796875, -35.12841796875, -33.59765625, -32.06689453125, -30.5361328125, -29.00537109375, -27.474609375, -25.94384765625, -24.4130859375, -22.88232421875, -21.3515625, -19.82080078125, -18.2900390625, -16.75927734375, -15.228515625, -13.69775390625, -12.1669921875, -10.63623046875, -9.10546875, -7.57470703125, -6.0439453125, -4.51318359375, -2.982421875, -1.45166015625, 0.0791015625, 1.60986328125, 3.140625, 4.67138671875, 6.2021484375, 7.73291015625, 9.263671875, 10.79443359375, 12.3251953125, 13.85595703125, 15.38671875, 16.91748046875, 18.4482421875, 19.97900390625, 21.509765625, 23.04052734375, 24.5712890625, 26.10205078125, 27.6328125, 29.16357421875, 30.6943359375, 32.22509765625, 33.755859375, 35.28662109375, 36.8173828125, 38.34814453125, 39.87890625, 41.40966796875, 42.9404296875, 44.47119140625, 46.001953125, 47.53271484375, 49.0634765625, 50.59423828125, 52.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 0.0, 5.0, 9.0, 6.0, 5.0, 7.0, 14.0, 26.0, 30.0, 33.0, 37.0, 34.0, 54.0, 47.0, 51.0, 57.0, 45.0, 56.0, 52.0, 57.0, 62.0, 48.0, 41.0, 27.0, 36.0, 32.0, 26.0, 16.0, 19.0, 15.0, 15.0, 11.0, 7.0, 9.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.359375, -9.08990478515625, -8.8204345703125, -8.55096435546875, -8.281494140625, -8.01202392578125, -7.7425537109375, -7.47308349609375, -7.20361328125, -6.93414306640625, -6.6646728515625, -6.39520263671875, -6.125732421875, -5.85626220703125, -5.5867919921875, -5.31732177734375, -5.0478515625, -4.77838134765625, -4.5089111328125, -4.23944091796875, -3.969970703125, -3.70050048828125, -3.4310302734375, -3.16156005859375, -2.89208984375, -2.62261962890625, -2.3531494140625, -2.08367919921875, -1.814208984375, -1.54473876953125, -1.2752685546875, -1.00579833984375, -0.736328125, -0.46685791015625, -0.1973876953125, 0.07208251953125, 0.341552734375, 0.61102294921875, 0.8804931640625, 1.14996337890625, 1.41943359375, 1.68890380859375, 1.9583740234375, 2.22784423828125, 2.497314453125, 2.76678466796875, 3.0362548828125, 3.30572509765625, 3.5751953125, 3.84466552734375, 4.1141357421875, 4.38360595703125, 4.653076171875, 4.92254638671875, 5.1920166015625, 5.46148681640625, 5.73095703125, 6.00042724609375, 6.2698974609375, 6.53936767578125, 6.808837890625, 7.07830810546875, 7.3477783203125, 7.61724853515625, 7.88671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 20.0, 22.0, 40.0, 79.0, 137.0, 239.0, 426.0, 770.0, 1407.0, 2961.0, 7840.0, 35541.0, 3986952.0, 133873.0, 14976.0, 4558.0, 2039.0, 1063.0, 568.0, 317.0, 187.0, 99.0, 59.0, 46.0, 22.0, 13.0, 4.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.34375, -38.77685546875, -37.2099609375, -35.64306640625, -34.076171875, -32.50927734375, -30.9423828125, -29.37548828125, -27.80859375, -26.24169921875, -24.6748046875, -23.10791015625, -21.541015625, -19.97412109375, -18.4072265625, -16.84033203125, -15.2734375, -13.70654296875, -12.1396484375, -10.57275390625, -9.005859375, -7.43896484375, -5.8720703125, -4.30517578125, -2.73828125, -1.17138671875, 0.3955078125, 1.96240234375, 3.529296875, 5.09619140625, 6.6630859375, 8.22998046875, 9.796875, 11.36376953125, 12.9306640625, 14.49755859375, 16.064453125, 17.63134765625, 19.1982421875, 20.76513671875, 22.33203125, 23.89892578125, 25.4658203125, 27.03271484375, 28.599609375, 30.16650390625, 31.7333984375, 33.30029296875, 34.8671875, 36.43408203125, 38.0009765625, 39.56787109375, 41.134765625, 42.70166015625, 44.2685546875, 45.83544921875, 47.40234375, 48.96923828125, 50.5361328125, 52.10302734375, 53.669921875, 55.23681640625, 56.8037109375, 58.37060546875, 59.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 8.0, 9.0, 17.0, 21.0, 53.0, 144.0, 3382.0, 241.0, 87.0, 41.0, 29.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7421875, -10.46453857421875, -10.1868896484375, -9.90924072265625, -9.631591796875, -9.35394287109375, -9.0762939453125, -8.79864501953125, -8.52099609375, -8.24334716796875, -7.9656982421875, -7.68804931640625, -7.410400390625, -7.13275146484375, -6.8551025390625, -6.57745361328125, -6.2998046875, -6.02215576171875, -5.7445068359375, -5.46685791015625, -5.189208984375, -4.91156005859375, -4.6339111328125, -4.35626220703125, -4.07861328125, -3.80096435546875, -3.5233154296875, -3.24566650390625, -2.968017578125, -2.69036865234375, -2.4127197265625, -2.13507080078125, -1.857421875, -1.57977294921875, -1.3021240234375, -1.02447509765625, -0.746826171875, -0.46917724609375, -0.1915283203125, 0.08612060546875, 0.36376953125, 0.64141845703125, 0.9190673828125, 1.19671630859375, 1.474365234375, 1.75201416015625, 2.0296630859375, 2.30731201171875, 2.5849609375, 2.86260986328125, 3.1402587890625, 3.41790771484375, 3.695556640625, 3.97320556640625, 4.2508544921875, 4.52850341796875, 4.80615234375, 5.08380126953125, 5.3614501953125, 5.63909912109375, 5.916748046875, 6.19439697265625, 6.4720458984375, 6.74969482421875, 7.02734375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 12.0, 29.0, 49.0, 68.0, 126.0, 135.0, 165.0, 122.0, 92.0, 75.0, 40.0, 29.0, 20.0, 16.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.60188865661621, -20.338390350341797, -19.074892044067383, -17.81139373779297, -16.547895431518555, -15.28439712524414, -14.020898818969727, -12.757400512695312, -11.493902206420898, -10.230403900146484, -8.96690559387207, -7.703407287597656, -6.439908981323242, -5.176410675048828, -3.912912368774414, -2.6494140625, -1.385915756225586, -0.12241744995117188, 1.1410808563232422, 2.4045791625976562, 3.6680774688720703, 4.931575775146484, 6.195074081420898, 7.4585723876953125, 8.722070693969727, 9.98556900024414, 11.249067306518555, 12.512565612792969, 13.776063919067383, 15.039562225341797, 16.30306053161621, 17.566558837890625, 18.830055236816406, 20.09355354309082, 21.357051849365234, 22.62055015563965, 23.884048461914062, 25.147546768188477, 26.41104507446289, 27.674543380737305, 28.93804168701172, 30.201539993286133, 31.465038299560547, 32.728538513183594, 33.992034912109375, 35.255531311035156, 36.5190315246582, 37.78253173828125, 39.04602813720703, 40.30952453613281, 41.57302474975586, 42.836524963378906, 44.10002136230469, 45.36351776123047, 46.627017974853516, 47.89051818847656, 49.154014587402344, 50.417510986328125, 51.68101119995117, 52.94451141357422, 54.2080078125, 55.47150421142578, 56.73500442504883, 57.998504638671875, 59.262001037597656]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 9.0, 3.0, 7.0, 12.0, 13.0, 16.0, 11.0, 12.0, 17.0, 16.0, 27.0, 28.0, 38.0, 33.0, 29.0, 22.0, 27.0, 34.0, 33.0, 29.0, 32.0, 48.0, 32.0, 44.0, 45.0, 40.0, 36.0, 38.0, 43.0, 35.0, 26.0, 30.0, 19.0, 17.0, 18.0, 21.0, 13.0, 11.0, 6.0, 13.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.117809295654297, -13.632817268371582, -13.14782428741455, -12.662832260131836, -12.177839279174805, -11.69284725189209, -11.207855224609375, -10.722862243652344, -10.237870216369629, -9.752878189086914, -9.267885208129883, -8.782893180847168, -8.297901153564453, -7.812908172607422, -7.327916145324707, -6.842923641204834, -6.357931137084961, -5.872938632965088, -5.387946128845215, -4.9029541015625, -4.417961597442627, -3.932969093322754, -3.44797682762146, -2.962984561920166, -2.477992057800293, -1.9929996728897095, -1.508007287979126, -1.0230149030685425, -0.538022518157959, -0.05303001403808594, 0.431962251663208, 0.916954517364502, 1.401947021484375, 1.8869394063949585, 2.371931791305542, 2.856924057006836, 3.341916561126709, 3.826909065246582, 4.311901092529297, 4.79689359664917, 5.281886100769043, 5.766878604888916, 6.251871109008789, 6.736863136291504, 7.221855640411377, 7.70684814453125, 8.191840171813965, 8.67683219909668, 9.161825180053711, 9.646817207336426, 10.131810188293457, 10.616802215576172, 11.101795196533203, 11.586787223815918, 12.071779251098633, 12.556772232055664, 13.041764259338379, 13.526756286621094, 14.011749267578125, 14.49674129486084, 14.981733322143555, 15.466726303100586, 15.9517183303833, 16.436710357666016, 16.921703338623047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 11.0, 8.0, 17.0, 15.0, 30.0, 35.0, 52.0, 111.0, 141.0, 249.0, 434.0, 843.0, 1487.0, 2995.0, 6023.0, 13103.0, 29019.0, 67449.0, 170950.0, 354317.0, 236705.0, 92761.0, 38502.0, 17335.0, 7988.0, 3660.0, 1934.0, 1011.0, 540.0, 313.0, 175.0, 118.0, 73.0, 50.0, 25.0, 26.0, 18.0, 12.0, 4.0, 5.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.475830078125, -17.87353515625, -17.271240234375, -16.6689453125, -16.066650390625, -15.46435546875, -14.862060546875, -14.259765625, -13.657470703125, -13.05517578125, -12.452880859375, -11.8505859375, -11.248291015625, -10.64599609375, -10.043701171875, -9.44140625, -8.839111328125, -8.23681640625, -7.634521484375, -7.0322265625, -6.429931640625, -5.82763671875, -5.225341796875, -4.623046875, -4.020751953125, -3.41845703125, -2.816162109375, -2.2138671875, -1.611572265625, -1.00927734375, -0.406982421875, 0.1953125, 0.797607421875, 1.39990234375, 2.002197265625, 2.6044921875, 3.206787109375, 3.80908203125, 4.411376953125, 5.013671875, 5.615966796875, 6.21826171875, 6.820556640625, 7.4228515625, 8.025146484375, 8.62744140625, 9.229736328125, 9.83203125, 10.434326171875, 11.03662109375, 11.638916015625, 12.2412109375, 12.843505859375, 13.44580078125, 14.048095703125, 14.650390625, 15.252685546875, 15.85498046875, 16.457275390625, 17.0595703125, 17.661865234375, 18.26416015625, 18.866455078125, 19.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 6.0, 8.0, 12.0, 11.0, 27.0, 23.0, 30.0, 38.0, 40.0, 46.0, 44.0, 47.0, 51.0, 66.0, 47.0, 62.0, 54.0, 47.0, 46.0, 40.0, 32.0, 43.0, 26.0, 22.0, 24.0, 17.0, 13.0, 20.0, 10.0, 5.0, 13.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.09375, -8.8251953125, -8.556640625, -8.2880859375, -8.01953125, -7.7509765625, -7.482421875, -7.2138671875, -6.9453125, -6.6767578125, -6.408203125, -6.1396484375, -5.87109375, -5.6025390625, -5.333984375, -5.0654296875, -4.796875, -4.5283203125, -4.259765625, -3.9912109375, -3.72265625, -3.4541015625, -3.185546875, -2.9169921875, -2.6484375, -2.3798828125, -2.111328125, -1.8427734375, -1.57421875, -1.3056640625, -1.037109375, -0.7685546875, -0.5, -0.2314453125, 0.037109375, 0.3056640625, 0.57421875, 0.8427734375, 1.111328125, 1.3798828125, 1.6484375, 1.9169921875, 2.185546875, 2.4541015625, 2.72265625, 2.9912109375, 3.259765625, 3.5283203125, 3.796875, 4.0654296875, 4.333984375, 4.6025390625, 4.87109375, 5.1396484375, 5.408203125, 5.6767578125, 5.9453125, 6.2138671875, 6.482421875, 6.7509765625, 7.01953125, 7.2880859375, 7.556640625, 7.8251953125, 8.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 13.0, 14.0, 22.0, 38.0, 54.0, 60.0, 72.0, 105.0, 142.0, 204.0, 286.0, 456.0, 640.0, 1091.0, 2459.0, 7254.0, 26149.0, 112527.0, 604931.0, 228375.0, 44293.0, 11759.0, 3701.0, 1483.0, 769.0, 496.0, 286.0, 220.0, 146.0, 117.0, 84.0, 57.0, 60.0, 34.0, 29.0, 23.0, 16.0, 16.0, 4.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.765869140625, -27.82861328125, -26.891357421875, -25.9541015625, -25.016845703125, -24.07958984375, -23.142333984375, -22.205078125, -21.267822265625, -20.33056640625, -19.393310546875, -18.4560546875, -17.518798828125, -16.58154296875, -15.644287109375, -14.70703125, -13.769775390625, -12.83251953125, -11.895263671875, -10.9580078125, -10.020751953125, -9.08349609375, -8.146240234375, -7.208984375, -6.271728515625, -5.33447265625, -4.397216796875, -3.4599609375, -2.522705078125, -1.58544921875, -0.648193359375, 0.2890625, 1.226318359375, 2.16357421875, 3.100830078125, 4.0380859375, 4.975341796875, 5.91259765625, 6.849853515625, 7.787109375, 8.724365234375, 9.66162109375, 10.598876953125, 11.5361328125, 12.473388671875, 13.41064453125, 14.347900390625, 15.28515625, 16.222412109375, 17.15966796875, 18.096923828125, 19.0341796875, 19.971435546875, 20.90869140625, 21.845947265625, 22.783203125, 23.720458984375, 24.65771484375, 25.594970703125, 26.5322265625, 27.469482421875, 28.40673828125, 29.343994140625, 30.28125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 10.0, 4.0, 9.0, 17.0, 12.0, 12.0, 16.0, 15.0, 22.0, 32.0, 28.0, 31.0, 37.0, 34.0, 37.0, 26.0, 36.0, 40.0, 44.0, 38.0, 39.0, 46.0, 43.0, 46.0, 35.0, 36.0, 35.0, 26.0, 20.0, 29.0, 23.0, 15.0, 17.0, 11.0, 10.0, 12.0, 11.0, 3.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.87109375, -24.9609375, -24.05078125, -23.140625, -22.23046875, -21.3203125, -20.41015625, -19.5, -18.58984375, -17.6796875, -16.76953125, -15.859375, -14.94921875, -14.0390625, -13.12890625, -12.21875, -11.30859375, -10.3984375, -9.48828125, -8.578125, -7.66796875, -6.7578125, -5.84765625, -4.9375, -4.02734375, -3.1171875, -2.20703125, -1.296875, -0.38671875, 0.5234375, 1.43359375, 2.34375, 3.25390625, 4.1640625, 5.07421875, 5.984375, 6.89453125, 7.8046875, 8.71484375, 9.625, 10.53515625, 11.4453125, 12.35546875, 13.265625, 14.17578125, 15.0859375, 15.99609375, 16.90625, 17.81640625, 18.7265625, 19.63671875, 20.546875, 21.45703125, 22.3671875, 23.27734375, 24.1875, 25.09765625, 26.0078125, 26.91796875, 27.828125, 28.73828125, 29.6484375, 30.55859375, 31.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 18.0, 23.0, 32.0, 64.0, 76.0, 129.0, 227.0, 365.0, 670.0, 1345.0, 2857.0, 7664.0, 27087.0, 146372.0, 635943.0, 178835.0, 32021.0, 8602.0, 3194.0, 1386.0, 661.0, 350.0, 209.0, 115.0, 86.0, 60.0, 40.0, 27.0, 17.0, 14.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.96875, -11.563720703125, -11.15869140625, -10.753662109375, -10.3486328125, -9.943603515625, -9.53857421875, -9.133544921875, -8.728515625, -8.323486328125, -7.91845703125, -7.513427734375, -7.1083984375, -6.703369140625, -6.29833984375, -5.893310546875, -5.48828125, -5.083251953125, -4.67822265625, -4.273193359375, -3.8681640625, -3.463134765625, -3.05810546875, -2.653076171875, -2.248046875, -1.843017578125, -1.43798828125, -1.032958984375, -0.6279296875, -0.222900390625, 0.18212890625, 0.587158203125, 0.9921875, 1.397216796875, 1.80224609375, 2.207275390625, 2.6123046875, 3.017333984375, 3.42236328125, 3.827392578125, 4.232421875, 4.637451171875, 5.04248046875, 5.447509765625, 5.8525390625, 6.257568359375, 6.66259765625, 7.067626953125, 7.47265625, 7.877685546875, 8.28271484375, 8.687744140625, 9.0927734375, 9.497802734375, 9.90283203125, 10.307861328125, 10.712890625, 11.117919921875, 11.52294921875, 11.927978515625, 12.3330078125, 12.738037109375, 13.14306640625, 13.548095703125, 13.953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 12.0, 11.0, 10.0, 22.0, 38.0, 32.0, 42.0, 56.0, 59.0, 110.0, 88.0, 85.0, 85.0, 71.0, 66.0, 51.0, 36.0, 27.0, 22.0, 17.0, 7.0, 10.0, 5.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017385482788085938, -0.001680418848991394, -0.0016222894191741943, -0.0015641599893569946, -0.001506030559539795, -0.0014479011297225952, -0.0013897716999053955, -0.0013316422700881958, -0.001273512840270996, -0.0012153834104537964, -0.0011572539806365967, -0.001099124550819397, -0.0010409951210021973, -0.0009828656911849976, -0.0009247362613677979, -0.0008666068315505981, -0.0008084774017333984, -0.0007503479719161987, -0.000692218542098999, -0.0006340891122817993, -0.0005759596824645996, -0.0005178302526473999, -0.0004597008228302002, -0.0004015713930130005, -0.0003434419631958008, -0.0002853125333786011, -0.00022718310356140137, -0.00016905367374420166, -0.00011092424392700195, -5.2794814109802246e-05, 5.334615707397461e-06, 6.346404552459717e-05, 0.00012159347534179688, 0.00017972290515899658, 0.0002378523349761963, 0.000295981764793396, 0.0003541111946105957, 0.0004122406244277954, 0.0004703700542449951, 0.0005284994840621948, 0.0005866289138793945, 0.0006447583436965942, 0.0007028877735137939, 0.0007610172033309937, 0.0008191466331481934, 0.0008772760629653931, 0.0009354054927825928, 0.0009935349225997925, 0.0010516643524169922, 0.001109793782234192, 0.0011679232120513916, 0.0012260526418685913, 0.001284182071685791, 0.0013423115015029907, 0.0014004409313201904, 0.0014585703611373901, 0.0015166997909545898, 0.0015748292207717896, 0.0016329586505889893, 0.001691088080406189, 0.0017492175102233887, 0.0018073469400405884, 0.001865476369857788, 0.0019236057996749878, 0.0019817352294921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 15.0, 16.0, 30.0, 45.0, 72.0, 140.0, 348.0, 786.0, 2244.0, 9250.0, 88147.0, 802580.0, 128874.0, 11732.0, 2620.0, 883.0, 386.0, 160.0, 93.0, 43.0, 36.0, 20.0, 10.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.4375, -22.7177734375, -21.998046875, -21.2783203125, -20.55859375, -19.8388671875, -19.119140625, -18.3994140625, -17.6796875, -16.9599609375, -16.240234375, -15.5205078125, -14.80078125, -14.0810546875, -13.361328125, -12.6416015625, -11.921875, -11.2021484375, -10.482421875, -9.7626953125, -9.04296875, -8.3232421875, -7.603515625, -6.8837890625, -6.1640625, -5.4443359375, -4.724609375, -4.0048828125, -3.28515625, -2.5654296875, -1.845703125, -1.1259765625, -0.40625, 0.3134765625, 1.033203125, 1.7529296875, 2.47265625, 3.1923828125, 3.912109375, 4.6318359375, 5.3515625, 6.0712890625, 6.791015625, 7.5107421875, 8.23046875, 8.9501953125, 9.669921875, 10.3896484375, 11.109375, 11.8291015625, 12.548828125, 13.2685546875, 13.98828125, 14.7080078125, 15.427734375, 16.1474609375, 16.8671875, 17.5869140625, 18.306640625, 19.0263671875, 19.74609375, 20.4658203125, 21.185546875, 21.9052734375, 22.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 0.0, 10.0, 14.0, 15.0, 20.0, 17.0, 58.0, 77.0, 96.0, 122.0, 121.0, 122.0, 97.0, 74.0, 51.0, 38.0, 17.0, 17.0, 13.0, 10.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.142578125, -16.58203125, -16.021484375, -15.4609375, -14.900390625, -14.33984375, -13.779296875, -13.21875, -12.658203125, -12.09765625, -11.537109375, -10.9765625, -10.416015625, -9.85546875, -9.294921875, -8.734375, -8.173828125, -7.61328125, -7.052734375, -6.4921875, -5.931640625, -5.37109375, -4.810546875, -4.25, -3.689453125, -3.12890625, -2.568359375, -2.0078125, -1.447265625, -0.88671875, -0.326171875, 0.234375, 0.794921875, 1.35546875, 1.916015625, 2.4765625, 3.037109375, 3.59765625, 4.158203125, 4.71875, 5.279296875, 5.83984375, 6.400390625, 6.9609375, 7.521484375, 8.08203125, 8.642578125, 9.203125, 9.763671875, 10.32421875, 10.884765625, 11.4453125, 12.005859375, 12.56640625, 13.126953125, 13.6875, 14.248046875, 14.80859375, 15.369140625, 15.9296875, 16.490234375, 17.05078125, 17.611328125, 18.171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 24.0, 120.0, 343.0, 359.0, 120.0, 30.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1158.416015625, -1135.703369140625, -1112.9908447265625, -1090.2781982421875, -1067.565673828125, -1044.85302734375, -1022.1404418945312, -999.4278564453125, -976.7152709960938, -954.002685546875, -931.2901000976562, -908.5775146484375, -885.8648681640625, -863.1522827148438, -840.439697265625, -817.7271118164062, -795.0145263671875, -772.3019409179688, -749.58935546875, -726.876708984375, -704.1641235351562, -681.4515380859375, -658.7389526367188, -636.0263671875, -613.313720703125, -590.6011352539062, -567.8885498046875, -545.1759033203125, -522.4633178710938, -499.750732421875, -477.03814697265625, -454.3255615234375, -431.61297607421875, -408.900390625, -386.1877746582031, -363.4751892089844, -340.7626037597656, -318.04998779296875, -295.33740234375, -272.62481689453125, -249.91221618652344, -227.19961547851562, -204.48703002929688, -181.77442932128906, -159.06182861328125, -136.3492431640625, -113.63664245605469, -90.92405700683594, -68.21145629882812, -45.498863220214844, -22.786266326904297, -0.07366943359375, 22.63892364501953, 45.35151672363281, 68.06411743164062, 90.77670288085938, 113.48930358886719, 136.201904296875, 158.91448974609375, 181.62709045410156, 204.33969116210938, 227.05227661132812, 249.76487731933594, 272.47747802734375, 295.1900634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 4.0, 7.0, 9.0, 6.0, 10.0, 14.0, 14.0, 22.0, 26.0, 20.0, 33.0, 28.0, 41.0, 41.0, 31.0, 47.0, 38.0, 33.0, 39.0, 42.0, 60.0, 43.0, 41.0, 42.0, 35.0, 27.0, 28.0, 31.0, 25.0, 15.0, 15.0, 16.0, 19.0, 16.0, 8.0, 10.0, 9.0, 8.0, 8.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-173.44593811035156, -168.6623992919922, -163.87884521484375, -159.09530639648438, -154.311767578125, -149.52821350097656, -144.7446746826172, -139.96112060546875, -135.17758178710938, -130.39404296875, -125.61048889160156, -120.82695007324219, -116.04340362548828, -111.25985717773438, -106.476318359375, -101.6927719116211, -96.90922546386719, -92.12567901611328, -87.34213256835938, -82.55859375, -77.7750473022461, -72.99150085449219, -68.20796203613281, -63.424415588378906, -58.640869140625, -53.857322692871094, -49.07378005981445, -44.29023742675781, -39.506690979003906, -34.72314453125, -29.93960189819336, -25.15605926513672, -20.37249755859375, -15.588953018188477, -10.805408477783203, -6.02186393737793, -1.2383193969726562, 3.545225143432617, 8.32876968383789, 13.112312316894531, 17.895858764648438, 22.67940330505371, 27.462947845458984, 32.246490478515625, 37.03003692626953, 41.81358337402344, 46.59712600708008, 51.38066864013672, 56.164215087890625, 60.94776153564453, 65.73130798339844, 70.51484680175781, 75.29839324951172, 80.08193969726562, 84.865478515625, 89.6490249633789, 94.43257141113281, 99.21611785888672, 103.99966430664062, 108.783203125, 113.5667495727539, 118.35029602050781, 123.13383483886719, 127.9173812866211, 132.700927734375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 14.0, 20.0, 23.0, 51.0, 63.0, 112.0, 202.0, 326.0, 524.0, 857.0, 1738.0, 4685.0, 20238.0, 635856.0, 3499471.0, 21315.0, 4890.0, 1718.0, 830.0, 517.0, 297.0, 182.0, 143.0, 71.0, 43.0, 32.0, 15.0, 9.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.86767578125, -49.1728515625, -47.47802734375, -45.783203125, -44.08837890625, -42.3935546875, -40.69873046875, -39.00390625, -37.30908203125, -35.6142578125, -33.91943359375, -32.224609375, -30.52978515625, -28.8349609375, -27.14013671875, -25.4453125, -23.75048828125, -22.0556640625, -20.36083984375, -18.666015625, -16.97119140625, -15.2763671875, -13.58154296875, -11.88671875, -10.19189453125, -8.4970703125, -6.80224609375, -5.107421875, -3.41259765625, -1.7177734375, -0.02294921875, 1.671875, 3.36669921875, 5.0615234375, 6.75634765625, 8.451171875, 10.14599609375, 11.8408203125, 13.53564453125, 15.23046875, 16.92529296875, 18.6201171875, 20.31494140625, 22.009765625, 23.70458984375, 25.3994140625, 27.09423828125, 28.7890625, 30.48388671875, 32.1787109375, 33.87353515625, 35.568359375, 37.26318359375, 38.9580078125, 40.65283203125, 42.34765625, 44.04248046875, 45.7373046875, 47.43212890625, 49.126953125, 50.82177734375, 52.5166015625, 54.21142578125, 55.90625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 11.0, 12.0, 12.0, 26.0, 32.0, 30.0, 35.0, 35.0, 53.0, 56.0, 52.0, 59.0, 43.0, 45.0, 70.0, 54.0, 39.0, 52.0, 38.0, 39.0, 32.0, 26.0, 18.0, 26.0, 21.0, 11.0, 9.0, 12.0, 8.0, 8.0, 0.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.96875, -8.70831298828125, -8.4478759765625, -8.18743896484375, -7.927001953125, -7.66656494140625, -7.4061279296875, -7.14569091796875, -6.88525390625, -6.62481689453125, -6.3643798828125, -6.10394287109375, -5.843505859375, -5.58306884765625, -5.3226318359375, -5.06219482421875, -4.8017578125, -4.54132080078125, -4.2808837890625, -4.02044677734375, -3.760009765625, -3.49957275390625, -3.2391357421875, -2.97869873046875, -2.71826171875, -2.45782470703125, -2.1973876953125, -1.93695068359375, -1.676513671875, -1.41607666015625, -1.1556396484375, -0.89520263671875, -0.634765625, -0.37432861328125, -0.1138916015625, 0.14654541015625, 0.406982421875, 0.66741943359375, 0.9278564453125, 1.18829345703125, 1.44873046875, 1.70916748046875, 1.9696044921875, 2.23004150390625, 2.490478515625, 2.75091552734375, 3.0113525390625, 3.27178955078125, 3.5322265625, 3.79266357421875, 4.0531005859375, 4.31353759765625, 4.573974609375, 4.83441162109375, 5.0948486328125, 5.35528564453125, 5.61572265625, 5.87615966796875, 6.1365966796875, 6.39703369140625, 6.657470703125, 6.91790771484375, 7.1783447265625, 7.43878173828125, 7.69921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 5.0, 14.0, 12.0, 18.0, 20.0, 40.0, 51.0, 55.0, 89.0, 139.0, 233.0, 307.0, 493.0, 819.0, 1199.0, 2143.0, 3784.0, 8293.0, 21800.0, 93944.0, 3830560.0, 177907.0, 30493.0, 10628.0, 4718.0, 2471.0, 1484.0, 883.0, 511.0, 389.0, 227.0, 144.0, 102.0, 83.0, 67.0, 31.0, 29.0, 20.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.8125, -30.919921875, -30.02734375, -29.134765625, -28.2421875, -27.349609375, -26.45703125, -25.564453125, -24.671875, -23.779296875, -22.88671875, -21.994140625, -21.1015625, -20.208984375, -19.31640625, -18.423828125, -17.53125, -16.638671875, -15.74609375, -14.853515625, -13.9609375, -13.068359375, -12.17578125, -11.283203125, -10.390625, -9.498046875, -8.60546875, -7.712890625, -6.8203125, -5.927734375, -5.03515625, -4.142578125, -3.25, -2.357421875, -1.46484375, -0.572265625, 0.3203125, 1.212890625, 2.10546875, 2.998046875, 3.890625, 4.783203125, 5.67578125, 6.568359375, 7.4609375, 8.353515625, 9.24609375, 10.138671875, 11.03125, 11.923828125, 12.81640625, 13.708984375, 14.6015625, 15.494140625, 16.38671875, 17.279296875, 18.171875, 19.064453125, 19.95703125, 20.849609375, 21.7421875, 22.634765625, 23.52734375, 24.419921875, 25.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 7.0, 8.0, 21.0, 15.0, 27.0, 34.0, 76.0, 113.0, 331.0, 2887.0, 218.0, 120.0, 59.0, 29.0, 34.0, 21.0, 10.0, 5.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.66796875, -6.494140625, -6.3203125, -6.146484375, -5.97265625, -5.798828125, -5.625, -5.451171875, -5.27734375, -5.103515625, -4.9296875, -4.755859375, -4.58203125, -4.408203125, -4.234375, -4.060546875, -3.88671875, -3.712890625, -3.5390625, -3.365234375, -3.19140625, -3.017578125, -2.84375, -2.669921875, -2.49609375, -2.322265625, -2.1484375, -1.974609375, -1.80078125, -1.626953125, -1.453125, -1.279296875, -1.10546875, -0.931640625, -0.7578125, -0.583984375, -0.41015625, -0.236328125, -0.0625, 0.111328125, 0.28515625, 0.458984375, 0.6328125, 0.806640625, 0.98046875, 1.154296875, 1.328125, 1.501953125, 1.67578125, 1.849609375, 2.0234375, 2.197265625, 2.37109375, 2.544921875, 2.71875, 2.892578125, 3.06640625, 3.240234375, 3.4140625, 3.587890625, 3.76171875, 3.935546875, 4.109375, 4.283203125, 4.45703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 10.0, 25.0, 42.0, 58.0, 100.0, 133.0, 144.0, 153.0, 136.0, 88.0, 64.0, 18.0, 7.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.17774963378906, -66.56575775146484, -64.9537582397461, -63.341766357421875, -61.729774475097656, -60.11777877807617, -58.50578308105469, -56.89379119873047, -55.281795501708984, -53.6697998046875, -52.05780792236328, -50.4458122253418, -48.83381652832031, -47.221824645996094, -45.60982894897461, -43.997833251953125, -42.385841369628906, -40.77384567260742, -39.1618537902832, -37.54985809326172, -35.9378662109375, -34.325870513916016, -32.71387481689453, -31.10188102722168, -29.489887237548828, -27.877893447875977, -26.265899658203125, -24.65390396118164, -23.04191017150879, -21.429916381835938, -19.817920684814453, -18.2059268951416, -16.593929290771484, -14.981935501098633, -13.369940757751465, -11.757946014404297, -10.145952224731445, -8.533958435058594, -6.921963691711426, -5.309968948364258, -3.6979751586914062, -2.0859808921813965, -0.4739866256713867, 1.138007640838623, 2.750001907348633, 4.361995697021484, 5.973990440368652, 7.58598518371582, 9.197978973388672, 10.809972763061523, 12.421967506408691, 14.03396224975586, 15.645956039428711, 17.257949829101562, 18.869945526123047, 20.4819393157959, 22.09393310546875, 23.7059268951416, 25.317920684814453, 26.929916381835938, 28.54191017150879, 30.15390396118164, 31.765899658203125, 33.377891540527344, 34.98988723754883]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 3.0, 5.0, 8.0, 8.0, 13.0, 9.0, 13.0, 22.0, 16.0, 17.0, 21.0, 24.0, 33.0, 29.0, 26.0, 37.0, 34.0, 50.0, 36.0, 39.0, 43.0, 52.0, 43.0, 44.0, 40.0, 41.0, 28.0, 30.0, 31.0, 29.0, 24.0, 16.0, 30.0, 17.0, 16.0, 10.0, 11.0, 7.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.808642387390137, -14.319196701049805, -13.829750061035156, -13.340304374694824, -12.850858688354492, -12.36141300201416, -11.871967315673828, -11.38252067565918, -10.893074989318848, -10.403629302978516, -9.914182662963867, -9.424736976623535, -8.935291290283203, -8.445845603942871, -7.956399440765381, -7.466953277587891, -6.977507591247559, -6.488061904907227, -5.998615741729736, -5.509169578552246, -5.019723892211914, -4.530278205871582, -4.040832042694092, -3.5513861179351807, -3.0619401931762695, -2.5724942684173584, -2.0830483436584473, -1.5936024188995361, -1.104156494140625, -0.6147105693817139, -0.12526464462280273, 0.3641812801361084, 0.8536262512207031, 1.3430721759796143, 1.8325181007385254, 2.3219640254974365, 2.8114099502563477, 3.300855875015259, 3.79030179977417, 4.27974796295166, 4.769193649291992, 5.258639335632324, 5.7480854988098145, 6.237531661987305, 6.726977348327637, 7.216423034667969, 7.705869197845459, 8.19531536102295, 8.684761047363281, 9.174206733703613, 9.663652420043945, 10.153099060058594, 10.642544746398926, 11.131990432739258, 11.621437072753906, 12.110882759094238, 12.60032844543457, 13.089774131774902, 13.579219818115234, 14.068666458129883, 14.558112144470215, 15.047557830810547, 15.537004470825195, 16.02644920349121, 16.51589584350586]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 11.0, 13.0, 29.0, 53.0, 66.0, 116.0, 178.0, 317.0, 616.0, 1122.0, 2361.0, 5023.0, 12176.0, 31638.0, 92347.0, 260286.0, 371581.0, 174353.0, 59004.0, 21354.0, 8452.0, 3755.0, 1717.0, 870.0, 462.0, 251.0, 139.0, 73.0, 60.0, 41.0, 20.0, 14.0, 7.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3515625, -13.8057861328125, -13.260009765625, -12.7142333984375, -12.16845703125, -11.6226806640625, -11.076904296875, -10.5311279296875, -9.9853515625, -9.4395751953125, -8.893798828125, -8.3480224609375, -7.80224609375, -7.2564697265625, -6.710693359375, -6.1649169921875, -5.619140625, -5.0733642578125, -4.527587890625, -3.9818115234375, -3.43603515625, -2.8902587890625, -2.344482421875, -1.7987060546875, -1.2529296875, -0.7071533203125, -0.161376953125, 0.3843994140625, 0.93017578125, 1.4759521484375, 2.021728515625, 2.5675048828125, 3.11328125, 3.6590576171875, 4.204833984375, 4.7506103515625, 5.29638671875, 5.8421630859375, 6.387939453125, 6.9337158203125, 7.4794921875, 8.0252685546875, 8.571044921875, 9.1168212890625, 9.66259765625, 10.2083740234375, 10.754150390625, 11.2999267578125, 11.845703125, 12.3914794921875, 12.937255859375, 13.4830322265625, 14.02880859375, 14.5745849609375, 15.120361328125, 15.6661376953125, 16.2119140625, 16.7576904296875, 17.303466796875, 17.8492431640625, 18.39501953125, 18.9407958984375, 19.486572265625, 20.0323486328125, 20.578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 8.0, 1.0, 6.0, 8.0, 8.0, 10.0, 23.0, 22.0, 22.0, 28.0, 25.0, 42.0, 40.0, 55.0, 49.0, 65.0, 46.0, 56.0, 51.0, 37.0, 50.0, 47.0, 52.0, 27.0, 36.0, 28.0, 30.0, 20.0, 25.0, 21.0, 16.0, 11.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1484375, -8.88055419921875, -8.6126708984375, -8.34478759765625, -8.076904296875, -7.80902099609375, -7.5411376953125, -7.27325439453125, -7.00537109375, -6.73748779296875, -6.4696044921875, -6.20172119140625, -5.933837890625, -5.66595458984375, -5.3980712890625, -5.13018798828125, -4.8623046875, -4.59442138671875, -4.3265380859375, -4.05865478515625, -3.790771484375, -3.52288818359375, -3.2550048828125, -2.98712158203125, -2.71923828125, -2.45135498046875, -2.1834716796875, -1.91558837890625, -1.647705078125, -1.37982177734375, -1.1119384765625, -0.84405517578125, -0.576171875, -0.30828857421875, -0.0404052734375, 0.22747802734375, 0.495361328125, 0.76324462890625, 1.0311279296875, 1.29901123046875, 1.56689453125, 1.83477783203125, 2.1026611328125, 2.37054443359375, 2.638427734375, 2.90631103515625, 3.1741943359375, 3.44207763671875, 3.7099609375, 3.97784423828125, 4.2457275390625, 4.51361083984375, 4.781494140625, 5.04937744140625, 5.3172607421875, 5.58514404296875, 5.85302734375, 6.12091064453125, 6.3887939453125, 6.65667724609375, 6.924560546875, 7.19244384765625, 7.4603271484375, 7.72821044921875, 7.99609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 10.0, 8.0, 15.0, 17.0, 33.0, 43.0, 50.0, 80.0, 85.0, 123.0, 178.0, 258.0, 454.0, 649.0, 1048.0, 2004.0, 5086.0, 20642.0, 134873.0, 668993.0, 177468.0, 25107.0, 5997.0, 2168.0, 1104.0, 667.0, 420.0, 278.0, 212.0, 138.0, 80.0, 71.0, 37.0, 38.0, 27.0, 24.0, 11.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-29.015625, -28.12451171875, -27.2333984375, -26.34228515625, -25.451171875, -24.56005859375, -23.6689453125, -22.77783203125, -21.88671875, -20.99560546875, -20.1044921875, -19.21337890625, -18.322265625, -17.43115234375, -16.5400390625, -15.64892578125, -14.7578125, -13.86669921875, -12.9755859375, -12.08447265625, -11.193359375, -10.30224609375, -9.4111328125, -8.52001953125, -7.62890625, -6.73779296875, -5.8466796875, -4.95556640625, -4.064453125, -3.17333984375, -2.2822265625, -1.39111328125, -0.5, 0.39111328125, 1.2822265625, 2.17333984375, 3.064453125, 3.95556640625, 4.8466796875, 5.73779296875, 6.62890625, 7.52001953125, 8.4111328125, 9.30224609375, 10.193359375, 11.08447265625, 11.9755859375, 12.86669921875, 13.7578125, 14.64892578125, 15.5400390625, 16.43115234375, 17.322265625, 18.21337890625, 19.1044921875, 19.99560546875, 20.88671875, 21.77783203125, 22.6689453125, 23.56005859375, 24.451171875, 25.34228515625, 26.2333984375, 27.12451171875, 28.015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 6.0, 11.0, 7.0, 12.0, 19.0, 18.0, 27.0, 28.0, 21.0, 18.0, 38.0, 31.0, 31.0, 32.0, 35.0, 41.0, 43.0, 43.0, 57.0, 39.0, 41.0, 41.0, 44.0, 37.0, 28.0, 30.0, 35.0, 24.0, 22.0, 25.0, 20.0, 16.0, 11.0, 9.0, 11.0, 10.0, 4.0, 6.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.359375, -28.4501953125, -27.541015625, -26.6318359375, -25.72265625, -24.8134765625, -23.904296875, -22.9951171875, -22.0859375, -21.1767578125, -20.267578125, -19.3583984375, -18.44921875, -17.5400390625, -16.630859375, -15.7216796875, -14.8125, -13.9033203125, -12.994140625, -12.0849609375, -11.17578125, -10.2666015625, -9.357421875, -8.4482421875, -7.5390625, -6.6298828125, -5.720703125, -4.8115234375, -3.90234375, -2.9931640625, -2.083984375, -1.1748046875, -0.265625, 0.6435546875, 1.552734375, 2.4619140625, 3.37109375, 4.2802734375, 5.189453125, 6.0986328125, 7.0078125, 7.9169921875, 8.826171875, 9.7353515625, 10.64453125, 11.5537109375, 12.462890625, 13.3720703125, 14.28125, 15.1904296875, 16.099609375, 17.0087890625, 17.91796875, 18.8271484375, 19.736328125, 20.6455078125, 21.5546875, 22.4638671875, 23.373046875, 24.2822265625, 25.19140625, 26.1005859375, 27.009765625, 27.9189453125, 28.828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 11.0, 10.0, 13.0, 16.0, 23.0, 36.0, 55.0, 102.0, 192.0, 387.0, 1225.0, 6108.0, 117767.0, 883883.0, 34132.0, 3141.0, 783.0, 283.0, 131.0, 94.0, 55.0, 37.0, 15.0, 9.0, 16.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.359130859375, -20.57763671875, -19.796142578125, -19.0146484375, -18.233154296875, -17.45166015625, -16.670166015625, -15.888671875, -15.107177734375, -14.32568359375, -13.544189453125, -12.7626953125, -11.981201171875, -11.19970703125, -10.418212890625, -9.63671875, -8.855224609375, -8.07373046875, -7.292236328125, -6.5107421875, -5.729248046875, -4.94775390625, -4.166259765625, -3.384765625, -2.603271484375, -1.82177734375, -1.040283203125, -0.2587890625, 0.522705078125, 1.30419921875, 2.085693359375, 2.8671875, 3.648681640625, 4.43017578125, 5.211669921875, 5.9931640625, 6.774658203125, 7.55615234375, 8.337646484375, 9.119140625, 9.900634765625, 10.68212890625, 11.463623046875, 12.2451171875, 13.026611328125, 13.80810546875, 14.589599609375, 15.37109375, 16.152587890625, 16.93408203125, 17.715576171875, 18.4970703125, 19.278564453125, 20.06005859375, 20.841552734375, 21.623046875, 22.404541015625, 23.18603515625, 23.967529296875, 24.7490234375, 25.530517578125, 26.31201171875, 27.093505859375, 27.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 6.0, 3.0, 3.0, 6.0, 12.0, 23.0, 45.0, 59.0, 110.0, 204.0, 240.0, 134.0, 73.0, 46.0, 17.0, 9.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005207061767578125, -0.0050890445709228516, -0.004971027374267578, -0.004853010177612305, -0.004734992980957031, -0.004616975784301758, -0.004498958587646484, -0.004380941390991211, -0.0042629241943359375, -0.004144906997680664, -0.004026889801025391, -0.003908872604370117, -0.0037908554077148438, -0.0036728382110595703, -0.003554821014404297, -0.0034368038177490234, -0.00331878662109375, -0.0032007694244384766, -0.003082752227783203, -0.0029647350311279297, -0.0028467178344726562, -0.002728700637817383, -0.0026106834411621094, -0.002492666244506836, -0.0023746490478515625, -0.002256631851196289, -0.0021386146545410156, -0.002020597457885742, -0.0019025802612304688, -0.0017845630645751953, -0.0016665458679199219, -0.0015485286712646484, -0.001430511474609375, -0.0013124942779541016, -0.0011944770812988281, -0.0010764598846435547, -0.0009584426879882812, -0.0008404254913330078, -0.0007224082946777344, -0.0006043910980224609, -0.0004863739013671875, -0.00036835670471191406, -0.0002503395080566406, -0.0001323223114013672, -1.430511474609375e-05, 0.00010371208190917969, 0.00022172927856445312, 0.00033974647521972656, 0.000457763671875, 0.0005757808685302734, 0.0006937980651855469, 0.0008118152618408203, 0.0009298324584960938, 0.0010478496551513672, 0.0011658668518066406, 0.001283884048461914, 0.0014019012451171875, 0.001519918441772461, 0.0016379356384277344, 0.0017559528350830078, 0.0018739700317382812, 0.0019919872283935547, 0.002110004425048828, 0.0022280216217041016, 0.002346038818359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 18.0, 24.0, 43.0, 119.0, 308.0, 936.0, 4988.0, 323514.0, 709428.0, 7243.0, 1235.0, 401.0, 133.0, 65.0, 32.0, 20.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.21875, -37.99609375, -36.7734375, -35.55078125, -34.328125, -33.10546875, -31.8828125, -30.66015625, -29.4375, -28.21484375, -26.9921875, -25.76953125, -24.546875, -23.32421875, -22.1015625, -20.87890625, -19.65625, -18.43359375, -17.2109375, -15.98828125, -14.765625, -13.54296875, -12.3203125, -11.09765625, -9.875, -8.65234375, -7.4296875, -6.20703125, -4.984375, -3.76171875, -2.5390625, -1.31640625, -0.09375, 1.12890625, 2.3515625, 3.57421875, 4.796875, 6.01953125, 7.2421875, 8.46484375, 9.6875, 10.91015625, 12.1328125, 13.35546875, 14.578125, 15.80078125, 17.0234375, 18.24609375, 19.46875, 20.69140625, 21.9140625, 23.13671875, 24.359375, 25.58203125, 26.8046875, 28.02734375, 29.25, 30.47265625, 31.6953125, 32.91796875, 34.140625, 35.36328125, 36.5859375, 37.80859375, 39.03125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 14.0, 27.0, 39.0, 85.0, 145.0, 181.0, 193.0, 151.0, 79.0, 30.0, 26.0, 11.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.796875, -28.016845703125, -27.23681640625, -26.456787109375, -25.6767578125, -24.896728515625, -24.11669921875, -23.336669921875, -22.556640625, -21.776611328125, -20.99658203125, -20.216552734375, -19.4365234375, -18.656494140625, -17.87646484375, -17.096435546875, -16.31640625, -15.536376953125, -14.75634765625, -13.976318359375, -13.1962890625, -12.416259765625, -11.63623046875, -10.856201171875, -10.076171875, -9.296142578125, -8.51611328125, -7.736083984375, -6.9560546875, -6.176025390625, -5.39599609375, -4.615966796875, -3.8359375, -3.055908203125, -2.27587890625, -1.495849609375, -0.7158203125, 0.064208984375, 0.84423828125, 1.624267578125, 2.404296875, 3.184326171875, 3.96435546875, 4.744384765625, 5.5244140625, 6.304443359375, 7.08447265625, 7.864501953125, 8.64453125, 9.424560546875, 10.20458984375, 10.984619140625, 11.7646484375, 12.544677734375, 13.32470703125, 14.104736328125, 14.884765625, 15.664794921875, 16.44482421875, 17.224853515625, 18.0048828125, 18.784912109375, 19.56494140625, 20.344970703125, 21.125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 19.0, 104.0, 289.0, 370.0, 156.0, 41.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-451.2337646484375, -432.5804138183594, -413.92706298828125, -395.2737121582031, -376.620361328125, -357.967041015625, -339.3136901855469, -320.66033935546875, -302.0069885253906, -283.3536376953125, -264.7002868652344, -246.0469512939453, -227.3936004638672, -208.74024963378906, -190.0869140625, -171.43356323242188, -152.78021240234375, -134.12686157226562, -115.47351837158203, -96.82017517089844, -78.16682434082031, -59.51347351074219, -40.860130310058594, -22.206787109375, -3.553436279296875, 15.099910736083984, 33.753257751464844, 52.4066047668457, 71.05995178222656, 89.71330261230469, 108.36664581298828, 127.01998901367188, 145.67333984375, 164.32669067382812, 182.98004150390625, 201.6333770751953, 220.28672790527344, 238.94007873535156, 257.5934143066406, 276.24676513671875, 294.9001159667969, 313.553466796875, 332.2068176269531, 350.86016845703125, 369.51348876953125, 388.1668701171875, 406.8201904296875, 425.4735412597656, 444.12689208984375, 462.7802429199219, 481.43359375, 500.0869445800781, 518.7402954101562, 537.3936157226562, 556.0469970703125, 574.7003173828125, 593.3536376953125, 612.0069580078125, 630.6603393554688, 649.3136596679688, 667.967041015625, 686.620361328125, 705.2737426757812, 723.9270629882812, 742.5804443359375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 4.0, 6.0, 14.0, 12.0, 24.0, 18.0, 15.0, 23.0, 30.0, 25.0, 37.0, 45.0, 38.0, 47.0, 50.0, 37.0, 46.0, 50.0, 42.0, 39.0, 46.0, 31.0, 40.0, 39.0, 40.0, 25.0, 32.0, 30.0, 22.0, 13.0, 6.0, 11.0, 5.0, 5.0, 12.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.65960693359375, -136.95567321777344, -132.2517547607422, -127.54782104492188, -122.84388732910156, -118.13996124267578, -113.43603515625, -108.73210144042969, -104.0281753540039, -99.32424926757812, -94.62031555175781, -89.91638946533203, -85.21246337890625, -80.50852966308594, -75.80460357666016, -71.10067749023438, -66.39674377441406, -61.692813873291016, -56.98888397216797, -52.28495788574219, -47.58102798461914, -42.877098083496094, -38.17317199707031, -33.469242095947266, -28.76531219482422, -24.061382293701172, -19.357454299926758, -14.653525352478027, -9.949596405029297, -5.24566650390625, -0.5417385101318359, 4.162189483642578, 8.866119384765625, 13.570048332214355, 18.273977279663086, 22.9779052734375, 27.681835174560547, 32.385765075683594, 37.089691162109375, 41.79362106323242, 46.49755096435547, 51.201480865478516, 55.90541076660156, 60.609336853027344, 65.31326293945312, 70.01719665527344, 74.72112274169922, 79.425048828125, 84.12898254394531, 88.8329086303711, 93.5368423461914, 98.24076843261719, 102.9447021484375, 107.64862823486328, 112.35255432128906, 117.05648803710938, 121.76041412353516, 126.46434020996094, 131.16827392578125, 135.87220764160156, 140.5761260986328, 145.28005981445312, 149.98399353027344, 154.6879119873047, 159.391845703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 12.0, 18.0, 17.0, 30.0, 40.0, 65.0, 76.0, 123.0, 196.0, 308.0, 475.0, 785.0, 1412.0, 2894.0, 7077.0, 25976.0, 4085553.0, 51623.0, 9607.0, 3754.0, 1780.0, 912.0, 550.0, 338.0, 202.0, 156.0, 84.0, 60.0, 41.0, 31.0, 28.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.740234375, -34.57421875, -33.408203125, -32.2421875, -31.076171875, -29.91015625, -28.744140625, -27.578125, -26.412109375, -25.24609375, -24.080078125, -22.9140625, -21.748046875, -20.58203125, -19.416015625, -18.25, -17.083984375, -15.91796875, -14.751953125, -13.5859375, -12.419921875, -11.25390625, -10.087890625, -8.921875, -7.755859375, -6.58984375, -5.423828125, -4.2578125, -3.091796875, -1.92578125, -0.759765625, 0.40625, 1.572265625, 2.73828125, 3.904296875, 5.0703125, 6.236328125, 7.40234375, 8.568359375, 9.734375, 10.900390625, 12.06640625, 13.232421875, 14.3984375, 15.564453125, 16.73046875, 17.896484375, 19.0625, 20.228515625, 21.39453125, 22.560546875, 23.7265625, 24.892578125, 26.05859375, 27.224609375, 28.390625, 29.556640625, 30.72265625, 31.888671875, 33.0546875, 34.220703125, 35.38671875, 36.552734375, 37.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 11.0, 12.0, 23.0, 20.0, 29.0, 26.0, 34.0, 43.0, 46.0, 59.0, 73.0, 46.0, 59.0, 52.0, 54.0, 53.0, 44.0, 41.0, 48.0, 44.0, 35.0, 16.0, 18.0, 19.0, 24.0, 13.0, 13.0, 5.0, 5.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7115478515625, -8.415283203125, -8.1190185546875, -7.82275390625, -7.5264892578125, -7.230224609375, -6.9339599609375, -6.6376953125, -6.3414306640625, -6.045166015625, -5.7489013671875, -5.45263671875, -5.1563720703125, -4.860107421875, -4.5638427734375, -4.267578125, -3.9713134765625, -3.675048828125, -3.3787841796875, -3.08251953125, -2.7862548828125, -2.489990234375, -2.1937255859375, -1.8974609375, -1.6011962890625, -1.304931640625, -1.0086669921875, -0.71240234375, -0.4161376953125, -0.119873046875, 0.1763916015625, 0.47265625, 0.7689208984375, 1.065185546875, 1.3614501953125, 1.65771484375, 1.9539794921875, 2.250244140625, 2.5465087890625, 2.8427734375, 3.1390380859375, 3.435302734375, 3.7315673828125, 4.02783203125, 4.3240966796875, 4.620361328125, 4.9166259765625, 5.212890625, 5.5091552734375, 5.805419921875, 6.1016845703125, 6.39794921875, 6.6942138671875, 6.990478515625, 7.2867431640625, 7.5830078125, 7.8792724609375, 8.175537109375, 8.4718017578125, 8.76806640625, 9.0643310546875, 9.360595703125, 9.6568603515625, 9.953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 13.0, 16.0, 17.0, 34.0, 35.0, 54.0, 78.0, 98.0, 161.0, 253.0, 398.0, 634.0, 1291.0, 2620.0, 6843.0, 31868.0, 4089768.0, 45885.0, 7922.0, 2942.0, 1378.0, 729.0, 426.0, 284.0, 177.0, 111.0, 57.0, 57.0, 45.0, 29.0, 16.0, 19.0, 12.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.52880859375, -33.2763671875, -32.02392578125, -30.771484375, -29.51904296875, -28.2666015625, -27.01416015625, -25.76171875, -24.50927734375, -23.2568359375, -22.00439453125, -20.751953125, -19.49951171875, -18.2470703125, -16.99462890625, -15.7421875, -14.48974609375, -13.2373046875, -11.98486328125, -10.732421875, -9.47998046875, -8.2275390625, -6.97509765625, -5.72265625, -4.47021484375, -3.2177734375, -1.96533203125, -0.712890625, 0.53955078125, 1.7919921875, 3.04443359375, 4.296875, 5.54931640625, 6.8017578125, 8.05419921875, 9.306640625, 10.55908203125, 11.8115234375, 13.06396484375, 14.31640625, 15.56884765625, 16.8212890625, 18.07373046875, 19.326171875, 20.57861328125, 21.8310546875, 23.08349609375, 24.3359375, 25.58837890625, 26.8408203125, 28.09326171875, 29.345703125, 30.59814453125, 31.8505859375, 33.10302734375, 34.35546875, 35.60791015625, 36.8603515625, 38.11279296875, 39.365234375, 40.61767578125, 41.8701171875, 43.12255859375, 44.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 7.0, 20.0, 30.0, 73.0, 3504.0, 281.0, 68.0, 31.0, 15.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.642822265625, -7.40283203125, -7.162841796875, -6.9228515625, -6.682861328125, -6.44287109375, -6.202880859375, -5.962890625, -5.722900390625, -5.48291015625, -5.242919921875, -5.0029296875, -4.762939453125, -4.52294921875, -4.282958984375, -4.04296875, -3.802978515625, -3.56298828125, -3.322998046875, -3.0830078125, -2.843017578125, -2.60302734375, -2.363037109375, -2.123046875, -1.883056640625, -1.64306640625, -1.403076171875, -1.1630859375, -0.923095703125, -0.68310546875, -0.443115234375, -0.203125, 0.036865234375, 0.27685546875, 0.516845703125, 0.7568359375, 0.996826171875, 1.23681640625, 1.476806640625, 1.716796875, 1.956787109375, 2.19677734375, 2.436767578125, 2.6767578125, 2.916748046875, 3.15673828125, 3.396728515625, 3.63671875, 3.876708984375, 4.11669921875, 4.356689453125, 4.5966796875, 4.836669921875, 5.07666015625, 5.316650390625, 5.556640625, 5.796630859375, 6.03662109375, 6.276611328125, 6.5166015625, 6.756591796875, 6.99658203125, 7.236572265625, 7.4765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 12.0, 17.0, 30.0, 44.0, 57.0, 103.0, 140.0, 142.0, 125.0, 119.0, 73.0, 49.0, 29.0, 24.0, 8.0, 6.0, 10.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.08169174194336, -35.12140655517578, -34.1611213684082, -33.200836181640625, -32.24055099487305, -31.28026580810547, -30.31998062133789, -29.359697341918945, -28.399412155151367, -27.43912696838379, -26.47884178161621, -25.518556594848633, -24.558271408081055, -23.59798812866211, -22.63770294189453, -21.677417755126953, -20.717132568359375, -19.756847381591797, -18.79656219482422, -17.83627700805664, -16.875991821289062, -15.9157075881958, -14.955422401428223, -13.995138168334961, -13.03485107421875, -12.074565887451172, -11.114280700683594, -10.153995513916016, -9.193711280822754, -8.233426094055176, -7.273140907287598, -6.312856197357178, -5.352571487426758, -4.39228630065918, -3.4320015907287598, -2.4717164039611816, -1.5114314556121826, -0.5511465072631836, 0.40913867950439453, 1.3694233894348145, 2.3297085762023926, 3.2899935245513916, 4.250278472900391, 5.210563659667969, 6.170848846435547, 7.131133556365967, 8.091419219970703, 9.051703453063965, 10.011988639831543, 10.972273826599121, 11.9325590133667, 12.892843246459961, 13.853128433227539, 14.813413619995117, 15.773698806762695, 16.733983993530273, 17.69426918029785, 18.65455436706543, 19.614839553833008, 20.575124740600586, 21.535409927368164, 22.49569320678711, 23.455978393554688, 24.416263580322266, 25.376548767089844]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 11.0, 10.0, 19.0, 13.0, 10.0, 13.0, 20.0, 15.0, 19.0, 29.0, 35.0, 29.0, 44.0, 35.0, 43.0, 30.0, 33.0, 47.0, 59.0, 46.0, 41.0, 38.0, 39.0, 41.0, 35.0, 32.0, 26.0, 17.0, 29.0, 21.0, 24.0, 14.0, 16.0, 12.0, 13.0, 10.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.810247421264648, -11.466096878051758, -11.121946334838867, -10.777795791625977, -10.433645248413086, -10.089493751525879, -9.745343208312988, -9.401192665100098, -9.057042121887207, -8.712891578674316, -8.368741035461426, -8.024590492248535, -7.680439472198486, -7.336288928985596, -6.992137908935547, -6.647987365722656, -6.303836822509766, -5.959686279296875, -5.615535736083984, -5.2713847160339355, -4.927234172821045, -4.583083629608154, -4.2389326095581055, -3.894782066345215, -3.550631523132324, -3.2064809799194336, -2.862330198287964, -2.518179416656494, -2.1740288734436035, -1.8298782110214233, -1.4857275485992432, -1.1415767669677734, -0.7974262237548828, -0.45327556133270264, -0.10912489891052246, 0.23502576351165771, 0.5791764259338379, 0.9233270883560181, 1.2674777507781982, 1.611628532409668, 1.9557790756225586, 2.299929618835449, 2.644080400466919, 2.9882311820983887, 3.3323817253112793, 3.67653226852417, 4.020683288574219, 4.364833831787109, 4.708984375, 5.053134918212891, 5.397285461425781, 5.74143648147583, 6.085587024688721, 6.429737567901611, 6.77388858795166, 7.118039131164551, 7.462189674377441, 7.806340217590332, 8.150490760803223, 8.494641304016113, 8.83879280090332, 9.182943344116211, 9.527093887329102, 9.871244430541992, 10.215394973754883]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 11.0, 16.0, 22.0, 22.0, 40.0, 57.0, 97.0, 133.0, 202.0, 323.0, 535.0, 966.0, 1679.0, 3256.0, 6022.0, 11914.0, 23626.0, 48173.0, 98052.0, 184844.0, 259787.0, 196305.0, 106227.0, 53019.0, 26002.0, 12729.0, 6527.0, 3367.0, 1921.0, 1033.0, 614.0, 371.0, 225.0, 161.0, 80.0, 63.0, 39.0, 25.0, 24.0, 10.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.7578125, -11.4176025390625, -11.077392578125, -10.7371826171875, -10.39697265625, -10.0567626953125, -9.716552734375, -9.3763427734375, -9.0361328125, -8.6959228515625, -8.355712890625, -8.0155029296875, -7.67529296875, -7.3350830078125, -6.994873046875, -6.6546630859375, -6.314453125, -5.9742431640625, -5.634033203125, -5.2938232421875, -4.95361328125, -4.6134033203125, -4.273193359375, -3.9329833984375, -3.5927734375, -3.2525634765625, -2.912353515625, -2.5721435546875, -2.23193359375, -1.8917236328125, -1.551513671875, -1.2113037109375, -0.87109375, -0.5308837890625, -0.190673828125, 0.1495361328125, 0.48974609375, 0.8299560546875, 1.170166015625, 1.5103759765625, 1.8505859375, 2.1907958984375, 2.531005859375, 2.8712158203125, 3.21142578125, 3.5516357421875, 3.891845703125, 4.2320556640625, 4.572265625, 4.9124755859375, 5.252685546875, 5.5928955078125, 5.93310546875, 6.2733154296875, 6.613525390625, 6.9537353515625, 7.2939453125, 7.6341552734375, 7.974365234375, 8.3145751953125, 8.65478515625, 8.9949951171875, 9.335205078125, 9.6754150390625, 10.015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 12.0, 17.0, 29.0, 22.0, 28.0, 37.0, 37.0, 40.0, 61.0, 48.0, 67.0, 50.0, 45.0, 54.0, 53.0, 44.0, 47.0, 44.0, 41.0, 35.0, 30.0, 19.0, 22.0, 19.0, 20.0, 15.0, 11.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.556884765625, -8.26220703125, -7.967529296875, -7.6728515625, -7.378173828125, -7.08349609375, -6.788818359375, -6.494140625, -6.199462890625, -5.90478515625, -5.610107421875, -5.3154296875, -5.020751953125, -4.72607421875, -4.431396484375, -4.13671875, -3.842041015625, -3.54736328125, -3.252685546875, -2.9580078125, -2.663330078125, -2.36865234375, -2.073974609375, -1.779296875, -1.484619140625, -1.18994140625, -0.895263671875, -0.6005859375, -0.305908203125, -0.01123046875, 0.283447265625, 0.578125, 0.872802734375, 1.16748046875, 1.462158203125, 1.7568359375, 2.051513671875, 2.34619140625, 2.640869140625, 2.935546875, 3.230224609375, 3.52490234375, 3.819580078125, 4.1142578125, 4.408935546875, 4.70361328125, 4.998291015625, 5.29296875, 5.587646484375, 5.88232421875, 6.177001953125, 6.4716796875, 6.766357421875, 7.06103515625, 7.355712890625, 7.650390625, 7.945068359375, 8.23974609375, 8.534423828125, 8.8291015625, 9.123779296875, 9.41845703125, 9.713134765625, 10.0078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 9.0, 10.0, 17.0, 10.0, 24.0, 26.0, 33.0, 48.0, 55.0, 105.0, 134.0, 237.0, 336.0, 518.0, 818.0, 1583.0, 4695.0, 25586.0, 280993.0, 658637.0, 61123.0, 8342.0, 2307.0, 1062.0, 618.0, 358.0, 249.0, 181.0, 129.0, 85.0, 71.0, 46.0, 34.0, 18.0, 13.0, 11.0, 12.0, 7.0, 1.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.25, -32.305419921875, -31.36083984375, -30.416259765625, -29.4716796875, -28.527099609375, -27.58251953125, -26.637939453125, -25.693359375, -24.748779296875, -23.80419921875, -22.859619140625, -21.9150390625, -20.970458984375, -20.02587890625, -19.081298828125, -18.13671875, -17.192138671875, -16.24755859375, -15.302978515625, -14.3583984375, -13.413818359375, -12.46923828125, -11.524658203125, -10.580078125, -9.635498046875, -8.69091796875, -7.746337890625, -6.8017578125, -5.857177734375, -4.91259765625, -3.968017578125, -3.0234375, -2.078857421875, -1.13427734375, -0.189697265625, 0.7548828125, 1.699462890625, 2.64404296875, 3.588623046875, 4.533203125, 5.477783203125, 6.42236328125, 7.366943359375, 8.3115234375, 9.256103515625, 10.20068359375, 11.145263671875, 12.08984375, 13.034423828125, 13.97900390625, 14.923583984375, 15.8681640625, 16.812744140625, 17.75732421875, 18.701904296875, 19.646484375, 20.591064453125, 21.53564453125, 22.480224609375, 23.4248046875, 24.369384765625, 25.31396484375, 26.258544921875, 27.203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 13.0, 10.0, 9.0, 10.0, 23.0, 25.0, 17.0, 24.0, 23.0, 37.0, 27.0, 36.0, 44.0, 33.0, 42.0, 40.0, 43.0, 50.0, 32.0, 33.0, 37.0, 35.0, 27.0, 38.0, 36.0, 32.0, 36.0, 27.0, 22.0, 18.0, 11.0, 14.0, 12.0, 7.0, 6.0, 12.0, 3.0, 5.0, 8.0, 8.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.9375, -26.0185546875, -25.099609375, -24.1806640625, -23.26171875, -22.3427734375, -21.423828125, -20.5048828125, -19.5859375, -18.6669921875, -17.748046875, -16.8291015625, -15.91015625, -14.9912109375, -14.072265625, -13.1533203125, -12.234375, -11.3154296875, -10.396484375, -9.4775390625, -8.55859375, -7.6396484375, -6.720703125, -5.8017578125, -4.8828125, -3.9638671875, -3.044921875, -2.1259765625, -1.20703125, -0.2880859375, 0.630859375, 1.5498046875, 2.46875, 3.3876953125, 4.306640625, 5.2255859375, 6.14453125, 7.0634765625, 7.982421875, 8.9013671875, 9.8203125, 10.7392578125, 11.658203125, 12.5771484375, 13.49609375, 14.4150390625, 15.333984375, 16.2529296875, 17.171875, 18.0908203125, 19.009765625, 19.9287109375, 20.84765625, 21.7666015625, 22.685546875, 23.6044921875, 24.5234375, 25.4423828125, 26.361328125, 27.2802734375, 28.19921875, 29.1181640625, 30.037109375, 30.9560546875, 31.875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 12.0, 11.0, 14.0, 19.0, 28.0, 39.0, 51.0, 88.0, 141.0, 216.0, 348.0, 683.0, 1489.0, 4015.0, 14966.0, 109660.0, 776941.0, 117002.0, 15669.0, 4037.0, 1496.0, 643.0, 380.0, 193.0, 134.0, 82.0, 48.0, 35.0, 40.0, 17.0, 8.0, 18.0, 8.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8046875, -11.3231201171875, -10.841552734375, -10.3599853515625, -9.87841796875, -9.3968505859375, -8.915283203125, -8.4337158203125, -7.9521484375, -7.4705810546875, -6.989013671875, -6.5074462890625, -6.02587890625, -5.5443115234375, -5.062744140625, -4.5811767578125, -4.099609375, -3.6180419921875, -3.136474609375, -2.6549072265625, -2.17333984375, -1.6917724609375, -1.210205078125, -0.7286376953125, -0.2470703125, 0.2344970703125, 0.716064453125, 1.1976318359375, 1.67919921875, 2.1607666015625, 2.642333984375, 3.1239013671875, 3.60546875, 4.0870361328125, 4.568603515625, 5.0501708984375, 5.53173828125, 6.0133056640625, 6.494873046875, 6.9764404296875, 7.4580078125, 7.9395751953125, 8.421142578125, 8.9027099609375, 9.38427734375, 9.8658447265625, 10.347412109375, 10.8289794921875, 11.310546875, 11.7921142578125, 12.273681640625, 12.7552490234375, 13.23681640625, 13.7183837890625, 14.199951171875, 14.6815185546875, 15.1630859375, 15.6446533203125, 16.126220703125, 16.6077880859375, 17.08935546875, 17.5709228515625, 18.052490234375, 18.5340576171875, 19.015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 20.0, 22.0, 30.0, 42.0, 59.0, 95.0, 100.0, 126.0, 124.0, 113.0, 71.0, 44.0, 37.0, 31.0, 14.0, 13.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021143555641174316, -0.0020428895950317383, -0.001971423625946045, -0.0018999576568603516, -0.0018284916877746582, -0.0017570257186889648, -0.0016855597496032715, -0.0016140937805175781, -0.0015426278114318848, -0.0014711618423461914, -0.001399695873260498, -0.0013282299041748047, -0.0012567639350891113, -0.001185297966003418, -0.0011138319969177246, -0.0010423660278320312, -0.0009709000587463379, -0.0008994340896606445, -0.0008279681205749512, -0.0007565021514892578, -0.0006850361824035645, -0.0006135702133178711, -0.0005421042442321777, -0.0004706382751464844, -0.000399172306060791, -0.00032770633697509766, -0.0002562403678894043, -0.00018477439880371094, -0.00011330842971801758, -4.184246063232422e-05, 2.962350845336914e-05, 0.0001010894775390625, 0.00017255544662475586, 0.00024402141571044922, 0.0003154873847961426, 0.00038695335388183594, 0.0004584193229675293, 0.0005298852920532227, 0.000601351261138916, 0.0006728172302246094, 0.0007442831993103027, 0.0008157491683959961, 0.0008872151374816895, 0.0009586811065673828, 0.0010301470756530762, 0.0011016130447387695, 0.0011730790138244629, 0.0012445449829101562, 0.0013160109519958496, 0.001387476921081543, 0.0014589428901672363, 0.0015304088592529297, 0.001601874828338623, 0.0016733407974243164, 0.0017448067665100098, 0.0018162727355957031, 0.0018877387046813965, 0.00195920467376709, 0.002030670642852783, 0.0021021366119384766, 0.00217360258102417, 0.0022450685501098633, 0.0023165345191955566, 0.00238800048828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 10.0, 8.0, 17.0, 26.0, 43.0, 113.0, 184.0, 454.0, 1099.0, 3422.0, 19349.0, 346485.0, 640951.0, 29653.0, 4460.0, 1230.0, 534.0, 253.0, 118.0, 62.0, 28.0, 24.0, 17.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.796875, -28.11279296875, -27.4287109375, -26.74462890625, -26.060546875, -25.37646484375, -24.6923828125, -24.00830078125, -23.32421875, -22.64013671875, -21.9560546875, -21.27197265625, -20.587890625, -19.90380859375, -19.2197265625, -18.53564453125, -17.8515625, -17.16748046875, -16.4833984375, -15.79931640625, -15.115234375, -14.43115234375, -13.7470703125, -13.06298828125, -12.37890625, -11.69482421875, -11.0107421875, -10.32666015625, -9.642578125, -8.95849609375, -8.2744140625, -7.59033203125, -6.90625, -6.22216796875, -5.5380859375, -4.85400390625, -4.169921875, -3.48583984375, -2.8017578125, -2.11767578125, -1.43359375, -0.74951171875, -0.0654296875, 0.61865234375, 1.302734375, 1.98681640625, 2.6708984375, 3.35498046875, 4.0390625, 4.72314453125, 5.4072265625, 6.09130859375, 6.775390625, 7.45947265625, 8.1435546875, 8.82763671875, 9.51171875, 10.19580078125, 10.8798828125, 11.56396484375, 12.248046875, 12.93212890625, 13.6162109375, 14.30029296875, 14.984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 4.0, 6.0, 13.0, 10.0, 10.0, 15.0, 24.0, 29.0, 46.0, 60.0, 59.0, 77.0, 84.0, 113.0, 85.0, 80.0, 67.0, 58.0, 42.0, 25.0, 17.0, 23.0, 9.0, 9.0, 6.0, 13.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.58740234375, -13.2060546875, -12.82470703125, -12.443359375, -12.06201171875, -11.6806640625, -11.29931640625, -10.91796875, -10.53662109375, -10.1552734375, -9.77392578125, -9.392578125, -9.01123046875, -8.6298828125, -8.24853515625, -7.8671875, -7.48583984375, -7.1044921875, -6.72314453125, -6.341796875, -5.96044921875, -5.5791015625, -5.19775390625, -4.81640625, -4.43505859375, -4.0537109375, -3.67236328125, -3.291015625, -2.90966796875, -2.5283203125, -2.14697265625, -1.765625, -1.38427734375, -1.0029296875, -0.62158203125, -0.240234375, 0.14111328125, 0.5224609375, 0.90380859375, 1.28515625, 1.66650390625, 2.0478515625, 2.42919921875, 2.810546875, 3.19189453125, 3.5732421875, 3.95458984375, 4.3359375, 4.71728515625, 5.0986328125, 5.47998046875, 5.861328125, 6.24267578125, 6.6240234375, 7.00537109375, 7.38671875, 7.76806640625, 8.1494140625, 8.53076171875, 8.912109375, 9.29345703125, 9.6748046875, 10.05615234375, 10.4375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 11.0, 23.0, 57.0, 123.0, 193.0, 235.0, 169.0, 98.0, 37.0, 25.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-412.002197265625, -401.8043212890625, -391.6064453125, -381.4085693359375, -371.210693359375, -361.0128173828125, -350.81494140625, -340.6170959472656, -330.4192199707031, -320.2213439941406, -310.0234680175781, -299.8255920410156, -289.6277160644531, -279.42987060546875, -269.23199462890625, -259.03411865234375, -248.8362274169922, -238.6383514404297, -228.4404754638672, -218.24261474609375, -208.04473876953125, -197.84686279296875, -187.64898681640625, -177.45111083984375, -167.25323486328125, -157.05535888671875, -146.85748291015625, -136.65960693359375, -126.46174621582031, -116.26387023925781, -106.06599426269531, -95.86812591552734, -85.67027282714844, -75.47239685058594, -65.27452850341797, -55.07665252685547, -44.878780364990234, -34.680908203125, -24.4830322265625, -14.285163879394531, -4.087287902832031, 6.1105852127075195, 16.30845832824707, 26.506332397460938, 36.70420455932617, 46.902076721191406, 57.099952697753906, 67.29782104492188, 77.49569702148438, 87.69357299804688, 97.89144134521484, 108.08931732177734, 118.28718566894531, 128.4850616455078, 138.6829376220703, 148.88079833984375, 159.07867431640625, 169.27655029296875, 179.47442626953125, 189.67230224609375, 199.8701629638672, 210.0680389404297, 220.2659149169922, 230.46377563476562, 240.6616668701172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 11.0, 5.0, 11.0, 14.0, 14.0, 17.0, 18.0, 19.0, 21.0, 37.0, 31.0, 36.0, 35.0, 31.0, 44.0, 50.0, 52.0, 44.0, 50.0, 53.0, 45.0, 27.0, 29.0, 27.0, 33.0, 33.0, 26.0, 27.0, 21.0, 25.0, 13.0, 11.0, 9.0, 8.0, 5.0, 8.0, 6.0, 9.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-129.1451873779297, -124.88058471679688, -120.61598205566406, -116.35137176513672, -112.0867691040039, -107.8221664428711, -103.55755615234375, -99.29295349121094, -95.02835083007812, -90.76374816894531, -86.4991455078125, -82.23453521728516, -77.96993255615234, -73.70532989501953, -69.44071960449219, -65.17611694335938, -60.91151428222656, -56.64691162109375, -52.38230514526367, -48.117698669433594, -43.85309600830078, -39.58849334716797, -35.32388687133789, -31.059282302856445, -26.794677734375, -22.530073165893555, -18.26546859741211, -14.000864028930664, -9.736259460449219, -5.471654891967773, -1.2070503234863281, 3.057554244995117, 7.322174072265625, 11.58677864074707, 15.851383209228516, 20.11598777770996, 24.380592346191406, 28.64519691467285, 32.9098014831543, 37.174407958984375, 41.43901062011719, 45.70361328125, 49.96821975708008, 54.232826232910156, 58.49742889404297, 62.76203155517578, 67.02664184570312, 71.29124450683594, 75.55584716796875, 79.82044982910156, 84.08505249023438, 88.34966278076172, 92.61426544189453, 96.87886810302734, 101.14347839355469, 105.4080810546875, 109.67268371582031, 113.93728637695312, 118.20188903808594, 122.46649932861328, 126.7311019897461, 130.99571228027344, 135.26031494140625, 139.52491760253906, 143.78952026367188]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 10.0, 13.0, 40.0, 43.0, 62.0, 70.0, 92.0, 142.0, 250.0, 367.0, 547.0, 1114.0, 2461.0, 6130.0, 21557.0, 235625.0, 3880712.0, 30915.0, 7967.0, 2963.0, 1272.0, 710.0, 423.0, 231.0, 154.0, 125.0, 68.0, 57.0, 35.0, 35.0, 21.0, 16.0, 9.0, 14.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.84375, -29.8525390625, -28.861328125, -27.8701171875, -26.87890625, -25.8876953125, -24.896484375, -23.9052734375, -22.9140625, -21.9228515625, -20.931640625, -19.9404296875, -18.94921875, -17.9580078125, -16.966796875, -15.9755859375, -14.984375, -13.9931640625, -13.001953125, -12.0107421875, -11.01953125, -10.0283203125, -9.037109375, -8.0458984375, -7.0546875, -6.0634765625, -5.072265625, -4.0810546875, -3.08984375, -2.0986328125, -1.107421875, -0.1162109375, 0.875, 1.8662109375, 2.857421875, 3.8486328125, 4.83984375, 5.8310546875, 6.822265625, 7.8134765625, 8.8046875, 9.7958984375, 10.787109375, 11.7783203125, 12.76953125, 13.7607421875, 14.751953125, 15.7431640625, 16.734375, 17.7255859375, 18.716796875, 19.7080078125, 20.69921875, 21.6904296875, 22.681640625, 23.6728515625, 24.6640625, 25.6552734375, 26.646484375, 27.6376953125, 28.62890625, 29.6201171875, 30.611328125, 31.6025390625, 32.59375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 6.0, 10.0, 13.0, 19.0, 11.0, 41.0, 53.0, 60.0, 67.0, 67.0, 75.0, 87.0, 81.0, 74.0, 48.0, 49.0, 58.0, 42.0, 27.0, 23.0, 23.0, 15.0, 8.0, 9.0, 11.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.584716796875, -9.20068359375, -8.816650390625, -8.4326171875, -8.048583984375, -7.66455078125, -7.280517578125, -6.896484375, -6.512451171875, -6.12841796875, -5.744384765625, -5.3603515625, -4.976318359375, -4.59228515625, -4.208251953125, -3.82421875, -3.440185546875, -3.05615234375, -2.672119140625, -2.2880859375, -1.904052734375, -1.52001953125, -1.135986328125, -0.751953125, -0.367919921875, 0.01611328125, 0.400146484375, 0.7841796875, 1.168212890625, 1.55224609375, 1.936279296875, 2.3203125, 2.704345703125, 3.08837890625, 3.472412109375, 3.8564453125, 4.240478515625, 4.62451171875, 5.008544921875, 5.392578125, 5.776611328125, 6.16064453125, 6.544677734375, 6.9287109375, 7.312744140625, 7.69677734375, 8.080810546875, 8.46484375, 8.848876953125, 9.23291015625, 9.616943359375, 10.0009765625, 10.385009765625, 10.76904296875, 11.153076171875, 11.537109375, 11.921142578125, 12.30517578125, 12.689208984375, 13.0732421875, 13.457275390625, 13.84130859375, 14.225341796875, 14.609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 16.0, 16.0, 18.0, 41.0, 89.0, 156.0, 336.0, 697.0, 1724.0, 4607.0, 19055.0, 3005311.0, 1135415.0, 19231.0, 4470.0, 1628.0, 717.0, 324.0, 182.0, 89.0, 56.0, 31.0, 33.0, 14.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.90625, -34.66796875, -33.4296875, -32.19140625, -30.953125, -29.71484375, -28.4765625, -27.23828125, -26.0, -24.76171875, -23.5234375, -22.28515625, -21.046875, -19.80859375, -18.5703125, -17.33203125, -16.09375, -14.85546875, -13.6171875, -12.37890625, -11.140625, -9.90234375, -8.6640625, -7.42578125, -6.1875, -4.94921875, -3.7109375, -2.47265625, -1.234375, 0.00390625, 1.2421875, 2.48046875, 3.71875, 4.95703125, 6.1953125, 7.43359375, 8.671875, 9.91015625, 11.1484375, 12.38671875, 13.625, 14.86328125, 16.1015625, 17.33984375, 18.578125, 19.81640625, 21.0546875, 22.29296875, 23.53125, 24.76953125, 26.0078125, 27.24609375, 28.484375, 29.72265625, 30.9609375, 32.19921875, 33.4375, 34.67578125, 35.9140625, 37.15234375, 38.390625, 39.62890625, 40.8671875, 42.10546875, 43.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 13.0, 24.0, 40.0, 78.0, 214.0, 3137.0, 287.0, 108.0, 49.0, 24.0, 14.0, 14.0, 12.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.035400390625, -8.71923828125, -8.403076171875, -8.0869140625, -7.770751953125, -7.45458984375, -7.138427734375, -6.822265625, -6.506103515625, -6.18994140625, -5.873779296875, -5.5576171875, -5.241455078125, -4.92529296875, -4.609130859375, -4.29296875, -3.976806640625, -3.66064453125, -3.344482421875, -3.0283203125, -2.712158203125, -2.39599609375, -2.079833984375, -1.763671875, -1.447509765625, -1.13134765625, -0.815185546875, -0.4990234375, -0.182861328125, 0.13330078125, 0.449462890625, 0.765625, 1.081787109375, 1.39794921875, 1.714111328125, 2.0302734375, 2.346435546875, 2.66259765625, 2.978759765625, 3.294921875, 3.611083984375, 3.92724609375, 4.243408203125, 4.5595703125, 4.875732421875, 5.19189453125, 5.508056640625, 5.82421875, 6.140380859375, 6.45654296875, 6.772705078125, 7.0888671875, 7.405029296875, 7.72119140625, 8.037353515625, 8.353515625, 8.669677734375, 8.98583984375, 9.302001953125, 9.6181640625, 9.934326171875, 10.25048828125, 10.566650390625, 10.8828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 29.0, 66.0, 142.0, 230.0, 240.0, 131.0, 86.0, 41.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.39588928222656, -54.76677322387695, -52.13766098022461, -49.508544921875, -46.879432678222656, -44.25031661987305, -41.62120056152344, -38.992088317871094, -36.362972259521484, -33.733856201171875, -31.10474395751953, -28.475627899169922, -25.846513748168945, -23.21739959716797, -20.58828353881836, -17.959169387817383, -15.330055236816406, -12.70094108581543, -10.071825981140137, -7.442711353302002, -4.813596725463867, -2.1844825744628906, 0.44463253021240234, 3.0737476348876953, 5.702861785888672, 8.331975936889648, 10.961091041564941, 13.590206146240234, 16.21932029724121, 18.848434448242188, 21.477550506591797, 24.106664657592773, 26.73577880859375, 29.364892959594727, 31.994007110595703, 34.62312316894531, 37.252235412597656, 39.881351470947266, 42.510467529296875, 45.13957977294922, 47.76869583129883, 50.39781188964844, 53.02692413330078, 55.65604019165039, 58.28515625, 60.914268493652344, 63.54338455200195, 66.17250061035156, 68.8016128540039, 71.43072509765625, 74.05984497070312, 76.68895721435547, 79.31806945800781, 81.94718933105469, 84.57630157470703, 87.20541381835938, 89.83453369140625, 92.4636459350586, 95.09276580810547, 97.72187805175781, 100.35099029541016, 102.9801025390625, 105.60922241210938, 108.23833465576172, 110.86744689941406]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 8.0, 11.0, 11.0, 11.0, 10.0, 22.0, 23.0, 15.0, 27.0, 27.0, 31.0, 38.0, 37.0, 36.0, 48.0, 38.0, 34.0, 48.0, 49.0, 48.0, 38.0, 45.0, 41.0, 27.0, 37.0, 31.0, 28.0, 31.0, 23.0, 23.0, 13.0, 13.0, 8.0, 8.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.982872009277344, -18.310510635375977, -17.63814926147461, -16.965789794921875, -16.293428421020508, -15.62106704711914, -14.948705673217773, -14.276344299316406, -13.603983879089355, -12.931622505187988, -12.259262084960938, -11.58690071105957, -10.914539337158203, -10.242178916931152, -9.569817543029785, -8.897457122802734, -8.225095748901367, -7.552734851837158, -6.880373954772949, -6.208012580871582, -5.535651683807373, -4.863290786743164, -4.190929412841797, -3.518568515777588, -2.846207618713379, -2.17384672164917, -1.5014855861663818, -0.8291244506835938, -0.15676355361938477, 0.5155973434448242, 1.1879587173461914, 1.8603196144104004, 2.5326805114746094, 3.2050414085388184, 3.8774025440216064, 4.5497636795043945, 5.2221245765686035, 5.8944854736328125, 6.56684684753418, 7.239207744598389, 7.911568641662598, 8.583930015563965, 9.256290435791016, 9.928651809692383, 10.60101318359375, 11.2733736038208, 11.945734977722168, 12.618095397949219, 13.290456771850586, 13.962818145751953, 14.635178565979004, 15.307539939880371, 15.979900360107422, 16.65226173400879, 17.324623107910156, 17.996984481811523, 18.66934585571289, 19.341707229614258, 20.014068603515625, 20.68642807006836, 21.358789443969727, 22.031150817871094, 22.70351219177246, 23.375873565673828, 24.048233032226562]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 12.0, 15.0, 19.0, 23.0, 43.0, 46.0, 64.0, 88.0, 174.0, 237.0, 380.0, 660.0, 1124.0, 2085.0, 3953.0, 7979.0, 17222.0, 38232.0, 85917.0, 189971.0, 332801.0, 200608.0, 90612.0, 40365.0, 18044.0, 8391.0, 4190.0, 2242.0, 1198.0, 673.0, 394.0, 237.0, 161.0, 123.0, 76.0, 58.0, 40.0, 26.0, 11.0, 16.0, 11.0, 7.0, 4.0, 6.0, 2.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.90625, -17.31982421875, -16.7333984375, -16.14697265625, -15.560546875, -14.97412109375, -14.3876953125, -13.80126953125, -13.21484375, -12.62841796875, -12.0419921875, -11.45556640625, -10.869140625, -10.28271484375, -9.6962890625, -9.10986328125, -8.5234375, -7.93701171875, -7.3505859375, -6.76416015625, -6.177734375, -5.59130859375, -5.0048828125, -4.41845703125, -3.83203125, -3.24560546875, -2.6591796875, -2.07275390625, -1.486328125, -0.89990234375, -0.3134765625, 0.27294921875, 0.859375, 1.44580078125, 2.0322265625, 2.61865234375, 3.205078125, 3.79150390625, 4.3779296875, 4.96435546875, 5.55078125, 6.13720703125, 6.7236328125, 7.31005859375, 7.896484375, 8.48291015625, 9.0693359375, 9.65576171875, 10.2421875, 10.82861328125, 11.4150390625, 12.00146484375, 12.587890625, 13.17431640625, 13.7607421875, 14.34716796875, 14.93359375, 15.52001953125, 16.1064453125, 16.69287109375, 17.279296875, 17.86572265625, 18.4521484375, 19.03857421875, 19.625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 13.0, 12.0, 26.0, 37.0, 49.0, 64.0, 84.0, 57.0, 85.0, 86.0, 78.0, 78.0, 57.0, 47.0, 54.0, 35.0, 27.0, 24.0, 17.0, 13.0, 8.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2274169921875, -9.814208984375, -9.4010009765625, -8.98779296875, -8.5745849609375, -8.161376953125, -7.7481689453125, -7.3349609375, -6.9217529296875, -6.508544921875, -6.0953369140625, -5.68212890625, -5.2689208984375, -4.855712890625, -4.4425048828125, -4.029296875, -3.6160888671875, -3.202880859375, -2.7896728515625, -2.37646484375, -1.9632568359375, -1.550048828125, -1.1368408203125, -0.7236328125, -0.3104248046875, 0.102783203125, 0.5159912109375, 0.92919921875, 1.3424072265625, 1.755615234375, 2.1688232421875, 2.58203125, 2.9952392578125, 3.408447265625, 3.8216552734375, 4.23486328125, 4.6480712890625, 5.061279296875, 5.4744873046875, 5.8876953125, 6.3009033203125, 6.714111328125, 7.1273193359375, 7.54052734375, 7.9537353515625, 8.366943359375, 8.7801513671875, 9.193359375, 9.6065673828125, 10.019775390625, 10.4329833984375, 10.84619140625, 11.2593994140625, 11.672607421875, 12.0858154296875, 12.4990234375, 12.9122314453125, 13.325439453125, 13.7386474609375, 14.15185546875, 14.5650634765625, 14.978271484375, 15.3914794921875, 15.8046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 11.0, 5.0, 10.0, 14.0, 19.0, 32.0, 58.0, 86.0, 132.0, 184.0, 271.0, 494.0, 950.0, 2101.0, 6928.0, 41130.0, 525026.0, 425251.0, 35409.0, 6247.0, 1914.0, 935.0, 510.0, 279.0, 165.0, 103.0, 78.0, 57.0, 35.0, 33.0, 23.0, 15.0, 13.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.26123046875, -35.9287109375, -34.59619140625, -33.263671875, -31.93115234375, -30.5986328125, -29.26611328125, -27.93359375, -26.60107421875, -25.2685546875, -23.93603515625, -22.603515625, -21.27099609375, -19.9384765625, -18.60595703125, -17.2734375, -15.94091796875, -14.6083984375, -13.27587890625, -11.943359375, -10.61083984375, -9.2783203125, -7.94580078125, -6.61328125, -5.28076171875, -3.9482421875, -2.61572265625, -1.283203125, 0.04931640625, 1.3818359375, 2.71435546875, 4.046875, 5.37939453125, 6.7119140625, 8.04443359375, 9.376953125, 10.70947265625, 12.0419921875, 13.37451171875, 14.70703125, 16.03955078125, 17.3720703125, 18.70458984375, 20.037109375, 21.36962890625, 22.7021484375, 24.03466796875, 25.3671875, 26.69970703125, 28.0322265625, 29.36474609375, 30.697265625, 32.02978515625, 33.3623046875, 34.69482421875, 36.02734375, 37.35986328125, 38.6923828125, 40.02490234375, 41.357421875, 42.68994140625, 44.0224609375, 45.35498046875, 46.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 12.0, 12.0, 17.0, 17.0, 20.0, 20.0, 25.0, 40.0, 38.0, 28.0, 37.0, 50.0, 52.0, 45.0, 45.0, 47.0, 52.0, 42.0, 52.0, 54.0, 48.0, 25.0, 34.0, 31.0, 28.0, 22.0, 12.0, 17.0, 9.0, 6.0, 9.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.59326171875, -31.5302734375, -30.46728515625, -29.404296875, -28.34130859375, -27.2783203125, -26.21533203125, -25.15234375, -24.08935546875, -23.0263671875, -21.96337890625, -20.900390625, -19.83740234375, -18.7744140625, -17.71142578125, -16.6484375, -15.58544921875, -14.5224609375, -13.45947265625, -12.396484375, -11.33349609375, -10.2705078125, -9.20751953125, -8.14453125, -7.08154296875, -6.0185546875, -4.95556640625, -3.892578125, -2.82958984375, -1.7666015625, -0.70361328125, 0.359375, 1.42236328125, 2.4853515625, 3.54833984375, 4.611328125, 5.67431640625, 6.7373046875, 7.80029296875, 8.86328125, 9.92626953125, 10.9892578125, 12.05224609375, 13.115234375, 14.17822265625, 15.2412109375, 16.30419921875, 17.3671875, 18.43017578125, 19.4931640625, 20.55615234375, 21.619140625, 22.68212890625, 23.7451171875, 24.80810546875, 25.87109375, 26.93408203125, 27.9970703125, 29.06005859375, 30.123046875, 31.18603515625, 32.2490234375, 33.31201171875, 34.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 3.0, 10.0, 10.0, 12.0, 24.0, 30.0, 54.0, 66.0, 107.0, 179.0, 239.0, 473.0, 835.0, 1825.0, 4250.0, 12211.0, 42918.0, 179146.0, 566067.0, 177707.0, 42329.0, 12192.0, 4147.0, 1674.0, 839.0, 422.0, 250.0, 149.0, 105.0, 73.0, 49.0, 39.0, 21.0, 20.0, 16.0, 11.0, 13.0, 6.0, 7.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.31829833984375, -7.0701904296875, -6.82208251953125, -6.573974609375, -6.32586669921875, -6.0777587890625, -5.82965087890625, -5.58154296875, -5.33343505859375, -5.0853271484375, -4.83721923828125, -4.589111328125, -4.34100341796875, -4.0928955078125, -3.84478759765625, -3.5966796875, -3.34857177734375, -3.1004638671875, -2.85235595703125, -2.604248046875, -2.35614013671875, -2.1080322265625, -1.85992431640625, -1.61181640625, -1.36370849609375, -1.1156005859375, -0.86749267578125, -0.619384765625, -0.37127685546875, -0.1231689453125, 0.12493896484375, 0.373046875, 0.62115478515625, 0.8692626953125, 1.11737060546875, 1.365478515625, 1.61358642578125, 1.8616943359375, 2.10980224609375, 2.35791015625, 2.60601806640625, 2.8541259765625, 3.10223388671875, 3.350341796875, 3.59844970703125, 3.8465576171875, 4.09466552734375, 4.3427734375, 4.59088134765625, 4.8389892578125, 5.08709716796875, 5.335205078125, 5.58331298828125, 5.8314208984375, 6.07952880859375, 6.32763671875, 6.57574462890625, 6.8238525390625, 7.07196044921875, 7.320068359375, 7.56817626953125, 7.8162841796875, 8.06439208984375, 8.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 7.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 12.0, 22.0, 13.0, 19.0, 25.0, 32.0, 34.0, 33.0, 41.0, 45.0, 97.0, 87.0, 83.0, 73.0, 64.0, 44.0, 40.0, 28.0, 14.0, 24.0, 18.0, 16.0, 14.0, 16.0, 11.0, 12.0, 3.0, 4.0, 5.0, 4.0, 1.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015697479248046875, -0.001520305871963501, -0.0014708638191223145, -0.001421421766281128, -0.0013719797134399414, -0.0013225376605987549, -0.0012730956077575684, -0.0012236535549163818, -0.0011742115020751953, -0.0011247694492340088, -0.0010753273963928223, -0.0010258853435516357, -0.0009764432907104492, -0.0009270012378692627, -0.0008775591850280762, -0.0008281171321868896, -0.0007786750793457031, -0.0007292330265045166, -0.0006797909736633301, -0.0006303489208221436, -0.000580906867980957, -0.0005314648151397705, -0.000482022762298584, -0.00043258070945739746, -0.00038313865661621094, -0.0003336966037750244, -0.0002842545509338379, -0.00023481249809265137, -0.00018537044525146484, -0.00013592839241027832, -8.64863395690918e-05, -3.7044286727905273e-05, 1.239776611328125e-05, 6.183981895446777e-05, 0.0001112818717956543, 0.00016072392463684082, 0.00021016597747802734, 0.00025960803031921387, 0.0003090500831604004, 0.0003584921360015869, 0.00040793418884277344, 0.00045737624168395996, 0.0005068182945251465, 0.000556260347366333, 0.0006057024002075195, 0.0006551444530487061, 0.0007045865058898926, 0.0007540285587310791, 0.0008034706115722656, 0.0008529126644134521, 0.0009023547172546387, 0.0009517967700958252, 0.0010012388229370117, 0.0010506808757781982, 0.0011001229286193848, 0.0011495649814605713, 0.0011990070343017578, 0.0012484490871429443, 0.0012978911399841309, 0.0013473331928253174, 0.001396775245666504, 0.0014462172985076904, 0.001495659351348877, 0.0015451014041900635, 0.00159454345703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 14.0, 28.0, 31.0, 64.0, 117.0, 235.0, 457.0, 1095.0, 3201.0, 16257.0, 202389.0, 747214.0, 66361.0, 7619.0, 1937.0, 772.0, 328.0, 178.0, 108.0, 58.0, 25.0, 16.0, 11.0, 8.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.0703125, -13.5731201171875, -13.075927734375, -12.5787353515625, -12.08154296875, -11.5843505859375, -11.087158203125, -10.5899658203125, -10.0927734375, -9.5955810546875, -9.098388671875, -8.6011962890625, -8.10400390625, -7.6068115234375, -7.109619140625, -6.6124267578125, -6.115234375, -5.6180419921875, -5.120849609375, -4.6236572265625, -4.12646484375, -3.6292724609375, -3.132080078125, -2.6348876953125, -2.1376953125, -1.6405029296875, -1.143310546875, -0.6461181640625, -0.14892578125, 0.3482666015625, 0.845458984375, 1.3426513671875, 1.83984375, 2.3370361328125, 2.834228515625, 3.3314208984375, 3.82861328125, 4.3258056640625, 4.822998046875, 5.3201904296875, 5.8173828125, 6.3145751953125, 6.811767578125, 7.3089599609375, 7.80615234375, 8.3033447265625, 8.800537109375, 9.2977294921875, 9.794921875, 10.2921142578125, 10.789306640625, 11.2864990234375, 11.78369140625, 12.2808837890625, 12.778076171875, 13.2752685546875, 13.7724609375, 14.2696533203125, 14.766845703125, 15.2640380859375, 15.76123046875, 16.2584228515625, 16.755615234375, 17.2528076171875, 17.75]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 5.0, 9.0, 12.0, 25.0, 19.0, 26.0, 26.0, 34.0, 51.0, 45.0, 62.0, 56.0, 83.0, 75.0, 68.0, 67.0, 55.0, 38.0, 31.0, 30.0, 20.0, 27.0, 26.0, 12.0, 9.0, 10.0, 11.0, 9.0, 8.0, 8.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.671875, -8.4390869140625, -8.206298828125, -7.9735107421875, -7.74072265625, -7.5079345703125, -7.275146484375, -7.0423583984375, -6.8095703125, -6.5767822265625, -6.343994140625, -6.1112060546875, -5.87841796875, -5.6456298828125, -5.412841796875, -5.1800537109375, -4.947265625, -4.7144775390625, -4.481689453125, -4.2489013671875, -4.01611328125, -3.7833251953125, -3.550537109375, -3.3177490234375, -3.0849609375, -2.8521728515625, -2.619384765625, -2.3865966796875, -2.15380859375, -1.9210205078125, -1.688232421875, -1.4554443359375, -1.22265625, -0.9898681640625, -0.757080078125, -0.5242919921875, -0.29150390625, -0.0587158203125, 0.174072265625, 0.4068603515625, 0.6396484375, 0.8724365234375, 1.105224609375, 1.3380126953125, 1.57080078125, 1.8035888671875, 2.036376953125, 2.2691650390625, 2.501953125, 2.7347412109375, 2.967529296875, 3.2003173828125, 3.43310546875, 3.6658935546875, 3.898681640625, 4.1314697265625, 4.3642578125, 4.5970458984375, 4.829833984375, 5.0626220703125, 5.29541015625, 5.5281982421875, 5.760986328125, 5.9937744140625, 6.2265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 16.0, 16.0, 36.0, 51.0, 81.0, 115.0, 171.0, 160.0, 112.0, 82.0, 58.0, 41.0, 12.0, 17.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.3588562011719, -272.6461181640625, -264.93341064453125, -257.2206726074219, -249.5079345703125, -241.7952117919922, -234.0824737548828, -226.3697509765625, -218.65701293945312, -210.9442901611328, -203.23155212402344, -195.51882934570312, -187.80609130859375, -180.09336853027344, -172.38063049316406, -164.66790771484375, -156.95516967773438, -149.24244689941406, -141.5297088623047, -133.81698608398438, -126.104248046875, -118.39152526855469, -110.67878723144531, -102.966064453125, -95.25334167480469, -87.54061126708984, -79.827880859375, -72.11515045166016, -64.40242004394531, -56.689693450927734, -48.97696304321289, -41.26423263549805, -33.55149841308594, -25.838768005371094, -18.12603759765625, -10.413309097290039, -2.7005786895751953, 5.012149810791016, 12.72488021850586, 20.437610626220703, 28.150341033935547, 35.86307144165039, 43.575801849365234, 51.28852844238281, 59.001258850097656, 66.7139892578125, 74.42671966552734, 82.13945007324219, 89.85218048095703, 97.56491088867188, 105.27764129638672, 112.99037170410156, 120.7031021118164, 128.41583251953125, 136.12855529785156, 143.84129333496094, 151.55401611328125, 159.26673889160156, 166.97947692871094, 174.69219970703125, 182.40493774414062, 190.11766052246094, 197.8303985595703, 205.54312133789062, 213.255859375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 12.0, 7.0, 9.0, 12.0, 16.0, 21.0, 23.0, 27.0, 41.0, 33.0, 42.0, 47.0, 52.0, 49.0, 61.0, 60.0, 55.0, 56.0, 47.0, 47.0, 38.0, 34.0, 43.0, 26.0, 24.0, 19.0, 17.0, 23.0, 10.0, 5.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.3222198486328, -148.1531982421875, -142.98419189453125, -137.81517028808594, -132.6461639404297, -127.47714233398438, -122.3081283569336, -117.13911437988281, -111.97010040283203, -106.80108642578125, -101.63207244873047, -96.46305847167969, -91.29403686523438, -86.12503051757812, -80.95600891113281, -75.78699493408203, -70.61798095703125, -65.44896697998047, -60.27995300292969, -55.11093521118164, -49.94192123413086, -44.77290725708008, -39.60388946533203, -34.43487548828125, -29.26586151123047, -24.096847534179688, -18.927831649780273, -13.758816719055176, -8.589801788330078, -3.420787811279297, 1.7482280731201172, 6.917243957519531, 12.08624267578125, 17.25525665283203, 22.424272537231445, 27.59328842163086, 32.76230239868164, 37.93131637573242, 43.10033416748047, 48.26934814453125, 53.43836212158203, 58.60737609863281, 63.776390075683594, 68.94540405273438, 74.11442565917969, 79.28343200683594, 84.45245361328125, 89.62146759033203, 94.79048156738281, 99.9594955444336, 105.12850952148438, 110.29752349853516, 115.46653747558594, 120.63555908203125, 125.80457305908203, 130.9735870361328, 136.14260864257812, 141.31163024902344, 146.4806365966797, 151.649658203125, 156.81866455078125, 161.98768615722656, 167.1566925048828, 172.32571411132812, 177.49472045898438]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 12.0, 8.0, 20.0, 25.0, 47.0, 65.0, 78.0, 107.0, 176.0, 257.0, 384.0, 589.0, 937.0, 1598.0, 2726.0, 4856.0, 9444.0, 20445.0, 52049.0, 196381.0, 2520412.0, 1181906.0, 127138.0, 39450.0, 16281.0, 8061.0, 4290.0, 2384.0, 1441.0, 925.0, 586.0, 344.0, 249.0, 185.0, 108.0, 77.0, 74.0, 37.0, 28.0, 23.0, 12.0, 13.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0], "bins": [-14.578125, -14.090087890625, -13.60205078125, -13.114013671875, -12.6259765625, -12.137939453125, -11.64990234375, -11.161865234375, -10.673828125, -10.185791015625, -9.69775390625, -9.209716796875, -8.7216796875, -8.233642578125, -7.74560546875, -7.257568359375, -6.76953125, -6.281494140625, -5.79345703125, -5.305419921875, -4.8173828125, -4.329345703125, -3.84130859375, -3.353271484375, -2.865234375, -2.377197265625, -1.88916015625, -1.401123046875, -0.9130859375, -0.425048828125, 0.06298828125, 0.551025390625, 1.0390625, 1.527099609375, 2.01513671875, 2.503173828125, 2.9912109375, 3.479248046875, 3.96728515625, 4.455322265625, 4.943359375, 5.431396484375, 5.91943359375, 6.407470703125, 6.8955078125, 7.383544921875, 7.87158203125, 8.359619140625, 8.84765625, 9.335693359375, 9.82373046875, 10.311767578125, 10.7998046875, 11.287841796875, 11.77587890625, 12.263916015625, 12.751953125, 13.239990234375, 13.72802734375, 14.216064453125, 14.7041015625, 15.192138671875, 15.68017578125, 16.168212890625, 16.65625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 15.0, 17.0, 19.0, 22.0, 34.0, 41.0, 43.0, 42.0, 63.0, 54.0, 59.0, 63.0, 61.0, 56.0, 80.0, 47.0, 40.0, 39.0, 32.0, 30.0, 18.0, 20.0, 22.0, 16.0, 7.0, 11.0, 8.0, 7.0, 11.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.54345703125, -8.2431640625, -7.94287109375, -7.642578125, -7.34228515625, -7.0419921875, -6.74169921875, -6.44140625, -6.14111328125, -5.8408203125, -5.54052734375, -5.240234375, -4.93994140625, -4.6396484375, -4.33935546875, -4.0390625, -3.73876953125, -3.4384765625, -3.13818359375, -2.837890625, -2.53759765625, -2.2373046875, -1.93701171875, -1.63671875, -1.33642578125, -1.0361328125, -0.73583984375, -0.435546875, -0.13525390625, 0.1650390625, 0.46533203125, 0.765625, 1.06591796875, 1.3662109375, 1.66650390625, 1.966796875, 2.26708984375, 2.5673828125, 2.86767578125, 3.16796875, 3.46826171875, 3.7685546875, 4.06884765625, 4.369140625, 4.66943359375, 4.9697265625, 5.27001953125, 5.5703125, 5.87060546875, 6.1708984375, 6.47119140625, 6.771484375, 7.07177734375, 7.3720703125, 7.67236328125, 7.97265625, 8.27294921875, 8.5732421875, 8.87353515625, 9.173828125, 9.47412109375, 9.7744140625, 10.07470703125, 10.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 7.0, 2.0, 9.0, 10.0, 15.0, 18.0, 28.0, 37.0, 69.0, 105.0, 230.0, 531.0, 1354.0, 4354.0, 16588.0, 90127.0, 3301631.0, 715300.0, 48815.0, 10239.0, 2953.0, 1005.0, 408.0, 179.0, 93.0, 61.0, 40.0, 23.0, 8.0, 8.0, 8.0, 6.0, 1.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.8486328125, -35.791015625, -34.7333984375, -33.67578125, -32.6181640625, -31.560546875, -30.5029296875, -29.4453125, -28.3876953125, -27.330078125, -26.2724609375, -25.21484375, -24.1572265625, -23.099609375, -22.0419921875, -20.984375, -19.9267578125, -18.869140625, -17.8115234375, -16.75390625, -15.6962890625, -14.638671875, -13.5810546875, -12.5234375, -11.4658203125, -10.408203125, -9.3505859375, -8.29296875, -7.2353515625, -6.177734375, -5.1201171875, -4.0625, -3.0048828125, -1.947265625, -0.8896484375, 0.16796875, 1.2255859375, 2.283203125, 3.3408203125, 4.3984375, 5.4560546875, 6.513671875, 7.5712890625, 8.62890625, 9.6865234375, 10.744140625, 11.8017578125, 12.859375, 13.9169921875, 14.974609375, 16.0322265625, 17.08984375, 18.1474609375, 19.205078125, 20.2626953125, 21.3203125, 22.3779296875, 23.435546875, 24.4931640625, 25.55078125, 26.6083984375, 27.666015625, 28.7236328125, 29.78125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 15.0, 13.0, 27.0, 16.0, 30.0, 46.0, 53.0, 91.0, 139.0, 242.0, 466.0, 1067.0, 939.0, 370.0, 186.0, 89.0, 67.0, 58.0, 31.0, 22.0, 17.0, 15.0, 7.0, 4.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.421875, -20.67822265625, -19.9345703125, -19.19091796875, -18.447265625, -17.70361328125, -16.9599609375, -16.21630859375, -15.47265625, -14.72900390625, -13.9853515625, -13.24169921875, -12.498046875, -11.75439453125, -11.0107421875, -10.26708984375, -9.5234375, -8.77978515625, -8.0361328125, -7.29248046875, -6.548828125, -5.80517578125, -5.0615234375, -4.31787109375, -3.57421875, -2.83056640625, -2.0869140625, -1.34326171875, -0.599609375, 0.14404296875, 0.8876953125, 1.63134765625, 2.375, 3.11865234375, 3.8623046875, 4.60595703125, 5.349609375, 6.09326171875, 6.8369140625, 7.58056640625, 8.32421875, 9.06787109375, 9.8115234375, 10.55517578125, 11.298828125, 12.04248046875, 12.7861328125, 13.52978515625, 14.2734375, 15.01708984375, 15.7607421875, 16.50439453125, 17.248046875, 17.99169921875, 18.7353515625, 19.47900390625, 20.22265625, 20.96630859375, 21.7099609375, 22.45361328125, 23.197265625, 23.94091796875, 24.6845703125, 25.42822265625, 26.171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 13.0, 12.0, 16.0, 31.0, 57.0, 85.0, 133.0, 158.0, 141.0, 111.0, 86.0, 65.0, 33.0, 15.0, 13.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-219.05348205566406, -213.0821075439453, -207.11073303222656, -201.1393585205078, -195.16798400878906, -189.1966094970703, -183.22525024414062, -177.25387573242188, -171.28250122070312, -165.31112670898438, -159.33975219726562, -153.36837768554688, -147.39700317382812, -141.42562866210938, -135.45425415039062, -129.48287963867188, -123.51150512695312, -117.54013061523438, -111.56875610351562, -105.59738159179688, -99.62600708007812, -93.65463256835938, -87.68326568603516, -81.7118911743164, -75.74051666259766, -69.7691421508789, -63.797767639160156, -57.82639694213867, -51.85502243041992, -45.88364791870117, -39.91227722167969, -33.94090270996094, -27.96954345703125, -21.9981689453125, -16.026796340942383, -10.055423736572266, -4.084049224853516, 1.8873252868652344, 7.858695983886719, 13.830070495605469, 19.80144500732422, 25.77281951904297, 31.744192123413086, 37.7155647277832, 43.68693923950195, 49.6583137512207, 55.62968444824219, 61.60105895996094, 67.57243347167969, 73.54380798339844, 79.51518249511719, 85.48655700683594, 91.45793151855469, 97.42930603027344, 103.40067291259766, 109.3720474243164, 115.34342193603516, 121.3147964477539, 127.28617095947266, 133.25753784179688, 139.22891235351562, 145.20028686523438, 151.17166137695312, 157.14303588867188, 163.11441040039062]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 7.0, 6.0, 12.0, 12.0, 7.0, 10.0, 8.0, 13.0, 20.0, 22.0, 22.0, 19.0, 26.0, 26.0, 37.0, 29.0, 27.0, 37.0, 45.0, 39.0, 34.0, 59.0, 36.0, 43.0, 50.0, 37.0, 27.0, 34.0, 33.0, 30.0, 41.0, 23.0, 19.0, 14.0, 22.0, 17.0, 7.0, 11.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-108.81504821777344, -105.65342712402344, -102.49180603027344, -99.33018493652344, -96.16856384277344, -93.00694274902344, -89.84532165527344, -86.68370056152344, -83.52207946777344, -80.36045837402344, -77.19883728027344, -74.03721618652344, -70.87559509277344, -67.71397399902344, -64.55235290527344, -61.3907356262207, -58.22911834716797, -55.06749725341797, -51.90587615966797, -48.74425506591797, -45.58263397216797, -42.42101287841797, -39.259395599365234, -36.097774505615234, -32.936153411865234, -29.774532318115234, -26.612911224365234, -23.451292037963867, -20.289670944213867, -17.128049850463867, -13.9664306640625, -10.8048095703125, -7.6431884765625, -4.481567859649658, -1.3199472427368164, 1.8416728973388672, 5.003293991088867, 8.164915084838867, 11.326534271240234, 14.488155364990234, 17.649776458740234, 20.811397552490234, 23.973018646240234, 27.1346378326416, 30.2962589263916, 33.45787811279297, 36.61949920654297, 39.78112030029297, 42.94274139404297, 46.10436248779297, 49.26598358154297, 52.42760467529297, 55.58922576904297, 58.75084686279297, 61.9124641418457, 65.07408142089844, 68.23570251464844, 71.39732360839844, 74.55894470214844, 77.72056579589844, 80.88218688964844, 84.04380798339844, 87.20542907714844, 90.36705017089844, 93.52867126464844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 11.0, 16.0, 18.0, 26.0, 32.0, 67.0, 86.0, 150.0, 165.0, 301.0, 445.0, 751.0, 1314.0, 2146.0, 4021.0, 7452.0, 15138.0, 32380.0, 73710.0, 184594.0, 367034.0, 206987.0, 81564.0, 35539.0, 16564.0, 7943.0, 4299.0, 2284.0, 1366.0, 723.0, 482.0, 293.0, 209.0, 160.0, 89.0, 55.0, 39.0, 25.0, 23.0, 15.0, 10.0, 10.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.7054443359375, -15.207763671875, -14.7100830078125, -14.21240234375, -13.7147216796875, -13.217041015625, -12.7193603515625, -12.2216796875, -11.7239990234375, -11.226318359375, -10.7286376953125, -10.23095703125, -9.7332763671875, -9.235595703125, -8.7379150390625, -8.240234375, -7.7425537109375, -7.244873046875, -6.7471923828125, -6.24951171875, -5.7518310546875, -5.254150390625, -4.7564697265625, -4.2587890625, -3.7611083984375, -3.263427734375, -2.7657470703125, -2.26806640625, -1.7703857421875, -1.272705078125, -0.7750244140625, -0.27734375, 0.2203369140625, 0.718017578125, 1.2156982421875, 1.71337890625, 2.2110595703125, 2.708740234375, 3.2064208984375, 3.7041015625, 4.2017822265625, 4.699462890625, 5.1971435546875, 5.69482421875, 6.1925048828125, 6.690185546875, 7.1878662109375, 7.685546875, 8.1832275390625, 8.680908203125, 9.1785888671875, 9.67626953125, 10.1739501953125, 10.671630859375, 11.1693115234375, 11.6669921875, 12.1646728515625, 12.662353515625, 13.1600341796875, 13.65771484375, 14.1553955078125, 14.653076171875, 15.1507568359375, 15.6484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 8.0, 12.0, 12.0, 16.0, 14.0, 23.0, 24.0, 28.0, 40.0, 40.0, 41.0, 49.0, 47.0, 51.0, 66.0, 53.0, 51.0, 56.0, 50.0, 51.0, 39.0, 35.0, 27.0, 28.0, 19.0, 25.0, 20.0, 16.0, 12.0, 6.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.109375, -8.8382568359375, -8.567138671875, -8.2960205078125, -8.02490234375, -7.7537841796875, -7.482666015625, -7.2115478515625, -6.9404296875, -6.6693115234375, -6.398193359375, -6.1270751953125, -5.85595703125, -5.5848388671875, -5.313720703125, -5.0426025390625, -4.771484375, -4.5003662109375, -4.229248046875, -3.9581298828125, -3.68701171875, -3.4158935546875, -3.144775390625, -2.8736572265625, -2.6025390625, -2.3314208984375, -2.060302734375, -1.7891845703125, -1.51806640625, -1.2469482421875, -0.975830078125, -0.7047119140625, -0.43359375, -0.1624755859375, 0.108642578125, 0.3797607421875, 0.65087890625, 0.9219970703125, 1.193115234375, 1.4642333984375, 1.7353515625, 2.0064697265625, 2.277587890625, 2.5487060546875, 2.81982421875, 3.0909423828125, 3.362060546875, 3.6331787109375, 3.904296875, 4.1754150390625, 4.446533203125, 4.7176513671875, 4.98876953125, 5.2598876953125, 5.531005859375, 5.8021240234375, 6.0732421875, 6.3443603515625, 6.615478515625, 6.8865966796875, 7.15771484375, 7.4288330078125, 7.699951171875, 7.9710693359375, 8.2421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 14.0, 15.0, 23.0, 35.0, 30.0, 53.0, 83.0, 140.0, 172.0, 333.0, 598.0, 1194.0, 2932.0, 10921.0, 96354.0, 802552.0, 114608.0, 12558.0, 3100.0, 1266.0, 598.0, 321.0, 206.0, 131.0, 77.0, 65.0, 43.0, 26.0, 20.0, 12.0, 14.0, 9.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.71875, -41.44482421875, -40.1708984375, -38.89697265625, -37.623046875, -36.34912109375, -35.0751953125, -33.80126953125, -32.52734375, -31.25341796875, -29.9794921875, -28.70556640625, -27.431640625, -26.15771484375, -24.8837890625, -23.60986328125, -22.3359375, -21.06201171875, -19.7880859375, -18.51416015625, -17.240234375, -15.96630859375, -14.6923828125, -13.41845703125, -12.14453125, -10.87060546875, -9.5966796875, -8.32275390625, -7.048828125, -5.77490234375, -4.5009765625, -3.22705078125, -1.953125, -0.67919921875, 0.5947265625, 1.86865234375, 3.142578125, 4.41650390625, 5.6904296875, 6.96435546875, 8.23828125, 9.51220703125, 10.7861328125, 12.06005859375, 13.333984375, 14.60791015625, 15.8818359375, 17.15576171875, 18.4296875, 19.70361328125, 20.9775390625, 22.25146484375, 23.525390625, 24.79931640625, 26.0732421875, 27.34716796875, 28.62109375, 29.89501953125, 31.1689453125, 32.44287109375, 33.716796875, 34.99072265625, 36.2646484375, 37.53857421875, 38.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 5.0, 12.0, 10.0, 10.0, 6.0, 17.0, 17.0, 16.0, 12.0, 20.0, 18.0, 33.0, 36.0, 25.0, 42.0, 34.0, 42.0, 41.0, 47.0, 46.0, 39.0, 46.0, 40.0, 32.0, 45.0, 35.0, 32.0, 33.0, 35.0, 34.0, 24.0, 20.0, 12.0, 12.0, 12.0, 15.0, 12.0, 8.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.301025390625, -25.36767578125, -24.434326171875, -23.5009765625, -22.567626953125, -21.63427734375, -20.700927734375, -19.767578125, -18.834228515625, -17.90087890625, -16.967529296875, -16.0341796875, -15.100830078125, -14.16748046875, -13.234130859375, -12.30078125, -11.367431640625, -10.43408203125, -9.500732421875, -8.5673828125, -7.634033203125, -6.70068359375, -5.767333984375, -4.833984375, -3.900634765625, -2.96728515625, -2.033935546875, -1.1005859375, -0.167236328125, 0.76611328125, 1.699462890625, 2.6328125, 3.566162109375, 4.49951171875, 5.432861328125, 6.3662109375, 7.299560546875, 8.23291015625, 9.166259765625, 10.099609375, 11.032958984375, 11.96630859375, 12.899658203125, 13.8330078125, 14.766357421875, 15.69970703125, 16.633056640625, 17.56640625, 18.499755859375, 19.43310546875, 20.366455078125, 21.2998046875, 22.233154296875, 23.16650390625, 24.099853515625, 25.033203125, 25.966552734375, 26.89990234375, 27.833251953125, 28.7666015625, 29.699951171875, 30.63330078125, 31.566650390625, 32.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 10.0, 4.0, 6.0, 8.0, 18.0, 12.0, 19.0, 29.0, 41.0, 52.0, 80.0, 118.0, 204.0, 364.0, 631.0, 1549.0, 5417.0, 31933.0, 479482.0, 487629.0, 32271.0, 5562.0, 1541.0, 637.0, 330.0, 198.0, 105.0, 78.0, 53.0, 46.0, 25.0, 27.0, 29.0, 10.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.148193359375, -12.69482421875, -12.241455078125, -11.7880859375, -11.334716796875, -10.88134765625, -10.427978515625, -9.974609375, -9.521240234375, -9.06787109375, -8.614501953125, -8.1611328125, -7.707763671875, -7.25439453125, -6.801025390625, -6.34765625, -5.894287109375, -5.44091796875, -4.987548828125, -4.5341796875, -4.080810546875, -3.62744140625, -3.174072265625, -2.720703125, -2.267333984375, -1.81396484375, -1.360595703125, -0.9072265625, -0.453857421875, -0.00048828125, 0.452880859375, 0.90625, 1.359619140625, 1.81298828125, 2.266357421875, 2.7197265625, 3.173095703125, 3.62646484375, 4.079833984375, 4.533203125, 4.986572265625, 5.43994140625, 5.893310546875, 6.3466796875, 6.800048828125, 7.25341796875, 7.706787109375, 8.16015625, 8.613525390625, 9.06689453125, 9.520263671875, 9.9736328125, 10.427001953125, 10.88037109375, 11.333740234375, 11.787109375, 12.240478515625, 12.69384765625, 13.147216796875, 13.6005859375, 14.053955078125, 14.50732421875, 14.960693359375, 15.4140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 10.0, 11.0, 10.0, 18.0, 28.0, 33.0, 35.0, 53.0, 57.0, 82.0, 98.0, 100.0, 100.0, 77.0, 60.0, 45.0, 34.0, 24.0, 24.0, 13.0, 9.0, 10.0, 11.0, 3.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016164779663085938, -0.0015556365251541138, -0.0014947950839996338, -0.0014339536428451538, -0.0013731122016906738, -0.0013122707605361938, -0.0012514293193817139, -0.0011905878782272339, -0.001129746437072754, -0.001068904995918274, -0.001008063554763794, -0.000947222113609314, -0.000886380672454834, -0.000825539231300354, -0.000764697790145874, -0.000703856348991394, -0.0006430149078369141, -0.0005821734666824341, -0.0005213320255279541, -0.0004604905843734741, -0.00039964914321899414, -0.00033880770206451416, -0.0002779662609100342, -0.0002171248197555542, -0.00015628337860107422, -9.544193744659424e-05, -3.460049629211426e-05, 2.6240944862365723e-05, 8.70823860168457e-05, 0.00014792382717132568, 0.00020876526832580566, 0.00026960670948028564, 0.0003304481506347656, 0.0003912895917892456, 0.0004521310329437256, 0.0005129724740982056, 0.0005738139152526855, 0.0006346553564071655, 0.0006954967975616455, 0.0007563382387161255, 0.0008171796798706055, 0.0008780211210250854, 0.0009388625621795654, 0.0009997040033340454, 0.0010605454444885254, 0.0011213868856430054, 0.0011822283267974854, 0.0012430697679519653, 0.0013039112091064453, 0.0013647526502609253, 0.0014255940914154053, 0.0014864355325698853, 0.0015472769737243652, 0.0016081184148788452, 0.0016689598560333252, 0.0017298012971878052, 0.0017906427383422852, 0.0018514841794967651, 0.0019123256206512451, 0.001973167061805725, 0.002034008502960205, 0.002094849944114685, 0.002155691385269165, 0.002216532826423645, 0.002277374267578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 13.0, 23.0, 33.0, 55.0, 111.0, 184.0, 392.0, 916.0, 2591.0, 13173.0, 231167.0, 761926.0, 31165.0, 4480.0, 1275.0, 482.0, 252.0, 124.0, 71.0, 42.0, 27.0, 19.0, 8.0, 9.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.828125, -21.17041015625, -20.5126953125, -19.85498046875, -19.197265625, -18.53955078125, -17.8818359375, -17.22412109375, -16.56640625, -15.90869140625, -15.2509765625, -14.59326171875, -13.935546875, -13.27783203125, -12.6201171875, -11.96240234375, -11.3046875, -10.64697265625, -9.9892578125, -9.33154296875, -8.673828125, -8.01611328125, -7.3583984375, -6.70068359375, -6.04296875, -5.38525390625, -4.7275390625, -4.06982421875, -3.412109375, -2.75439453125, -2.0966796875, -1.43896484375, -0.78125, -0.12353515625, 0.5341796875, 1.19189453125, 1.849609375, 2.50732421875, 3.1650390625, 3.82275390625, 4.48046875, 5.13818359375, 5.7958984375, 6.45361328125, 7.111328125, 7.76904296875, 8.4267578125, 9.08447265625, 9.7421875, 10.39990234375, 11.0576171875, 11.71533203125, 12.373046875, 13.03076171875, 13.6884765625, 14.34619140625, 15.00390625, 15.66162109375, 16.3193359375, 16.97705078125, 17.634765625, 18.29248046875, 18.9501953125, 19.60791015625, 20.265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 3.0, 9.0, 13.0, 13.0, 24.0, 28.0, 27.0, 39.0, 58.0, 78.0, 59.0, 65.0, 82.0, 90.0, 78.0, 72.0, 56.0, 51.0, 26.0, 26.0, 25.0, 9.0, 10.0, 6.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.3770751953125, -11.027587890625, -10.6781005859375, -10.32861328125, -9.9791259765625, -9.629638671875, -9.2801513671875, -8.9306640625, -8.5811767578125, -8.231689453125, -7.8822021484375, -7.53271484375, -7.1832275390625, -6.833740234375, -6.4842529296875, -6.134765625, -5.7852783203125, -5.435791015625, -5.0863037109375, -4.73681640625, -4.3873291015625, -4.037841796875, -3.6883544921875, -3.3388671875, -2.9893798828125, -2.639892578125, -2.2904052734375, -1.94091796875, -1.5914306640625, -1.241943359375, -0.8924560546875, -0.54296875, -0.1934814453125, 0.156005859375, 0.5054931640625, 0.85498046875, 1.2044677734375, 1.553955078125, 1.9034423828125, 2.2529296875, 2.6024169921875, 2.951904296875, 3.3013916015625, 3.65087890625, 4.0003662109375, 4.349853515625, 4.6993408203125, 5.048828125, 5.3983154296875, 5.747802734375, 6.0972900390625, 6.44677734375, 6.7962646484375, 7.145751953125, 7.4952392578125, 7.8447265625, 8.1942138671875, 8.543701171875, 8.8931884765625, 9.24267578125, 9.5921630859375, 9.941650390625, 10.2911376953125, 10.640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 6.0, 36.0, 131.0, 400.0, 291.0, 103.0, 23.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-543.4518432617188, -527.4437255859375, -511.43560791015625, -495.427490234375, -479.41937255859375, -463.4112548828125, -447.40313720703125, -431.39501953125, -415.38690185546875, -399.3787841796875, -383.37066650390625, -367.362548828125, -351.35443115234375, -335.3463134765625, -319.33819580078125, -303.330078125, -287.3219909667969, -271.3138732910156, -255.30575561523438, -239.29763793945312, -223.28952026367188, -207.28140258789062, -191.27330017089844, -175.2651824951172, -159.25706481933594, -143.2489471435547, -127.24082946777344, -111.23271942138672, -95.22460174560547, -79.21648406982422, -63.2083740234375, -47.20025634765625, -31.192169189453125, -15.184053421020508, 0.8240623474121094, 16.832176208496094, 32.840293884277344, 48.848411560058594, 64.85652160644531, 80.86463928222656, 96.87275695800781, 112.88087463378906, 128.8889923095703, 144.8970947265625, 160.90521240234375, 176.913330078125, 192.92144775390625, 208.9295654296875, 224.93768310546875, 240.94580078125, 256.95391845703125, 272.9620361328125, 288.97015380859375, 304.978271484375, 320.98638916015625, 336.9945068359375, 353.00262451171875, 369.0107421875, 385.01885986328125, 401.0269775390625, 417.03509521484375, 433.043212890625, 449.05133056640625, 465.0594482421875, 481.0675354003906]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 14.0, 12.0, 21.0, 24.0, 31.0, 34.0, 34.0, 37.0, 61.0, 66.0, 73.0, 43.0, 62.0, 76.0, 60.0, 48.0, 39.0, 37.0, 28.0, 28.0, 34.0, 15.0, 14.0, 19.0, 9.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-161.8929443359375, -157.3733367919922, -152.8537139892578, -148.3341064453125, -143.8144989013672, -139.29489135742188, -134.7752685546875, -130.2556610107422, -125.73605346679688, -121.21643829345703, -116.69683074951172, -112.17721557617188, -107.65760803222656, -103.13799285888672, -98.61837768554688, -94.09877014160156, -89.57915496826172, -85.05953979492188, -80.53993225097656, -76.02031707763672, -71.5007095336914, -66.98109436035156, -62.461483001708984, -57.941871643066406, -53.42226028442383, -48.90264892578125, -44.38303756713867, -39.863426208496094, -35.34381103515625, -30.824201583862305, -26.304588317871094, -21.784976959228516, -17.265357971191406, -12.745746612548828, -8.226134300231934, -3.706521987915039, 0.8130893707275391, 5.332700729370117, 9.852313995361328, 14.371925354003906, 18.891536712646484, 23.411148071289062, 27.93075942993164, 32.45037078857422, 36.96998596191406, 41.489593505859375, 46.00920867919922, 50.5288200378418, 55.048431396484375, 59.56804275512695, 64.08765411376953, 68.60726928710938, 73.12687683105469, 77.64649200439453, 82.16610717773438, 86.68571472167969, 91.205322265625, 95.72493743896484, 100.24454498291016, 104.76416015625, 109.28376770019531, 113.80338287353516, 118.322998046875, 122.84260559082031, 127.36222076416016]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 4.0, 17.0, 12.0, 17.0, 18.0, 19.0, 33.0, 52.0, 62.0, 55.0, 113.0, 145.0, 267.0, 1021.0, 12554.0, 4068233.0, 107501.0, 2971.0, 497.0, 208.0, 135.0, 101.0, 56.0, 45.0, 45.0, 26.0, 24.0, 10.0, 14.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.875, -51.6064453125, -49.337890625, -47.0693359375, -44.80078125, -42.5322265625, -40.263671875, -37.9951171875, -35.7265625, -33.4580078125, -31.189453125, -28.9208984375, -26.65234375, -24.3837890625, -22.115234375, -19.8466796875, -17.578125, -15.3095703125, -13.041015625, -10.7724609375, -8.50390625, -6.2353515625, -3.966796875, -1.6982421875, 0.5703125, 2.8388671875, 5.107421875, 7.3759765625, 9.64453125, 11.9130859375, 14.181640625, 16.4501953125, 18.71875, 20.9873046875, 23.255859375, 25.5244140625, 27.79296875, 30.0615234375, 32.330078125, 34.5986328125, 36.8671875, 39.1357421875, 41.404296875, 43.6728515625, 45.94140625, 48.2099609375, 50.478515625, 52.7470703125, 55.015625, 57.2841796875, 59.552734375, 61.8212890625, 64.08984375, 66.3583984375, 68.626953125, 70.8955078125, 73.1640625, 75.4326171875, 77.701171875, 79.9697265625, 82.23828125, 84.5068359375, 86.775390625, 89.0439453125, 91.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 13.0, 9.0, 26.0, 20.0, 25.0, 30.0, 27.0, 44.0, 45.0, 50.0, 52.0, 56.0, 58.0, 60.0, 71.0, 58.0, 43.0, 45.0, 37.0, 31.0, 36.0, 24.0, 22.0, 20.0, 17.0, 12.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3515625, -9.077392578125, -8.80322265625, -8.529052734375, -8.2548828125, -7.980712890625, -7.70654296875, -7.432373046875, -7.158203125, -6.884033203125, -6.60986328125, -6.335693359375, -6.0615234375, -5.787353515625, -5.51318359375, -5.239013671875, -4.96484375, -4.690673828125, -4.41650390625, -4.142333984375, -3.8681640625, -3.593994140625, -3.31982421875, -3.045654296875, -2.771484375, -2.497314453125, -2.22314453125, -1.948974609375, -1.6748046875, -1.400634765625, -1.12646484375, -0.852294921875, -0.578125, -0.303955078125, -0.02978515625, 0.244384765625, 0.5185546875, 0.792724609375, 1.06689453125, 1.341064453125, 1.615234375, 1.889404296875, 2.16357421875, 2.437744140625, 2.7119140625, 2.986083984375, 3.26025390625, 3.534423828125, 3.80859375, 4.082763671875, 4.35693359375, 4.631103515625, 4.9052734375, 5.179443359375, 5.45361328125, 5.727783203125, 6.001953125, 6.276123046875, 6.55029296875, 6.824462890625, 7.0986328125, 7.372802734375, 7.64697265625, 7.921142578125, 8.1953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 13.0, 13.0, 14.0, 30.0, 51.0, 81.0, 141.0, 263.0, 490.0, 978.0, 2053.0, 4481.0, 11799.0, 35620.0, 195551.0, 3413345.0, 448455.0, 53433.0, 16169.0, 6138.0, 2687.0, 1220.0, 563.0, 282.0, 169.0, 81.0, 60.0, 30.0, 10.0, 20.0, 13.0, 9.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.640380859375, -18.99951171875, -18.358642578125, -17.7177734375, -17.076904296875, -16.43603515625, -15.795166015625, -15.154296875, -14.513427734375, -13.87255859375, -13.231689453125, -12.5908203125, -11.949951171875, -11.30908203125, -10.668212890625, -10.02734375, -9.386474609375, -8.74560546875, -8.104736328125, -7.4638671875, -6.822998046875, -6.18212890625, -5.541259765625, -4.900390625, -4.259521484375, -3.61865234375, -2.977783203125, -2.3369140625, -1.696044921875, -1.05517578125, -0.414306640625, 0.2265625, 0.867431640625, 1.50830078125, 2.149169921875, 2.7900390625, 3.430908203125, 4.07177734375, 4.712646484375, 5.353515625, 5.994384765625, 6.63525390625, 7.276123046875, 7.9169921875, 8.557861328125, 9.19873046875, 9.839599609375, 10.48046875, 11.121337890625, 11.76220703125, 12.403076171875, 13.0439453125, 13.684814453125, 14.32568359375, 14.966552734375, 15.607421875, 16.248291015625, 16.88916015625, 17.530029296875, 18.1708984375, 18.811767578125, 19.45263671875, 20.093505859375, 20.734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 9.0, 10.0, 11.0, 14.0, 17.0, 28.0, 40.0, 82.0, 100.0, 256.0, 633.0, 1358.0, 822.0, 319.0, 135.0, 79.0, 47.0, 25.0, 21.0, 13.0, 11.0, 16.0, 4.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.358154296875, -19.62255859375, -18.886962890625, -18.1513671875, -17.415771484375, -16.68017578125, -15.944580078125, -15.208984375, -14.473388671875, -13.73779296875, -13.002197265625, -12.2666015625, -11.531005859375, -10.79541015625, -10.059814453125, -9.32421875, -8.588623046875, -7.85302734375, -7.117431640625, -6.3818359375, -5.646240234375, -4.91064453125, -4.175048828125, -3.439453125, -2.703857421875, -1.96826171875, -1.232666015625, -0.4970703125, 0.238525390625, 0.97412109375, 1.709716796875, 2.4453125, 3.180908203125, 3.91650390625, 4.652099609375, 5.3876953125, 6.123291015625, 6.85888671875, 7.594482421875, 8.330078125, 9.065673828125, 9.80126953125, 10.536865234375, 11.2724609375, 12.008056640625, 12.74365234375, 13.479248046875, 14.21484375, 14.950439453125, 15.68603515625, 16.421630859375, 17.1572265625, 17.892822265625, 18.62841796875, 19.364013671875, 20.099609375, 20.835205078125, 21.57080078125, 22.306396484375, 23.0419921875, 23.777587890625, 24.51318359375, 25.248779296875, 25.984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 12.0, 34.0, 86.0, 207.0, 289.0, 229.0, 97.0, 26.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.63230895996094, -218.76780700683594, -209.90330505371094, -201.03878784179688, -192.17428588867188, -183.30978393554688, -174.44528198242188, -165.58078002929688, -156.71627807617188, -147.85177612304688, -138.98727416992188, -130.12277221679688, -121.25825500488281, -112.39375305175781, -103.52925109863281, -94.66474914550781, -85.80023193359375, -76.93572998046875, -68.07122039794922, -59.20671844482422, -50.34221267700195, -41.47770690917969, -32.61320495605469, -23.748699188232422, -14.884193420410156, -6.019688606262207, 2.844816207885742, 11.709320068359375, 20.57382583618164, 29.438331604003906, 38.302833557128906, 47.16733932495117, 56.031829833984375, 64.89633178710938, 73.7608413696289, 82.6253433227539, 91.48985290527344, 100.35435485839844, 109.21885681152344, 118.08335876464844, 126.94786834716797, 135.8123779296875, 144.6768798828125, 153.5413818359375, 162.4058837890625, 171.2703857421875, 180.1348876953125, 188.99940490722656, 197.86390686035156, 206.72840881347656, 215.59291076660156, 224.45742797851562, 233.32192993164062, 242.18643188476562, 251.05093383789062, 259.9154357910156, 268.7799377441406, 277.6444396972656, 286.5089416503906, 295.3734436035156, 304.2379455566406, 313.10247802734375, 321.96697998046875, 330.83148193359375, 339.69598388671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 10.0, 19.0, 11.0, 17.0, 27.0, 28.0, 42.0, 31.0, 39.0, 45.0, 52.0, 48.0, 59.0, 64.0, 54.0, 57.0, 51.0, 51.0, 51.0, 37.0, 39.0, 18.0, 32.0, 25.0, 11.0, 17.0, 9.0, 16.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-96.53462219238281, -93.73416137695312, -90.9336929321289, -88.13323211669922, -85.332763671875, -82.53230285644531, -79.73184204101562, -76.9313735961914, -74.13090515136719, -71.3304443359375, -68.52997589111328, -65.7295150756836, -62.929046630859375, -60.12858581542969, -57.328121185302734, -54.52765655517578, -51.727195739746094, -48.92673110961914, -46.12626647949219, -43.3258056640625, -40.52533721923828, -37.724876403808594, -34.92441177368164, -32.12394714355469, -29.323482513427734, -26.52301788330078, -23.722553253173828, -20.922090530395508, -18.121625900268555, -15.321161270141602, -12.520698547363281, -9.720233917236328, -6.919769287109375, -4.11930513381958, -1.3188409805297852, 1.4816226959228516, 4.282087326049805, 7.082551956176758, 9.883014678955078, 12.683479309082031, 15.483943939208984, 18.284408569335938, 21.08487319946289, 23.88533592224121, 26.685800552368164, 29.486265182495117, 32.28672790527344, 35.08719253540039, 37.887657165527344, 40.6881217956543, 43.48858642578125, 46.28904724121094, 49.089515686035156, 51.889976501464844, 54.6904411315918, 57.49090576171875, 60.2913703918457, 63.091835021972656, 65.89229583740234, 68.69276428222656, 71.49322509765625, 74.29369354248047, 77.09415435791016, 79.89462280273438, 82.69508361816406]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 16.0, 27.0, 37.0, 55.0, 98.0, 99.0, 186.0, 283.0, 436.0, 716.0, 1238.0, 2174.0, 3774.0, 6970.0, 12770.0, 25306.0, 51249.0, 110601.0, 250870.0, 304961.0, 144579.0, 65053.0, 31509.0, 15984.0, 8414.0, 4647.0, 2641.0, 1449.0, 859.0, 521.0, 334.0, 239.0, 136.0, 85.0, 56.0, 52.0, 37.0, 20.0, 10.0, 9.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-14.796875, -14.3876953125, -13.978515625, -13.5693359375, -13.16015625, -12.7509765625, -12.341796875, -11.9326171875, -11.5234375, -11.1142578125, -10.705078125, -10.2958984375, -9.88671875, -9.4775390625, -9.068359375, -8.6591796875, -8.25, -7.8408203125, -7.431640625, -7.0224609375, -6.61328125, -6.2041015625, -5.794921875, -5.3857421875, -4.9765625, -4.5673828125, -4.158203125, -3.7490234375, -3.33984375, -2.9306640625, -2.521484375, -2.1123046875, -1.703125, -1.2939453125, -0.884765625, -0.4755859375, -0.06640625, 0.3427734375, 0.751953125, 1.1611328125, 1.5703125, 1.9794921875, 2.388671875, 2.7978515625, 3.20703125, 3.6162109375, 4.025390625, 4.4345703125, 4.84375, 5.2529296875, 5.662109375, 6.0712890625, 6.48046875, 6.8896484375, 7.298828125, 7.7080078125, 8.1171875, 8.5263671875, 8.935546875, 9.3447265625, 9.75390625, 10.1630859375, 10.572265625, 10.9814453125, 11.390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 12.0, 9.0, 10.0, 17.0, 27.0, 24.0, 21.0, 38.0, 39.0, 31.0, 48.0, 50.0, 58.0, 61.0, 56.0, 57.0, 56.0, 47.0, 49.0, 49.0, 40.0, 25.0, 30.0, 24.0, 17.0, 17.0, 14.0, 12.0, 7.0, 9.0, 13.0, 3.0, 2.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.296875, -9.0201416015625, -8.743408203125, -8.4666748046875, -8.18994140625, -7.9132080078125, -7.636474609375, -7.3597412109375, -7.0830078125, -6.8062744140625, -6.529541015625, -6.2528076171875, -5.97607421875, -5.6993408203125, -5.422607421875, -5.1458740234375, -4.869140625, -4.5924072265625, -4.315673828125, -4.0389404296875, -3.76220703125, -3.4854736328125, -3.208740234375, -2.9320068359375, -2.6552734375, -2.3785400390625, -2.101806640625, -1.8250732421875, -1.54833984375, -1.2716064453125, -0.994873046875, -0.7181396484375, -0.44140625, -0.1646728515625, 0.112060546875, 0.3887939453125, 0.66552734375, 0.9422607421875, 1.218994140625, 1.4957275390625, 1.7724609375, 2.0491943359375, 2.325927734375, 2.6026611328125, 2.87939453125, 3.1561279296875, 3.432861328125, 3.7095947265625, 3.986328125, 4.2630615234375, 4.539794921875, 4.8165283203125, 5.09326171875, 5.3699951171875, 5.646728515625, 5.9234619140625, 6.2001953125, 6.4769287109375, 6.753662109375, 7.0303955078125, 7.30712890625, 7.5838623046875, 7.860595703125, 8.1373291015625, 8.4140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 3.0, 4.0, 10.0, 13.0, 19.0, 26.0, 37.0, 62.0, 70.0, 112.0, 178.0, 269.0, 436.0, 820.0, 1670.0, 4147.0, 13465.0, 57637.0, 344731.0, 523689.0, 75139.0, 17012.0, 4870.0, 1938.0, 878.0, 458.0, 279.0, 187.0, 126.0, 64.0, 51.0, 51.0, 27.0, 25.0, 13.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.46533203125, -19.6494140625, -18.83349609375, -18.017578125, -17.20166015625, -16.3857421875, -15.56982421875, -14.75390625, -13.93798828125, -13.1220703125, -12.30615234375, -11.490234375, -10.67431640625, -9.8583984375, -9.04248046875, -8.2265625, -7.41064453125, -6.5947265625, -5.77880859375, -4.962890625, -4.14697265625, -3.3310546875, -2.51513671875, -1.69921875, -0.88330078125, -0.0673828125, 0.74853515625, 1.564453125, 2.38037109375, 3.1962890625, 4.01220703125, 4.828125, 5.64404296875, 6.4599609375, 7.27587890625, 8.091796875, 8.90771484375, 9.7236328125, 10.53955078125, 11.35546875, 12.17138671875, 12.9873046875, 13.80322265625, 14.619140625, 15.43505859375, 16.2509765625, 17.06689453125, 17.8828125, 18.69873046875, 19.5146484375, 20.33056640625, 21.146484375, 21.96240234375, 22.7783203125, 23.59423828125, 24.41015625, 25.22607421875, 26.0419921875, 26.85791015625, 27.673828125, 28.48974609375, 29.3056640625, 30.12158203125, 30.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 16.0, 12.0, 18.0, 18.0, 30.0, 23.0, 40.0, 34.0, 41.0, 42.0, 58.0, 53.0, 56.0, 46.0, 59.0, 48.0, 55.0, 51.0, 48.0, 43.0, 32.0, 26.0, 27.0, 14.0, 24.0, 12.0, 11.0, 7.0, 10.0, 8.0, 3.0, 2.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.21875, -31.11669921875, -30.0146484375, -28.91259765625, -27.810546875, -26.70849609375, -25.6064453125, -24.50439453125, -23.40234375, -22.30029296875, -21.1982421875, -20.09619140625, -18.994140625, -17.89208984375, -16.7900390625, -15.68798828125, -14.5859375, -13.48388671875, -12.3818359375, -11.27978515625, -10.177734375, -9.07568359375, -7.9736328125, -6.87158203125, -5.76953125, -4.66748046875, -3.5654296875, -2.46337890625, -1.361328125, -0.25927734375, 0.8427734375, 1.94482421875, 3.046875, 4.14892578125, 5.2509765625, 6.35302734375, 7.455078125, 8.55712890625, 9.6591796875, 10.76123046875, 11.86328125, 12.96533203125, 14.0673828125, 15.16943359375, 16.271484375, 17.37353515625, 18.4755859375, 19.57763671875, 20.6796875, 21.78173828125, 22.8837890625, 23.98583984375, 25.087890625, 26.18994140625, 27.2919921875, 28.39404296875, 29.49609375, 30.59814453125, 31.7001953125, 32.80224609375, 33.904296875, 35.00634765625, 36.1083984375, 37.21044921875, 38.3125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 18.0, 19.0, 30.0, 42.0, 73.0, 140.0, 270.0, 598.0, 2033.0, 12132.0, 231929.0, 766416.0, 29572.0, 3605.0, 935.0, 318.0, 140.0, 76.0, 44.0, 38.0, 38.0, 12.0, 11.0, 8.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.609375, -20.9951171875, -20.380859375, -19.7666015625, -19.15234375, -18.5380859375, -17.923828125, -17.3095703125, -16.6953125, -16.0810546875, -15.466796875, -14.8525390625, -14.23828125, -13.6240234375, -13.009765625, -12.3955078125, -11.78125, -11.1669921875, -10.552734375, -9.9384765625, -9.32421875, -8.7099609375, -8.095703125, -7.4814453125, -6.8671875, -6.2529296875, -5.638671875, -5.0244140625, -4.41015625, -3.7958984375, -3.181640625, -2.5673828125, -1.953125, -1.3388671875, -0.724609375, -0.1103515625, 0.50390625, 1.1181640625, 1.732421875, 2.3466796875, 2.9609375, 3.5751953125, 4.189453125, 4.8037109375, 5.41796875, 6.0322265625, 6.646484375, 7.2607421875, 7.875, 8.4892578125, 9.103515625, 9.7177734375, 10.33203125, 10.9462890625, 11.560546875, 12.1748046875, 12.7890625, 13.4033203125, 14.017578125, 14.6318359375, 15.24609375, 15.8603515625, 16.474609375, 17.0888671875, 17.703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 9.0, 10.0, 12.0, 8.0, 15.0, 35.0, 37.0, 44.0, 53.0, 81.0, 93.0, 119.0, 125.0, 74.0, 62.0, 42.0, 35.0, 17.0, 28.0, 9.0, 12.0, 17.0, 6.0, 5.0, 4.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00200653076171875, -0.0019413530826568604, -0.0018761754035949707, -0.001810997724533081, -0.0017458200454711914, -0.0016806423664093018, -0.0016154646873474121, -0.0015502870082855225, -0.0014851093292236328, -0.0014199316501617432, -0.0013547539710998535, -0.0012895762920379639, -0.0012243986129760742, -0.0011592209339141846, -0.001094043254852295, -0.0010288655757904053, -0.0009636878967285156, -0.000898510217666626, -0.0008333325386047363, -0.0007681548595428467, -0.000702977180480957, -0.0006377995014190674, -0.0005726218223571777, -0.0005074441432952881, -0.00044226646423339844, -0.0003770887851715088, -0.00031191110610961914, -0.0002467334270477295, -0.00018155574798583984, -0.0001163780689239502, -5.120038986206055e-05, 1.3977289199829102e-05, 7.915496826171875e-05, 0.0001443326473236084, 0.00020951032638549805, 0.0002746880054473877, 0.00033986568450927734, 0.000405043363571167, 0.00047022104263305664, 0.0005353987216949463, 0.0006005764007568359, 0.0006657540798187256, 0.0007309317588806152, 0.0007961094379425049, 0.0008612871170043945, 0.0009264647960662842, 0.0009916424751281738, 0.0010568201541900635, 0.0011219978332519531, 0.0011871755123138428, 0.0012523531913757324, 0.001317530870437622, 0.0013827085494995117, 0.0014478862285614014, 0.001513063907623291, 0.0015782415866851807, 0.0016434192657470703, 0.00170859694480896, 0.0017737746238708496, 0.0018389523029327393, 0.001904129981994629, 0.0019693076610565186, 0.002034485340118408, 0.002099663019180298, 0.0021648406982421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 8.0, 27.0, 40.0, 83.0, 148.0, 297.0, 647.0, 1810.0, 5744.0, 42279.0, 732097.0, 243018.0, 16765.0, 3447.0, 1143.0, 473.0, 248.0, 115.0, 51.0, 30.0, 25.0, 12.0, 9.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.625, -14.1171875, -13.609375, -13.1015625, -12.59375, -12.0859375, -11.578125, -11.0703125, -10.5625, -10.0546875, -9.546875, -9.0390625, -8.53125, -8.0234375, -7.515625, -7.0078125, -6.5, -5.9921875, -5.484375, -4.9765625, -4.46875, -3.9609375, -3.453125, -2.9453125, -2.4375, -1.9296875, -1.421875, -0.9140625, -0.40625, 0.1015625, 0.609375, 1.1171875, 1.625, 2.1328125, 2.640625, 3.1484375, 3.65625, 4.1640625, 4.671875, 5.1796875, 5.6875, 6.1953125, 6.703125, 7.2109375, 7.71875, 8.2265625, 8.734375, 9.2421875, 9.75, 10.2578125, 10.765625, 11.2734375, 11.78125, 12.2890625, 12.796875, 13.3046875, 13.8125, 14.3203125, 14.828125, 15.3359375, 15.84375, 16.3515625, 16.859375, 17.3671875, 17.875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 3.0, 2.0, 13.0, 9.0, 18.0, 14.0, 16.0, 20.0, 26.0, 47.0, 36.0, 53.0, 48.0, 56.0, 76.0, 78.0, 73.0, 68.0, 66.0, 55.0, 32.0, 31.0, 34.0, 22.0, 25.0, 12.0, 18.0, 8.0, 7.0, 5.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.6580810546875, -7.421630859375, -7.1851806640625, -6.94873046875, -6.7122802734375, -6.475830078125, -6.2393798828125, -6.0029296875, -5.7664794921875, -5.530029296875, -5.2935791015625, -5.05712890625, -4.8206787109375, -4.584228515625, -4.3477783203125, -4.111328125, -3.8748779296875, -3.638427734375, -3.4019775390625, -3.16552734375, -2.9290771484375, -2.692626953125, -2.4561767578125, -2.2197265625, -1.9832763671875, -1.746826171875, -1.5103759765625, -1.27392578125, -1.0374755859375, -0.801025390625, -0.5645751953125, -0.328125, -0.0916748046875, 0.144775390625, 0.3812255859375, 0.61767578125, 0.8541259765625, 1.090576171875, 1.3270263671875, 1.5634765625, 1.7999267578125, 2.036376953125, 2.2728271484375, 2.50927734375, 2.7457275390625, 2.982177734375, 3.2186279296875, 3.455078125, 3.6915283203125, 3.927978515625, 4.1644287109375, 4.40087890625, 4.6373291015625, 4.873779296875, 5.1102294921875, 5.3466796875, 5.5831298828125, 5.819580078125, 6.0560302734375, 6.29248046875, 6.5289306640625, 6.765380859375, 7.0018310546875, 7.23828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 14.0, 20.0, 29.0, 41.0, 92.0, 93.0, 147.0, 155.0, 143.0, 91.0, 62.0, 39.0, 19.0, 16.0, 10.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-237.98324584960938, -232.77313232421875, -227.5630340576172, -222.35292053222656, -217.14280700683594, -211.93270874023438, -206.72259521484375, -201.51248168945312, -196.3023681640625, -191.09225463867188, -185.8821563720703, -180.6720428466797, -175.46192932128906, -170.2518310546875, -165.04171752929688, -159.83160400390625, -154.6215057373047, -149.41139221191406, -144.2012939453125, -138.99118041992188, -133.78106689453125, -128.57095336914062, -123.36085510253906, -118.15074157714844, -112.94063568115234, -107.73052978515625, -102.52041625976562, -97.31031036376953, -92.10020446777344, -86.89009094238281, -81.67998504638672, -76.46987915039062, -71.25975036621094, -66.04964447021484, -60.83953094482422, -55.629425048828125, -50.419315338134766, -45.209205627441406, -39.99909973144531, -34.78899002075195, -29.578880310058594, -24.368770599365234, -19.158662796020508, -13.948554039001465, -8.738445281982422, -3.5283355712890625, 1.681772232055664, 6.891880035400391, 12.10198974609375, 17.31209945678711, 22.522207260131836, 27.732315063476562, 32.94242477416992, 38.15253448486328, 43.362640380859375, 48.572750091552734, 53.782859802246094, 58.99296951293945, 64.20307922363281, 69.4131851196289, 74.623291015625, 79.83340454101562, 85.04351043701172, 90.25361633300781, 95.46372985839844]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 14.0, 13.0, 17.0, 15.0, 25.0, 37.0, 34.0, 50.0, 59.0, 61.0, 70.0, 102.0, 96.0, 53.0, 63.0, 52.0, 45.0, 29.0, 44.0, 24.0, 23.0, 19.0, 22.0, 7.0, 8.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.56808471679688, -139.45872497558594, -133.349365234375, -127.2400131225586, -121.13065338134766, -115.02129364013672, -108.91194152832031, -102.80258178710938, -96.69322204589844, -90.5838623046875, -84.47450256347656, -78.36515045166016, -72.25579071044922, -66.14643096923828, -60.03707504272461, -53.92771911621094, -47.818359375, -41.70899963378906, -35.59964370727539, -29.490285873413086, -23.38092803955078, -17.271570205688477, -11.162212371826172, -5.0528564453125, 1.0565032958984375, 7.165861129760742, 13.275218963623047, 19.38457679748535, 25.493934631347656, 31.60329246520996, 37.712650299072266, 43.82200622558594, 49.93138122558594, 56.040740966796875, 62.15009689331055, 68.25945281982422, 74.36881256103516, 80.4781723022461, 86.5875244140625, 92.69688415527344, 98.80624389648438, 104.91560363769531, 111.02496337890625, 117.13431549072266, 123.2436752319336, 129.35302734375, 135.46238708496094, 141.57174682617188, 147.6811065673828, 153.79046630859375, 159.8998260498047, 166.00918579101562, 172.1185302734375, 178.22789001464844, 184.33724975585938, 190.4466094970703, 196.55596923828125, 202.6653289794922, 208.77468872070312, 214.88404846191406, 220.993408203125, 227.10275268554688, 233.2121124267578, 239.32147216796875, 245.4308319091797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 16.0, 25.0, 31.0, 59.0, 92.0, 124.0, 169.0, 379.0, 657.0, 1376.0, 2914.0, 6937.0, 18754.0, 75751.0, 796619.0, 2960958.0, 269440.0, 39960.0, 11370.0, 4353.0, 1911.0, 958.0, 503.0, 287.0, 174.0, 140.0, 83.0, 61.0, 36.0, 23.0, 22.0, 14.0, 16.0, 12.0, 9.0, 5.0, 7.0, 4.0, 0.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.99658203125, -12.4619140625, -11.92724609375, -11.392578125, -10.85791015625, -10.3232421875, -9.78857421875, -9.25390625, -8.71923828125, -8.1845703125, -7.64990234375, -7.115234375, -6.58056640625, -6.0458984375, -5.51123046875, -4.9765625, -4.44189453125, -3.9072265625, -3.37255859375, -2.837890625, -2.30322265625, -1.7685546875, -1.23388671875, -0.69921875, -0.16455078125, 0.3701171875, 0.90478515625, 1.439453125, 1.97412109375, 2.5087890625, 3.04345703125, 3.578125, 4.11279296875, 4.6474609375, 5.18212890625, 5.716796875, 6.25146484375, 6.7861328125, 7.32080078125, 7.85546875, 8.39013671875, 8.9248046875, 9.45947265625, 9.994140625, 10.52880859375, 11.0634765625, 11.59814453125, 12.1328125, 12.66748046875, 13.2021484375, 13.73681640625, 14.271484375, 14.80615234375, 15.3408203125, 15.87548828125, 16.41015625, 16.94482421875, 17.4794921875, 18.01416015625, 18.548828125, 19.08349609375, 19.6181640625, 20.15283203125, 20.6875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 21.0, 34.0, 70.0, 81.0, 113.0, 112.0, 139.0, 114.0, 98.0, 90.0, 53.0, 27.0, 24.0, 13.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -8.8812255859375, -8.270263671875, -7.6593017578125, -7.04833984375, -6.4373779296875, -5.826416015625, -5.2154541015625, -4.6044921875, -3.9935302734375, -3.382568359375, -2.7716064453125, -2.16064453125, -1.5496826171875, -0.938720703125, -0.3277587890625, 0.283203125, 0.8941650390625, 1.505126953125, 2.1160888671875, 2.72705078125, 3.3380126953125, 3.948974609375, 4.5599365234375, 5.1708984375, 5.7818603515625, 6.392822265625, 7.0037841796875, 7.61474609375, 8.2257080078125, 8.836669921875, 9.4476318359375, 10.05859375, 10.6695556640625, 11.280517578125, 11.8914794921875, 12.50244140625, 13.1134033203125, 13.724365234375, 14.3353271484375, 14.9462890625, 15.5572509765625, 16.168212890625, 16.7791748046875, 17.39013671875, 18.0010986328125, 18.612060546875, 19.2230224609375, 19.833984375, 20.4449462890625, 21.055908203125, 21.6668701171875, 22.27783203125, 22.8887939453125, 23.499755859375, 24.1107177734375, 24.7216796875, 25.3326416015625, 25.943603515625, 26.5545654296875, 27.16552734375, 27.7764892578125, 28.387451171875, 28.9984130859375, 29.609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 9.0, 4.0, 7.0, 16.0, 19.0, 39.0, 58.0, 87.0, 146.0, 295.0, 601.0, 1453.0, 3857.0, 12232.0, 55707.0, 576816.0, 3290800.0, 207118.0, 31955.0, 8117.0, 2693.0, 1136.0, 488.0, 252.0, 142.0, 60.0, 46.0, 26.0, 21.0, 19.0, 9.0, 16.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.48974609375, -18.7763671875, -18.06298828125, -17.349609375, -16.63623046875, -15.9228515625, -15.20947265625, -14.49609375, -13.78271484375, -13.0693359375, -12.35595703125, -11.642578125, -10.92919921875, -10.2158203125, -9.50244140625, -8.7890625, -8.07568359375, -7.3623046875, -6.64892578125, -5.935546875, -5.22216796875, -4.5087890625, -3.79541015625, -3.08203125, -2.36865234375, -1.6552734375, -0.94189453125, -0.228515625, 0.48486328125, 1.1982421875, 1.91162109375, 2.625, 3.33837890625, 4.0517578125, 4.76513671875, 5.478515625, 6.19189453125, 6.9052734375, 7.61865234375, 8.33203125, 9.04541015625, 9.7587890625, 10.47216796875, 11.185546875, 11.89892578125, 12.6123046875, 13.32568359375, 14.0390625, 14.75244140625, 15.4658203125, 16.17919921875, 16.892578125, 17.60595703125, 18.3193359375, 19.03271484375, 19.74609375, 20.45947265625, 21.1728515625, 21.88623046875, 22.599609375, 23.31298828125, 24.0263671875, 24.73974609375, 25.453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 5.0, 1.0, 5.0, 6.0, 2.0, 2.0, 7.0, 17.0, 21.0, 21.0, 36.0, 36.0, 58.0, 96.0, 135.0, 182.0, 348.0, 527.0, 702.0, 665.0, 423.0, 233.0, 151.0, 99.0, 75.0, 58.0, 35.0, 20.0, 16.0, 22.0, 18.0, 7.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.26904296875, -16.6474609375, -16.02587890625, -15.404296875, -14.78271484375, -14.1611328125, -13.53955078125, -12.91796875, -12.29638671875, -11.6748046875, -11.05322265625, -10.431640625, -9.81005859375, -9.1884765625, -8.56689453125, -7.9453125, -7.32373046875, -6.7021484375, -6.08056640625, -5.458984375, -4.83740234375, -4.2158203125, -3.59423828125, -2.97265625, -2.35107421875, -1.7294921875, -1.10791015625, -0.486328125, 0.13525390625, 0.7568359375, 1.37841796875, 2.0, 2.62158203125, 3.2431640625, 3.86474609375, 4.486328125, 5.10791015625, 5.7294921875, 6.35107421875, 6.97265625, 7.59423828125, 8.2158203125, 8.83740234375, 9.458984375, 10.08056640625, 10.7021484375, 11.32373046875, 11.9453125, 12.56689453125, 13.1884765625, 13.81005859375, 14.431640625, 15.05322265625, 15.6748046875, 16.29638671875, 16.91796875, 17.53955078125, 18.1611328125, 18.78271484375, 19.404296875, 20.02587890625, 20.6474609375, 21.26904296875, 21.890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 23.0, 94.0, 194.0, 283.0, 204.0, 115.0, 38.0, 14.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-252.84799194335938, -242.0911865234375, -231.33436584472656, -220.5775604248047, -209.8207550048828, -199.06393432617188, -188.30712890625, -177.55032348632812, -166.79351806640625, -156.03671264648438, -145.27989196777344, -134.52308654785156, -123.76628112792969, -113.00946807861328, -102.25265502929688, -91.495849609375, -80.73902893066406, -69.98221588134766, -59.22541046142578, -48.468597412109375, -37.711788177490234, -26.954978942871094, -16.198165893554688, -5.4413604736328125, 5.315452575683594, 16.072261810302734, 26.829072952270508, 37.58588409423828, 48.34269332885742, 59.09950256347656, 69.85631561279297, 80.61312103271484, 91.36993408203125, 102.12674713134766, 112.88355255126953, 123.64036560058594, 134.3971710205078, 145.15399169921875, 155.91079711914062, 166.6676025390625, 177.42440795898438, 188.18121337890625, 198.9380340576172, 209.69483947753906, 220.45164489746094, 231.20846557617188, 241.96527099609375, 252.72207641601562, 263.4788818359375, 274.2356872558594, 284.99249267578125, 295.74932861328125, 306.5061340332031, 317.262939453125, 328.0197448730469, 338.77655029296875, 349.53338623046875, 360.2901916503906, 371.0469970703125, 381.8038330078125, 392.5606384277344, 403.31744384765625, 414.0742492675781, 424.8310546875, 435.5878601074219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 10.0, 11.0, 13.0, 19.0, 27.0, 25.0, 28.0, 40.0, 51.0, 48.0, 50.0, 54.0, 60.0, 49.0, 77.0, 69.0, 58.0, 57.0, 48.0, 46.0, 38.0, 27.0, 19.0, 22.0, 21.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-183.96829223632812, -179.79054260253906, -175.61279296875, -171.43505859375, -167.25730895996094, -163.07955932617188, -158.90182495117188, -154.7240753173828, -150.54632568359375, -146.3685760498047, -142.19082641601562, -138.01309204101562, -133.83534240722656, -129.6575927734375, -125.47985076904297, -121.30210876464844, -117.12435913085938, -112.94660949707031, -108.76886749267578, -104.59112548828125, -100.41337585449219, -96.23562622070312, -92.0578842163086, -87.88014221191406, -83.702392578125, -79.52464294433594, -75.3469009399414, -71.16915893554688, -66.99140930175781, -62.813663482666016, -58.63591766357422, -54.45817184448242, -50.280418395996094, -46.1026725769043, -41.9249267578125, -37.7471809387207, -33.569435119628906, -29.39168930053711, -25.213943481445312, -21.036197662353516, -16.85845184326172, -12.680706024169922, -8.502960205078125, -4.325214385986328, -0.14746856689453125, 4.030277252197266, 8.208023071289062, 12.38576889038086, 16.563514709472656, 20.741260528564453, 24.91900634765625, 29.096752166748047, 33.274497985839844, 37.45224380493164, 41.62998962402344, 45.807735443115234, 49.98548126220703, 54.16322708129883, 58.340972900390625, 62.51871871948242, 66.69646453857422, 70.87420654296875, 75.05195617675781, 79.22970581054688, 83.4074478149414]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 6.0, 14.0, 21.0, 34.0, 62.0, 89.0, 169.0, 248.0, 556.0, 1089.0, 2222.0, 4903.0, 12564.0, 32640.0, 89590.0, 244226.0, 395620.0, 165106.0, 61360.0, 22469.0, 8639.0, 3501.0, 1642.0, 759.0, 408.0, 268.0, 128.0, 75.0, 46.0, 26.0, 21.0, 16.0, 1.0, 10.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.78125, -20.23876953125, -19.6962890625, -19.15380859375, -18.611328125, -18.06884765625, -17.5263671875, -16.98388671875, -16.44140625, -15.89892578125, -15.3564453125, -14.81396484375, -14.271484375, -13.72900390625, -13.1865234375, -12.64404296875, -12.1015625, -11.55908203125, -11.0166015625, -10.47412109375, -9.931640625, -9.38916015625, -8.8466796875, -8.30419921875, -7.76171875, -7.21923828125, -6.6767578125, -6.13427734375, -5.591796875, -5.04931640625, -4.5068359375, -3.96435546875, -3.421875, -2.87939453125, -2.3369140625, -1.79443359375, -1.251953125, -0.70947265625, -0.1669921875, 0.37548828125, 0.91796875, 1.46044921875, 2.0029296875, 2.54541015625, 3.087890625, 3.63037109375, 4.1728515625, 4.71533203125, 5.2578125, 5.80029296875, 6.3427734375, 6.88525390625, 7.427734375, 7.97021484375, 8.5126953125, 9.05517578125, 9.59765625, 10.14013671875, 10.6826171875, 11.22509765625, 11.767578125, 12.31005859375, 12.8525390625, 13.39501953125, 13.9375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 16.0, 18.0, 21.0, 17.0, 39.0, 44.0, 47.0, 45.0, 55.0, 62.0, 65.0, 50.0, 64.0, 53.0, 62.0, 57.0, 49.0, 26.0, 32.0, 36.0, 27.0, 20.0, 18.0, 12.0, 11.0, 12.0, 8.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.08935546875, -8.7880859375, -8.48681640625, -8.185546875, -7.88427734375, -7.5830078125, -7.28173828125, -6.98046875, -6.67919921875, -6.3779296875, -6.07666015625, -5.775390625, -5.47412109375, -5.1728515625, -4.87158203125, -4.5703125, -4.26904296875, -3.9677734375, -3.66650390625, -3.365234375, -3.06396484375, -2.7626953125, -2.46142578125, -2.16015625, -1.85888671875, -1.5576171875, -1.25634765625, -0.955078125, -0.65380859375, -0.3525390625, -0.05126953125, 0.25, 0.55126953125, 0.8525390625, 1.15380859375, 1.455078125, 1.75634765625, 2.0576171875, 2.35888671875, 2.66015625, 2.96142578125, 3.2626953125, 3.56396484375, 3.865234375, 4.16650390625, 4.4677734375, 4.76904296875, 5.0703125, 5.37158203125, 5.6728515625, 5.97412109375, 6.275390625, 6.57666015625, 6.8779296875, 7.17919921875, 7.48046875, 7.78173828125, 8.0830078125, 8.38427734375, 8.685546875, 8.98681640625, 9.2880859375, 9.58935546875, 9.890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 8.0, 8.0, 15.0, 28.0, 31.0, 42.0, 66.0, 104.0, 132.0, 182.0, 264.0, 369.0, 534.0, 896.0, 1516.0, 2994.0, 7796.0, 33010.0, 230458.0, 664242.0, 81063.0, 14843.0, 4437.0, 2131.0, 1145.0, 699.0, 442.0, 326.0, 211.0, 158.0, 111.0, 73.0, 62.0, 45.0, 27.0, 14.0, 22.0, 11.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.875, -26.953369140625, -26.03173828125, -25.110107421875, -24.1884765625, -23.266845703125, -22.34521484375, -21.423583984375, -20.501953125, -19.580322265625, -18.65869140625, -17.737060546875, -16.8154296875, -15.893798828125, -14.97216796875, -14.050537109375, -13.12890625, -12.207275390625, -11.28564453125, -10.364013671875, -9.4423828125, -8.520751953125, -7.59912109375, -6.677490234375, -5.755859375, -4.834228515625, -3.91259765625, -2.990966796875, -2.0693359375, -1.147705078125, -0.22607421875, 0.695556640625, 1.6171875, 2.538818359375, 3.46044921875, 4.382080078125, 5.3037109375, 6.225341796875, 7.14697265625, 8.068603515625, 8.990234375, 9.911865234375, 10.83349609375, 11.755126953125, 12.6767578125, 13.598388671875, 14.52001953125, 15.441650390625, 16.36328125, 17.284912109375, 18.20654296875, 19.128173828125, 20.0498046875, 20.971435546875, 21.89306640625, 22.814697265625, 23.736328125, 24.657958984375, 25.57958984375, 26.501220703125, 27.4228515625, 28.344482421875, 29.26611328125, 30.187744140625, 31.109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 3.0, 7.0, 3.0, 3.0, 10.0, 6.0, 9.0, 10.0, 10.0, 16.0, 13.0, 33.0, 22.0, 27.0, 37.0, 36.0, 52.0, 37.0, 29.0, 34.0, 45.0, 48.0, 49.0, 38.0, 33.0, 41.0, 41.0, 47.0, 35.0, 32.0, 25.0, 26.0, 29.0, 17.0, 11.0, 13.0, 9.0, 13.0, 4.0, 6.0, 4.0, 5.0, 6.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-31.03125, -30.093017578125, -29.15478515625, -28.216552734375, -27.2783203125, -26.340087890625, -25.40185546875, -24.463623046875, -23.525390625, -22.587158203125, -21.64892578125, -20.710693359375, -19.7724609375, -18.834228515625, -17.89599609375, -16.957763671875, -16.01953125, -15.081298828125, -14.14306640625, -13.204833984375, -12.2666015625, -11.328369140625, -10.39013671875, -9.451904296875, -8.513671875, -7.575439453125, -6.63720703125, -5.698974609375, -4.7607421875, -3.822509765625, -2.88427734375, -1.946044921875, -1.0078125, -0.069580078125, 0.86865234375, 1.806884765625, 2.7451171875, 3.683349609375, 4.62158203125, 5.559814453125, 6.498046875, 7.436279296875, 8.37451171875, 9.312744140625, 10.2509765625, 11.189208984375, 12.12744140625, 13.065673828125, 14.00390625, 14.942138671875, 15.88037109375, 16.818603515625, 17.7568359375, 18.695068359375, 19.63330078125, 20.571533203125, 21.509765625, 22.447998046875, 23.38623046875, 24.324462890625, 25.2626953125, 26.200927734375, 27.13916015625, 28.077392578125, 29.015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 13.0, 17.0, 30.0, 30.0, 59.0, 112.0, 156.0, 322.0, 775.0, 2376.0, 12090.0, 121322.0, 790463.0, 106349.0, 10760.0, 2159.0, 750.0, 320.0, 144.0, 109.0, 50.0, 35.0, 24.0, 19.0, 9.0, 13.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.381103515625, -10.05126953125, -9.721435546875, -9.3916015625, -9.061767578125, -8.73193359375, -8.402099609375, -8.072265625, -7.742431640625, -7.41259765625, -7.082763671875, -6.7529296875, -6.423095703125, -6.09326171875, -5.763427734375, -5.43359375, -5.103759765625, -4.77392578125, -4.444091796875, -4.1142578125, -3.784423828125, -3.45458984375, -3.124755859375, -2.794921875, -2.465087890625, -2.13525390625, -1.805419921875, -1.4755859375, -1.145751953125, -0.81591796875, -0.486083984375, -0.15625, 0.173583984375, 0.50341796875, 0.833251953125, 1.1630859375, 1.492919921875, 1.82275390625, 2.152587890625, 2.482421875, 2.812255859375, 3.14208984375, 3.471923828125, 3.8017578125, 4.131591796875, 4.46142578125, 4.791259765625, 5.12109375, 5.450927734375, 5.78076171875, 6.110595703125, 6.4404296875, 6.770263671875, 7.10009765625, 7.429931640625, 7.759765625, 8.089599609375, 8.41943359375, 8.749267578125, 9.0791015625, 9.408935546875, 9.73876953125, 10.068603515625, 10.3984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 5.0, 14.0, 17.0, 15.0, 22.0, 21.0, 31.0, 41.0, 55.0, 78.0, 79.0, 98.0, 106.0, 70.0, 56.0, 63.0, 39.0, 25.0, 26.0, 20.0, 21.0, 14.0, 9.0, 7.0, 8.0, 4.0, 3.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001720428466796875, -0.0016647577285766602, -0.0016090869903564453, -0.0015534162521362305, -0.0014977455139160156, -0.0014420747756958008, -0.001386404037475586, -0.001330733299255371, -0.0012750625610351562, -0.0012193918228149414, -0.0011637210845947266, -0.0011080503463745117, -0.0010523796081542969, -0.000996708869934082, -0.0009410381317138672, -0.0008853673934936523, -0.0008296966552734375, -0.0007740259170532227, -0.0007183551788330078, -0.000662684440612793, -0.0006070137023925781, -0.0005513429641723633, -0.0004956722259521484, -0.0004400014877319336, -0.00038433074951171875, -0.0003286600112915039, -0.00027298927307128906, -0.00021731853485107422, -0.00016164779663085938, -0.00010597705841064453, -5.030632019042969e-05, 5.364418029785156e-06, 6.103515625e-05, 0.00011670589447021484, 0.0001723766326904297, 0.00022804737091064453, 0.0002837181091308594, 0.0003393888473510742, 0.00039505958557128906, 0.0004507303237915039, 0.0005064010620117188, 0.0005620718002319336, 0.0006177425384521484, 0.0006734132766723633, 0.0007290840148925781, 0.000784754753112793, 0.0008404254913330078, 0.0008960962295532227, 0.0009517669677734375, 0.0010074377059936523, 0.0010631084442138672, 0.001118779182434082, 0.0011744499206542969, 0.0012301206588745117, 0.0012857913970947266, 0.0013414621353149414, 0.0013971328735351562, 0.001452803611755371, 0.001508474349975586, 0.0015641450881958008, 0.0016198158264160156, 0.0016754865646362305, 0.0017311573028564453, 0.0017868280410766602, 0.001842498779296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 17.0, 23.0, 25.0, 41.0, 63.0, 90.0, 142.0, 198.0, 353.0, 610.0, 1243.0, 2783.0, 7989.0, 34742.0, 270588.0, 639759.0, 69381.0, 12740.0, 4042.0, 1727.0, 800.0, 459.0, 254.0, 162.0, 95.0, 72.0, 43.0, 34.0, 18.0, 16.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9185791015625, -6.673095703125, -6.4276123046875, -6.18212890625, -5.9366455078125, -5.691162109375, -5.4456787109375, -5.2001953125, -4.9547119140625, -4.709228515625, -4.4637451171875, -4.21826171875, -3.9727783203125, -3.727294921875, -3.4818115234375, -3.236328125, -2.9908447265625, -2.745361328125, -2.4998779296875, -2.25439453125, -2.0089111328125, -1.763427734375, -1.5179443359375, -1.2724609375, -1.0269775390625, -0.781494140625, -0.5360107421875, -0.29052734375, -0.0450439453125, 0.200439453125, 0.4459228515625, 0.69140625, 0.9368896484375, 1.182373046875, 1.4278564453125, 1.67333984375, 1.9188232421875, 2.164306640625, 2.4097900390625, 2.6552734375, 2.9007568359375, 3.146240234375, 3.3917236328125, 3.63720703125, 3.8826904296875, 4.128173828125, 4.3736572265625, 4.619140625, 4.8646240234375, 5.110107421875, 5.3555908203125, 5.60107421875, 5.8465576171875, 6.092041015625, 6.3375244140625, 6.5830078125, 6.8284912109375, 7.073974609375, 7.3194580078125, 7.56494140625, 7.8104248046875, 8.055908203125, 8.3013916015625, 8.546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 13.0, 12.0, 21.0, 19.0, 26.0, 25.0, 26.0, 29.0, 38.0, 33.0, 46.0, 30.0, 62.0, 41.0, 56.0, 50.0, 55.0, 59.0, 41.0, 40.0, 38.0, 29.0, 23.0, 24.0, 23.0, 16.0, 16.0, 17.0, 6.0, 6.0, 8.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.61328125, -4.470703125, -4.328125, -4.185546875, -4.04296875, -3.900390625, -3.7578125, -3.615234375, -3.47265625, -3.330078125, -3.1875, -3.044921875, -2.90234375, -2.759765625, -2.6171875, -2.474609375, -2.33203125, -2.189453125, -2.046875, -1.904296875, -1.76171875, -1.619140625, -1.4765625, -1.333984375, -1.19140625, -1.048828125, -0.90625, -0.763671875, -0.62109375, -0.478515625, -0.3359375, -0.193359375, -0.05078125, 0.091796875, 0.234375, 0.376953125, 0.51953125, 0.662109375, 0.8046875, 0.947265625, 1.08984375, 1.232421875, 1.375, 1.517578125, 1.66015625, 1.802734375, 1.9453125, 2.087890625, 2.23046875, 2.373046875, 2.515625, 2.658203125, 2.80078125, 2.943359375, 3.0859375, 3.228515625, 3.37109375, 3.513671875, 3.65625, 3.798828125, 3.94140625, 4.083984375, 4.2265625, 4.369140625, 4.51171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 14.0, 11.0, 27.0, 53.0, 88.0, 156.0, 233.0, 142.0, 115.0, 77.0, 27.0, 19.0, 14.0, 8.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-147.45614624023438, -141.1963653564453, -134.9365997314453, -128.67681884765625, -122.41703796386719, -116.15726470947266, -109.89749145507812, -103.63771057128906, -97.3779296875, -91.11815643310547, -84.8583755493164, -78.59860229492188, -72.33882141113281, -66.07904815673828, -59.819271087646484, -53.55949401855469, -47.299720764160156, -41.03994369506836, -34.78016662597656, -28.5203914642334, -22.2606143951416, -16.000837326049805, -9.74106216430664, -3.4812850952148438, 2.778491973876953, 9.03826904296875, 15.29804515838623, 21.55782127380371, 27.817598342895508, 34.07737731933594, 40.33715057373047, 46.596927642822266, 52.85670471191406, 59.11648178100586, 65.37625885009766, 71.63603210449219, 77.89581298828125, 84.15558624267578, 90.41535949707031, 96.67514038085938, 102.93492126464844, 109.19469451904297, 115.45447540283203, 121.71424865722656, 127.97402954101562, 134.2338104248047, 140.4935760498047, 146.75335693359375, 153.01312255859375, 159.2729034423828, 165.5326690673828, 171.79244995117188, 178.05223083496094, 184.31201171875, 190.57177734375, 196.83155822753906, 203.09133911132812, 209.3511199951172, 215.6108856201172, 221.87066650390625, 228.1304473876953, 234.39022827148438, 240.64999389648438, 246.90977478027344, 253.1695556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 1.0, 11.0, 7.0, 12.0, 8.0, 9.0, 10.0, 9.0, 19.0, 16.0, 23.0, 21.0, 27.0, 37.0, 32.0, 25.0, 45.0, 56.0, 58.0, 74.0, 70.0, 55.0, 40.0, 32.0, 33.0, 26.0, 33.0, 27.0, 23.0, 15.0, 28.0, 25.0, 19.0, 13.0, 10.0, 14.0, 5.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-132.94903564453125, -129.16490173339844, -125.38077545166016, -121.59664154052734, -117.81251525878906, -114.02838134765625, -110.24424743652344, -106.46012115478516, -102.67599487304688, -98.89186096191406, -95.10773468017578, -91.32360076904297, -87.53947448730469, -83.75534057617188, -79.97120666503906, -76.18708038330078, -72.40294647216797, -68.61881256103516, -64.83468627929688, -61.05055236816406, -57.26642608642578, -53.48229217529297, -49.69816207885742, -45.914031982421875, -42.12990188598633, -38.34577178955078, -34.561641693115234, -30.777509689331055, -26.993379592895508, -23.20924949645996, -19.42511749267578, -15.640987396240234, -11.856857299804688, -8.07272720336914, -4.288596153259277, -0.5044651031494141, 3.279664993286133, 7.06379508972168, 10.84792709350586, 14.632057189941406, 18.416187286376953, 22.2003173828125, 25.984447479248047, 29.768579483032227, 33.552711486816406, 37.33683776855469, 41.1209716796875, 44.90510177612305, 48.689231872558594, 52.47336196899414, 56.25749206542969, 60.0416259765625, 63.82575225830078, 67.6098861694336, 71.39401245117188, 75.17814636230469, 78.9622802734375, 82.74641418457031, 86.5305404663086, 90.3146743774414, 94.09880065917969, 97.8829345703125, 101.66706848144531, 105.4511947631836, 109.23532104492188]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 16.0, 12.0, 22.0, 37.0, 71.0, 101.0, 177.0, 292.0, 519.0, 928.0, 1994.0, 4198.0, 9782.0, 26380.0, 93560.0, 582416.0, 2577436.0, 739325.0, 108526.0, 28618.0, 10530.0, 4649.0, 2160.0, 1061.0, 608.0, 323.0, 188.0, 119.0, 70.0, 51.0, 32.0, 19.0, 19.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-12.1640625, -11.831298828125, -11.49853515625, -11.165771484375, -10.8330078125, -10.500244140625, -10.16748046875, -9.834716796875, -9.501953125, -9.169189453125, -8.83642578125, -8.503662109375, -8.1708984375, -7.838134765625, -7.50537109375, -7.172607421875, -6.83984375, -6.507080078125, -6.17431640625, -5.841552734375, -5.5087890625, -5.176025390625, -4.84326171875, -4.510498046875, -4.177734375, -3.844970703125, -3.51220703125, -3.179443359375, -2.8466796875, -2.513916015625, -2.18115234375, -1.848388671875, -1.515625, -1.182861328125, -0.85009765625, -0.517333984375, -0.1845703125, 0.148193359375, 0.48095703125, 0.813720703125, 1.146484375, 1.479248046875, 1.81201171875, 2.144775390625, 2.4775390625, 2.810302734375, 3.14306640625, 3.475830078125, 3.80859375, 4.141357421875, 4.47412109375, 4.806884765625, 5.1396484375, 5.472412109375, 5.80517578125, 6.137939453125, 6.470703125, 6.803466796875, 7.13623046875, 7.468994140625, 7.8017578125, 8.134521484375, 8.46728515625, 8.800048828125, 9.1328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 5.0, 10.0, 19.0, 26.0, 20.0, 14.0, 24.0, 33.0, 34.0, 34.0, 47.0, 50.0, 52.0, 65.0, 66.0, 49.0, 54.0, 55.0, 50.0, 43.0, 37.0, 39.0, 29.0, 29.0, 20.0, 22.0, 20.0, 15.0, 9.0, 4.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9320068359375, -8.653076171875, -8.3741455078125, -8.09521484375, -7.8162841796875, -7.537353515625, -7.2584228515625, -6.9794921875, -6.7005615234375, -6.421630859375, -6.1427001953125, -5.86376953125, -5.5848388671875, -5.305908203125, -5.0269775390625, -4.748046875, -4.4691162109375, -4.190185546875, -3.9112548828125, -3.63232421875, -3.3533935546875, -3.074462890625, -2.7955322265625, -2.5166015625, -2.2376708984375, -1.958740234375, -1.6798095703125, -1.40087890625, -1.1219482421875, -0.843017578125, -0.5640869140625, -0.28515625, -0.0062255859375, 0.272705078125, 0.5516357421875, 0.83056640625, 1.1094970703125, 1.388427734375, 1.6673583984375, 1.9462890625, 2.2252197265625, 2.504150390625, 2.7830810546875, 3.06201171875, 3.3409423828125, 3.619873046875, 3.8988037109375, 4.177734375, 4.4566650390625, 4.735595703125, 5.0145263671875, 5.29345703125, 5.5723876953125, 5.851318359375, 6.1302490234375, 6.4091796875, 6.6881103515625, 6.967041015625, 7.2459716796875, 7.52490234375, 7.8038330078125, 8.082763671875, 8.3616943359375, 8.640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 10.0, 20.0, 32.0, 50.0, 71.0, 95.0, 158.0, 282.0, 524.0, 1056.0, 2448.0, 6224.0, 18085.0, 66453.0, 486761.0, 3161403.0, 363379.0, 59230.0, 16937.0, 6051.0, 2479.0, 1139.0, 569.0, 322.0, 176.0, 108.0, 75.0, 41.0, 21.0, 19.0, 10.0, 8.0, 3.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-18.671875, -18.1732177734375, -17.674560546875, -17.1759033203125, -16.67724609375, -16.1785888671875, -15.679931640625, -15.1812744140625, -14.6826171875, -14.1839599609375, -13.685302734375, -13.1866455078125, -12.68798828125, -12.1893310546875, -11.690673828125, -11.1920166015625, -10.693359375, -10.1947021484375, -9.696044921875, -9.1973876953125, -8.69873046875, -8.2000732421875, -7.701416015625, -7.2027587890625, -6.7041015625, -6.2054443359375, -5.706787109375, -5.2081298828125, -4.70947265625, -4.2108154296875, -3.712158203125, -3.2135009765625, -2.71484375, -2.2161865234375, -1.717529296875, -1.2188720703125, -0.72021484375, -0.2215576171875, 0.277099609375, 0.7757568359375, 1.2744140625, 1.7730712890625, 2.271728515625, 2.7703857421875, 3.26904296875, 3.7677001953125, 4.266357421875, 4.7650146484375, 5.263671875, 5.7623291015625, 6.260986328125, 6.7596435546875, 7.25830078125, 7.7569580078125, 8.255615234375, 8.7542724609375, 9.2529296875, 9.7515869140625, 10.250244140625, 10.7489013671875, 11.24755859375, 11.7462158203125, 12.244873046875, 12.7435302734375, 13.2421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 5.0, 15.0, 12.0, 12.0, 14.0, 29.0, 42.0, 52.0, 87.0, 156.0, 230.0, 474.0, 662.0, 785.0, 573.0, 330.0, 173.0, 94.0, 86.0, 63.0, 52.0, 29.0, 15.0, 21.0, 10.0, 9.0, 6.0, 4.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.953125, -20.359375, -19.765625, -19.171875, -18.578125, -17.984375, -17.390625, -16.796875, -16.203125, -15.609375, -15.015625, -14.421875, -13.828125, -13.234375, -12.640625, -12.046875, -11.453125, -10.859375, -10.265625, -9.671875, -9.078125, -8.484375, -7.890625, -7.296875, -6.703125, -6.109375, -5.515625, -4.921875, -4.328125, -3.734375, -3.140625, -2.546875, -1.953125, -1.359375, -0.765625, -0.171875, 0.421875, 1.015625, 1.609375, 2.203125, 2.796875, 3.390625, 3.984375, 4.578125, 5.171875, 5.765625, 6.359375, 6.953125, 7.546875, 8.140625, 8.734375, 9.328125, 9.921875, 10.515625, 11.109375, 11.703125, 12.296875, 12.890625, 13.484375, 14.078125, 14.671875, 15.265625, 15.859375, 16.453125, 17.046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 13.0, 45.0, 152.0, 305.0, 274.0, 120.0, 50.0, 16.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.2875671386719, -336.6203918457031, -326.9532165527344, -317.2860412597656, -307.6188659667969, -297.9516906738281, -288.2845153808594, -278.6173400878906, -268.9501647949219, -259.2829895019531, -249.61581420898438, -239.94863891601562, -230.28146362304688, -220.61428833007812, -210.94711303710938, -201.27993774414062, -191.61277770996094, -181.9456024169922, -172.27842712402344, -162.6112518310547, -152.94407653808594, -143.2769012451172, -133.6097412109375, -123.94255828857422, -114.27538299560547, -104.60820770263672, -94.94103240966797, -85.27386474609375, -75.606689453125, -65.93951416015625, -56.2723388671875, -46.60516357421875, -36.93798828125, -27.27081298828125, -17.603639602661133, -7.936466217041016, 1.7307090759277344, 11.397884368896484, 21.06505584716797, 30.73223114013672, 40.39940643310547, 50.06658172607422, 59.73375701904297, 69.40092468261719, 79.06809997558594, 88.73527526855469, 98.40245056152344, 108.06962585449219, 117.73680114746094, 127.40397644042969, 137.07115173339844, 146.7383270263672, 156.40550231933594, 166.0726776123047, 175.73983764648438, 185.40701293945312, 195.07418823242188, 204.74136352539062, 214.40853881835938, 224.07571411132812, 233.74288940429688, 243.41006469726562, 253.07723999023438, 262.7444152832031, 272.4115905761719]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 2.0, 8.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 19.0, 26.0, 23.0, 29.0, 30.0, 33.0, 42.0, 40.0, 36.0, 48.0, 48.0, 65.0, 47.0, 50.0, 52.0, 48.0, 52.0, 41.0, 32.0, 34.0, 25.0, 15.0, 23.0, 20.0, 12.0, 15.0, 11.0, 9.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.00346374511719, -78.33860778808594, -75.67374420166016, -73.0088882446289, -70.34402465820312, -67.67916870117188, -65.0143051147461, -62.349449157714844, -59.68458938598633, -57.01972961425781, -54.3548698425293, -51.69001007080078, -49.02515411376953, -46.36029052734375, -43.6954345703125, -41.030574798583984, -38.36571502685547, -35.70085525512695, -33.03599548339844, -30.371137619018555, -27.70627784729004, -25.041418075561523, -22.37656021118164, -19.711700439453125, -17.04684066772461, -14.381980895996094, -11.717122077941895, -9.052263259887695, -6.38740348815918, -3.722543716430664, -1.0576848983764648, 1.6071739196777344, 4.27203369140625, 6.936892986297607, 9.601752281188965, 12.266611099243164, 14.93147087097168, 17.596330642700195, 20.261188507080078, 22.926048278808594, 25.59090805053711, 28.255767822265625, 30.92062759399414, 33.585487365722656, 36.250343322753906, 38.91520690917969, 41.58006286621094, 44.24492263793945, 46.90978240966797, 49.574642181396484, 52.239501953125, 54.904361724853516, 57.56922149658203, 60.23407745361328, 62.8989372253418, 65.56379699707031, 68.22865295410156, 70.89350891113281, 73.5583724975586, 76.22322845458984, 78.88809204101562, 81.55294799804688, 84.21781158447266, 86.8826675415039, 89.54753112792969]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 12.0, 18.0, 35.0, 43.0, 80.0, 82.0, 157.0, 227.0, 341.0, 614.0, 977.0, 1667.0, 2882.0, 5210.0, 9757.0, 18537.0, 37535.0, 79118.0, 190094.0, 346687.0, 194200.0, 80409.0, 38135.0, 19251.0, 10119.0, 5294.0, 2878.0, 1635.0, 954.0, 591.0, 358.0, 225.0, 133.0, 83.0, 73.0, 33.0, 31.0, 25.0, 13.0, 9.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.53125, -11.1533203125, -10.775390625, -10.3974609375, -10.01953125, -9.6416015625, -9.263671875, -8.8857421875, -8.5078125, -8.1298828125, -7.751953125, -7.3740234375, -6.99609375, -6.6181640625, -6.240234375, -5.8623046875, -5.484375, -5.1064453125, -4.728515625, -4.3505859375, -3.97265625, -3.5947265625, -3.216796875, -2.8388671875, -2.4609375, -2.0830078125, -1.705078125, -1.3271484375, -0.94921875, -0.5712890625, -0.193359375, 0.1845703125, 0.5625, 0.9404296875, 1.318359375, 1.6962890625, 2.07421875, 2.4521484375, 2.830078125, 3.2080078125, 3.5859375, 3.9638671875, 4.341796875, 4.7197265625, 5.09765625, 5.4755859375, 5.853515625, 6.2314453125, 6.609375, 6.9873046875, 7.365234375, 7.7431640625, 8.12109375, 8.4990234375, 8.876953125, 9.2548828125, 9.6328125, 10.0107421875, 10.388671875, 10.7666015625, 11.14453125, 11.5224609375, 11.900390625, 12.2783203125, 12.65625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 15.0, 16.0, 11.0, 18.0, 15.0, 23.0, 22.0, 33.0, 35.0, 40.0, 57.0, 55.0, 58.0, 47.0, 57.0, 60.0, 62.0, 49.0, 47.0, 31.0, 35.0, 38.0, 28.0, 23.0, 26.0, 21.0, 15.0, 15.0, 6.0, 8.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.8294677734375, -8.549560546875, -8.2696533203125, -7.98974609375, -7.7098388671875, -7.429931640625, -7.1500244140625, -6.8701171875, -6.5902099609375, -6.310302734375, -6.0303955078125, -5.75048828125, -5.4705810546875, -5.190673828125, -4.9107666015625, -4.630859375, -4.3509521484375, -4.071044921875, -3.7911376953125, -3.51123046875, -3.2313232421875, -2.951416015625, -2.6715087890625, -2.3916015625, -2.1116943359375, -1.831787109375, -1.5518798828125, -1.27197265625, -0.9920654296875, -0.712158203125, -0.4322509765625, -0.15234375, 0.1275634765625, 0.407470703125, 0.6873779296875, 0.96728515625, 1.2471923828125, 1.527099609375, 1.8070068359375, 2.0869140625, 2.3668212890625, 2.646728515625, 2.9266357421875, 3.20654296875, 3.4864501953125, 3.766357421875, 4.0462646484375, 4.326171875, 4.6060791015625, 4.885986328125, 5.1658935546875, 5.44580078125, 5.7257080078125, 6.005615234375, 6.2855224609375, 6.5654296875, 6.8453369140625, 7.125244140625, 7.4051513671875, 7.68505859375, 7.9649658203125, 8.244873046875, 8.5247802734375, 8.8046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 10.0, 18.0, 29.0, 37.0, 57.0, 100.0, 142.0, 228.0, 327.0, 561.0, 967.0, 1808.0, 4855.0, 21483.0, 202383.0, 742483.0, 57788.0, 9215.0, 2822.0, 1257.0, 737.0, 434.0, 272.0, 169.0, 113.0, 87.0, 56.0, 25.0, 32.0, 13.0, 14.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.875, -36.76904296875, -35.6630859375, -34.55712890625, -33.451171875, -32.34521484375, -31.2392578125, -30.13330078125, -29.02734375, -27.92138671875, -26.8154296875, -25.70947265625, -24.603515625, -23.49755859375, -22.3916015625, -21.28564453125, -20.1796875, -19.07373046875, -17.9677734375, -16.86181640625, -15.755859375, -14.64990234375, -13.5439453125, -12.43798828125, -11.33203125, -10.22607421875, -9.1201171875, -8.01416015625, -6.908203125, -5.80224609375, -4.6962890625, -3.59033203125, -2.484375, -1.37841796875, -0.2724609375, 0.83349609375, 1.939453125, 3.04541015625, 4.1513671875, 5.25732421875, 6.36328125, 7.46923828125, 8.5751953125, 9.68115234375, 10.787109375, 11.89306640625, 12.9990234375, 14.10498046875, 15.2109375, 16.31689453125, 17.4228515625, 18.52880859375, 19.634765625, 20.74072265625, 21.8466796875, 22.95263671875, 24.05859375, 25.16455078125, 26.2705078125, 27.37646484375, 28.482421875, 29.58837890625, 30.6943359375, 31.80029296875, 32.90625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 11.0, 13.0, 7.0, 19.0, 14.0, 21.0, 32.0, 37.0, 30.0, 29.0, 41.0, 45.0, 56.0, 62.0, 58.0, 49.0, 61.0, 45.0, 43.0, 30.0, 42.0, 32.0, 28.0, 33.0, 27.0, 16.0, 19.0, 18.0, 16.0, 4.0, 13.0, 13.0, 4.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.03125, -34.014404296875, -32.99755859375, -31.980712890625, -30.9638671875, -29.947021484375, -28.93017578125, -27.913330078125, -26.896484375, -25.879638671875, -24.86279296875, -23.845947265625, -22.8291015625, -21.812255859375, -20.79541015625, -19.778564453125, -18.76171875, -17.744873046875, -16.72802734375, -15.711181640625, -14.6943359375, -13.677490234375, -12.66064453125, -11.643798828125, -10.626953125, -9.610107421875, -8.59326171875, -7.576416015625, -6.5595703125, -5.542724609375, -4.52587890625, -3.509033203125, -2.4921875, -1.475341796875, -0.45849609375, 0.558349609375, 1.5751953125, 2.592041015625, 3.60888671875, 4.625732421875, 5.642578125, 6.659423828125, 7.67626953125, 8.693115234375, 9.7099609375, 10.726806640625, 11.74365234375, 12.760498046875, 13.77734375, 14.794189453125, 15.81103515625, 16.827880859375, 17.8447265625, 18.861572265625, 19.87841796875, 20.895263671875, 21.912109375, 22.928955078125, 23.94580078125, 24.962646484375, 25.9794921875, 26.996337890625, 28.01318359375, 29.030029296875, 30.046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 9.0, 17.0, 17.0, 23.0, 43.0, 54.0, 117.0, 217.0, 545.0, 1699.0, 8102.0, 76002.0, 835122.0, 112766.0, 10532.0, 2098.0, 631.0, 236.0, 127.0, 54.0, 49.0, 24.0, 24.0, 10.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.614990234375, -10.22998046875, -9.844970703125, -9.4599609375, -9.074951171875, -8.68994140625, -8.304931640625, -7.919921875, -7.534912109375, -7.14990234375, -6.764892578125, -6.3798828125, -5.994873046875, -5.60986328125, -5.224853515625, -4.83984375, -4.454833984375, -4.06982421875, -3.684814453125, -3.2998046875, -2.914794921875, -2.52978515625, -2.144775390625, -1.759765625, -1.374755859375, -0.98974609375, -0.604736328125, -0.2197265625, 0.165283203125, 0.55029296875, 0.935302734375, 1.3203125, 1.705322265625, 2.09033203125, 2.475341796875, 2.8603515625, 3.245361328125, 3.63037109375, 4.015380859375, 4.400390625, 4.785400390625, 5.17041015625, 5.555419921875, 5.9404296875, 6.325439453125, 6.71044921875, 7.095458984375, 7.48046875, 7.865478515625, 8.25048828125, 8.635498046875, 9.0205078125, 9.405517578125, 9.79052734375, 10.175537109375, 10.560546875, 10.945556640625, 11.33056640625, 11.715576171875, 12.1005859375, 12.485595703125, 12.87060546875, 13.255615234375, 13.640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 8.0, 10.0, 6.0, 10.0, 11.0, 24.0, 29.0, 36.0, 50.0, 63.0, 96.0, 127.0, 151.0, 105.0, 81.0, 49.0, 27.0, 26.0, 11.0, 15.0, 12.0, 8.0, 5.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020961761474609375, -0.0020237863063812256, -0.0019513964653015137, -0.0018790066242218018, -0.0018066167831420898, -0.001734226942062378, -0.001661837100982666, -0.001589447259902954, -0.0015170574188232422, -0.0014446675777435303, -0.0013722777366638184, -0.0012998878955841064, -0.0012274980545043945, -0.0011551082134246826, -0.0010827183723449707, -0.0010103285312652588, -0.0009379386901855469, -0.000865548849105835, -0.000793159008026123, -0.0007207691669464111, -0.0006483793258666992, -0.0005759894847869873, -0.0005035996437072754, -0.0004312098026275635, -0.00035881996154785156, -0.00028643012046813965, -0.00021404027938842773, -0.00014165043830871582, -6.92605972290039e-05, 3.129243850708008e-06, 7.551908493041992e-05, 0.00014790892601013184, 0.00022029876708984375, 0.00029268860816955566, 0.0003650784492492676, 0.0004374682903289795, 0.0005098581314086914, 0.0005822479724884033, 0.0006546378135681152, 0.0007270276546478271, 0.0007994174957275391, 0.000871807336807251, 0.0009441971778869629, 0.0010165870189666748, 0.0010889768600463867, 0.0011613667011260986, 0.0012337565422058105, 0.0013061463832855225, 0.0013785362243652344, 0.0014509260654449463, 0.0015233159065246582, 0.0015957057476043701, 0.001668095588684082, 0.001740485429763794, 0.0018128752708435059, 0.0018852651119232178, 0.0019576549530029297, 0.0020300447940826416, 0.0021024346351623535, 0.0021748244762420654, 0.0022472143173217773, 0.0023196041584014893, 0.002391993999481201, 0.002464383840560913, 0.002536773681640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 0.0, 9.0, 14.0, 27.0, 18.0, 47.0, 67.0, 136.0, 230.0, 446.0, 1161.0, 3077.0, 12616.0, 118930.0, 818246.0, 79287.0, 9830.0, 2593.0, 949.0, 425.0, 197.0, 93.0, 68.0, 32.0, 20.0, 16.0, 5.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.56640625, -6.24493408203125, -5.9234619140625, -5.60198974609375, -5.280517578125, -4.95904541015625, -4.6375732421875, -4.31610107421875, -3.99462890625, -3.67315673828125, -3.3516845703125, -3.03021240234375, -2.708740234375, -2.38726806640625, -2.0657958984375, -1.74432373046875, -1.4228515625, -1.10137939453125, -0.7799072265625, -0.45843505859375, -0.136962890625, 0.18450927734375, 0.5059814453125, 0.82745361328125, 1.14892578125, 1.47039794921875, 1.7918701171875, 2.11334228515625, 2.434814453125, 2.75628662109375, 3.0777587890625, 3.39923095703125, 3.720703125, 4.04217529296875, 4.3636474609375, 4.68511962890625, 5.006591796875, 5.32806396484375, 5.6495361328125, 5.97100830078125, 6.29248046875, 6.61395263671875, 6.9354248046875, 7.25689697265625, 7.578369140625, 7.89984130859375, 8.2213134765625, 8.54278564453125, 8.8642578125, 9.18572998046875, 9.5072021484375, 9.82867431640625, 10.150146484375, 10.47161865234375, 10.7930908203125, 11.11456298828125, 11.43603515625, 11.75750732421875, 12.0789794921875, 12.40045166015625, 12.721923828125, 13.04339599609375, 13.3648681640625, 13.68634033203125, 14.0078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 6.0, 15.0, 13.0, 19.0, 25.0, 26.0, 42.0, 46.0, 32.0, 63.0, 63.0, 90.0, 83.0, 76.0, 71.0, 66.0, 49.0, 43.0, 42.0, 39.0, 20.0, 15.0, 8.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.65716552734375, -6.4588623046875, -6.26055908203125, -6.062255859375, -5.86395263671875, -5.6656494140625, -5.46734619140625, -5.26904296875, -5.07073974609375, -4.8724365234375, -4.67413330078125, -4.475830078125, -4.27752685546875, -4.0792236328125, -3.88092041015625, -3.6826171875, -3.48431396484375, -3.2860107421875, -3.08770751953125, -2.889404296875, -2.69110107421875, -2.4927978515625, -2.29449462890625, -2.09619140625, -1.89788818359375, -1.6995849609375, -1.50128173828125, -1.302978515625, -1.10467529296875, -0.9063720703125, -0.70806884765625, -0.509765625, -0.31146240234375, -0.1131591796875, 0.08514404296875, 0.283447265625, 0.48175048828125, 0.6800537109375, 0.87835693359375, 1.07666015625, 1.27496337890625, 1.4732666015625, 1.67156982421875, 1.869873046875, 2.06817626953125, 2.2664794921875, 2.46478271484375, 2.6630859375, 2.86138916015625, 3.0596923828125, 3.25799560546875, 3.456298828125, 3.65460205078125, 3.8529052734375, 4.05120849609375, 4.24951171875, 4.44781494140625, 4.6461181640625, 4.84442138671875, 5.042724609375, 5.24102783203125, 5.4393310546875, 5.63763427734375, 5.8359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 14.0, 25.0, 39.0, 72.0, 129.0, 243.0, 228.0, 109.0, 72.0, 29.0, 9.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-258.89837646484375, -252.25265502929688, -245.60691833496094, -238.96119689941406, -232.31546020507812, -225.66973876953125, -219.02401733398438, -212.37828063964844, -205.7325439453125, -199.08682250976562, -192.4410858154297, -185.7953643798828, -179.14962768554688, -172.50390625, -165.85818481445312, -159.2124481201172, -152.5667266845703, -145.92100524902344, -139.2752685546875, -132.62954711914062, -125.98381042480469, -119.33808898925781, -112.6923599243164, -106.046630859375, -99.4009017944336, -92.75517272949219, -86.10944366455078, -79.46371459960938, -72.8179931640625, -66.17225646972656, -59.52653503417969, -52.88080596923828, -46.23509216308594, -39.58936309814453, -32.943634033203125, -26.297908782958984, -19.652179718017578, -13.006450653076172, -6.360725402832031, 0.285003662109375, 6.930732727050781, 13.576460838317871, 20.22218894958496, 26.867916107177734, 33.51364517211914, 40.15937423706055, 46.80509948730469, 53.450828552246094, 60.0965576171875, 66.7422866821289, 73.38801574707031, 80.03373718261719, 86.67947387695312, 93.3251953125, 99.9709243774414, 106.61665344238281, 113.26238250732422, 119.90811157226562, 126.55384063720703, 133.19956970214844, 139.8452911376953, 146.49102783203125, 153.13674926757812, 159.782470703125, 166.42820739746094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 7.0, 10.0, 8.0, 14.0, 17.0, 11.0, 14.0, 19.0, 13.0, 16.0, 26.0, 38.0, 33.0, 27.0, 36.0, 45.0, 71.0, 78.0, 58.0, 49.0, 62.0, 67.0, 33.0, 23.0, 26.0, 18.0, 29.0, 24.0, 18.0, 15.0, 15.0, 16.0, 11.0, 14.0, 6.0, 6.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-117.03082275390625, -113.3010025024414, -109.5711898803711, -105.84136962890625, -102.11155700683594, -98.3817367553711, -94.65192413330078, -90.92210388183594, -87.19229125976562, -83.46247100830078, -79.73265838623047, -76.00283813476562, -72.27302551269531, -68.54320526123047, -64.81339263916016, -61.08357238769531, -57.353755950927734, -53.623939514160156, -49.89412307739258, -46.164306640625, -42.43449020385742, -38.704673767089844, -34.974853515625, -31.245038986206055, -27.515222549438477, -23.7854061126709, -20.05558967590332, -16.32577133178711, -12.595955848693848, -8.866138458251953, -5.136322021484375, -1.4065055847167969, 2.3233108520507812, 6.053127288818359, 9.782943725585938, 13.512761116027832, 17.242576599121094, 20.972394943237305, 24.702211380004883, 28.43202781677246, 32.161842346191406, 35.891658782958984, 39.62147521972656, 43.35129165649414, 47.08110809326172, 50.81092834472656, 54.540740966796875, 58.27056121826172, 62.0003776550293, 65.73019409179688, 69.46001434326172, 73.18982696533203, 76.91964721679688, 80.64945983886719, 84.37928009033203, 88.10909271240234, 91.83891296386719, 95.56873321533203, 99.29854583740234, 103.02836608886719, 106.7581787109375, 110.48799896240234, 114.21781158447266, 117.9476318359375, 121.67744445800781]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 13.0, 13.0, 17.0, 25.0, 41.0, 52.0, 87.0, 134.0, 209.0, 342.0, 596.0, 838.0, 1606.0, 2914.0, 5839.0, 14725.0, 51398.0, 356489.0, 2506174.0, 1092607.0, 117750.0, 24605.0, 8588.0, 3909.0, 2059.0, 1182.0, 727.0, 427.0, 293.0, 182.0, 138.0, 86.0, 65.0, 37.0, 28.0, 19.0, 6.0, 13.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.3515625, -11.0048828125, -10.658203125, -10.3115234375, -9.96484375, -9.6181640625, -9.271484375, -8.9248046875, -8.578125, -8.2314453125, -7.884765625, -7.5380859375, -7.19140625, -6.8447265625, -6.498046875, -6.1513671875, -5.8046875, -5.4580078125, -5.111328125, -4.7646484375, -4.41796875, -4.0712890625, -3.724609375, -3.3779296875, -3.03125, -2.6845703125, -2.337890625, -1.9912109375, -1.64453125, -1.2978515625, -0.951171875, -0.6044921875, -0.2578125, 0.0888671875, 0.435546875, 0.7822265625, 1.12890625, 1.4755859375, 1.822265625, 2.1689453125, 2.515625, 2.8623046875, 3.208984375, 3.5556640625, 3.90234375, 4.2490234375, 4.595703125, 4.9423828125, 5.2890625, 5.6357421875, 5.982421875, 6.3291015625, 6.67578125, 7.0224609375, 7.369140625, 7.7158203125, 8.0625, 8.4091796875, 8.755859375, 9.1025390625, 9.44921875, 9.7958984375, 10.142578125, 10.4892578125, 10.8359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 15.0, 19.0, 20.0, 17.0, 33.0, 30.0, 44.0, 36.0, 47.0, 53.0, 39.0, 42.0, 67.0, 67.0, 53.0, 71.0, 49.0, 40.0, 34.0, 34.0, 36.0, 39.0, 24.0, 16.0, 12.0, 15.0, 6.0, 7.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0689697265625, -8.786376953125, -8.5037841796875, -8.22119140625, -7.9385986328125, -7.656005859375, -7.3734130859375, -7.0908203125, -6.8082275390625, -6.525634765625, -6.2430419921875, -5.96044921875, -5.6778564453125, -5.395263671875, -5.1126708984375, -4.830078125, -4.5474853515625, -4.264892578125, -3.9822998046875, -3.69970703125, -3.4171142578125, -3.134521484375, -2.8519287109375, -2.5693359375, -2.2867431640625, -2.004150390625, -1.7215576171875, -1.43896484375, -1.1563720703125, -0.873779296875, -0.5911865234375, -0.30859375, -0.0260009765625, 0.256591796875, 0.5391845703125, 0.82177734375, 1.1043701171875, 1.386962890625, 1.6695556640625, 1.9521484375, 2.2347412109375, 2.517333984375, 2.7999267578125, 3.08251953125, 3.3651123046875, 3.647705078125, 3.9302978515625, 4.212890625, 4.4954833984375, 4.778076171875, 5.0606689453125, 5.34326171875, 5.6258544921875, 5.908447265625, 6.1910400390625, 6.4736328125, 6.7562255859375, 7.038818359375, 7.3214111328125, 7.60400390625, 7.8865966796875, 8.169189453125, 8.4517822265625, 8.734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 11.0, 6.0, 13.0, 19.0, 40.0, 40.0, 72.0, 143.0, 288.0, 610.0, 1606.0, 5166.0, 22748.0, 294840.0, 3725461.0, 121905.0, 15209.0, 3710.0, 1313.0, 547.0, 228.0, 124.0, 79.0, 34.0, 19.0, 10.0, 9.0, 3.0, 7.0, 6.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.625, -30.82177734375, -30.0185546875, -29.21533203125, -28.412109375, -27.60888671875, -26.8056640625, -26.00244140625, -25.19921875, -24.39599609375, -23.5927734375, -22.78955078125, -21.986328125, -21.18310546875, -20.3798828125, -19.57666015625, -18.7734375, -17.97021484375, -17.1669921875, -16.36376953125, -15.560546875, -14.75732421875, -13.9541015625, -13.15087890625, -12.34765625, -11.54443359375, -10.7412109375, -9.93798828125, -9.134765625, -8.33154296875, -7.5283203125, -6.72509765625, -5.921875, -5.11865234375, -4.3154296875, -3.51220703125, -2.708984375, -1.90576171875, -1.1025390625, -0.29931640625, 0.50390625, 1.30712890625, 2.1103515625, 2.91357421875, 3.716796875, 4.52001953125, 5.3232421875, 6.12646484375, 6.9296875, 7.73291015625, 8.5361328125, 9.33935546875, 10.142578125, 10.94580078125, 11.7490234375, 12.55224609375, 13.35546875, 14.15869140625, 14.9619140625, 15.76513671875, 16.568359375, 17.37158203125, 18.1748046875, 18.97802734375, 19.78125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 15.0, 25.0, 60.0, 76.0, 158.0, 317.0, 725.0, 1170.0, 789.0, 339.0, 163.0, 77.0, 41.0, 23.0, 21.0, 10.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.28125, -30.4892578125, -29.697265625, -28.9052734375, -28.11328125, -27.3212890625, -26.529296875, -25.7373046875, -24.9453125, -24.1533203125, -23.361328125, -22.5693359375, -21.77734375, -20.9853515625, -20.193359375, -19.4013671875, -18.609375, -17.8173828125, -17.025390625, -16.2333984375, -15.44140625, -14.6494140625, -13.857421875, -13.0654296875, -12.2734375, -11.4814453125, -10.689453125, -9.8974609375, -9.10546875, -8.3134765625, -7.521484375, -6.7294921875, -5.9375, -5.1455078125, -4.353515625, -3.5615234375, -2.76953125, -1.9775390625, -1.185546875, -0.3935546875, 0.3984375, 1.1904296875, 1.982421875, 2.7744140625, 3.56640625, 4.3583984375, 5.150390625, 5.9423828125, 6.734375, 7.5263671875, 8.318359375, 9.1103515625, 9.90234375, 10.6943359375, 11.486328125, 12.2783203125, 13.0703125, 13.8623046875, 14.654296875, 15.4462890625, 16.23828125, 17.0302734375, 17.822265625, 18.6142578125, 19.40625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 13.0, 35.0, 95.0, 210.0, 283.0, 219.0, 81.0, 32.0, 8.0, 4.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.28248596191406, -126.15614318847656, -118.02980041503906, -109.90345764160156, -101.77711486816406, -93.65077209472656, -85.5244369506836, -77.3980941772461, -69.2717514038086, -61.145408630371094, -53.019065856933594, -44.89272689819336, -36.76638412475586, -28.64004135131836, -20.513702392578125, -12.387359619140625, -4.261016845703125, 3.8653249740600586, 11.991666793823242, 20.11800765991211, 28.24435043334961, 36.37069320678711, 44.497032165527344, 52.623374938964844, 60.749717712402344, 68.87606048583984, 77.00240325927734, 85.12873840332031, 93.25508117675781, 101.38142395019531, 109.50776672363281, 117.63410949707031, 125.76046752929688, 133.88681030273438, 142.01315307617188, 150.13949584960938, 158.26583862304688, 166.39218139648438, 174.51852416992188, 182.64486694335938, 190.77120971679688, 198.89755249023438, 207.02389526367188, 215.15023803710938, 223.27658081054688, 231.40292358398438, 239.52926635742188, 247.65560913085938, 255.7819366455078, 263.90826416015625, 272.03460693359375, 280.16094970703125, 288.28729248046875, 296.41363525390625, 304.53997802734375, 312.66632080078125, 320.79266357421875, 328.91900634765625, 337.04534912109375, 345.17169189453125, 353.29803466796875, 361.42437744140625, 369.55072021484375, 377.67706298828125, 385.80340576171875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 4.0, 13.0, 19.0, 21.0, 25.0, 26.0, 26.0, 36.0, 32.0, 39.0, 38.0, 41.0, 46.0, 50.0, 44.0, 48.0, 58.0, 52.0, 41.0, 40.0, 46.0, 40.0, 28.0, 20.0, 24.0, 26.0, 13.0, 12.0, 17.0, 14.0, 11.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-81.655029296875, -79.3887710571289, -77.12251281738281, -74.85626220703125, -72.59000396728516, -70.32374572753906, -68.05748748779297, -65.79122924804688, -63.52497482299805, -61.25871658325195, -58.992462158203125, -56.72620391845703, -54.45994567871094, -52.19369125366211, -49.927433013916016, -47.66117858886719, -45.394920349121094, -43.128662109375, -40.86240768432617, -38.59614944458008, -36.32989501953125, -34.063636779785156, -31.797378540039062, -29.5311222076416, -27.26486587524414, -24.99860954284668, -22.73235321044922, -20.466094970703125, -18.199838638305664, -15.933582305908203, -13.667325019836426, -11.401067733764648, -9.134807586669922, -6.868550777435303, -4.602293968200684, -2.3360371589660645, -0.06978034973144531, 2.1964759826660156, 4.462733268737793, 6.72899055480957, 8.995246887207031, 11.261503219604492, 13.52776050567627, 15.794017791748047, 18.060274124145508, 20.32653045654297, 22.592788696289062, 24.859045028686523, 27.125301361083984, 29.391557693481445, 31.657814025878906, 33.924072265625, 36.190330505371094, 38.45658493041992, 40.722843170166016, 42.989097595214844, 45.25535583496094, 47.52161407470703, 49.78786849975586, 52.05412673950195, 54.32038116455078, 56.586639404296875, 58.85289764404297, 61.11915588378906, 63.38541030883789]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 11.0, 10.0, 27.0, 48.0, 66.0, 97.0, 176.0, 285.0, 523.0, 909.0, 1756.0, 3431.0, 7393.0, 16771.0, 42912.0, 120397.0, 305338.0, 327572.0, 137274.0, 48565.0, 18891.0, 8021.0, 3801.0, 1911.0, 1051.0, 538.0, 336.0, 169.0, 106.0, 60.0, 37.0, 20.0, 16.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.7354736328125, -10.400634765625, -10.0657958984375, -9.73095703125, -9.3961181640625, -9.061279296875, -8.7264404296875, -8.3916015625, -8.0567626953125, -7.721923828125, -7.3870849609375, -7.05224609375, -6.7174072265625, -6.382568359375, -6.0477294921875, -5.712890625, -5.3780517578125, -5.043212890625, -4.7083740234375, -4.37353515625, -4.0386962890625, -3.703857421875, -3.3690185546875, -3.0341796875, -2.6993408203125, -2.364501953125, -2.0296630859375, -1.69482421875, -1.3599853515625, -1.025146484375, -0.6903076171875, -0.35546875, -0.0206298828125, 0.314208984375, 0.6490478515625, 0.98388671875, 1.3187255859375, 1.653564453125, 1.9884033203125, 2.3232421875, 2.6580810546875, 2.992919921875, 3.3277587890625, 3.66259765625, 3.9974365234375, 4.332275390625, 4.6671142578125, 5.001953125, 5.3367919921875, 5.671630859375, 6.0064697265625, 6.34130859375, 6.6761474609375, 7.010986328125, 7.3458251953125, 7.6806640625, 8.0155029296875, 8.350341796875, 8.6851806640625, 9.02001953125, 9.3548583984375, 9.689697265625, 10.0245361328125, 10.359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 15.0, 9.0, 13.0, 19.0, 17.0, 24.0, 25.0, 36.0, 38.0, 38.0, 46.0, 65.0, 54.0, 58.0, 51.0, 63.0, 50.0, 56.0, 64.0, 46.0, 25.0, 35.0, 21.0, 24.0, 16.0, 14.0, 16.0, 12.0, 9.0, 10.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.117919921875, -8.83740234375, -8.556884765625, -8.2763671875, -7.995849609375, -7.71533203125, -7.434814453125, -7.154296875, -6.873779296875, -6.59326171875, -6.312744140625, -6.0322265625, -5.751708984375, -5.47119140625, -5.190673828125, -4.91015625, -4.629638671875, -4.34912109375, -4.068603515625, -3.7880859375, -3.507568359375, -3.22705078125, -2.946533203125, -2.666015625, -2.385498046875, -2.10498046875, -1.824462890625, -1.5439453125, -1.263427734375, -0.98291015625, -0.702392578125, -0.421875, -0.141357421875, 0.13916015625, 0.419677734375, 0.7001953125, 0.980712890625, 1.26123046875, 1.541748046875, 1.822265625, 2.102783203125, 2.38330078125, 2.663818359375, 2.9443359375, 3.224853515625, 3.50537109375, 3.785888671875, 4.06640625, 4.346923828125, 4.62744140625, 4.907958984375, 5.1884765625, 5.468994140625, 5.74951171875, 6.030029296875, 6.310546875, 6.591064453125, 6.87158203125, 7.152099609375, 7.4326171875, 7.713134765625, 7.99365234375, 8.274169921875, 8.5546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 21.0, 36.0, 37.0, 67.0, 108.0, 192.0, 445.0, 1062.0, 2841.0, 10910.0, 64164.0, 674427.0, 254628.0, 29921.0, 6290.0, 1859.0, 716.0, 326.0, 189.0, 90.0, 64.0, 39.0, 33.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.738525390625, -19.99267578125, -19.246826171875, -18.5009765625, -17.755126953125, -17.00927734375, -16.263427734375, -15.517578125, -14.771728515625, -14.02587890625, -13.280029296875, -12.5341796875, -11.788330078125, -11.04248046875, -10.296630859375, -9.55078125, -8.804931640625, -8.05908203125, -7.313232421875, -6.5673828125, -5.821533203125, -5.07568359375, -4.329833984375, -3.583984375, -2.838134765625, -2.09228515625, -1.346435546875, -0.6005859375, 0.145263671875, 0.89111328125, 1.636962890625, 2.3828125, 3.128662109375, 3.87451171875, 4.620361328125, 5.3662109375, 6.112060546875, 6.85791015625, 7.603759765625, 8.349609375, 9.095458984375, 9.84130859375, 10.587158203125, 11.3330078125, 12.078857421875, 12.82470703125, 13.570556640625, 14.31640625, 15.062255859375, 15.80810546875, 16.553955078125, 17.2998046875, 18.045654296875, 18.79150390625, 19.537353515625, 20.283203125, 21.029052734375, 21.77490234375, 22.520751953125, 23.2666015625, 24.012451171875, 24.75830078125, 25.504150390625, 26.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 6.0, 8.0, 14.0, 20.0, 15.0, 40.0, 35.0, 37.0, 55.0, 45.0, 64.0, 57.0, 61.0, 70.0, 56.0, 61.0, 52.0, 51.0, 46.0, 27.0, 45.0, 26.0, 23.0, 20.0, 17.0, 12.0, 7.0, 5.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.546875, -30.484619140625, -29.42236328125, -28.360107421875, -27.2978515625, -26.235595703125, -25.17333984375, -24.111083984375, -23.048828125, -21.986572265625, -20.92431640625, -19.862060546875, -18.7998046875, -17.737548828125, -16.67529296875, -15.613037109375, -14.55078125, -13.488525390625, -12.42626953125, -11.364013671875, -10.3017578125, -9.239501953125, -8.17724609375, -7.114990234375, -6.052734375, -4.990478515625, -3.92822265625, -2.865966796875, -1.8037109375, -0.741455078125, 0.32080078125, 1.383056640625, 2.4453125, 3.507568359375, 4.56982421875, 5.632080078125, 6.6943359375, 7.756591796875, 8.81884765625, 9.881103515625, 10.943359375, 12.005615234375, 13.06787109375, 14.130126953125, 15.1923828125, 16.254638671875, 17.31689453125, 18.379150390625, 19.44140625, 20.503662109375, 21.56591796875, 22.628173828125, 23.6904296875, 24.752685546875, 25.81494140625, 26.877197265625, 27.939453125, 29.001708984375, 30.06396484375, 31.126220703125, 32.1884765625, 33.250732421875, 34.31298828125, 35.375244140625, 36.4375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 10.0, 5.0, 11.0, 21.0, 27.0, 44.0, 71.0, 91.0, 194.0, 356.0, 792.0, 1686.0, 4264.0, 11410.0, 37192.0, 150402.0, 618754.0, 163025.0, 39941.0, 12299.0, 4352.0, 1836.0, 809.0, 418.0, 195.0, 102.0, 81.0, 36.0, 21.0, 21.0, 14.0, 12.0, 6.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.95703125, -4.8175048828125, -4.677978515625, -4.5384521484375, -4.39892578125, -4.2593994140625, -4.119873046875, -3.9803466796875, -3.8408203125, -3.7012939453125, -3.561767578125, -3.4222412109375, -3.28271484375, -3.1431884765625, -3.003662109375, -2.8641357421875, -2.724609375, -2.5850830078125, -2.445556640625, -2.3060302734375, -2.16650390625, -2.0269775390625, -1.887451171875, -1.7479248046875, -1.6083984375, -1.4688720703125, -1.329345703125, -1.1898193359375, -1.05029296875, -0.9107666015625, -0.771240234375, -0.6317138671875, -0.4921875, -0.3526611328125, -0.213134765625, -0.0736083984375, 0.06591796875, 0.2054443359375, 0.344970703125, 0.4844970703125, 0.6240234375, 0.7635498046875, 0.903076171875, 1.0426025390625, 1.18212890625, 1.3216552734375, 1.461181640625, 1.6007080078125, 1.740234375, 1.8797607421875, 2.019287109375, 2.1588134765625, 2.29833984375, 2.4378662109375, 2.577392578125, 2.7169189453125, 2.8564453125, 2.9959716796875, 3.135498046875, 3.2750244140625, 3.41455078125, 3.5540771484375, 3.693603515625, 3.8331298828125, 3.97265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 15.0, 40.0, 40.0, 72.0, 121.0, 182.0, 158.0, 129.0, 84.0, 42.0, 31.0, 13.0, 10.0, 7.0, 3.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.0019785165786743164, -0.0019104480743408203, -0.0018423795700073242, -0.0017743110656738281, -0.001706242561340332, -0.001638174057006836, -0.0015701055526733398, -0.0015020370483398438, -0.0014339685440063477, -0.0013659000396728516, -0.0012978315353393555, -0.0012297630310058594, -0.0011616945266723633, -0.0010936260223388672, -0.001025557518005371, -0.000957489013671875, -0.0008894205093383789, -0.0008213520050048828, -0.0007532835006713867, -0.0006852149963378906, -0.0006171464920043945, -0.0005490779876708984, -0.00048100948333740234, -0.00041294097900390625, -0.00034487247467041016, -0.00027680397033691406, -0.00020873546600341797, -0.00014066696166992188, -7.259845733642578e-05, -4.5299530029296875e-06, 6.35385513305664e-05, 0.0001316070556640625, 0.0001996755599975586, 0.0002677440643310547, 0.0003358125686645508, 0.0004038810729980469, 0.00047194957733154297, 0.0005400180816650391, 0.0006080865859985352, 0.0006761550903320312, 0.0007442235946655273, 0.0008122920989990234, 0.0008803606033325195, 0.0009484291076660156, 0.0010164976119995117, 0.0010845661163330078, 0.001152634620666504, 0.001220703125, 0.001288771629333496, 0.0013568401336669922, 0.0014249086380004883, 0.0014929771423339844, 0.0015610456466674805, 0.0016291141510009766, 0.0016971826553344727, 0.0017652511596679688, 0.0018333196640014648, 0.001901388168334961, 0.001969456672668457, 0.002037525177001953, 0.0021055936813354492, 0.0021736621856689453, 0.0022417306900024414, 0.0023097991943359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 10.0, 17.0, 19.0, 19.0, 21.0, 43.0, 86.0, 125.0, 210.0, 387.0, 680.0, 1472.0, 3288.0, 8444.0, 25513.0, 89178.0, 477685.0, 321155.0, 82327.0, 23733.0, 7965.0, 3135.0, 1472.0, 685.0, 322.0, 198.0, 123.0, 89.0, 42.0, 33.0, 23.0, 12.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3046875, -4.1700439453125, -4.035400390625, -3.9007568359375, -3.76611328125, -3.6314697265625, -3.496826171875, -3.3621826171875, -3.2275390625, -3.0928955078125, -2.958251953125, -2.8236083984375, -2.68896484375, -2.5543212890625, -2.419677734375, -2.2850341796875, -2.150390625, -2.0157470703125, -1.881103515625, -1.7464599609375, -1.61181640625, -1.4771728515625, -1.342529296875, -1.2078857421875, -1.0732421875, -0.9385986328125, -0.803955078125, -0.6693115234375, -0.53466796875, -0.4000244140625, -0.265380859375, -0.1307373046875, 0.00390625, 0.1385498046875, 0.273193359375, 0.4078369140625, 0.54248046875, 0.6771240234375, 0.811767578125, 0.9464111328125, 1.0810546875, 1.2156982421875, 1.350341796875, 1.4849853515625, 1.61962890625, 1.7542724609375, 1.888916015625, 2.0235595703125, 2.158203125, 2.2928466796875, 2.427490234375, 2.5621337890625, 2.69677734375, 2.8314208984375, 2.966064453125, 3.1007080078125, 3.2353515625, 3.3699951171875, 3.504638671875, 3.6392822265625, 3.77392578125, 3.9085693359375, 4.043212890625, 4.1778564453125, 4.3125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 14.0, 16.0, 20.0, 20.0, 46.0, 55.0, 76.0, 84.0, 97.0, 102.0, 116.0, 80.0, 63.0, 52.0, 43.0, 25.0, 20.0, 18.0, 11.0, 8.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.97308349609375, -5.7821044921875, -5.59112548828125, -5.400146484375, -5.20916748046875, -5.0181884765625, -4.82720947265625, -4.63623046875, -4.44525146484375, -4.2542724609375, -4.06329345703125, -3.872314453125, -3.68133544921875, -3.4903564453125, -3.29937744140625, -3.1083984375, -2.91741943359375, -2.7264404296875, -2.53546142578125, -2.344482421875, -2.15350341796875, -1.9625244140625, -1.77154541015625, -1.58056640625, -1.38958740234375, -1.1986083984375, -1.00762939453125, -0.816650390625, -0.62567138671875, -0.4346923828125, -0.24371337890625, -0.052734375, 0.13824462890625, 0.3292236328125, 0.52020263671875, 0.711181640625, 0.90216064453125, 1.0931396484375, 1.28411865234375, 1.47509765625, 1.66607666015625, 1.8570556640625, 2.04803466796875, 2.239013671875, 2.42999267578125, 2.6209716796875, 2.81195068359375, 3.0029296875, 3.19390869140625, 3.3848876953125, 3.57586669921875, 3.766845703125, 3.95782470703125, 4.1488037109375, 4.33978271484375, 4.53076171875, 4.72174072265625, 4.9127197265625, 5.10369873046875, 5.294677734375, 5.48565673828125, 5.6766357421875, 5.86761474609375, 6.05859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 7.0, 8.0, 17.0, 39.0, 54.0, 94.0, 162.0, 245.0, 149.0, 92.0, 54.0, 33.0, 22.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-186.63433837890625, -182.4351043701172, -178.23587036132812, -174.03663635253906, -169.83740234375, -165.63818359375, -161.43894958496094, -157.23971557617188, -153.0404815673828, -148.84124755859375, -144.6420135498047, -140.44277954101562, -136.24356079101562, -132.04432678222656, -127.8450927734375, -123.64585876464844, -119.44662475585938, -115.24739074707031, -111.04815673828125, -106.84893035888672, -102.64969635009766, -98.4504623413086, -94.25123596191406, -90.052001953125, -85.85276794433594, -81.65353393554688, -77.45429992675781, -73.25507354736328, -69.05583953857422, -64.85660552978516, -60.65737533569336, -56.45814514160156, -52.25889587402344, -48.059661865234375, -43.86043167114258, -39.66120147705078, -35.46196746826172, -31.26273536682129, -27.06350326538086, -22.86427116394043, -18.6650390625, -14.46580696105957, -10.26657485961914, -6.067342758178711, -1.8681106567382812, 2.3311214447021484, 6.530353546142578, 10.729585647583008, 14.928817749023438, 19.128049850463867, 23.327281951904297, 27.526514053344727, 31.725746154785156, 35.92498016357422, 40.124210357666016, 44.32344055175781, 48.522674560546875, 52.72190856933594, 56.921138763427734, 61.12036895751953, 65.3196029663086, 69.51883697509766, 73.71806335449219, 77.91729736328125, 82.11653137207031]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 3.0, 5.0, 4.0, 5.0, 10.0, 8.0, 13.0, 16.0, 17.0, 13.0, 28.0, 32.0, 36.0, 23.0, 36.0, 48.0, 59.0, 78.0, 82.0, 80.0, 60.0, 40.0, 36.0, 36.0, 34.0, 34.0, 28.0, 28.0, 14.0, 16.0, 17.0, 13.0, 10.0, 10.0, 4.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.71212005615234, -97.30599975585938, -93.8998794555664, -90.49375915527344, -87.08763122558594, -83.6815185546875, -80.275390625, -76.86927032470703, -73.46315002441406, -70.0570297241211, -66.65090942382812, -63.24478530883789, -59.83866500854492, -56.43254470825195, -53.02642059326172, -49.62030029296875, -46.21417999267578, -42.80805969238281, -39.401939392089844, -35.99581527709961, -32.58969497680664, -29.183574676513672, -25.77745246887207, -22.37133026123047, -18.9652099609375, -15.559088706970215, -12.15296745300293, -8.746846199035645, -5.340724945068359, -1.9346046447753906, 1.471517562866211, 4.8776397705078125, 8.283767700195312, 11.689888954162598, 15.096010208129883, 18.502132415771484, 21.908252716064453, 25.314373016357422, 28.720495223999023, 32.126617431640625, 35.532737731933594, 38.93885803222656, 42.34497833251953, 45.751102447509766, 49.157222747802734, 52.5633430480957, 55.96946716308594, 59.375587463378906, 62.781707763671875, 66.18782806396484, 69.59394836425781, 73.00006866455078, 76.40618896484375, 79.81231689453125, 83.21843719482422, 86.62455749511719, 90.03067779541016, 93.43679809570312, 96.8429183959961, 100.24903869628906, 103.65516662597656, 107.061279296875, 110.4674072265625, 113.87352752685547, 117.27964782714844]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 16.0, 21.0, 24.0, 31.0, 64.0, 71.0, 100.0, 154.0, 241.0, 369.0, 580.0, 933.0, 1605.0, 3020.0, 6119.0, 13948.0, 40644.0, 158466.0, 719975.0, 2028410.0, 939753.0, 200943.0, 48460.0, 15652.0, 6740.0, 3284.0, 1796.0, 916.0, 651.0, 399.0, 273.0, 146.0, 128.0, 90.0, 57.0, 43.0, 37.0, 24.0, 21.0, 15.0, 12.0, 7.0, 1.0, 5.0, 7.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.9375, -6.7030029296875, -6.468505859375, -6.2340087890625, -5.99951171875, -5.7650146484375, -5.530517578125, -5.2960205078125, -5.0615234375, -4.8270263671875, -4.592529296875, -4.3580322265625, -4.12353515625, -3.8890380859375, -3.654541015625, -3.4200439453125, -3.185546875, -2.9510498046875, -2.716552734375, -2.4820556640625, -2.24755859375, -2.0130615234375, -1.778564453125, -1.5440673828125, -1.3095703125, -1.0750732421875, -0.840576171875, -0.6060791015625, -0.37158203125, -0.1370849609375, 0.097412109375, 0.3319091796875, 0.56640625, 0.8009033203125, 1.035400390625, 1.2698974609375, 1.50439453125, 1.7388916015625, 1.973388671875, 2.2078857421875, 2.4423828125, 2.6768798828125, 2.911376953125, 3.1458740234375, 3.38037109375, 3.6148681640625, 3.849365234375, 4.0838623046875, 4.318359375, 4.5528564453125, 4.787353515625, 5.0218505859375, 5.25634765625, 5.4908447265625, 5.725341796875, 5.9598388671875, 6.1943359375, 6.4288330078125, 6.663330078125, 6.8978271484375, 7.13232421875, 7.3668212890625, 7.601318359375, 7.8358154296875, 8.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 14.0, 10.0, 15.0, 26.0, 32.0, 20.0, 41.0, 45.0, 37.0, 55.0, 49.0, 59.0, 66.0, 65.0, 62.0, 42.0, 39.0, 47.0, 56.0, 34.0, 35.0, 28.0, 28.0, 26.0, 7.0, 14.0, 11.0, 5.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.46875, -9.1864013671875, -8.904052734375, -8.6217041015625, -8.33935546875, -8.0570068359375, -7.774658203125, -7.4923095703125, -7.2099609375, -6.9276123046875, -6.645263671875, -6.3629150390625, -6.08056640625, -5.7982177734375, -5.515869140625, -5.2335205078125, -4.951171875, -4.6688232421875, -4.386474609375, -4.1041259765625, -3.82177734375, -3.5394287109375, -3.257080078125, -2.9747314453125, -2.6923828125, -2.4100341796875, -2.127685546875, -1.8453369140625, -1.56298828125, -1.2806396484375, -0.998291015625, -0.7159423828125, -0.43359375, -0.1512451171875, 0.131103515625, 0.4134521484375, 0.69580078125, 0.9781494140625, 1.260498046875, 1.5428466796875, 1.8251953125, 2.1075439453125, 2.389892578125, 2.6722412109375, 2.95458984375, 3.2369384765625, 3.519287109375, 3.8016357421875, 4.083984375, 4.3663330078125, 4.648681640625, 4.9310302734375, 5.21337890625, 5.4957275390625, 5.778076171875, 6.0604248046875, 6.3427734375, 6.6251220703125, 6.907470703125, 7.1898193359375, 7.47216796875, 7.7545166015625, 8.036865234375, 8.3192138671875, 8.6015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 7.0, 2.0, 9.0, 7.0, 15.0, 21.0, 29.0, 36.0, 66.0, 85.0, 179.0, 389.0, 987.0, 3573.0, 19038.0, 269286.0, 3714934.0, 166110.0, 14939.0, 3001.0, 784.0, 342.0, 175.0, 99.0, 41.0, 39.0, 20.0, 21.0, 10.0, 8.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.515625, -23.82373046875, -23.1318359375, -22.43994140625, -21.748046875, -21.05615234375, -20.3642578125, -19.67236328125, -18.98046875, -18.28857421875, -17.5966796875, -16.90478515625, -16.212890625, -15.52099609375, -14.8291015625, -14.13720703125, -13.4453125, -12.75341796875, -12.0615234375, -11.36962890625, -10.677734375, -9.98583984375, -9.2939453125, -8.60205078125, -7.91015625, -7.21826171875, -6.5263671875, -5.83447265625, -5.142578125, -4.45068359375, -3.7587890625, -3.06689453125, -2.375, -1.68310546875, -0.9912109375, -0.29931640625, 0.392578125, 1.08447265625, 1.7763671875, 2.46826171875, 3.16015625, 3.85205078125, 4.5439453125, 5.23583984375, 5.927734375, 6.61962890625, 7.3115234375, 8.00341796875, 8.6953125, 9.38720703125, 10.0791015625, 10.77099609375, 11.462890625, 12.15478515625, 12.8466796875, 13.53857421875, 14.23046875, 14.92236328125, 15.6142578125, 16.30615234375, 16.998046875, 17.68994140625, 18.3818359375, 19.07373046875, 19.765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 21.0, 20.0, 22.0, 51.0, 62.0, 104.0, 176.0, 262.0, 437.0, 608.0, 737.0, 549.0, 328.0, 217.0, 133.0, 110.0, 63.0, 37.0, 26.0, 17.0, 10.0, 12.0, 7.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.125, -12.642578125, -12.16015625, -11.677734375, -11.1953125, -10.712890625, -10.23046875, -9.748046875, -9.265625, -8.783203125, -8.30078125, -7.818359375, -7.3359375, -6.853515625, -6.37109375, -5.888671875, -5.40625, -4.923828125, -4.44140625, -3.958984375, -3.4765625, -2.994140625, -2.51171875, -2.029296875, -1.546875, -1.064453125, -0.58203125, -0.099609375, 0.3828125, 0.865234375, 1.34765625, 1.830078125, 2.3125, 2.794921875, 3.27734375, 3.759765625, 4.2421875, 4.724609375, 5.20703125, 5.689453125, 6.171875, 6.654296875, 7.13671875, 7.619140625, 8.1015625, 8.583984375, 9.06640625, 9.548828125, 10.03125, 10.513671875, 10.99609375, 11.478515625, 11.9609375, 12.443359375, 12.92578125, 13.408203125, 13.890625, 14.373046875, 14.85546875, 15.337890625, 15.8203125, 16.302734375, 16.78515625, 17.267578125, 17.75]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 28.0, 48.0, 118.0, 198.0, 211.0, 168.0, 117.0, 52.0, 18.0, 15.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-202.45848083496094, -197.18507385253906, -191.9116668701172, -186.6382598876953, -181.36485290527344, -176.09144592285156, -170.8180389404297, -165.54464721679688, -160.271240234375, -154.99783325195312, -149.72442626953125, -144.45101928710938, -139.1776123046875, -133.90420532226562, -128.63079833984375, -123.3573989868164, -118.083984375, -112.81057739257812, -107.53717041015625, -102.26376342773438, -96.9903564453125, -91.71694946289062, -86.44355010986328, -81.1701431274414, -75.89673614501953, -70.62332916259766, -65.34992218017578, -60.07651901245117, -54.8031120300293, -49.52970504760742, -44.25630187988281, -38.98289489746094, -33.70948791503906, -28.436080932617188, -23.162675857543945, -17.889270782470703, -12.615863800048828, -7.342456817626953, -2.069051742553711, 3.2043533325195312, 8.477760314941406, 13.751166343688965, 19.024572372436523, 24.297977447509766, 29.57138442993164, 34.844791412353516, 40.118194580078125, 45.3916015625, 50.665008544921875, 55.93841552734375, 61.211822509765625, 66.4852294921875, 71.75863647460938, 77.03204345703125, 82.3054428100586, 87.57884979248047, 92.85225677490234, 98.12566375732422, 103.3990707397461, 108.67247772216797, 113.94587707519531, 119.21928405761719, 124.49269104003906, 129.76609802246094, 135.0395050048828]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 14.0, 12.0, 13.0, 5.0, 10.0, 15.0, 19.0, 19.0, 22.0, 32.0, 37.0, 25.0, 38.0, 38.0, 45.0, 46.0, 37.0, 35.0, 47.0, 46.0, 46.0, 49.0, 36.0, 35.0, 43.0, 36.0, 27.0, 25.0, 20.0, 23.0, 10.0, 16.0, 12.0, 7.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.35954284667969, -58.442535400390625, -56.5255241394043, -54.608516693115234, -52.691505432128906, -50.774497985839844, -48.85749053955078, -46.94047927856445, -45.02347183227539, -43.10646438598633, -41.189453125, -39.27244567871094, -37.35543441772461, -35.43842697143555, -33.52141571044922, -31.604408264160156, -29.68739891052246, -27.770389556884766, -25.85338020324707, -23.936370849609375, -22.019363403320312, -20.102354049682617, -18.185344696044922, -16.26833724975586, -14.351326942443848, -12.434317588806152, -10.517309188842773, -8.600299835205078, -6.683290958404541, -4.766282081604004, -2.8492727279663086, -0.9322643280029297, 0.9847450256347656, 2.9017539024353027, 4.81876277923584, 6.735772132873535, 8.652780532836914, 10.56978988647461, 12.486799240112305, 14.403807640075684, 16.320816040039062, 18.237825393676758, 20.154834747314453, 22.071842193603516, 23.98885154724121, 25.905860900878906, 27.8228702545166, 29.739879608154297, 31.656888961791992, 33.57389831542969, 35.49090576171875, 37.40791702270508, 39.32492446899414, 41.24193572998047, 43.15894317626953, 45.075950622558594, 46.99296188354492, 48.909969329833984, 50.82698059082031, 52.743988037109375, 54.6609992980957, 56.578006744384766, 58.495018005371094, 60.412025451660156, 62.32903289794922]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 9.0, 11.0, 24.0, 33.0, 51.0, 73.0, 120.0, 196.0, 304.0, 538.0, 959.0, 1805.0, 3726.0, 8510.0, 20422.0, 53131.0, 147753.0, 355475.0, 284496.0, 104991.0, 38155.0, 15028.0, 6465.0, 2908.0, 1465.0, 745.0, 396.0, 257.0, 156.0, 115.0, 71.0, 46.0, 28.0, 23.0, 13.0, 12.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7265625, -9.4210205078125, -9.115478515625, -8.8099365234375, -8.50439453125, -8.1988525390625, -7.893310546875, -7.5877685546875, -7.2822265625, -6.9766845703125, -6.671142578125, -6.3656005859375, -6.06005859375, -5.7545166015625, -5.448974609375, -5.1434326171875, -4.837890625, -4.5323486328125, -4.226806640625, -3.9212646484375, -3.61572265625, -3.3101806640625, -3.004638671875, -2.6990966796875, -2.3935546875, -2.0880126953125, -1.782470703125, -1.4769287109375, -1.17138671875, -0.8658447265625, -0.560302734375, -0.2547607421875, 0.05078125, 0.3563232421875, 0.661865234375, 0.9674072265625, 1.27294921875, 1.5784912109375, 1.884033203125, 2.1895751953125, 2.4951171875, 2.8006591796875, 3.106201171875, 3.4117431640625, 3.71728515625, 4.0228271484375, 4.328369140625, 4.6339111328125, 4.939453125, 5.2449951171875, 5.550537109375, 5.8560791015625, 6.16162109375, 6.4671630859375, 6.772705078125, 7.0782470703125, 7.3837890625, 7.6893310546875, 7.994873046875, 8.3004150390625, 8.60595703125, 8.9114990234375, 9.217041015625, 9.5225830078125, 9.828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 3.0, 2.0, 10.0, 5.0, 9.0, 12.0, 21.0, 28.0, 26.0, 32.0, 47.0, 38.0, 44.0, 44.0, 44.0, 59.0, 61.0, 62.0, 59.0, 49.0, 42.0, 50.0, 44.0, 43.0, 28.0, 22.0, 26.0, 18.0, 17.0, 16.0, 13.0, 10.0, 2.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0635986328125, -8.783447265625, -8.5032958984375, -8.22314453125, -7.9429931640625, -7.662841796875, -7.3826904296875, -7.1025390625, -6.8223876953125, -6.542236328125, -6.2620849609375, -5.98193359375, -5.7017822265625, -5.421630859375, -5.1414794921875, -4.861328125, -4.5811767578125, -4.301025390625, -4.0208740234375, -3.74072265625, -3.4605712890625, -3.180419921875, -2.9002685546875, -2.6201171875, -2.3399658203125, -2.059814453125, -1.7796630859375, -1.49951171875, -1.2193603515625, -0.939208984375, -0.6590576171875, -0.37890625, -0.0987548828125, 0.181396484375, 0.4615478515625, 0.74169921875, 1.0218505859375, 1.302001953125, 1.5821533203125, 1.8623046875, 2.1424560546875, 2.422607421875, 2.7027587890625, 2.98291015625, 3.2630615234375, 3.543212890625, 3.8233642578125, 4.103515625, 4.3836669921875, 4.663818359375, 4.9439697265625, 5.22412109375, 5.5042724609375, 5.784423828125, 6.0645751953125, 6.3447265625, 6.6248779296875, 6.905029296875, 7.1851806640625, 7.46533203125, 7.7454833984375, 8.025634765625, 8.3057861328125, 8.5859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 12.0, 13.0, 24.0, 27.0, 26.0, 54.0, 62.0, 95.0, 115.0, 157.0, 255.0, 393.0, 648.0, 1249.0, 2850.0, 8355.0, 32536.0, 190092.0, 693059.0, 89739.0, 18566.0, 5460.0, 2080.0, 989.0, 562.0, 306.0, 234.0, 146.0, 125.0, 79.0, 59.0, 44.0, 37.0, 22.0, 17.0, 13.0, 9.0, 10.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.091552734375, -15.54248046875, -14.993408203125, -14.4443359375, -13.895263671875, -13.34619140625, -12.797119140625, -12.248046875, -11.698974609375, -11.14990234375, -10.600830078125, -10.0517578125, -9.502685546875, -8.95361328125, -8.404541015625, -7.85546875, -7.306396484375, -6.75732421875, -6.208251953125, -5.6591796875, -5.110107421875, -4.56103515625, -4.011962890625, -3.462890625, -2.913818359375, -2.36474609375, -1.815673828125, -1.2666015625, -0.717529296875, -0.16845703125, 0.380615234375, 0.9296875, 1.478759765625, 2.02783203125, 2.576904296875, 3.1259765625, 3.675048828125, 4.22412109375, 4.773193359375, 5.322265625, 5.871337890625, 6.42041015625, 6.969482421875, 7.5185546875, 8.067626953125, 8.61669921875, 9.165771484375, 9.71484375, 10.263916015625, 10.81298828125, 11.362060546875, 11.9111328125, 12.460205078125, 13.00927734375, 13.558349609375, 14.107421875, 14.656494140625, 15.20556640625, 15.754638671875, 16.3037109375, 16.852783203125, 17.40185546875, 17.950927734375, 18.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 26.0, 14.0, 29.0, 34.0, 27.0, 35.0, 32.0, 50.0, 42.0, 46.0, 51.0, 60.0, 42.0, 51.0, 57.0, 49.0, 41.0, 39.0, 40.0, 19.0, 20.0, 28.0, 19.0, 14.0, 11.0, 10.0, 8.0, 11.0, 9.0, 6.0, 2.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.453125, -26.60791015625, -25.7626953125, -24.91748046875, -24.072265625, -23.22705078125, -22.3818359375, -21.53662109375, -20.69140625, -19.84619140625, -19.0009765625, -18.15576171875, -17.310546875, -16.46533203125, -15.6201171875, -14.77490234375, -13.9296875, -13.08447265625, -12.2392578125, -11.39404296875, -10.548828125, -9.70361328125, -8.8583984375, -8.01318359375, -7.16796875, -6.32275390625, -5.4775390625, -4.63232421875, -3.787109375, -2.94189453125, -2.0966796875, -1.25146484375, -0.40625, 0.43896484375, 1.2841796875, 2.12939453125, 2.974609375, 3.81982421875, 4.6650390625, 5.51025390625, 6.35546875, 7.20068359375, 8.0458984375, 8.89111328125, 9.736328125, 10.58154296875, 11.4267578125, 12.27197265625, 13.1171875, 13.96240234375, 14.8076171875, 15.65283203125, 16.498046875, 17.34326171875, 18.1884765625, 19.03369140625, 19.87890625, 20.72412109375, 21.5693359375, 22.41455078125, 23.259765625, 24.10498046875, 24.9501953125, 25.79541015625, 26.640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 9.0, 14.0, 13.0, 24.0, 34.0, 40.0, 55.0, 102.0, 173.0, 309.0, 515.0, 994.0, 2159.0, 5141.0, 14299.0, 47284.0, 274060.0, 611300.0, 63014.0, 17587.0, 6234.0, 2643.0, 1169.0, 578.0, 302.0, 169.0, 96.0, 70.0, 51.0, 27.0, 18.0, 15.0, 5.0, 5.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.11328125, -3.971923828125, -3.83056640625, -3.689208984375, -3.5478515625, -3.406494140625, -3.26513671875, -3.123779296875, -2.982421875, -2.841064453125, -2.69970703125, -2.558349609375, -2.4169921875, -2.275634765625, -2.13427734375, -1.992919921875, -1.8515625, -1.710205078125, -1.56884765625, -1.427490234375, -1.2861328125, -1.144775390625, -1.00341796875, -0.862060546875, -0.720703125, -0.579345703125, -0.43798828125, -0.296630859375, -0.1552734375, -0.013916015625, 0.12744140625, 0.268798828125, 0.41015625, 0.551513671875, 0.69287109375, 0.834228515625, 0.9755859375, 1.116943359375, 1.25830078125, 1.399658203125, 1.541015625, 1.682373046875, 1.82373046875, 1.965087890625, 2.1064453125, 2.247802734375, 2.38916015625, 2.530517578125, 2.671875, 2.813232421875, 2.95458984375, 3.095947265625, 3.2373046875, 3.378662109375, 3.52001953125, 3.661376953125, 3.802734375, 3.944091796875, 4.08544921875, 4.226806640625, 4.3681640625, 4.509521484375, 4.65087890625, 4.792236328125, 4.93359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 7.0, 7.0, 6.0, 13.0, 18.0, 24.0, 35.0, 66.0, 62.0, 117.0, 141.0, 154.0, 87.0, 65.0, 43.0, 28.0, 21.0, 19.0, 16.0, 10.0, 9.0, 5.0, 7.0, 6.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015840530395507812, -0.0015386193990707397, -0.0014931857585906982, -0.0014477521181106567, -0.0014023184776306152, -0.0013568848371505737, -0.0013114511966705322, -0.0012660175561904907, -0.0012205839157104492, -0.0011751502752304077, -0.0011297166347503662, -0.0010842829942703247, -0.0010388493537902832, -0.0009934157133102417, -0.0009479820728302002, -0.0009025484323501587, -0.0008571147918701172, -0.0008116811513900757, -0.0007662475109100342, -0.0007208138704299927, -0.0006753802299499512, -0.0006299465894699097, -0.0005845129489898682, -0.0005390793085098267, -0.0004936456680297852, -0.00044821202754974365, -0.00040277838706970215, -0.00035734474658966064, -0.00031191110610961914, -0.00026647746562957764, -0.00022104382514953613, -0.00017561018466949463, -0.00013017654418945312, -8.474290370941162e-05, -3.930926322937012e-05, 6.124377250671387e-06, 5.155801773071289e-05, 9.69916582107544e-05, 0.0001424252986907959, 0.0001878589391708374, 0.0002332925796508789, 0.0002787262201309204, 0.0003241598606109619, 0.0003695935010910034, 0.0004150271415710449, 0.0004604607820510864, 0.0005058944225311279, 0.0005513280630111694, 0.0005967617034912109, 0.0006421953439712524, 0.0006876289844512939, 0.0007330626249313354, 0.000778496265411377, 0.0008239299058914185, 0.00086936354637146, 0.0009147971868515015, 0.000960230827331543, 0.0010056644678115845, 0.001051098108291626, 0.0010965317487716675, 0.001141965389251709, 0.0011873990297317505, 0.001232832670211792, 0.0012782663106918335, 0.001323699951171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 9.0, 13.0, 14.0, 23.0, 36.0, 49.0, 57.0, 103.0, 158.0, 266.0, 396.0, 760.0, 1556.0, 3337.0, 8129.0, 23589.0, 86725.0, 648448.0, 206486.0, 44417.0, 13965.0, 5256.0, 2260.0, 991.0, 589.0, 344.0, 193.0, 111.0, 72.0, 50.0, 36.0, 25.0, 18.0, 12.0, 14.0, 8.0, 3.0, 10.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.97198486328125, -3.8385009765625, -3.70501708984375, -3.571533203125, -3.43804931640625, -3.3045654296875, -3.17108154296875, -3.03759765625, -2.90411376953125, -2.7706298828125, -2.63714599609375, -2.503662109375, -2.37017822265625, -2.2366943359375, -2.10321044921875, -1.9697265625, -1.83624267578125, -1.7027587890625, -1.56927490234375, -1.435791015625, -1.30230712890625, -1.1688232421875, -1.03533935546875, -0.90185546875, -0.76837158203125, -0.6348876953125, -0.50140380859375, -0.367919921875, -0.23443603515625, -0.1009521484375, 0.03253173828125, 0.166015625, 0.29949951171875, 0.4329833984375, 0.56646728515625, 0.699951171875, 0.83343505859375, 0.9669189453125, 1.10040283203125, 1.23388671875, 1.36737060546875, 1.5008544921875, 1.63433837890625, 1.767822265625, 1.90130615234375, 2.0347900390625, 2.16827392578125, 2.3017578125, 2.43524169921875, 2.5687255859375, 2.70220947265625, 2.835693359375, 2.96917724609375, 3.1026611328125, 3.23614501953125, 3.36962890625, 3.50311279296875, 3.6365966796875, 3.77008056640625, 3.903564453125, 4.03704833984375, 4.1705322265625, 4.30401611328125, 4.4375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 10.0, 21.0, 12.0, 23.0, 39.0, 40.0, 59.0, 86.0, 114.0, 112.0, 98.0, 99.0, 65.0, 42.0, 35.0, 22.0, 19.0, 12.0, 10.0, 12.0, 10.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.89453125, -5.71942138671875, -5.5443115234375, -5.36920166015625, -5.194091796875, -5.01898193359375, -4.8438720703125, -4.66876220703125, -4.49365234375, -4.31854248046875, -4.1434326171875, -3.96832275390625, -3.793212890625, -3.61810302734375, -3.4429931640625, -3.26788330078125, -3.0927734375, -2.91766357421875, -2.7425537109375, -2.56744384765625, -2.392333984375, -2.21722412109375, -2.0421142578125, -1.86700439453125, -1.69189453125, -1.51678466796875, -1.3416748046875, -1.16656494140625, -0.991455078125, -0.81634521484375, -0.6412353515625, -0.46612548828125, -0.291015625, -0.11590576171875, 0.0592041015625, 0.23431396484375, 0.409423828125, 0.58453369140625, 0.7596435546875, 0.93475341796875, 1.10986328125, 1.28497314453125, 1.4600830078125, 1.63519287109375, 1.810302734375, 1.98541259765625, 2.1605224609375, 2.33563232421875, 2.5107421875, 2.68585205078125, 2.8609619140625, 3.03607177734375, 3.211181640625, 3.38629150390625, 3.5614013671875, 3.73651123046875, 3.91162109375, 4.08673095703125, 4.2618408203125, 4.43695068359375, 4.612060546875, 4.78717041015625, 4.9622802734375, 5.13739013671875, 5.3125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 17.0, 36.0, 75.0, 138.0, 327.0, 182.0, 91.0, 52.0, 22.0, 16.0, 7.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-226.6300506591797, -221.7748565673828, -216.91964721679688, -212.064453125, -207.20925903320312, -202.35406494140625, -197.49887084960938, -192.64366149902344, -187.78846740722656, -182.9332733154297, -178.07806396484375, -173.22286987304688, -168.36767578125, -163.51248168945312, -158.65728759765625, -153.8020782470703, -148.94688415527344, -144.09169006347656, -139.23648071289062, -134.38128662109375, -129.52609252929688, -124.6708984375, -119.8156967163086, -114.96049499511719, -110.10530090332031, -105.25010681152344, -100.39490509033203, -95.53970336914062, -90.68450927734375, -85.82931518554688, -80.97411346435547, -76.11891174316406, -71.26371002197266, -66.40850830078125, -61.553314208984375, -56.698116302490234, -51.842918395996094, -46.98772048950195, -42.13252258300781, -37.27732467651367, -32.42212677001953, -27.56692886352539, -22.71173095703125, -17.85653305053711, -13.001335144042969, -8.146137237548828, -3.2909393310546875, 1.5642585754394531, 6.419456481933594, 11.274654388427734, 16.129852294921875, 20.985050201416016, 25.840248107910156, 30.695446014404297, 35.55064392089844, 40.40584182739258, 45.26103973388672, 50.11623764038086, 54.971435546875, 59.82663345336914, 64.68183135986328, 69.53703308105469, 74.39222717285156, 79.24742126464844, 84.10262298583984]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 11.0, 12.0, 5.0, 15.0, 16.0, 17.0, 21.0, 22.0, 27.0, 35.0, 41.0, 50.0, 45.0, 82.0, 100.0, 103.0, 72.0, 42.0, 47.0, 32.0, 31.0, 29.0, 17.0, 15.0, 20.0, 13.0, 11.0, 7.0, 14.0, 10.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-136.49073791503906, -132.78094482421875, -129.07113647460938, -125.36134338378906, -121.65154266357422, -117.94174194335938, -114.23194885253906, -110.52214813232422, -106.81234741210938, -103.10254669189453, -99.39275360107422, -95.68295288085938, -91.97315216064453, -88.26335144042969, -84.55355834960938, -80.84375762939453, -77.13395690917969, -73.42415618896484, -69.71436309814453, -66.00456237792969, -62.294761657714844, -58.584964752197266, -54.87516784667969, -51.165367126464844, -47.45557403564453, -43.74577713012695, -40.03597640991211, -36.32617950439453, -32.61637878417969, -28.90658187866211, -25.1967830657959, -21.486984252929688, -17.777183532714844, -14.067384719848633, -10.357585906982422, -6.647788047790527, -2.9379892349243164, 0.7718086242675781, 4.481607437133789, 8.19140625, 11.901205062866211, 15.611003875732422, 19.320802688598633, 23.030601501464844, 26.740398406982422, 30.450197219848633, 34.159996032714844, 37.86979675292969, 41.579593658447266, 45.289390563964844, 48.99919128417969, 52.708988189697266, 56.41878890991211, 60.12858581542969, 63.83838653564453, 67.54818725585938, 71.25798034667969, 74.96778106689453, 78.67757415771484, 82.38737487792969, 86.09717559814453, 89.80697631835938, 93.51676940917969, 97.22657012939453, 100.93637084960938]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 8.0, 12.0, 17.0, 18.0, 28.0, 51.0, 60.0, 95.0, 147.0, 198.0, 284.0, 503.0, 777.0, 1271.0, 2440.0, 5682.0, 14637.0, 50989.0, 245215.0, 1301696.0, 1999037.0, 451983.0, 82330.0, 21774.0, 7607.0, 3237.0, 1589.0, 966.0, 523.0, 366.0, 241.0, 148.0, 98.0, 79.0, 42.0, 24.0, 30.0, 20.0, 10.0, 11.0, 9.0, 9.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.8389892578125, -7.560791015625, -7.2825927734375, -7.00439453125, -6.7261962890625, -6.447998046875, -6.1697998046875, -5.8916015625, -5.6134033203125, -5.335205078125, -5.0570068359375, -4.77880859375, -4.5006103515625, -4.222412109375, -3.9442138671875, -3.666015625, -3.3878173828125, -3.109619140625, -2.8314208984375, -2.55322265625, -2.2750244140625, -1.996826171875, -1.7186279296875, -1.4404296875, -1.1622314453125, -0.884033203125, -0.6058349609375, -0.32763671875, -0.0494384765625, 0.228759765625, 0.5069580078125, 0.78515625, 1.0633544921875, 1.341552734375, 1.6197509765625, 1.89794921875, 2.1761474609375, 2.454345703125, 2.7325439453125, 3.0107421875, 3.2889404296875, 3.567138671875, 3.8453369140625, 4.12353515625, 4.4017333984375, 4.679931640625, 4.9581298828125, 5.236328125, 5.5145263671875, 5.792724609375, 6.0709228515625, 6.34912109375, 6.6273193359375, 6.905517578125, 7.1837158203125, 7.4619140625, 7.7401123046875, 8.018310546875, 8.2965087890625, 8.57470703125, 8.8529052734375, 9.131103515625, 9.4093017578125, 9.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 8.0, 25.0, 23.0, 29.0, 31.0, 41.0, 45.0, 47.0, 54.0, 48.0, 45.0, 50.0, 60.0, 70.0, 53.0, 51.0, 45.0, 46.0, 44.0, 29.0, 20.0, 25.0, 20.0, 17.0, 19.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0726318359375, -8.793701171875, -8.5147705078125, -8.23583984375, -7.9569091796875, -7.677978515625, -7.3990478515625, -7.1201171875, -6.8411865234375, -6.562255859375, -6.2833251953125, -6.00439453125, -5.7254638671875, -5.446533203125, -5.1676025390625, -4.888671875, -4.6097412109375, -4.330810546875, -4.0518798828125, -3.77294921875, -3.4940185546875, -3.215087890625, -2.9361572265625, -2.6572265625, -2.3782958984375, -2.099365234375, -1.8204345703125, -1.54150390625, -1.2625732421875, -0.983642578125, -0.7047119140625, -0.42578125, -0.1468505859375, 0.132080078125, 0.4110107421875, 0.68994140625, 0.9688720703125, 1.247802734375, 1.5267333984375, 1.8056640625, 2.0845947265625, 2.363525390625, 2.6424560546875, 2.92138671875, 3.2003173828125, 3.479248046875, 3.7581787109375, 4.037109375, 4.3160400390625, 4.594970703125, 4.8739013671875, 5.15283203125, 5.4317626953125, 5.710693359375, 5.9896240234375, 6.2685546875, 6.5474853515625, 6.826416015625, 7.1053466796875, 7.38427734375, 7.6632080078125, 7.942138671875, 8.2210693359375, 8.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 11.0, 10.0, 13.0, 16.0, 28.0, 37.0, 48.0, 97.0, 163.0, 361.0, 807.0, 2546.0, 13247.0, 197194.0, 3823638.0, 141040.0, 11211.0, 2298.0, 714.0, 376.0, 172.0, 96.0, 54.0, 37.0, 22.0, 17.0, 14.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.181640625, -20.41015625, -19.638671875, -18.8671875, -18.095703125, -17.32421875, -16.552734375, -15.78125, -15.009765625, -14.23828125, -13.466796875, -12.6953125, -11.923828125, -11.15234375, -10.380859375, -9.609375, -8.837890625, -8.06640625, -7.294921875, -6.5234375, -5.751953125, -4.98046875, -4.208984375, -3.4375, -2.666015625, -1.89453125, -1.123046875, -0.3515625, 0.419921875, 1.19140625, 1.962890625, 2.734375, 3.505859375, 4.27734375, 5.048828125, 5.8203125, 6.591796875, 7.36328125, 8.134765625, 8.90625, 9.677734375, 10.44921875, 11.220703125, 11.9921875, 12.763671875, 13.53515625, 14.306640625, 15.078125, 15.849609375, 16.62109375, 17.392578125, 18.1640625, 18.935546875, 19.70703125, 20.478515625, 21.25, 22.021484375, 22.79296875, 23.564453125, 24.3359375, 25.107421875, 25.87890625, 26.650390625, 27.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 14.0, 31.0, 38.0, 85.0, 132.0, 242.0, 416.0, 704.0, 863.0, 659.0, 372.0, 185.0, 100.0, 58.0, 51.0, 23.0, 21.0, 19.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.074462890625, -23.43017578125, -22.785888671875, -22.1416015625, -21.497314453125, -20.85302734375, -20.208740234375, -19.564453125, -18.920166015625, -18.27587890625, -17.631591796875, -16.9873046875, -16.343017578125, -15.69873046875, -15.054443359375, -14.41015625, -13.765869140625, -13.12158203125, -12.477294921875, -11.8330078125, -11.188720703125, -10.54443359375, -9.900146484375, -9.255859375, -8.611572265625, -7.96728515625, -7.322998046875, -6.6787109375, -6.034423828125, -5.39013671875, -4.745849609375, -4.1015625, -3.457275390625, -2.81298828125, -2.168701171875, -1.5244140625, -0.880126953125, -0.23583984375, 0.408447265625, 1.052734375, 1.697021484375, 2.34130859375, 2.985595703125, 3.6298828125, 4.274169921875, 4.91845703125, 5.562744140625, 6.20703125, 6.851318359375, 7.49560546875, 8.139892578125, 8.7841796875, 9.428466796875, 10.07275390625, 10.717041015625, 11.361328125, 12.005615234375, 12.64990234375, 13.294189453125, 13.9384765625, 14.582763671875, 15.22705078125, 15.871337890625, 16.515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 9.0, 7.0, 10.0, 34.0, 53.0, 139.0, 249.0, 226.0, 144.0, 76.0, 29.0, 10.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.17324829101562, -157.8883056640625, -151.60337829589844, -145.3184356689453, -139.03350830078125, -132.74856567382812, -126.463623046875, -120.1786880493164, -113.89375305175781, -107.60881805419922, -101.32388305664062, -95.0389404296875, -88.7540054321289, -82.46907043457031, -76.18412780761719, -69.8991928100586, -63.6142578125, -57.329322814941406, -51.04438400268555, -44.75944519042969, -38.474510192871094, -32.1895751953125, -25.90463638305664, -19.61969757080078, -13.334762573242188, -7.049825668334961, -0.7648887634277344, 5.520048141479492, 11.804985046386719, 18.089921951293945, 24.374858856201172, 30.65979766845703, 36.94474792480469, 43.22968292236328, 49.51462173461914, 55.799560546875, 62.084495544433594, 68.36943054199219, 74.65437316894531, 80.9393081665039, 87.2242431640625, 93.5091781616211, 99.79411315917969, 106.07905578613281, 112.3639907836914, 118.64892578125, 124.93386840820312, 131.21881103515625, 137.5037384033203, 143.78868103027344, 150.0736083984375, 156.35855102539062, 162.64349365234375, 168.9284210205078, 175.21336364746094, 181.498291015625, 187.78323364257812, 194.06817626953125, 200.3531036376953, 206.63804626464844, 212.9229736328125, 219.20791625976562, 225.49285888671875, 231.77780151367188, 238.06272888183594]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 13.0, 8.0, 14.0, 12.0, 11.0, 13.0, 18.0, 24.0, 25.0, 39.0, 16.0, 29.0, 40.0, 40.0, 44.0, 70.0, 69.0, 59.0, 66.0, 44.0, 35.0, 45.0, 34.0, 28.0, 26.0, 23.0, 19.0, 19.0, 16.0, 24.0, 12.0, 14.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.90861892700195, -60.680538177490234, -58.45246124267578, -56.22438049316406, -53.996299743652344, -51.768218994140625, -49.540138244628906, -47.31206130981445, -45.083980560302734, -42.855899810791016, -40.62782287597656, -38.399742126464844, -36.171661376953125, -33.943580627441406, -31.71550178527832, -29.487422943115234, -27.259342193603516, -25.031261444091797, -22.80318260192871, -20.575103759765625, -18.347023010253906, -16.118942260742188, -13.890863418579102, -11.6627836227417, -9.434703826904297, -7.2066240310668945, -4.978544235229492, -2.75046443939209, -0.5223846435546875, 1.7056951522827148, 3.933774948120117, 6.1618547439575195, 8.389930725097656, 10.618010520935059, 12.846090316772461, 15.074170112609863, 17.302249908447266, 19.530330657958984, 21.75840950012207, 23.986488342285156, 26.214569091796875, 28.442649841308594, 30.67072868347168, 32.898807525634766, 35.126888275146484, 37.3549690246582, 39.583045959472656, 41.811126708984375, 44.039207458496094, 46.26728820800781, 48.49536895751953, 50.723445892333984, 52.9515266418457, 55.17960739135742, 57.407684326171875, 59.635765075683594, 61.86384582519531, 64.09192657470703, 66.32000732421875, 68.54808807373047, 70.77616882324219, 73.00424194335938, 75.2323226928711, 77.46040344238281, 79.68848419189453]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 9.0, 9.0, 13.0, 25.0, 28.0, 48.0, 64.0, 117.0, 175.0, 263.0, 460.0, 773.0, 1595.0, 2848.0, 5855.0, 12275.0, 27993.0, 67971.0, 182314.0, 380960.0, 221138.0, 82149.0, 33008.0, 14371.0, 6691.0, 3455.0, 1706.0, 930.0, 509.0, 326.0, 173.0, 102.0, 61.0, 46.0, 34.0, 19.0, 11.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.51708984375, -9.2060546875, -8.89501953125, -8.583984375, -8.27294921875, -7.9619140625, -7.65087890625, -7.33984375, -7.02880859375, -6.7177734375, -6.40673828125, -6.095703125, -5.78466796875, -5.4736328125, -5.16259765625, -4.8515625, -4.54052734375, -4.2294921875, -3.91845703125, -3.607421875, -3.29638671875, -2.9853515625, -2.67431640625, -2.36328125, -2.05224609375, -1.7412109375, -1.43017578125, -1.119140625, -0.80810546875, -0.4970703125, -0.18603515625, 0.125, 0.43603515625, 0.7470703125, 1.05810546875, 1.369140625, 1.68017578125, 1.9912109375, 2.30224609375, 2.61328125, 2.92431640625, 3.2353515625, 3.54638671875, 3.857421875, 4.16845703125, 4.4794921875, 4.79052734375, 5.1015625, 5.41259765625, 5.7236328125, 6.03466796875, 6.345703125, 6.65673828125, 6.9677734375, 7.27880859375, 7.58984375, 7.90087890625, 8.2119140625, 8.52294921875, 8.833984375, 9.14501953125, 9.4560546875, 9.76708984375, 10.078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 17.0, 14.0, 22.0, 33.0, 41.0, 37.0, 40.0, 46.0, 48.0, 39.0, 44.0, 63.0, 54.0, 49.0, 65.0, 54.0, 43.0, 47.0, 36.0, 30.0, 24.0, 25.0, 18.0, 15.0, 13.0, 12.0, 12.0, 9.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.09716796875, -8.8193359375, -8.54150390625, -8.263671875, -7.98583984375, -7.7080078125, -7.43017578125, -7.15234375, -6.87451171875, -6.5966796875, -6.31884765625, -6.041015625, -5.76318359375, -5.4853515625, -5.20751953125, -4.9296875, -4.65185546875, -4.3740234375, -4.09619140625, -3.818359375, -3.54052734375, -3.2626953125, -2.98486328125, -2.70703125, -2.42919921875, -2.1513671875, -1.87353515625, -1.595703125, -1.31787109375, -1.0400390625, -0.76220703125, -0.484375, -0.20654296875, 0.0712890625, 0.34912109375, 0.626953125, 0.90478515625, 1.1826171875, 1.46044921875, 1.73828125, 2.01611328125, 2.2939453125, 2.57177734375, 2.849609375, 3.12744140625, 3.4052734375, 3.68310546875, 3.9609375, 4.23876953125, 4.5166015625, 4.79443359375, 5.072265625, 5.35009765625, 5.6279296875, 5.90576171875, 6.18359375, 6.46142578125, 6.7392578125, 7.01708984375, 7.294921875, 7.57275390625, 7.8505859375, 8.12841796875, 8.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 7.0, 3.0, 9.0, 18.0, 28.0, 45.0, 47.0, 62.0, 64.0, 150.0, 187.0, 272.0, 450.0, 675.0, 1218.0, 2337.0, 5994.0, 23962.0, 168678.0, 757221.0, 66455.0, 12537.0, 3890.0, 1687.0, 935.0, 568.0, 332.0, 232.0, 134.0, 112.0, 65.0, 44.0, 42.0, 24.0, 20.0, 11.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.65234375, -19.9921875, -19.33203125, -18.671875, -18.01171875, -17.3515625, -16.69140625, -16.03125, -15.37109375, -14.7109375, -14.05078125, -13.390625, -12.73046875, -12.0703125, -11.41015625, -10.75, -10.08984375, -9.4296875, -8.76953125, -8.109375, -7.44921875, -6.7890625, -6.12890625, -5.46875, -4.80859375, -4.1484375, -3.48828125, -2.828125, -2.16796875, -1.5078125, -0.84765625, -0.1875, 0.47265625, 1.1328125, 1.79296875, 2.453125, 3.11328125, 3.7734375, 4.43359375, 5.09375, 5.75390625, 6.4140625, 7.07421875, 7.734375, 8.39453125, 9.0546875, 9.71484375, 10.375, 11.03515625, 11.6953125, 12.35546875, 13.015625, 13.67578125, 14.3359375, 14.99609375, 15.65625, 16.31640625, 16.9765625, 17.63671875, 18.296875, 18.95703125, 19.6171875, 20.27734375, 20.9375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 2.0, 1.0, 6.0, 5.0, 10.0, 17.0, 16.0, 20.0, 24.0, 28.0, 25.0, 28.0, 51.0, 47.0, 53.0, 63.0, 82.0, 71.0, 50.0, 67.0, 60.0, 40.0, 44.0, 40.0, 34.0, 26.0, 20.0, 17.0, 11.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -36.35205078125, -35.2353515625, -34.11865234375, -33.001953125, -31.88525390625, -30.7685546875, -29.65185546875, -28.53515625, -27.41845703125, -26.3017578125, -25.18505859375, -24.068359375, -22.95166015625, -21.8349609375, -20.71826171875, -19.6015625, -18.48486328125, -17.3681640625, -16.25146484375, -15.134765625, -14.01806640625, -12.9013671875, -11.78466796875, -10.66796875, -9.55126953125, -8.4345703125, -7.31787109375, -6.201171875, -5.08447265625, -3.9677734375, -2.85107421875, -1.734375, -0.61767578125, 0.4990234375, 1.61572265625, 2.732421875, 3.84912109375, 4.9658203125, 6.08251953125, 7.19921875, 8.31591796875, 9.4326171875, 10.54931640625, 11.666015625, 12.78271484375, 13.8994140625, 15.01611328125, 16.1328125, 17.24951171875, 18.3662109375, 19.48291015625, 20.599609375, 21.71630859375, 22.8330078125, 23.94970703125, 25.06640625, 26.18310546875, 27.2998046875, 28.41650390625, 29.533203125, 30.64990234375, 31.7666015625, 32.88330078125, 34.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 12.0, 6.0, 12.0, 25.0, 18.0, 45.0, 93.0, 162.0, 347.0, 780.0, 2268.0, 9506.0, 79436.0, 878019.0, 65720.0, 8550.0, 2085.0, 716.0, 330.0, 165.0, 85.0, 56.0, 31.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 7.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.53271484375, -7.3076171875, -7.08251953125, -6.857421875, -6.63232421875, -6.4072265625, -6.18212890625, -5.95703125, -5.73193359375, -5.5068359375, -5.28173828125, -5.056640625, -4.83154296875, -4.6064453125, -4.38134765625, -4.15625, -3.93115234375, -3.7060546875, -3.48095703125, -3.255859375, -3.03076171875, -2.8056640625, -2.58056640625, -2.35546875, -2.13037109375, -1.9052734375, -1.68017578125, -1.455078125, -1.22998046875, -1.0048828125, -0.77978515625, -0.5546875, -0.32958984375, -0.1044921875, 0.12060546875, 0.345703125, 0.57080078125, 0.7958984375, 1.02099609375, 1.24609375, 1.47119140625, 1.6962890625, 1.92138671875, 2.146484375, 2.37158203125, 2.5966796875, 2.82177734375, 3.046875, 3.27197265625, 3.4970703125, 3.72216796875, 3.947265625, 4.17236328125, 4.3974609375, 4.62255859375, 4.84765625, 5.07275390625, 5.2978515625, 5.52294921875, 5.748046875, 5.97314453125, 6.1982421875, 6.42333984375, 6.6484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 11.0, 13.0, 23.0, 39.0, 31.0, 53.0, 96.0, 175.0, 185.0, 111.0, 63.0, 44.0, 25.0, 21.0, 17.0, 9.0, 7.0, 13.0, 11.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001689910888671875, -0.001631706953048706, -0.0015735030174255371, -0.0015152990818023682, -0.0014570951461791992, -0.0013988912105560303, -0.0013406872749328613, -0.0012824833393096924, -0.0012242794036865234, -0.0011660754680633545, -0.0011078715324401855, -0.0010496675968170166, -0.0009914636611938477, -0.0009332597255706787, -0.0008750557899475098, -0.0008168518543243408, -0.0007586479187011719, -0.0007004439830780029, -0.000642240047454834, -0.000584036111831665, -0.0005258321762084961, -0.00046762824058532715, -0.0004094243049621582, -0.00035122036933898926, -0.0002930164337158203, -0.00023481249809265137, -0.00017660856246948242, -0.00011840462684631348, -6.020069122314453e-05, -1.996755599975586e-06, 5.620718002319336e-05, 0.0001144111156463623, 0.00017261505126953125, 0.0002308189868927002, 0.00028902292251586914, 0.0003472268581390381, 0.00040543079376220703, 0.000463634729385376, 0.0005218386650085449, 0.0005800426006317139, 0.0006382465362548828, 0.0006964504718780518, 0.0007546544075012207, 0.0008128583431243896, 0.0008710622787475586, 0.0009292662143707275, 0.0009874701499938965, 0.0010456740856170654, 0.0011038780212402344, 0.0011620819568634033, 0.0012202858924865723, 0.0012784898281097412, 0.0013366937637329102, 0.001394897699356079, 0.001453101634979248, 0.001511305570602417, 0.001569509506225586, 0.0016277134418487549, 0.0016859173774719238, 0.0017441213130950928, 0.0018023252487182617, 0.0018605291843414307, 0.0019187331199645996, 0.0019769370555877686, 0.0020351409912109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 10.0, 16.0, 22.0, 40.0, 55.0, 103.0, 151.0, 272.0, 490.0, 1077.0, 2327.0, 6338.0, 23367.0, 147471.0, 766412.0, 77313.0, 14931.0, 4484.0, 1734.0, 810.0, 455.0, 228.0, 153.0, 69.0, 67.0, 40.0, 19.0, 14.0, 17.0, 10.0, 3.0, 9.0, 4.0, 1.0, 9.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.882080078125, -4.72119140625, -4.560302734375, -4.3994140625, -4.238525390625, -4.07763671875, -3.916748046875, -3.755859375, -3.594970703125, -3.43408203125, -3.273193359375, -3.1123046875, -2.951416015625, -2.79052734375, -2.629638671875, -2.46875, -2.307861328125, -2.14697265625, -1.986083984375, -1.8251953125, -1.664306640625, -1.50341796875, -1.342529296875, -1.181640625, -1.020751953125, -0.85986328125, -0.698974609375, -0.5380859375, -0.377197265625, -0.21630859375, -0.055419921875, 0.10546875, 0.266357421875, 0.42724609375, 0.588134765625, 0.7490234375, 0.909912109375, 1.07080078125, 1.231689453125, 1.392578125, 1.553466796875, 1.71435546875, 1.875244140625, 2.0361328125, 2.197021484375, 2.35791015625, 2.518798828125, 2.6796875, 2.840576171875, 3.00146484375, 3.162353515625, 3.3232421875, 3.484130859375, 3.64501953125, 3.805908203125, 3.966796875, 4.127685546875, 4.28857421875, 4.449462890625, 4.6103515625, 4.771240234375, 4.93212890625, 5.093017578125, 5.25390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 9.0, 16.0, 18.0, 30.0, 41.0, 51.0, 65.0, 122.0, 148.0, 131.0, 83.0, 73.0, 56.0, 45.0, 30.0, 17.0, 11.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.4825439453125, -6.297119140625, -6.1116943359375, -5.92626953125, -5.7408447265625, -5.555419921875, -5.3699951171875, -5.1845703125, -4.9991455078125, -4.813720703125, -4.6282958984375, -4.44287109375, -4.2574462890625, -4.072021484375, -3.8865966796875, -3.701171875, -3.5157470703125, -3.330322265625, -3.1448974609375, -2.95947265625, -2.7740478515625, -2.588623046875, -2.4031982421875, -2.2177734375, -2.0323486328125, -1.846923828125, -1.6614990234375, -1.47607421875, -1.2906494140625, -1.105224609375, -0.9197998046875, -0.734375, -0.5489501953125, -0.363525390625, -0.1781005859375, 0.00732421875, 0.1927490234375, 0.378173828125, 0.5635986328125, 0.7490234375, 0.9344482421875, 1.119873046875, 1.3052978515625, 1.49072265625, 1.6761474609375, 1.861572265625, 2.0469970703125, 2.232421875, 2.4178466796875, 2.603271484375, 2.7886962890625, 2.97412109375, 3.1595458984375, 3.344970703125, 3.5303955078125, 3.7158203125, 3.9012451171875, 4.086669921875, 4.2720947265625, 4.45751953125, 4.6429443359375, 4.828369140625, 5.0137939453125, 5.19921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 7.0, 15.0, 55.0, 171.0, 480.0, 172.0, 62.0, 23.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-420.51397705078125, -411.8282165527344, -403.1424865722656, -394.45672607421875, -385.77099609375, -377.0852355957031, -368.3995056152344, -359.7137451171875, -351.02801513671875, -342.3422546386719, -333.6565246582031, -324.97076416015625, -316.2850341796875, -307.5992736816406, -298.9135437011719, -290.227783203125, -281.5420227050781, -272.85626220703125, -264.1705322265625, -255.4847869873047, -246.79904174804688, -238.11328125, -229.4275360107422, -220.74179077148438, -212.05604553222656, -203.37030029296875, -194.68455505371094, -185.99880981445312, -177.31304931640625, -168.6273193359375, -159.94155883789062, -151.2558135986328, -142.57008361816406, -133.88433837890625, -125.19859313964844, -116.5128402709961, -107.82709503173828, -99.14134979248047, -90.45559692382812, -81.76985168457031, -73.0841064453125, -64.39836120605469, -55.71261215209961, -47.02686309814453, -38.34111785888672, -29.655372619628906, -20.969623565673828, -12.28387451171875, -3.5981292724609375, 5.087617874145508, 13.773365020751953, 22.4591121673584, 31.144859313964844, 39.830604553222656, 48.516353607177734, 57.20210266113281, 65.88784790039062, 74.57359313964844, 83.25933837890625, 91.9450912475586, 100.6308364868164, 109.31658172607422, 118.00233459472656, 126.68807983398438, 135.3738250732422]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 11.0, 13.0, 10.0, 18.0, 10.0, 15.0, 13.0, 16.0, 13.0, 29.0, 35.0, 39.0, 41.0, 49.0, 101.0, 114.0, 121.0, 63.0, 53.0, 39.0, 21.0, 29.0, 24.0, 15.0, 20.0, 14.0, 7.0, 15.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-118.04840087890625, -114.33404541015625, -110.61968231201172, -106.90532684326172, -103.19097137451172, -99.47660827636719, -95.76225280761719, -92.04789733886719, -88.33353424072266, -84.61917877197266, -80.90481567382812, -77.19046020507812, -73.47610473632812, -69.7617416381836, -66.0473861694336, -62.33302688598633, -58.61867141723633, -54.90431213378906, -51.18995666503906, -47.4755973815918, -43.76123809814453, -40.04688262939453, -36.332523345947266, -32.6181640625, -28.903806686401367, -25.189449310302734, -21.47509002685547, -17.760732650756836, -14.046374320983887, -10.332015991210938, -6.617658615112305, -2.903299331665039, 0.8110580444335938, 4.525416374206543, 8.239774703979492, 11.954132080078125, 15.668490409851074, 19.382848739624023, 23.097206115722656, 26.811565399169922, 30.525922775268555, 34.24028015136719, 37.95463943481445, 41.66899871826172, 45.38335418701172, 49.097713470458984, 52.81207275390625, 56.52642822265625, 60.240787506103516, 63.95514678955078, 67.66950225830078, 71.38386535644531, 75.09822082519531, 78.81257629394531, 82.52693176269531, 86.24129486083984, 89.95565032958984, 93.67000579833984, 97.38436889648438, 101.09872436523438, 104.81307983398438, 108.5274429321289, 112.2417984008789, 115.95616149902344, 119.67051696777344]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 12.0, 9.0, 18.0, 27.0, 37.0, 65.0, 103.0, 177.0, 373.0, 842.0, 1965.0, 5442.0, 22283.0, 171352.0, 1504604.0, 2192646.0, 253025.0, 29797.0, 7072.0, 2379.0, 1028.0, 465.0, 205.0, 120.0, 81.0, 48.0, 33.0, 16.0, 11.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.6229248046875, -11.159912109375, -10.6968994140625, -10.23388671875, -9.7708740234375, -9.307861328125, -8.8448486328125, -8.3818359375, -7.9188232421875, -7.455810546875, -6.9927978515625, -6.52978515625, -6.0667724609375, -5.603759765625, -5.1407470703125, -4.677734375, -4.2147216796875, -3.751708984375, -3.2886962890625, -2.82568359375, -2.3626708984375, -1.899658203125, -1.4366455078125, -0.9736328125, -0.5106201171875, -0.047607421875, 0.4154052734375, 0.87841796875, 1.3414306640625, 1.804443359375, 2.2674560546875, 2.73046875, 3.1934814453125, 3.656494140625, 4.1195068359375, 4.58251953125, 5.0455322265625, 5.508544921875, 5.9715576171875, 6.4345703125, 6.8975830078125, 7.360595703125, 7.8236083984375, 8.28662109375, 8.7496337890625, 9.212646484375, 9.6756591796875, 10.138671875, 10.6016845703125, 11.064697265625, 11.5277099609375, 11.99072265625, 12.4537353515625, 12.916748046875, 13.3797607421875, 13.8427734375, 14.3057861328125, 14.768798828125, 15.2318115234375, 15.69482421875, 16.1578369140625, 16.620849609375, 17.0838623046875, 17.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 10.0, 21.0, 21.0, 20.0, 40.0, 32.0, 48.0, 71.0, 53.0, 49.0, 48.0, 67.0, 53.0, 65.0, 49.0, 48.0, 49.0, 58.0, 33.0, 34.0, 24.0, 18.0, 22.0, 9.0, 6.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0548095703125, -8.773681640625, -8.4925537109375, -8.21142578125, -7.9302978515625, -7.649169921875, -7.3680419921875, -7.0869140625, -6.8057861328125, -6.524658203125, -6.2435302734375, -5.96240234375, -5.6812744140625, -5.400146484375, -5.1190185546875, -4.837890625, -4.5567626953125, -4.275634765625, -3.9945068359375, -3.71337890625, -3.4322509765625, -3.151123046875, -2.8699951171875, -2.5888671875, -2.3077392578125, -2.026611328125, -1.7454833984375, -1.46435546875, -1.1832275390625, -0.902099609375, -0.6209716796875, -0.33984375, -0.0587158203125, 0.222412109375, 0.5035400390625, 0.78466796875, 1.0657958984375, 1.346923828125, 1.6280517578125, 1.9091796875, 2.1903076171875, 2.471435546875, 2.7525634765625, 3.03369140625, 3.3148193359375, 3.595947265625, 3.8770751953125, 4.158203125, 4.4393310546875, 4.720458984375, 5.0015869140625, 5.28271484375, 5.5638427734375, 5.844970703125, 6.1260986328125, 6.4072265625, 6.6883544921875, 6.969482421875, 7.2506103515625, 7.53173828125, 7.8128662109375, 8.093994140625, 8.3751220703125, 8.65625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 4.0, 6.0, 7.0, 9.0, 11.0, 11.0, 26.0, 38.0, 59.0, 75.0, 97.0, 151.0, 248.0, 441.0, 805.0, 1603.0, 4211.0, 18885.0, 446685.0, 3650624.0, 57068.0, 7962.0, 2550.0, 1153.0, 565.0, 346.0, 211.0, 131.0, 78.0, 56.0, 48.0, 33.0, 21.0, 15.0, 12.0, 8.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-31.9375, -30.9462890625, -29.955078125, -28.9638671875, -27.97265625, -26.9814453125, -25.990234375, -24.9990234375, -24.0078125, -23.0166015625, -22.025390625, -21.0341796875, -20.04296875, -19.0517578125, -18.060546875, -17.0693359375, -16.078125, -15.0869140625, -14.095703125, -13.1044921875, -12.11328125, -11.1220703125, -10.130859375, -9.1396484375, -8.1484375, -7.1572265625, -6.166015625, -5.1748046875, -4.18359375, -3.1923828125, -2.201171875, -1.2099609375, -0.21875, 0.7724609375, 1.763671875, 2.7548828125, 3.74609375, 4.7373046875, 5.728515625, 6.7197265625, 7.7109375, 8.7021484375, 9.693359375, 10.6845703125, 11.67578125, 12.6669921875, 13.658203125, 14.6494140625, 15.640625, 16.6318359375, 17.623046875, 18.6142578125, 19.60546875, 20.5966796875, 21.587890625, 22.5791015625, 23.5703125, 24.5615234375, 25.552734375, 26.5439453125, 27.53515625, 28.5263671875, 29.517578125, 30.5087890625, 31.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 11.0, 15.0, 16.0, 35.0, 36.0, 86.0, 114.0, 176.0, 324.0, 569.0, 752.0, 627.0, 439.0, 292.0, 174.0, 109.0, 85.0, 54.0, 31.0, 32.0, 16.0, 15.0, 10.0, 8.0, 10.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.779052734375, -23.99560546875, -23.212158203125, -22.4287109375, -21.645263671875, -20.86181640625, -20.078369140625, -19.294921875, -18.511474609375, -17.72802734375, -16.944580078125, -16.1611328125, -15.377685546875, -14.59423828125, -13.810791015625, -13.02734375, -12.243896484375, -11.46044921875, -10.677001953125, -9.8935546875, -9.110107421875, -8.32666015625, -7.543212890625, -6.759765625, -5.976318359375, -5.19287109375, -4.409423828125, -3.6259765625, -2.842529296875, -2.05908203125, -1.275634765625, -0.4921875, 0.291259765625, 1.07470703125, 1.858154296875, 2.6416015625, 3.425048828125, 4.20849609375, 4.991943359375, 5.775390625, 6.558837890625, 7.34228515625, 8.125732421875, 8.9091796875, 9.692626953125, 10.47607421875, 11.259521484375, 12.04296875, 12.826416015625, 13.60986328125, 14.393310546875, 15.1767578125, 15.960205078125, 16.74365234375, 17.527099609375, 18.310546875, 19.093994140625, 19.87744140625, 20.660888671875, 21.4443359375, 22.227783203125, 23.01123046875, 23.794677734375, 24.578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 9.0, 13.0, 14.0, 32.0, 56.0, 121.0, 186.0, 197.0, 143.0, 79.0, 52.0, 22.0, 14.0, 9.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-195.37460327148438, -187.87167358398438, -180.3687286376953, -172.8657989501953, -165.36285400390625, -157.85992431640625, -150.35699462890625, -142.8540496826172, -135.3511199951172, -127.84818267822266, -120.34524536132812, -112.84231567382812, -105.3393783569336, -97.83644104003906, -90.33350372314453, -82.83056640625, -75.32762908935547, -67.82469177246094, -60.32175827026367, -52.81882095336914, -45.315887451171875, -37.812950134277344, -30.310012817382812, -22.807079315185547, -15.304141998291016, -7.801206111907959, -0.29827022552490234, 7.2046661376953125, 14.707601547241211, 22.21053695678711, 29.71347427368164, 37.216407775878906, 44.71934509277344, 52.22228240966797, 59.725215911865234, 67.2281494140625, 74.73108673095703, 82.23402404785156, 89.7369613647461, 97.23989868164062, 104.74282836914062, 112.24576568603516, 119.74870300292969, 127.25163269042969, 134.75457763671875, 142.25750732421875, 149.76043701171875, 157.2633819580078, 164.76632690429688, 172.26925659179688, 179.77220153808594, 187.27513122558594, 194.778076171875, 202.281005859375, 209.783935546875, 217.28688049316406, 224.78981018066406, 232.29273986816406, 239.79568481445312, 247.29861450195312, 254.8015594482422, 262.30450439453125, 269.80743408203125, 277.31036376953125, 284.81329345703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 6.0, 10.0, 4.0, 13.0, 18.0, 17.0, 18.0, 12.0, 29.0, 35.0, 28.0, 30.0, 41.0, 30.0, 40.0, 56.0, 50.0, 61.0, 85.0, 66.0, 43.0, 46.0, 54.0, 35.0, 28.0, 25.0, 32.0, 17.0, 13.0, 9.0, 17.0, 7.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.8236846923828, -143.45022583007812, -139.07676696777344, -134.70330810546875, -130.32986450195312, -125.9563980102539, -121.58294677734375, -117.20948791503906, -112.83602905273438, -108.46257019042969, -104.089111328125, -99.71566009521484, -95.34220123291016, -90.96874237060547, -86.59529113769531, -82.22183227539062, -77.84837341308594, -73.47491455078125, -69.10145568847656, -64.7280044555664, -60.35454559326172, -55.98108673095703, -51.60763168334961, -47.23417663574219, -42.8607177734375, -38.48725891113281, -34.11380386352539, -29.740346908569336, -25.36688995361328, -20.993432998657227, -16.619976043701172, -12.246519088745117, -7.8730621337890625, -3.499605178833008, 0.8738517761230469, 5.247308731079102, 9.620765686035156, 13.994222640991211, 18.367679595947266, 22.74113655090332, 27.114593505859375, 31.48805046081543, 35.861507415771484, 40.234962463378906, 44.608421325683594, 48.98188018798828, 53.3553352355957, 57.728790283203125, 62.10224914550781, 66.4757080078125, 70.84916687011719, 75.22261810302734, 79.59607696533203, 83.96953582763672, 88.34298706054688, 92.71644592285156, 97.08990478515625, 101.46336364746094, 105.83682250976562, 110.21027374267578, 114.58373260498047, 118.95719146728516, 123.33064270019531, 127.7041015625, 132.0775604248047]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 11.0, 13.0, 20.0, 32.0, 34.0, 56.0, 63.0, 106.0, 163.0, 265.0, 422.0, 683.0, 1280.0, 2309.0, 4740.0, 10502.0, 27111.0, 85213.0, 354054.0, 412137.0, 96642.0, 30291.0, 11477.0, 4994.0, 2593.0, 1397.0, 754.0, 441.0, 269.0, 181.0, 89.0, 71.0, 38.0, 27.0, 17.0, 12.0, 12.0, 8.0, 5.0, 10.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.381103515625, -10.03564453125, -9.690185546875, -9.3447265625, -8.999267578125, -8.65380859375, -8.308349609375, -7.962890625, -7.617431640625, -7.27197265625, -6.926513671875, -6.5810546875, -6.235595703125, -5.89013671875, -5.544677734375, -5.19921875, -4.853759765625, -4.50830078125, -4.162841796875, -3.8173828125, -3.471923828125, -3.12646484375, -2.781005859375, -2.435546875, -2.090087890625, -1.74462890625, -1.399169921875, -1.0537109375, -0.708251953125, -0.36279296875, -0.017333984375, 0.328125, 0.673583984375, 1.01904296875, 1.364501953125, 1.7099609375, 2.055419921875, 2.40087890625, 2.746337890625, 3.091796875, 3.437255859375, 3.78271484375, 4.128173828125, 4.4736328125, 4.819091796875, 5.16455078125, 5.510009765625, 5.85546875, 6.200927734375, 6.54638671875, 6.891845703125, 7.2373046875, 7.582763671875, 7.92822265625, 8.273681640625, 8.619140625, 8.964599609375, 9.31005859375, 9.655517578125, 10.0009765625, 10.346435546875, 10.69189453125, 11.037353515625, 11.3828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 10.0, 8.0, 9.0, 17.0, 25.0, 21.0, 19.0, 38.0, 50.0, 38.0, 58.0, 70.0, 57.0, 55.0, 81.0, 45.0, 49.0, 56.0, 51.0, 41.0, 39.0, 34.0, 21.0, 25.0, 17.0, 17.0, 19.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.5838623046875, -8.269287109375, -7.9547119140625, -7.64013671875, -7.3255615234375, -7.010986328125, -6.6964111328125, -6.3818359375, -6.0672607421875, -5.752685546875, -5.4381103515625, -5.12353515625, -4.8089599609375, -4.494384765625, -4.1798095703125, -3.865234375, -3.5506591796875, -3.236083984375, -2.9215087890625, -2.60693359375, -2.2923583984375, -1.977783203125, -1.6632080078125, -1.3486328125, -1.0340576171875, -0.719482421875, -0.4049072265625, -0.09033203125, 0.2242431640625, 0.538818359375, 0.8533935546875, 1.16796875, 1.4825439453125, 1.797119140625, 2.1116943359375, 2.42626953125, 2.7408447265625, 3.055419921875, 3.3699951171875, 3.6845703125, 3.9991455078125, 4.313720703125, 4.6282958984375, 4.94287109375, 5.2574462890625, 5.572021484375, 5.8865966796875, 6.201171875, 6.5157470703125, 6.830322265625, 7.1448974609375, 7.45947265625, 7.7740478515625, 8.088623046875, 8.4031982421875, 8.7177734375, 9.0323486328125, 9.346923828125, 9.6614990234375, 9.97607421875, 10.2906494140625, 10.605224609375, 10.9197998046875, 11.234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 17.0, 17.0, 15.0, 26.0, 45.0, 39.0, 72.0, 109.0, 176.0, 244.0, 447.0, 841.0, 2094.0, 9213.0, 127827.0, 859903.0, 39420.0, 5059.0, 1431.0, 588.0, 338.0, 202.0, 135.0, 88.0, 48.0, 41.0, 28.0, 25.0, 13.0, 15.0, 12.0, 6.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.9140625, -15.3712158203125, -14.828369140625, -14.2855224609375, -13.74267578125, -13.1998291015625, -12.656982421875, -12.1141357421875, -11.5712890625, -11.0284423828125, -10.485595703125, -9.9427490234375, -9.39990234375, -8.8570556640625, -8.314208984375, -7.7713623046875, -7.228515625, -6.6856689453125, -6.142822265625, -5.5999755859375, -5.05712890625, -4.5142822265625, -3.971435546875, -3.4285888671875, -2.8857421875, -2.3428955078125, -1.800048828125, -1.2572021484375, -0.71435546875, -0.1715087890625, 0.371337890625, 0.9141845703125, 1.45703125, 1.9998779296875, 2.542724609375, 3.0855712890625, 3.62841796875, 4.1712646484375, 4.714111328125, 5.2569580078125, 5.7998046875, 6.3426513671875, 6.885498046875, 7.4283447265625, 7.97119140625, 8.5140380859375, 9.056884765625, 9.5997314453125, 10.142578125, 10.6854248046875, 11.228271484375, 11.7711181640625, 12.31396484375, 12.8568115234375, 13.399658203125, 13.9425048828125, 14.4853515625, 15.0281982421875, 15.571044921875, 16.1138916015625, 16.65673828125, 17.1995849609375, 17.742431640625, 18.2852783203125, 18.828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 7.0, 6.0, 8.0, 9.0, 15.0, 13.0, 19.0, 11.0, 29.0, 17.0, 27.0, 41.0, 31.0, 31.0, 31.0, 54.0, 60.0, 68.0, 68.0, 55.0, 47.0, 51.0, 42.0, 29.0, 32.0, 32.0, 26.0, 22.0, 22.0, 15.0, 14.0, 11.0, 10.0, 4.0, 3.0, 7.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.143310546875, -23.28662109375, -22.429931640625, -21.5732421875, -20.716552734375, -19.85986328125, -19.003173828125, -18.146484375, -17.289794921875, -16.43310546875, -15.576416015625, -14.7197265625, -13.863037109375, -13.00634765625, -12.149658203125, -11.29296875, -10.436279296875, -9.57958984375, -8.722900390625, -7.8662109375, -7.009521484375, -6.15283203125, -5.296142578125, -4.439453125, -3.582763671875, -2.72607421875, -1.869384765625, -1.0126953125, -0.156005859375, 0.70068359375, 1.557373046875, 2.4140625, 3.270751953125, 4.12744140625, 4.984130859375, 5.8408203125, 6.697509765625, 7.55419921875, 8.410888671875, 9.267578125, 10.124267578125, 10.98095703125, 11.837646484375, 12.6943359375, 13.551025390625, 14.40771484375, 15.264404296875, 16.12109375, 16.977783203125, 17.83447265625, 18.691162109375, 19.5478515625, 20.404541015625, 21.26123046875, 22.117919921875, 22.974609375, 23.831298828125, 24.68798828125, 25.544677734375, 26.4013671875, 27.258056640625, 28.11474609375, 28.971435546875, 29.828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 8.0, 11.0, 9.0, 20.0, 17.0, 44.0, 59.0, 82.0, 156.0, 204.0, 377.0, 725.0, 1582.0, 4013.0, 13451.0, 76381.0, 871274.0, 61597.0, 11775.0, 3667.0, 1511.0, 647.0, 313.0, 182.0, 124.0, 90.0, 60.0, 40.0, 26.0, 20.0, 20.0, 14.0, 11.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.412109375, -2.339996337890625, -2.26788330078125, -2.195770263671875, -2.1236572265625, -2.051544189453125, -1.97943115234375, -1.907318115234375, -1.835205078125, -1.763092041015625, -1.69097900390625, -1.618865966796875, -1.5467529296875, -1.474639892578125, -1.40252685546875, -1.330413818359375, -1.25830078125, -1.186187744140625, -1.11407470703125, -1.041961669921875, -0.9698486328125, -0.897735595703125, -0.82562255859375, -0.753509521484375, -0.681396484375, -0.609283447265625, -0.53717041015625, -0.465057373046875, -0.3929443359375, -0.320831298828125, -0.24871826171875, -0.176605224609375, -0.1044921875, -0.032379150390625, 0.03973388671875, 0.111846923828125, 0.1839599609375, 0.256072998046875, 0.32818603515625, 0.400299072265625, 0.472412109375, 0.544525146484375, 0.61663818359375, 0.688751220703125, 0.7608642578125, 0.832977294921875, 0.90509033203125, 0.977203369140625, 1.04931640625, 1.121429443359375, 1.19354248046875, 1.265655517578125, 1.3377685546875, 1.409881591796875, 1.48199462890625, 1.554107666015625, 1.626220703125, 1.698333740234375, 1.77044677734375, 1.842559814453125, 1.9146728515625, 1.986785888671875, 2.05889892578125, 2.131011962890625, 2.203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 3.0, 8.0, 10.0, 10.0, 11.0, 16.0, 18.0, 20.0, 18.0, 47.0, 45.0, 93.0, 140.0, 152.0, 129.0, 67.0, 50.0, 31.0, 33.0, 18.0, 22.0, 4.0, 7.0, 4.0, 4.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0009822845458984375, -0.0009566321969032288, -0.00093097984790802, -0.0009053274989128113, -0.0008796751499176025, -0.0008540228009223938, -0.0008283704519271851, -0.0008027181029319763, -0.0007770657539367676, -0.0007514134049415588, -0.0007257610559463501, -0.0007001087069511414, -0.0006744563579559326, -0.0006488040089607239, -0.0006231516599655151, -0.0005974993109703064, -0.0005718469619750977, -0.0005461946129798889, -0.0005205422639846802, -0.0004948899149894714, -0.0004692375659942627, -0.00044358521699905396, -0.0004179328680038452, -0.0003922805190086365, -0.00036662817001342773, -0.000340975821018219, -0.00031532347202301025, -0.0002896711230278015, -0.0002640187740325928, -0.00023836642503738403, -0.0002127140760421753, -0.00018706172704696655, -0.0001614093780517578, -0.00013575702905654907, -0.00011010468006134033, -8.445233106613159e-05, -5.879998207092285e-05, -3.314763307571411e-05, -7.495284080505371e-06, 1.815706491470337e-05, 4.380941390991211e-05, 6.946176290512085e-05, 9.511411190032959e-05, 0.00012076646089553833, 0.00014641880989074707, 0.0001720711588859558, 0.00019772350788116455, 0.0002233758568763733, 0.00024902820587158203, 0.00027468055486679077, 0.0003003329038619995, 0.00032598525285720825, 0.000351637601852417, 0.00037728995084762573, 0.00040294229984283447, 0.0004285946488380432, 0.00045424699783325195, 0.0004798993468284607, 0.0005055516958236694, 0.0005312040448188782, 0.0005568563938140869, 0.0005825087428092957, 0.0006081610918045044, 0.0006338134407997131, 0.0006594657897949219]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 10.0, 9.0, 8.0, 11.0, 16.0, 25.0, 33.0, 55.0, 71.0, 108.0, 152.0, 208.0, 421.0, 614.0, 1116.0, 2070.0, 3917.0, 8362.0, 19488.0, 57229.0, 619179.0, 261171.0, 43552.0, 16031.0, 6973.0, 3205.0, 1813.0, 996.0, 622.0, 366.0, 238.0, 147.0, 95.0, 69.0, 45.0, 28.0, 28.0, 15.0, 11.0, 11.0, 12.0, 10.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3541107177734375, -1.308807373046875, -1.2635040283203125, -1.21820068359375, -1.1728973388671875, -1.127593994140625, -1.0822906494140625, -1.0369873046875, -0.9916839599609375, -0.946380615234375, -0.9010772705078125, -0.85577392578125, -0.8104705810546875, -0.765167236328125, -0.7198638916015625, -0.674560546875, -0.6292572021484375, -0.583953857421875, -0.5386505126953125, -0.49334716796875, -0.4480438232421875, -0.402740478515625, -0.3574371337890625, -0.3121337890625, -0.2668304443359375, -0.221527099609375, -0.1762237548828125, -0.13092041015625, -0.0856170654296875, -0.040313720703125, 0.0049896240234375, 0.05029296875, 0.0955963134765625, 0.140899658203125, 0.1862030029296875, 0.23150634765625, 0.2768096923828125, 0.322113037109375, 0.3674163818359375, 0.4127197265625, 0.4580230712890625, 0.503326416015625, 0.5486297607421875, 0.59393310546875, 0.6392364501953125, 0.684539794921875, 0.7298431396484375, 0.775146484375, 0.8204498291015625, 0.865753173828125, 0.9110565185546875, 0.95635986328125, 1.0016632080078125, 1.046966552734375, 1.0922698974609375, 1.1375732421875, 1.1828765869140625, 1.228179931640625, 1.2734832763671875, 1.31878662109375, 1.3640899658203125, 1.409393310546875, 1.4546966552734375, 1.5]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 23.0, 12.0, 17.0, 32.0, 39.0, 53.0, 70.0, 95.0, 142.0, 121.0, 84.0, 70.0, 41.0, 35.0, 38.0, 16.0, 19.0, 16.0, 8.0, 14.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.296356201171875, -2.21966552734375, -2.142974853515625, -2.0662841796875, -1.989593505859375, -1.91290283203125, -1.836212158203125, -1.759521484375, -1.682830810546875, -1.60614013671875, -1.529449462890625, -1.4527587890625, -1.376068115234375, -1.29937744140625, -1.222686767578125, -1.14599609375, -1.069305419921875, -0.99261474609375, -0.915924072265625, -0.8392333984375, -0.762542724609375, -0.68585205078125, -0.609161376953125, -0.532470703125, -0.455780029296875, -0.37908935546875, -0.302398681640625, -0.2257080078125, -0.149017333984375, -0.07232666015625, 0.004364013671875, 0.0810546875, 0.157745361328125, 0.23443603515625, 0.311126708984375, 0.3878173828125, 0.464508056640625, 0.54119873046875, 0.617889404296875, 0.694580078125, 0.771270751953125, 0.84796142578125, 0.924652099609375, 1.0013427734375, 1.078033447265625, 1.15472412109375, 1.231414794921875, 1.30810546875, 1.384796142578125, 1.46148681640625, 1.538177490234375, 1.6148681640625, 1.691558837890625, 1.76824951171875, 1.844940185546875, 1.921630859375, 1.998321533203125, 2.07501220703125, 2.151702880859375, 2.2283935546875, 2.305084228515625, 2.38177490234375, 2.458465576171875, 2.53515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 19.0, 31.0, 43.0, 166.0, 410.0, 187.0, 58.0, 37.0, 13.0, 8.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.36531829833984, -103.95246887207031, -99.53961181640625, -95.12676239013672, -90.71391296386719, -86.30105590820312, -81.8882064819336, -77.47535705566406, -73.0625, -68.64965057373047, -64.2367935180664, -59.823944091796875, -55.411094665527344, -50.99824142456055, -46.58538818359375, -42.17253875732422, -37.75968933105469, -33.34683609008789, -28.93398666381836, -24.521133422851562, -20.1082820892334, -15.695430755615234, -11.282577514648438, -6.869726181030273, -2.4568748474121094, 1.955976963043213, 6.368828773498535, 10.781681060791016, 15.19453239440918, 19.607383728027344, 24.02023696899414, 28.433088302612305, 32.845947265625, 37.2588005065918, 41.67164993286133, 46.084503173828125, 50.497352600097656, 54.91020584106445, 59.32305908203125, 63.73590850830078, 68.14875793457031, 72.56160736083984, 76.9744644165039, 81.38731384277344, 85.80016326904297, 90.2130126953125, 94.62586975097656, 99.0387191772461, 103.45157623291016, 107.86442565917969, 112.27728271484375, 116.69013214111328, 121.10298156738281, 125.51583862304688, 129.92868041992188, 134.34153747558594, 138.75439453125, 143.16725158691406, 147.58009338378906, 151.99295043945312, 156.4058074951172, 160.8186492919922, 165.23150634765625, 169.6443634033203, 174.0572052001953]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 8.0, 10.0, 11.0, 12.0, 10.0, 10.0, 16.0, 15.0, 17.0, 24.0, 21.0, 25.0, 43.0, 112.0, 98.0, 57.0, 111.0, 138.0, 50.0, 23.0, 19.0, 19.0, 22.0, 7.0, 14.0, 11.0, 18.0, 12.0, 12.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.00067138671875, -90.29997253417969, -87.59927368164062, -84.89857482910156, -82.1978759765625, -79.49717712402344, -76.79647827148438, -74.09577941894531, -71.39508056640625, -68.69438171386719, -65.99368286132812, -63.29298400878906, -60.59228515625, -57.89158630371094, -55.190887451171875, -52.49018859863281, -49.789485931396484, -47.08878707885742, -44.38808822631836, -41.6873893737793, -38.986690521240234, -36.28599166870117, -33.585289001464844, -30.884592056274414, -28.18389320373535, -25.48319435119629, -22.782495498657227, -20.08179473876953, -17.38109588623047, -14.680397987365723, -11.979698181152344, -9.278999328613281, -6.578300476074219, -3.877601385116577, -1.1769022941589355, 1.5237970352172852, 4.224495887756348, 6.92519474029541, 9.625894546508789, 12.326593399047852, 15.027292251586914, 17.727991104125977, 20.42868995666504, 23.129390716552734, 25.830089569091797, 28.53078842163086, 31.231487274169922, 33.932186126708984, 36.63288497924805, 39.33358383178711, 42.03428268432617, 44.734981536865234, 47.4356803894043, 50.13637924194336, 52.83708190917969, 55.53778076171875, 58.23847961425781, 60.939178466796875, 63.63987731933594, 66.340576171875, 69.04127502441406, 71.74197387695312, 74.44267272949219, 77.14337158203125, 79.84407043457031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 6.0, 3.0, 5.0, 4.0, 7.0, 11.0, 14.0, 12.0, 13.0, 15.0, 21.0, 29.0, 30.0, 27.0, 30.0, 41.0, 87.0, 252.0, 85.0, 34.0, 29.0, 25.0, 19.0, 26.0, 19.0, 28.0, 21.0, 17.0, 14.0, 10.0, 9.0, 5.0, 6.0, 5.0, 8.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.25390625, -7.03167724609375, -6.8094482421875, -6.58721923828125, -6.364990234375, -6.14276123046875, -5.9205322265625, -5.69830322265625, -5.47607421875, -5.25384521484375, -5.0316162109375, -4.80938720703125, -4.587158203125, -4.36492919921875, -4.1427001953125, -3.92047119140625, -3.6982421875, -3.47601318359375, -3.2537841796875, -3.03155517578125, -2.809326171875, -2.58709716796875, -2.3648681640625, -2.14263916015625, -1.92041015625, -1.69818115234375, -1.4759521484375, -1.25372314453125, -1.031494140625, -0.80926513671875, -0.5870361328125, -0.36480712890625, -0.142578125, 0.07965087890625, 0.3018798828125, 0.52410888671875, 0.746337890625, 0.96856689453125, 1.1907958984375, 1.41302490234375, 1.63525390625, 1.85748291015625, 2.0797119140625, 2.30194091796875, 2.524169921875, 2.74639892578125, 2.9686279296875, 3.19085693359375, 3.4130859375, 3.63531494140625, 3.8575439453125, 4.07977294921875, 4.302001953125, 4.52423095703125, 4.7464599609375, 4.96868896484375, 5.19091796875, 5.41314697265625, 5.6353759765625, 5.85760498046875, 6.079833984375, 6.30206298828125, 6.5242919921875, 6.74652099609375, 6.96875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 4.0, 2.0, 11.0, 18.0, 21.0, 25.0, 63.0, 89.0, 79.0, 214.0, 595.0, 2002.0, 9564.0, 8338266.0, 32156.0, 3777.0, 938.0, 335.0, 149.0, 78.0, 55.0, 36.0, 25.0, 12.0, 10.0, 13.0, 4.0, 7.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-107.97128295898438, -104.94878387451172, -101.92628479003906, -98.9037857055664, -95.88128662109375, -92.8587875366211, -89.83628845214844, -86.81378173828125, -83.79129028320312, -80.76879119873047, -77.74629211425781, -74.72379302978516, -71.7012939453125, -68.67879486083984, -65.65629577636719, -62.633792877197266, -59.611289978027344, -56.58879089355469, -53.56629180908203, -50.543792724609375, -47.52129364013672, -44.49879455566406, -41.47629165649414, -38.453792572021484, -35.43129348754883, -32.40879440307617, -29.386295318603516, -26.363794326782227, -23.34129524230957, -20.318796157836914, -17.296295166015625, -14.273796081542969, -11.251296997070312, -8.228797912597656, -5.206297874450684, -2.183797836303711, 0.8387012481689453, 3.8612003326416016, 6.883701324462891, 9.906200408935547, 12.928699493408203, 15.95119857788086, 18.973697662353516, 21.996198654174805, 25.01869773864746, 28.041196823120117, 31.063697814941406, 34.08619689941406, 37.10869598388672, 40.131195068359375, 43.15369415283203, 46.17619323730469, 49.198692321777344, 52.22119140625, 55.24369430541992, 58.26619338989258, 61.288692474365234, 64.31119537353516, 67.33369445800781, 70.35619354248047, 73.37869262695312, 76.40119171142578, 79.42369079589844, 82.4461898803711, 85.46868896484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-120.77578735351562, -116.64141082763672, -112.50702667236328, -108.37265014648438, -104.23826599121094, -100.10388946533203, -95.96951293945312, -91.83512878417969, -87.70075225830078, -83.56637573242188, -79.43199157714844, -75.29761505126953, -71.16323852539062, -67.02885437011719, -62.89447784423828, -58.76009750366211, -54.62571716308594, -50.491336822509766, -46.356956481933594, -42.22257995605469, -38.088199615478516, -33.953819274902344, -29.819440841674805, -25.685062408447266, -21.550682067871094, -17.416301727294922, -13.281923294067383, -9.147543907165527, -5.013164520263672, -0.8787841796875, 3.255594253540039, 7.389972686767578, 11.52435302734375, 15.658732414245605, 19.79311180114746, 23.927490234375, 28.061870574951172, 32.196250915527344, 36.33062744140625, 40.46500778198242, 44.599388122558594, 48.733768463134766, 52.86814880371094, 57.002525329589844, 61.136905670166016, 65.27128601074219, 69.4056625366211, 73.5400390625, 77.67442321777344, 81.80879974365234, 85.94318389892578, 90.07756042480469, 94.21194458007812, 98.34632110595703, 102.48069763183594, 106.61508178710938, 110.74945831298828, 114.88383483886719, 119.01821899414062, 123.15259552001953, 127.28697204589844, 131.42135620117188, 135.5557403564453, 139.6901092529297, 143.82449340820312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 6.0, 12.0, 19.0, 19.0, 37.0, 42.0, 70.0, 110.0, 159.0, 268.0, 454.0, 846.0, 1751.0, 3570.0, 8308.0, 21293.0, 57069.0, 149801.0, 169267.0, 68736.0, 24864.0, 9665.0, 3970.0, 1801.0, 888.0, 465.0, 289.0, 145.0, 106.0, 82.0, 46.0, 31.0, 14.0, 13.0, 12.0, 4.0, 4.0, 5.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-57.0625, -55.166015625, -53.26953125, -51.373046875, -49.4765625, -47.580078125, -45.68359375, -43.787109375, -41.890625, -39.994140625, -38.09765625, -36.201171875, -34.3046875, -32.408203125, -30.51171875, -28.615234375, -26.71875, -24.822265625, -22.92578125, -21.029296875, -19.1328125, -17.236328125, -15.33984375, -13.443359375, -11.546875, -9.650390625, -7.75390625, -5.857421875, -3.9609375, -2.064453125, -0.16796875, 1.728515625, 3.625, 5.521484375, 7.41796875, 9.314453125, 11.2109375, 13.107421875, 15.00390625, 16.900390625, 18.796875, 20.693359375, 22.58984375, 24.486328125, 26.3828125, 28.279296875, 30.17578125, 32.072265625, 33.96875, 35.865234375, 37.76171875, 39.658203125, 41.5546875, 43.451171875, 45.34765625, 47.244140625, 49.140625, 51.037109375, 52.93359375, 54.830078125, 56.7265625, 58.623046875, 60.51953125, 62.416015625, 64.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 5.0, 6.0, 8.0, 9.0, 20.0, 19.0, 17.0, 27.0, 30.0, 39.0, 42.0, 60.0, 51.0, 68.0, 63.0, 69.0, 78.0, 76.0, 50.0, 54.0, 44.0, 28.0, 33.0, 13.0, 15.0, 16.0, 14.0, 6.0, 9.0, 6.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.25048828125, -8.9462890625, -8.64208984375, -8.337890625, -8.03369140625, -7.7294921875, -7.42529296875, -7.12109375, -6.81689453125, -6.5126953125, -6.20849609375, -5.904296875, -5.60009765625, -5.2958984375, -4.99169921875, -4.6875, -4.38330078125, -4.0791015625, -3.77490234375, -3.470703125, -3.16650390625, -2.8623046875, -2.55810546875, -2.25390625, -1.94970703125, -1.6455078125, -1.34130859375, -1.037109375, -0.73291015625, -0.4287109375, -0.12451171875, 0.1796875, 0.48388671875, 0.7880859375, 1.09228515625, 1.396484375, 1.70068359375, 2.0048828125, 2.30908203125, 2.61328125, 2.91748046875, 3.2216796875, 3.52587890625, 3.830078125, 4.13427734375, 4.4384765625, 4.74267578125, 5.046875, 5.35107421875, 5.6552734375, 5.95947265625, 6.263671875, 6.56787109375, 6.8720703125, 7.17626953125, 7.48046875, 7.78466796875, 8.0888671875, 8.39306640625, 8.697265625, 9.00146484375, 9.3056640625, 9.60986328125, 9.9140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 17.0, 45.0, 54.0, 112.0, 86.0, 60.0, 45.0, 19.0, 13.0, 5.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.49837875366211, -29.815095901489258, -27.131813049316406, -24.448528289794922, -21.76524543762207, -19.08196258544922, -16.398677825927734, -13.715394973754883, -11.032112121582031, -8.34882926940918, -5.665545463562012, -2.9822616577148438, -0.2989788055419922, 2.3843040466308594, 5.067588806152344, 7.750871658325195, 10.434154510498047, 13.117437362670898, 15.800721168518066, 18.484004974365234, 21.167287826538086, 23.850570678710938, 26.533855438232422, 29.217138290405273, 31.900421142578125, 34.58370590209961, 37.26698684692383, 39.95027160644531, 42.63355255126953, 45.316837310791016, 48.0001220703125, 50.68340301513672, 53.36668395996094, 56.04996871948242, 58.73324966430664, 61.416534423828125, 64.09981536865234, 66.78309631347656, 69.46638488769531, 72.14966583251953, 74.83294677734375, 77.51622772216797, 80.19951629638672, 82.88279724121094, 85.56607818603516, 88.24935913085938, 90.93264770507812, 93.61592864990234, 96.2992172241211, 98.98249816894531, 101.66578674316406, 104.34906768798828, 107.0323486328125, 109.71563720703125, 112.39891815185547, 115.08219909667969, 117.76548767089844, 120.44876861572266, 123.1320571899414, 125.81533813476562, 128.49862670898438, 131.18190002441406, 133.8651885986328, 136.54847717285156, 139.23175048828125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 19.0, 38.0, 67.0, 79.0, 86.0, 55.0, 32.0, 16.0, 8.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.633628845214844, -50.882179260253906, -49.130733489990234, -47.3792839050293, -45.62783432006836, -43.87638854980469, -42.12493896484375, -40.37348937988281, -38.622039794921875, -36.87059020996094, -35.119144439697266, -33.36769485473633, -31.61624526977539, -29.864797592163086, -28.11334991455078, -26.361900329589844, -24.610454559326172, -22.859006881713867, -21.10755729675293, -19.356109619140625, -17.604660034179688, -15.853212356567383, -14.101764678955078, -12.350316047668457, -10.598867416381836, -8.847418785095215, -7.095970630645752, -5.344522476196289, -3.593073844909668, -1.8416252136230469, -0.09017753601074219, 1.661271095275879, 3.4127235412597656, 5.164172172546387, 6.91562032699585, 8.667068481445312, 10.418517112731934, 12.169965744018555, 13.92141342163086, 15.67286205291748, 17.4243106842041, 19.175758361816406, 20.927207946777344, 22.67865562438965, 24.430103302001953, 26.18155288696289, 27.933000564575195, 29.6844482421875, 31.435897827148438, 33.187347412109375, 34.93879318237305, 36.690242767333984, 38.44169235229492, 40.193138122558594, 41.94458770751953, 43.69603729248047, 45.447486877441406, 47.198936462402344, 48.950382232666016, 50.70183181762695, 52.45328140258789, 54.20472717285156, 55.9561767578125, 57.70762634277344, 59.45907211303711]}, "eval/loss": 0.8383785486221313, "eval/wer": 0.1366748020715519, "eval/runtime": 1219.9567, "eval/samples_per_second": 2.166, "eval/steps_per_second": 0.271} \ No newline at end of file +{"train/loss": 0.2499, "train/learning_rate": 8.907363420427554e-09, "train/epoch": 20.0, "train/global_step": 17840, "_runtime": 122858, "_timestamp": 1647497135, "_step": 17851, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 10.0, 14.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 5.0, 4.0, 9.0, 18.0, 29525.0, 875.0, 16.0, 6.0, 7.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.125, -168.603515625, -165.08203125, -161.560546875, -158.0390625, -154.517578125, -150.99609375, -147.474609375, -143.953125, -140.431640625, -136.91015625, -133.388671875, -129.8671875, -126.345703125, -122.82421875, -119.302734375, -115.78125, -112.259765625, -108.73828125, -105.216796875, -101.6953125, -98.173828125, -94.65234375, -91.130859375, -87.609375, -84.087890625, -80.56640625, -77.044921875, -73.5234375, -70.001953125, -66.48046875, -62.958984375, -59.4375, -55.916015625, -52.39453125, -48.873046875, -45.3515625, -41.830078125, -38.30859375, -34.787109375, -31.265625, -27.744140625, -24.22265625, -20.701171875, -17.1796875, -13.658203125, -10.13671875, -6.615234375, -3.09375, 0.427734375, 3.94921875, 7.470703125, 10.9921875, 14.513671875, 18.03515625, 21.556640625, 25.078125, 28.599609375, 32.12109375, 35.642578125, 39.1640625, 42.685546875, 46.20703125, 49.728515625, 53.25]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 7.0, 3.0, 3.0, 6.0, 8.0, 6.0, 5.0, 13.0, 13.0, 17.0, 19.0, 24.0, 24.0, 22.0, 21.0, 35.0, 37.0, 47.0, 27.0, 39.0, 42.0, 41.0, 58.0, 41.0, 38.0, 43.0, 42.0, 39.0, 39.0, 38.0, 29.0, 20.0, 24.0, 26.0, 15.0, 15.0, 13.0, 6.0, 10.0, 10.0, 4.0, 7.0, 7.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-37.44131088256836, -36.594993591308594, -35.74867630004883, -34.90236282348633, -34.05604553222656, -33.2097282409668, -32.36341094970703, -31.5170955657959, -30.670780181884766, -29.824462890625, -28.978147506713867, -28.1318302154541, -27.28551483154297, -26.439197540283203, -25.592880249023438, -24.746564865112305, -23.90024757385254, -23.053930282592773, -22.20761489868164, -21.361297607421875, -20.514982223510742, -19.668664932250977, -18.822349548339844, -17.976032257080078, -17.129714965820312, -16.283397674560547, -15.437082290649414, -14.590764999389648, -13.744449615478516, -12.89813232421875, -12.0518159866333, -11.205499649047852, -10.359186172485352, -9.512869834899902, -8.666553497314453, -7.820236682891846, -6.9739203453063965, -6.127604007720947, -5.28128719329834, -4.434970855712891, -3.5886545181274414, -2.742338180541992, -1.8960216045379639, -1.0497050285339355, -0.20338869094848633, 0.6429276466369629, 1.4892444610595703, 2.3355607986450195, 3.1818771362304688, 4.028193473815918, 4.874509811401367, 5.720826625823975, 6.567142963409424, 7.413459300994873, 8.25977611541748, 9.10609245300293, 9.952408790588379, 10.798725128173828, 11.645041465759277, 12.491357803344727, 13.337675094604492, 14.183990478515625, 15.03030776977539, 15.87662410736084, 16.72294044494629]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 8.0, 6.0, 9.0, 6.0, 11.0, 9.0, 17.0, 14.0, 31.0, 26.0, 29.0, 23.0, 36.0, 51.0, 43.0, 34.0, 44.0, 50.0, 42.0, 32.0, 52.0, 35.0, 40.0, 48.0, 33.0, 29.0, 20.0, 31.0, 30.0, 16.0, 24.0, 27.0, 13.0, 17.0, 17.0, 10.0, 9.0, 4.0, 4.0, 8.0, 8.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.865875244140625, -26.000263214111328, -25.13465118408203, -24.269039154052734, -23.403425216674805, -22.537813186645508, -21.67220115661621, -20.806589126586914, -19.940975189208984, -19.075363159179688, -18.20975112915039, -17.344139099121094, -16.478525161743164, -15.612913131713867, -14.74730110168457, -13.881689071655273, -13.016077041625977, -12.15046501159668, -11.284852027893066, -10.41923999786377, -9.553627014160156, -8.68801498413086, -7.8224029541015625, -6.956790447235107, -6.091177940368652, -5.225565433502197, -4.359952926635742, -3.4943408966064453, -2.6287283897399902, -1.7631158828735352, -0.8975038528442383, -0.0318913459777832, 0.8337230682373047, 1.6993354558944702, 2.5649478435516357, 3.4305601119995117, 4.296172618865967, 5.161785125732422, 6.027397155761719, 6.893009662628174, 7.758622169494629, 8.624234199523926, 9.489847183227539, 10.355459213256836, 11.221071243286133, 12.086684226989746, 12.952296257019043, 13.817909240722656, 14.683521270751953, 15.54913330078125, 16.414745330810547, 17.280357360839844, 18.145971298217773, 19.01158332824707, 19.877195358276367, 20.742807388305664, 21.608421325683594, 22.47403335571289, 23.339645385742188, 24.205257415771484, 25.070871353149414, 25.93648338317871, 26.802095413208008, 27.667707443237305, 28.5333194732666]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 13.0, 11.0, 18.0, 35.0, 61.0, 87.0, 144.0, 236.0, 381.0, 558.0, 930.0, 1512.0, 2314.0, 3589.0, 5697.0, 8750.0, 12940.0, 19432.0, 27520.0, 38987.0, 51489.0, 67133.0, 81702.0, 94353.0, 120262.0, 107531.0, 91995.0, 79255.0, 64688.0, 50098.0, 37011.0, 26422.0, 18287.0, 12305.0, 8119.0, 5403.0, 3480.0, 2149.0, 1360.0, 858.0, 533.0, 316.0, 200.0, 140.0, 90.0, 56.0, 41.0, 28.0, 18.0, 9.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.25, -85.396484375, -82.54296875, -79.689453125, -76.8359375, -73.982421875, -71.12890625, -68.275390625, -65.421875, -62.568359375, -59.71484375, -56.861328125, -54.0078125, -51.154296875, -48.30078125, -45.447265625, -42.59375, -39.740234375, -36.88671875, -34.033203125, -31.1796875, -28.326171875, -25.47265625, -22.619140625, -19.765625, -16.912109375, -14.05859375, -11.205078125, -8.3515625, -5.498046875, -2.64453125, 0.208984375, 3.0625, 5.916015625, 8.76953125, 11.623046875, 14.4765625, 17.330078125, 20.18359375, 23.037109375, 25.890625, 28.744140625, 31.59765625, 34.451171875, 37.3046875, 40.158203125, 43.01171875, 45.865234375, 48.71875, 51.572265625, 54.42578125, 57.279296875, 60.1328125, 62.986328125, 65.83984375, 68.693359375, 71.546875, 74.400390625, 77.25390625, 80.107421875, 82.9609375, 85.814453125, 88.66796875, 91.521484375, 94.375]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 11.0, 6.0, 13.0, 20.0, 24.0, 14.0, 25.0, 33.0, 35.0, 52.0, 42.0, 43.0, 50.0, 43.0, 73.0, 84.0, 53.0, 57.0, 36.0, 45.0, 46.0, 32.0, 39.0, 16.0, 15.0, 17.0, 18.0, 13.0, 9.0, 11.0, 4.0, 7.0, 6.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5, -52.84619140625, -51.1923828125, -49.53857421875, -47.884765625, -46.23095703125, -44.5771484375, -42.92333984375, -41.26953125, -39.61572265625, -37.9619140625, -36.30810546875, -34.654296875, -33.00048828125, -31.3466796875, -29.69287109375, -28.0390625, -26.38525390625, -24.7314453125, -23.07763671875, -21.423828125, -19.77001953125, -18.1162109375, -16.46240234375, -14.80859375, -13.15478515625, -11.5009765625, -9.84716796875, -8.193359375, -6.53955078125, -4.8857421875, -3.23193359375, -1.578125, 0.07568359375, 1.7294921875, 3.38330078125, 5.037109375, 6.69091796875, 8.3447265625, 9.99853515625, 11.65234375, 13.30615234375, 14.9599609375, 16.61376953125, 18.267578125, 19.92138671875, 21.5751953125, 23.22900390625, 24.8828125, 26.53662109375, 28.1904296875, 29.84423828125, 31.498046875, 33.15185546875, 34.8056640625, 36.45947265625, 38.11328125, 39.76708984375, 41.4208984375, 43.07470703125, 44.728515625, 46.38232421875, 48.0361328125, 49.68994140625, 51.34375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 3.0, 12.0, 5.0, 7.0, 4.0, 18.0, 19.0, 24.0, 31.0, 37.0, 40.0, 42.0, 53.0, 33.0, 37.0, 45.0, 41.0, 56.0, 48.0, 60.0, 46.0, 43.0, 32.0, 37.0, 29.0, 25.0, 29.0, 25.0, 17.0, 12.0, 21.0, 17.0, 12.0, 5.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.385425567626953, -25.43740463256836, -24.489383697509766, -23.541362762451172, -22.59334373474121, -21.645322799682617, -20.697301864624023, -19.74928092956543, -18.80126190185547, -17.853240966796875, -16.90522003173828, -15.957200050354004, -15.009180068969727, -14.061159133911133, -13.113138198852539, -12.165117263793945, -11.217096328735352, -10.269075393676758, -9.32105541229248, -8.373034477233887, -7.425014019012451, -6.476993560791016, -5.528972625732422, -4.580952167510986, -3.632931709289551, -2.6849112510681152, -1.7368905544281006, -0.7888698577880859, 0.1591506004333496, 1.1071710586547852, 2.055191993713379, 3.0032124519348145, 3.95123291015625, 4.8992533683776855, 5.847273826599121, 6.795294761657715, 7.74331521987915, 8.691335678100586, 9.63935661315918, 10.587377548217773, 11.53539752960205, 12.483418464660645, 13.431438446044922, 14.379459381103516, 15.32748031616211, 16.275501251220703, 17.223522186279297, 18.171541213989258, 19.11956214904785, 20.067583084106445, 21.01560401916504, 21.963623046875, 22.911643981933594, 23.859664916992188, 24.80768585205078, 25.755706787109375, 26.70372772216797, 27.651748657226562, 28.599769592285156, 29.54779052734375, 30.49580955505371, 31.443830490112305, 32.39185333251953, 33.33987045288086, 34.28789138793945]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 8.0, 10.0, 13.0, 15.0, 18.0, 18.0, 13.0, 19.0, 24.0, 17.0, 28.0, 28.0, 27.0, 33.0, 37.0, 38.0, 38.0, 34.0, 37.0, 29.0, 32.0, 34.0, 50.0, 35.0, 29.0, 39.0, 29.0, 23.0, 26.0, 23.0, 22.0, 25.0, 22.0, 16.0, 13.0, 16.0, 13.0, 13.0, 7.0, 3.0, 11.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.41060447692871, -23.645917892456055, -22.881229400634766, -22.11654281616211, -21.351856231689453, -20.587169647216797, -19.822481155395508, -19.05779457092285, -18.293106079101562, -17.528419494628906, -16.763731002807617, -15.999044418334961, -15.234357833862305, -14.469670295715332, -13.70498275756836, -12.940296173095703, -12.175609588623047, -11.410922050476074, -10.646235466003418, -9.881547927856445, -9.116861343383789, -8.352173805236816, -7.587486267089844, -6.822799205780029, -6.058112144470215, -5.2934250831604, -4.528738021850586, -3.7640504837036133, -2.999363422393799, -2.2346763610839844, -1.4699888229370117, -0.7053017616271973, 0.059383392333984375, 0.8240705728530884, 1.5887577533721924, 2.353445053100586, 3.1181321144104004, 3.882819175720215, 4.6475067138671875, 5.412193775177002, 6.176880836486816, 6.941567897796631, 7.706254959106445, 8.470942497253418, 9.23563003540039, 10.000316619873047, 10.76500415802002, 11.529691696166992, 12.294378280639648, 13.059065818786621, 13.823752403259277, 14.58843994140625, 15.353126525878906, 16.117813110351562, 16.88250160217285, 17.647188186645508, 18.411876678466797, 19.176563262939453, 19.941251754760742, 20.7059383392334, 21.470624923706055, 22.235313415527344, 23.0, 23.764686584472656, 24.529373168945312]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 0.0, 3.0, 8.0, 18.0, 32.0, 34.0, 52.0, 100.0, 157.0, 221.0, 375.0, 630.0, 1037.0, 1504.0, 2432.0, 3798.0, 5961.0, 9766.0, 15600.0, 24875.0, 39892.0, 65460.0, 105003.0, 171497.0, 273961.0, 430752.0, 634959.0, 751476.0, 601193.0, 398115.0, 250380.0, 154641.0, 95080.0, 58549.0, 35874.0, 22552.0, 13783.0, 8724.0, 5604.0, 3651.0, 2317.0, 1469.0, 901.0, 638.0, 386.0, 280.0, 207.0, 125.0, 71.0, 59.0, 37.0, 16.0, 16.0, 6.0, 3.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-41.5, -40.1357421875, -38.771484375, -37.4072265625, -36.04296875, -34.6787109375, -33.314453125, -31.9501953125, -30.5859375, -29.2216796875, -27.857421875, -26.4931640625, -25.12890625, -23.7646484375, -22.400390625, -21.0361328125, -19.671875, -18.3076171875, -16.943359375, -15.5791015625, -14.21484375, -12.8505859375, -11.486328125, -10.1220703125, -8.7578125, -7.3935546875, -6.029296875, -4.6650390625, -3.30078125, -1.9365234375, -0.572265625, 0.7919921875, 2.15625, 3.5205078125, 4.884765625, 6.2490234375, 7.61328125, 8.9775390625, 10.341796875, 11.7060546875, 13.0703125, 14.4345703125, 15.798828125, 17.1630859375, 18.52734375, 19.8916015625, 21.255859375, 22.6201171875, 23.984375, 25.3486328125, 26.712890625, 28.0771484375, 29.44140625, 30.8056640625, 32.169921875, 33.5341796875, 34.8984375, 36.2626953125, 37.626953125, 38.9912109375, 40.35546875, 41.7197265625, 43.083984375, 44.4482421875, 45.8125]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 22.0, 13.0, 16.0, 19.0, 23.0, 22.0, 19.0, 30.0, 23.0, 24.0, 40.0, 30.0, 45.0, 34.0, 31.0, 31.0, 27.0, 42.0, 40.0, 39.0, 26.0, 39.0, 27.0, 32.0, 27.0, 14.0, 31.0, 22.0, 26.0, 12.0, 21.0, 16.0, 16.0, 12.0, 18.0, 12.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-20.96875, -20.309326171875, -19.64990234375, -18.990478515625, -18.3310546875, -17.671630859375, -17.01220703125, -16.352783203125, -15.693359375, -15.033935546875, -14.37451171875, -13.715087890625, -13.0556640625, -12.396240234375, -11.73681640625, -11.077392578125, -10.41796875, -9.758544921875, -9.09912109375, -8.439697265625, -7.7802734375, -7.120849609375, -6.46142578125, -5.802001953125, -5.142578125, -4.483154296875, -3.82373046875, -3.164306640625, -2.5048828125, -1.845458984375, -1.18603515625, -0.526611328125, 0.1328125, 0.792236328125, 1.45166015625, 2.111083984375, 2.7705078125, 3.429931640625, 4.08935546875, 4.748779296875, 5.408203125, 6.067626953125, 6.72705078125, 7.386474609375, 8.0458984375, 8.705322265625, 9.36474609375, 10.024169921875, 10.68359375, 11.343017578125, 12.00244140625, 12.661865234375, 13.3212890625, 13.980712890625, 14.64013671875, 15.299560546875, 15.958984375, 16.618408203125, 17.27783203125, 17.937255859375, 18.5966796875, 19.256103515625, 19.91552734375, 20.574951171875, 21.234375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 11.0, 13.0, 5.0, 29.0, 44.0, 67.0, 103.0, 168.0, 251.0, 365.0, 604.0, 976.0, 1532.0, 2343.0, 3750.0, 5927.0, 9563.0, 14926.0, 23821.0, 37469.0, 59351.0, 92981.0, 144844.0, 219601.0, 324507.0, 455309.0, 581203.0, 610101.0, 505410.0, 370667.0, 255806.0, 169993.0, 110137.0, 70691.0, 45003.0, 28529.0, 17916.0, 11100.0, 7026.0, 4359.0, 2848.0, 1764.0, 1187.0, 706.0, 465.0, 323.0, 183.0, 115.0, 74.0, 50.0, 25.0, 18.0, 14.0, 14.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-27.90625, -27.039306640625, -26.17236328125, -25.305419921875, -24.4384765625, -23.571533203125, -22.70458984375, -21.837646484375, -20.970703125, -20.103759765625, -19.23681640625, -18.369873046875, -17.5029296875, -16.635986328125, -15.76904296875, -14.902099609375, -14.03515625, -13.168212890625, -12.30126953125, -11.434326171875, -10.5673828125, -9.700439453125, -8.83349609375, -7.966552734375, -7.099609375, -6.232666015625, -5.36572265625, -4.498779296875, -3.6318359375, -2.764892578125, -1.89794921875, -1.031005859375, -0.1640625, 0.702880859375, 1.56982421875, 2.436767578125, 3.3037109375, 4.170654296875, 5.03759765625, 5.904541015625, 6.771484375, 7.638427734375, 8.50537109375, 9.372314453125, 10.2392578125, 11.106201171875, 11.97314453125, 12.840087890625, 13.70703125, 14.573974609375, 15.44091796875, 16.307861328125, 17.1748046875, 18.041748046875, 18.90869140625, 19.775634765625, 20.642578125, 21.509521484375, 22.37646484375, 23.243408203125, 24.1103515625, 24.977294921875, 25.84423828125, 26.711181640625, 27.578125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 9.0, 10.0, 17.0, 17.0, 27.0, 30.0, 41.0, 40.0, 49.0, 75.0, 94.0, 122.0, 135.0, 163.0, 175.0, 177.0, 235.0, 248.0, 258.0, 237.0, 241.0, 216.0, 218.0, 181.0, 191.0, 135.0, 127.0, 99.0, 92.0, 64.0, 71.0, 49.0, 40.0, 40.0, 27.0, 22.0, 16.0, 26.0, 15.0, 6.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.9765625, -11.58203125, -11.1875, -10.79296875, -10.3984375, -10.00390625, -9.609375, -9.21484375, -8.8203125, -8.42578125, -8.03125, -7.63671875, -7.2421875, -6.84765625, -6.453125, -6.05859375, -5.6640625, -5.26953125, -4.875, -4.48046875, -4.0859375, -3.69140625, -3.296875, -2.90234375, -2.5078125, -2.11328125, -1.71875, -1.32421875, -0.9296875, -0.53515625, -0.140625, 0.25390625, 0.6484375, 1.04296875, 1.4375, 1.83203125, 2.2265625, 2.62109375, 3.015625, 3.41015625, 3.8046875, 4.19921875, 4.59375, 4.98828125, 5.3828125, 5.77734375, 6.171875, 6.56640625, 6.9609375, 7.35546875, 7.75, 8.14453125, 8.5390625, 8.93359375, 9.328125, 9.72265625, 10.1171875, 10.51171875, 10.90625, 11.30078125, 11.6953125, 12.08984375, 12.484375, 12.87890625, 13.2734375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 18.0, 21.0, 17.0, 31.0, 19.0, 31.0, 17.0, 35.0, 53.0, 36.0, 50.0, 47.0, 61.0, 61.0, 54.0, 60.0, 58.0, 47.0, 56.0, 32.0, 30.0, 31.0, 27.0, 18.0, 13.0, 15.0, 16.0, 11.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.50990104675293, -29.452804565429688, -28.395709991455078, -27.338613510131836, -26.281517028808594, -25.224422454833984, -24.167325973510742, -23.1102294921875, -22.05313491821289, -20.99603843688965, -19.93894386291504, -18.881847381591797, -17.824750900268555, -16.767654418945312, -15.710559844970703, -14.653463363647461, -13.596366882324219, -12.539271354675293, -11.48217487335205, -10.425079345703125, -9.367982864379883, -8.310887336730957, -7.253791809082031, -6.196695804595947, -5.139599800109863, -4.082503795623779, -3.0254080295562744, -1.9683122634887695, -0.9112162590026855, 0.14587974548339844, 1.2029752731323242, 2.260071277618408, 3.317169189453125, 4.374265193939209, 5.431361198425293, 6.488456726074219, 7.545552730560303, 8.602648735046387, 9.659744262695312, 10.716840744018555, 11.77393627166748, 12.831031799316406, 13.888128280639648, 14.945223808288574, 16.0023193359375, 17.059415817260742, 18.116512298583984, 19.173606872558594, 20.230703353881836, 21.287799835205078, 22.344894409179688, 23.40199089050293, 24.459087371826172, 25.51618194580078, 26.573278427124023, 27.630374908447266, 28.687469482421875, 29.744565963745117, 30.801660537719727, 31.85875701904297, 32.91585159301758, 33.97294998168945, 35.03004455566406, 36.08713912963867, 37.14423751831055]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 13.0, 7.0, 18.0, 20.0, 21.0, 21.0, 28.0, 26.0, 34.0, 36.0, 38.0, 40.0, 37.0, 38.0, 36.0, 39.0, 50.0, 46.0, 43.0, 31.0, 37.0, 35.0, 25.0, 25.0, 32.0, 29.0, 25.0, 31.0, 19.0, 22.0, 8.0, 17.0, 11.0, 7.0, 11.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.82933235168457, -25.998638153076172, -25.16794204711914, -24.337247848510742, -23.50655174255371, -22.675857543945312, -21.84516143798828, -21.014467239379883, -20.183773040771484, -19.353078842163086, -18.522382736206055, -17.691688537597656, -16.860992431640625, -16.030298233032227, -15.199603080749512, -14.368907928466797, -13.538211822509766, -12.70751667022705, -11.876821517944336, -11.046127319335938, -10.215431213378906, -9.384737014770508, -8.554041862487793, -7.723346710205078, -6.892651557922363, -6.061956405639648, -5.231261253356934, -4.400566577911377, -3.569871425628662, -2.7391762733459473, -1.9084815979003906, -1.0777864456176758, -0.24708938598632812, 0.5836056470870972, 1.4143006801605225, 2.244995594024658, 3.075690746307373, 3.906385898590088, 4.7370805740356445, 5.567775726318359, 6.398470878601074, 7.229166030883789, 8.059861183166504, 8.890556335449219, 9.721250534057617, 10.551946640014648, 11.382640838623047, 12.213335990905762, 13.044031143188477, 13.874726295471191, 14.705421447753906, 15.536115646362305, 16.366811752319336, 17.197505950927734, 18.028202056884766, 18.858896255493164, 19.689590454101562, 20.52028465270996, 21.350980758666992, 22.18167495727539, 23.012371063232422, 23.84306526184082, 24.67375946044922, 25.50445556640625, 26.33515167236328]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 17.0, 19.0, 31.0, 43.0, 77.0, 87.0, 147.0, 224.0, 339.0, 516.0, 854.0, 1359.0, 1890.0, 3049.0, 4505.0, 6896.0, 10347.0, 15084.0, 22622.0, 33123.0, 47921.0, 67835.0, 91363.0, 115509.0, 131494.0, 125950.0, 105654.0, 79613.0, 57718.0, 40394.0, 27504.0, 18776.0, 12876.0, 8414.0, 5651.0, 3673.0, 2466.0, 1545.0, 1020.0, 697.0, 445.0, 323.0, 165.0, 103.0, 83.0, 52.0, 31.0, 23.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-14.734375, -14.28466796875, -13.8349609375, -13.38525390625, -12.935546875, -12.48583984375, -12.0361328125, -11.58642578125, -11.13671875, -10.68701171875, -10.2373046875, -9.78759765625, -9.337890625, -8.88818359375, -8.4384765625, -7.98876953125, -7.5390625, -7.08935546875, -6.6396484375, -6.18994140625, -5.740234375, -5.29052734375, -4.8408203125, -4.39111328125, -3.94140625, -3.49169921875, -3.0419921875, -2.59228515625, -2.142578125, -1.69287109375, -1.2431640625, -0.79345703125, -0.34375, 0.10595703125, 0.5556640625, 1.00537109375, 1.455078125, 1.90478515625, 2.3544921875, 2.80419921875, 3.25390625, 3.70361328125, 4.1533203125, 4.60302734375, 5.052734375, 5.50244140625, 5.9521484375, 6.40185546875, 6.8515625, 7.30126953125, 7.7509765625, 8.20068359375, 8.650390625, 9.10009765625, 9.5498046875, 9.99951171875, 10.44921875, 10.89892578125, 11.3486328125, 11.79833984375, 12.248046875, 12.69775390625, 13.1474609375, 13.59716796875, 14.046875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 17.0, 17.0, 16.0, 17.0, 16.0, 29.0, 34.0, 41.0, 37.0, 37.0, 45.0, 36.0, 46.0, 47.0, 38.0, 53.0, 43.0, 36.0, 27.0, 32.0, 38.0, 27.0, 34.0, 34.0, 25.0, 23.0, 20.0, 27.0, 19.0, 12.0, 13.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.796875, -23.990478515625, -23.18408203125, -22.377685546875, -21.5712890625, -20.764892578125, -19.95849609375, -19.152099609375, -18.345703125, -17.539306640625, -16.73291015625, -15.926513671875, -15.1201171875, -14.313720703125, -13.50732421875, -12.700927734375, -11.89453125, -11.088134765625, -10.28173828125, -9.475341796875, -8.6689453125, -7.862548828125, -7.05615234375, -6.249755859375, -5.443359375, -4.636962890625, -3.83056640625, -3.024169921875, -2.2177734375, -1.411376953125, -0.60498046875, 0.201416015625, 1.0078125, 1.814208984375, 2.62060546875, 3.427001953125, 4.2333984375, 5.039794921875, 5.84619140625, 6.652587890625, 7.458984375, 8.265380859375, 9.07177734375, 9.878173828125, 10.6845703125, 11.490966796875, 12.29736328125, 13.103759765625, 13.91015625, 14.716552734375, 15.52294921875, 16.329345703125, 17.1357421875, 17.942138671875, 18.74853515625, 19.554931640625, 20.361328125, 21.167724609375, 21.97412109375, 22.780517578125, 23.5869140625, 24.393310546875, 25.19970703125, 26.006103515625, 26.8125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 6.0, 9.0, 13.0, 11.0, 25.0, 23.0, 42.0, 65.0, 63.0, 132.0, 151.0, 209.0, 301.0, 444.0, 662.0, 951.0, 1321.0, 2091.0, 3223.0, 5351.0, 8662.0, 15274.0, 32503.0, 724323.0, 193773.0, 24985.0, 13108.0, 7510.0, 4683.0, 2910.0, 1873.0, 1240.0, 817.0, 555.0, 355.0, 261.0, 191.0, 125.0, 89.0, 66.0, 57.0, 39.0, 18.0, 19.0, 7.0, 8.0, 6.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.0, -33.86572265625, -32.7314453125, -31.59716796875, -30.462890625, -29.32861328125, -28.1943359375, -27.06005859375, -25.92578125, -24.79150390625, -23.6572265625, -22.52294921875, -21.388671875, -20.25439453125, -19.1201171875, -17.98583984375, -16.8515625, -15.71728515625, -14.5830078125, -13.44873046875, -12.314453125, -11.18017578125, -10.0458984375, -8.91162109375, -7.77734375, -6.64306640625, -5.5087890625, -4.37451171875, -3.240234375, -2.10595703125, -0.9716796875, 0.16259765625, 1.296875, 2.43115234375, 3.5654296875, 4.69970703125, 5.833984375, 6.96826171875, 8.1025390625, 9.23681640625, 10.37109375, 11.50537109375, 12.6396484375, 13.77392578125, 14.908203125, 16.04248046875, 17.1767578125, 18.31103515625, 19.4453125, 20.57958984375, 21.7138671875, 22.84814453125, 23.982421875, 25.11669921875, 26.2509765625, 27.38525390625, 28.51953125, 29.65380859375, 30.7880859375, 31.92236328125, 33.056640625, 34.19091796875, 35.3251953125, 36.45947265625, 37.59375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 11.0, 8.0, 8.0, 12.0, 8.0, 18.0, 14.0, 27.0, 20.0, 30.0, 29.0, 36.0, 42.0, 52.0, 47.0, 54.0, 56.0, 60.0, 59.0, 48.0, 49.0, 39.0, 47.0, 37.0, 35.0, 26.0, 20.0, 24.0, 19.0, 14.0, 11.0, 7.0, 9.0, 2.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.546630859375, -22.68701171875, -21.827392578125, -20.9677734375, -20.108154296875, -19.24853515625, -18.388916015625, -17.529296875, -16.669677734375, -15.81005859375, -14.950439453125, -14.0908203125, -13.231201171875, -12.37158203125, -11.511962890625, -10.65234375, -9.792724609375, -8.93310546875, -8.073486328125, -7.2138671875, -6.354248046875, -5.49462890625, -4.635009765625, -3.775390625, -2.915771484375, -2.05615234375, -1.196533203125, -0.3369140625, 0.522705078125, 1.38232421875, 2.241943359375, 3.1015625, 3.961181640625, 4.82080078125, 5.680419921875, 6.5400390625, 7.399658203125, 8.25927734375, 9.118896484375, 9.978515625, 10.838134765625, 11.69775390625, 12.557373046875, 13.4169921875, 14.276611328125, 15.13623046875, 15.995849609375, 16.85546875, 17.715087890625, 18.57470703125, 19.434326171875, 20.2939453125, 21.153564453125, 22.01318359375, 22.872802734375, 23.732421875, 24.592041015625, 25.45166015625, 26.311279296875, 27.1708984375, 28.030517578125, 28.89013671875, 29.749755859375, 30.609375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 11.0, 4.0, 8.0, 6.0, 15.0, 19.0, 27.0, 33.0, 33.0, 78.0, 105.0, 175.0, 242.0, 429.0, 600.0, 998.0, 1839.0, 3163.0, 5787.0, 10821.0, 23013.0, 101112.0, 823349.0, 40568.0, 16720.0, 8463.0, 4579.0, 2451.0, 1461.0, 892.0, 486.0, 365.0, 230.0, 138.0, 95.0, 68.0, 54.0, 36.0, 29.0, 16.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4921875, -7.26019287109375, -7.0281982421875, -6.79620361328125, -6.564208984375, -6.33221435546875, -6.1002197265625, -5.86822509765625, -5.63623046875, -5.40423583984375, -5.1722412109375, -4.94024658203125, -4.708251953125, -4.47625732421875, -4.2442626953125, -4.01226806640625, -3.7802734375, -3.54827880859375, -3.3162841796875, -3.08428955078125, -2.852294921875, -2.62030029296875, -2.3883056640625, -2.15631103515625, -1.92431640625, -1.69232177734375, -1.4603271484375, -1.22833251953125, -0.996337890625, -0.76434326171875, -0.5323486328125, -0.30035400390625, -0.068359375, 0.16363525390625, 0.3956298828125, 0.62762451171875, 0.859619140625, 1.09161376953125, 1.3236083984375, 1.55560302734375, 1.78759765625, 2.01959228515625, 2.2515869140625, 2.48358154296875, 2.715576171875, 2.94757080078125, 3.1795654296875, 3.41156005859375, 3.6435546875, 3.87554931640625, 4.1075439453125, 4.33953857421875, 4.571533203125, 4.80352783203125, 5.0355224609375, 5.26751708984375, 5.49951171875, 5.73150634765625, 5.9635009765625, 6.19549560546875, 6.427490234375, 6.65948486328125, 6.8914794921875, 7.12347412109375, 7.35546875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 6.0, 10.0, 9.0, 9.0, 9.0, 21.0, 21.0, 28.0, 38.0, 41.0, 59.0, 64.0, 75.0, 77.0, 91.0, 79.0, 68.0, 51.0, 39.0, 25.0, 30.0, 19.0, 18.0, 13.0, 17.0, 16.0, 9.0, 8.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009636133909225464, -0.000932544469833374, -0.0009014755487442017, -0.0008704066276550293, -0.0008393377065658569, -0.0008082687854766846, -0.0007771998643875122, -0.0007461309432983398, -0.0007150620222091675, -0.0006839931011199951, -0.0006529241800308228, -0.0006218552589416504, -0.000590786337852478, -0.0005597174167633057, -0.0005286484956741333, -0.0004975795745849609, -0.0004665106534957886, -0.0004354417324066162, -0.00040437281131744385, -0.0003733038902282715, -0.0003422349691390991, -0.00031116604804992676, -0.0002800971269607544, -0.00024902820587158203, -0.00021795928478240967, -0.0001868903636932373, -0.00015582144260406494, -0.00012475252151489258, -9.368360042572021e-05, -6.261467933654785e-05, -3.154575824737549e-05, -4.76837158203125e-07, 3.059208393096924e-05, 6.16610050201416e-05, 9.272992610931396e-05, 0.00012379884719848633, 0.0001548677682876587, 0.00018593668937683105, 0.00021700561046600342, 0.0002480745315551758, 0.00027914345264434814, 0.0003102123737335205, 0.00034128129482269287, 0.00037235021591186523, 0.0004034191370010376, 0.00043448805809020996, 0.0004655569791793823, 0.0004966259002685547, 0.000527694821357727, 0.0005587637424468994, 0.0005898326635360718, 0.0006209015846252441, 0.0006519705057144165, 0.0006830394268035889, 0.0007141083478927612, 0.0007451772689819336, 0.000776246190071106, 0.0008073151111602783, 0.0008383840322494507, 0.000869452953338623, 0.0009005218744277954, 0.0009315907955169678, 0.0009626597166061401, 0.0009937286376953125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 15.0, 12.0, 25.0, 33.0, 47.0, 65.0, 79.0, 154.0, 198.0, 290.0, 414.0, 638.0, 1054.0, 1535.0, 2600.0, 4377.0, 7614.0, 13250.0, 24151.0, 43480.0, 76554.0, 126405.0, 180612.0, 194406.0, 149415.0, 94911.0, 55291.0, 30497.0, 16927.0, 9409.0, 5391.0, 3200.0, 1925.0, 1267.0, 785.0, 463.0, 332.0, 212.0, 143.0, 103.0, 76.0, 58.0, 33.0, 46.0, 26.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.77734375, -3.666900634765625, -3.55645751953125, -3.446014404296875, -3.3355712890625, -3.225128173828125, -3.11468505859375, -3.004241943359375, -2.893798828125, -2.783355712890625, -2.67291259765625, -2.562469482421875, -2.4520263671875, -2.341583251953125, -2.23114013671875, -2.120697021484375, -2.01025390625, -1.899810791015625, -1.78936767578125, -1.678924560546875, -1.5684814453125, -1.458038330078125, -1.34759521484375, -1.237152099609375, -1.126708984375, -1.016265869140625, -0.90582275390625, -0.795379638671875, -0.6849365234375, -0.574493408203125, -0.46405029296875, -0.353607177734375, -0.2431640625, -0.132720947265625, -0.02227783203125, 0.088165283203125, 0.1986083984375, 0.309051513671875, 0.41949462890625, 0.529937744140625, 0.640380859375, 0.750823974609375, 0.86126708984375, 0.971710205078125, 1.0821533203125, 1.192596435546875, 1.30303955078125, 1.413482666015625, 1.52392578125, 1.634368896484375, 1.74481201171875, 1.855255126953125, 1.9656982421875, 2.076141357421875, 2.18658447265625, 2.297027587890625, 2.407470703125, 2.517913818359375, 2.62835693359375, 2.738800048828125, 2.8492431640625, 2.959686279296875, 3.07012939453125, 3.180572509765625, 3.291015625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 11.0, 12.0, 11.0, 9.0, 15.0, 25.0, 22.0, 25.0, 45.0, 58.0, 43.0, 64.0, 60.0, 53.0, 80.0, 55.0, 57.0, 61.0, 42.0, 40.0, 37.0, 35.0, 28.0, 24.0, 13.0, 10.0, 6.0, 6.0, 8.0, 13.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.41015625, -1.371368408203125, -1.33258056640625, -1.293792724609375, -1.2550048828125, -1.216217041015625, -1.17742919921875, -1.138641357421875, -1.099853515625, -1.061065673828125, -1.02227783203125, -0.983489990234375, -0.9447021484375, -0.905914306640625, -0.86712646484375, -0.828338623046875, -0.78955078125, -0.750762939453125, -0.71197509765625, -0.673187255859375, -0.6343994140625, -0.595611572265625, -0.55682373046875, -0.518035888671875, -0.479248046875, -0.440460205078125, -0.40167236328125, -0.362884521484375, -0.3240966796875, -0.285308837890625, -0.24652099609375, -0.207733154296875, -0.1689453125, -0.130157470703125, -0.09136962890625, -0.052581787109375, -0.0137939453125, 0.024993896484375, 0.06378173828125, 0.102569580078125, 0.141357421875, 0.180145263671875, 0.21893310546875, 0.257720947265625, 0.2965087890625, 0.335296630859375, 0.37408447265625, 0.412872314453125, 0.45166015625, 0.490447998046875, 0.52923583984375, 0.568023681640625, 0.6068115234375, 0.645599365234375, 0.68438720703125, 0.723175048828125, 0.761962890625, 0.800750732421875, 0.83953857421875, 0.878326416015625, 0.9171142578125, 0.955902099609375, 0.99468994140625, 1.033477783203125, 1.072265625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 13.0, 12.0, 23.0, 22.0, 21.0, 23.0, 31.0, 33.0, 35.0, 47.0, 45.0, 41.0, 44.0, 55.0, 58.0, 58.0, 50.0, 57.0, 52.0, 48.0, 33.0, 35.0, 25.0, 28.0, 28.0, 14.0, 11.0, 8.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.869583129882812, -23.966888427734375, -23.064193725585938, -22.1614990234375, -21.258804321289062, -20.356109619140625, -19.453414916992188, -18.55072021484375, -17.648025512695312, -16.745330810546875, -15.842636108398438, -14.93994140625, -14.037246704101562, -13.134552001953125, -12.231856346130371, -11.329161643981934, -10.42646598815918, -9.523771286010742, -8.621076583862305, -7.718381404876709, -6.8156867027282715, -5.912992000579834, -5.010296821594238, -4.107602119445801, -3.2049074172973633, -2.302212715148926, -1.3995177745819092, -0.4968228340148926, 0.4058718681335449, 1.3085665702819824, 2.211261749267578, 3.1139564514160156, 4.016651153564453, 4.919345855712891, 5.822040557861328, 6.724735736846924, 7.627430438995361, 8.53012466430664, 9.432820320129395, 10.335515022277832, 11.23820972442627, 12.140904426574707, 13.043599128723145, 13.946294784545898, 14.848989486694336, 15.751684188842773, 16.65437889099121, 17.55707359313965, 18.459768295288086, 19.362462997436523, 20.26515769958496, 21.1678524017334, 22.070547103881836, 22.973241806030273, 23.875938415527344, 24.77863311767578, 25.68132781982422, 26.584022521972656, 27.486717224121094, 28.38941192626953, 29.29210662841797, 30.194801330566406, 31.097496032714844, 32.00019073486328, 32.90288543701172]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 16.0, 9.0, 16.0, 19.0, 20.0, 17.0, 25.0, 26.0, 28.0, 37.0, 38.0, 37.0, 38.0, 51.0, 28.0, 45.0, 54.0, 42.0, 35.0, 42.0, 28.0, 34.0, 30.0, 32.0, 30.0, 27.0, 28.0, 31.0, 20.0, 13.0, 15.0, 27.0, 9.0, 6.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.204423904418945, -22.469974517822266, -21.735523223876953, -21.001073837280273, -20.26662254333496, -19.53217315673828, -18.79772186279297, -18.06327247619629, -17.32882308959961, -16.59437370300293, -15.859922409057617, -15.125473022460938, -14.391021728515625, -13.656572341918945, -12.92212200164795, -12.187671661376953, -11.45322036743164, -10.718770027160645, -9.984319686889648, -9.249870300292969, -8.515419006347656, -7.780969142913818, -7.0465192794799805, -6.312068939208984, -5.577618598937988, -4.843168258666992, -4.108717918395996, -3.374268054962158, -2.639817714691162, -1.905367374420166, -1.1709175109863281, -0.43646717071533203, 0.29798126220703125, 1.0324314832687378, 1.7668817043304443, 2.5013318061828613, 3.2357821464538574, 3.9702324867248535, 4.704682350158691, 5.4391326904296875, 6.173583030700684, 6.90803337097168, 7.642483711242676, 8.376934051513672, 9.111383438110352, 9.845834732055664, 10.580284118652344, 11.31473445892334, 12.049184799194336, 12.783635139465332, 13.518085479736328, 14.252534866333008, 14.98698616027832, 15.721435546875, 16.455886840820312, 17.190336227416992, 17.924785614013672, 18.65923500061035, 19.393686294555664, 20.128135681152344, 20.862586975097656, 21.597036361694336, 22.331485748291016, 23.065937042236328, 23.80038833618164]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 11.0, 11.0, 29.0, 37.0, 55.0, 95.0, 143.0, 237.0, 337.0, 530.0, 878.0, 1337.0, 1948.0, 3210.0, 4837.0, 7632.0, 11890.0, 18504.0, 27989.0, 41775.0, 59828.0, 82951.0, 106070.0, 122432.0, 126501.0, 115354.0, 94807.0, 70614.0, 50169.0, 33781.0, 22892.0, 14855.0, 9762.0, 5968.0, 3870.0, 2534.0, 1672.0, 1084.0, 669.0, 425.0, 291.0, 188.0, 118.0, 74.0, 49.0, 37.0, 29.0, 10.0, 9.0, 4.0, 8.0, 4.0, 1.0, 3.0, 3.0], "bins": [-28.765625, -27.900390625, -27.03515625, -26.169921875, -25.3046875, -24.439453125, -23.57421875, -22.708984375, -21.84375, -20.978515625, -20.11328125, -19.248046875, -18.3828125, -17.517578125, -16.65234375, -15.787109375, -14.921875, -14.056640625, -13.19140625, -12.326171875, -11.4609375, -10.595703125, -9.73046875, -8.865234375, -8.0, -7.134765625, -6.26953125, -5.404296875, -4.5390625, -3.673828125, -2.80859375, -1.943359375, -1.078125, -0.212890625, 0.65234375, 1.517578125, 2.3828125, 3.248046875, 4.11328125, 4.978515625, 5.84375, 6.708984375, 7.57421875, 8.439453125, 9.3046875, 10.169921875, 11.03515625, 11.900390625, 12.765625, 13.630859375, 14.49609375, 15.361328125, 16.2265625, 17.091796875, 17.95703125, 18.822265625, 19.6875, 20.552734375, 21.41796875, 22.283203125, 23.1484375, 24.013671875, 24.87890625, 25.744140625, 26.609375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 8.0, 10.0, 18.0, 7.0, 14.0, 19.0, 24.0, 20.0, 20.0, 38.0, 31.0, 33.0, 28.0, 38.0, 33.0, 46.0, 50.0, 28.0, 47.0, 31.0, 32.0, 43.0, 42.0, 43.0, 36.0, 27.0, 32.0, 19.0, 23.0, 27.0, 21.0, 15.0, 20.0, 17.0, 9.0, 10.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.796875, -21.098876953125, -20.40087890625, -19.702880859375, -19.0048828125, -18.306884765625, -17.60888671875, -16.910888671875, -16.212890625, -15.514892578125, -14.81689453125, -14.118896484375, -13.4208984375, -12.722900390625, -12.02490234375, -11.326904296875, -10.62890625, -9.930908203125, -9.23291015625, -8.534912109375, -7.8369140625, -7.138916015625, -6.44091796875, -5.742919921875, -5.044921875, -4.346923828125, -3.64892578125, -2.950927734375, -2.2529296875, -1.554931640625, -0.85693359375, -0.158935546875, 0.5390625, 1.237060546875, 1.93505859375, 2.633056640625, 3.3310546875, 4.029052734375, 4.72705078125, 5.425048828125, 6.123046875, 6.821044921875, 7.51904296875, 8.217041015625, 8.9150390625, 9.613037109375, 10.31103515625, 11.009033203125, 11.70703125, 12.405029296875, 13.10302734375, 13.801025390625, 14.4990234375, 15.197021484375, 15.89501953125, 16.593017578125, 17.291015625, 17.989013671875, 18.68701171875, 19.385009765625, 20.0830078125, 20.781005859375, 21.47900390625, 22.177001953125, 22.875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 20.0, 14.0, 23.0, 28.0, 53.0, 82.0, 136.0, 217.0, 325.0, 487.0, 781.0, 1177.0, 1777.0, 2847.0, 4137.0, 6166.0, 9528.0, 13520.0, 19323.0, 27671.0, 38352.0, 50891.0, 65814.0, 80844.0, 93688.0, 101429.0, 102982.0, 94082.0, 82344.0, 66949.0, 52426.0, 39184.0, 28400.0, 20232.0, 14013.0, 9541.0, 6513.0, 4295.0, 2852.0, 1847.0, 1222.0, 848.0, 544.0, 329.0, 211.0, 149.0, 81.0, 76.0, 42.0, 29.0, 17.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-22.859375, -22.14599609375, -21.4326171875, -20.71923828125, -20.005859375, -19.29248046875, -18.5791015625, -17.86572265625, -17.15234375, -16.43896484375, -15.7255859375, -15.01220703125, -14.298828125, -13.58544921875, -12.8720703125, -12.15869140625, -11.4453125, -10.73193359375, -10.0185546875, -9.30517578125, -8.591796875, -7.87841796875, -7.1650390625, -6.45166015625, -5.73828125, -5.02490234375, -4.3115234375, -3.59814453125, -2.884765625, -2.17138671875, -1.4580078125, -0.74462890625, -0.03125, 0.68212890625, 1.3955078125, 2.10888671875, 2.822265625, 3.53564453125, 4.2490234375, 4.96240234375, 5.67578125, 6.38916015625, 7.1025390625, 7.81591796875, 8.529296875, 9.24267578125, 9.9560546875, 10.66943359375, 11.3828125, 12.09619140625, 12.8095703125, 13.52294921875, 14.236328125, 14.94970703125, 15.6630859375, 16.37646484375, 17.08984375, 17.80322265625, 18.5166015625, 19.22998046875, 19.943359375, 20.65673828125, 21.3701171875, 22.08349609375, 22.796875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 8.0, 16.0, 13.0, 17.0, 19.0, 25.0, 26.0, 22.0, 32.0, 31.0, 30.0, 33.0, 31.0, 35.0, 37.0, 47.0, 47.0, 30.0, 43.0, 41.0, 31.0, 35.0, 45.0, 32.0, 32.0, 34.0, 37.0, 32.0, 30.0, 16.0, 9.0, 16.0, 15.0, 9.0, 7.0, 7.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.0625, -16.593505859375, -16.12451171875, -15.655517578125, -15.1865234375, -14.717529296875, -14.24853515625, -13.779541015625, -13.310546875, -12.841552734375, -12.37255859375, -11.903564453125, -11.4345703125, -10.965576171875, -10.49658203125, -10.027587890625, -9.55859375, -9.089599609375, -8.62060546875, -8.151611328125, -7.6826171875, -7.213623046875, -6.74462890625, -6.275634765625, -5.806640625, -5.337646484375, -4.86865234375, -4.399658203125, -3.9306640625, -3.461669921875, -2.99267578125, -2.523681640625, -2.0546875, -1.585693359375, -1.11669921875, -0.647705078125, -0.1787109375, 0.290283203125, 0.75927734375, 1.228271484375, 1.697265625, 2.166259765625, 2.63525390625, 3.104248046875, 3.5732421875, 4.042236328125, 4.51123046875, 4.980224609375, 5.44921875, 5.918212890625, 6.38720703125, 6.856201171875, 7.3251953125, 7.794189453125, 8.26318359375, 8.732177734375, 9.201171875, 9.670166015625, 10.13916015625, 10.608154296875, 11.0771484375, 11.546142578125, 12.01513671875, 12.484130859375, 12.953125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 7.0, 10.0, 18.0, 20.0, 35.0, 53.0, 81.0, 109.0, 199.0, 256.0, 436.0, 651.0, 1161.0, 2046.0, 3313.0, 5582.0, 9923.0, 17664.0, 31659.0, 56208.0, 95968.0, 149091.0, 189343.0, 176799.0, 127086.0, 77757.0, 44498.0, 25192.0, 14065.0, 7982.0, 4674.0, 2666.0, 1576.0, 896.0, 547.0, 373.0, 204.0, 133.0, 87.0, 56.0, 35.0, 35.0, 19.0, 17.0, 11.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-13.640625, -13.2247314453125, -12.808837890625, -12.3929443359375, -11.97705078125, -11.5611572265625, -11.145263671875, -10.7293701171875, -10.3134765625, -9.8975830078125, -9.481689453125, -9.0657958984375, -8.64990234375, -8.2340087890625, -7.818115234375, -7.4022216796875, -6.986328125, -6.5704345703125, -6.154541015625, -5.7386474609375, -5.32275390625, -4.9068603515625, -4.490966796875, -4.0750732421875, -3.6591796875, -3.2432861328125, -2.827392578125, -2.4114990234375, -1.99560546875, -1.5797119140625, -1.163818359375, -0.7479248046875, -0.33203125, 0.0838623046875, 0.499755859375, 0.9156494140625, 1.33154296875, 1.7474365234375, 2.163330078125, 2.5792236328125, 2.9951171875, 3.4110107421875, 3.826904296875, 4.2427978515625, 4.65869140625, 5.0745849609375, 5.490478515625, 5.9063720703125, 6.322265625, 6.7381591796875, 7.154052734375, 7.5699462890625, 7.98583984375, 8.4017333984375, 8.817626953125, 9.2335205078125, 9.6494140625, 10.0653076171875, 10.481201171875, 10.8970947265625, 11.31298828125, 11.7288818359375, 12.144775390625, 12.5606689453125, 12.9765625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 4.0, 8.0, 12.0, 10.0, 22.0, 25.0, 18.0, 43.0, 42.0, 48.0, 58.0, 71.0, 82.0, 87.0, 63.0, 80.0, 60.0, 62.0, 34.0, 39.0, 21.0, 31.0, 15.0, 10.0, 9.0, 7.0, 8.0, 5.0, 6.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00180816650390625, -0.0017583668231964111, -0.0017085671424865723, -0.0016587674617767334, -0.0016089677810668945, -0.0015591681003570557, -0.0015093684196472168, -0.001459568738937378, -0.001409769058227539, -0.0013599693775177002, -0.0013101696968078613, -0.0012603700160980225, -0.0012105703353881836, -0.0011607706546783447, -0.0011109709739685059, -0.001061171293258667, -0.0010113716125488281, -0.0009615719318389893, -0.0009117722511291504, -0.0008619725704193115, -0.0008121728897094727, -0.0007623732089996338, -0.0007125735282897949, -0.0006627738475799561, -0.0006129741668701172, -0.0005631744861602783, -0.0005133748054504395, -0.0004635751247406006, -0.0004137754440307617, -0.00036397576332092285, -0.000314176082611084, -0.0002643764019012451, -0.00021457672119140625, -0.00016477704048156738, -0.00011497735977172852, -6.517767906188965e-05, -1.537799835205078e-05, 3.4421682357788086e-05, 8.422136306762695e-05, 0.00013402104377746582, 0.0001838207244873047, 0.00023362040519714355, 0.0002834200859069824, 0.0003332197666168213, 0.00038301944732666016, 0.000432819128036499, 0.0004826188087463379, 0.0005324184894561768, 0.0005822181701660156, 0.0006320178508758545, 0.0006818175315856934, 0.0007316172122955322, 0.0007814168930053711, 0.00083121657371521, 0.0008810162544250488, 0.0009308159351348877, 0.0009806156158447266, 0.0010304152965545654, 0.0010802149772644043, 0.0011300146579742432, 0.001179814338684082, 0.001229614019393921, 0.0012794137001037598, 0.0013292133808135986, 0.0013790130615234375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 11.0, 11.0, 22.0, 19.0, 38.0, 54.0, 88.0, 121.0, 197.0, 305.0, 521.0, 856.0, 1473.0, 2468.0, 4160.0, 7301.0, 12294.0, 21399.0, 36063.0, 59802.0, 94490.0, 133180.0, 161283.0, 158612.0, 127981.0, 88716.0, 56004.0, 33810.0, 19544.0, 11599.0, 6604.0, 3877.0, 2228.0, 1337.0, 824.0, 477.0, 269.0, 183.0, 125.0, 60.0, 39.0, 32.0, 26.0, 13.0, 17.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.2578125, -9.9365234375, -9.615234375, -9.2939453125, -8.97265625, -8.6513671875, -8.330078125, -8.0087890625, -7.6875, -7.3662109375, -7.044921875, -6.7236328125, -6.40234375, -6.0810546875, -5.759765625, -5.4384765625, -5.1171875, -4.7958984375, -4.474609375, -4.1533203125, -3.83203125, -3.5107421875, -3.189453125, -2.8681640625, -2.546875, -2.2255859375, -1.904296875, -1.5830078125, -1.26171875, -0.9404296875, -0.619140625, -0.2978515625, 0.0234375, 0.3447265625, 0.666015625, 0.9873046875, 1.30859375, 1.6298828125, 1.951171875, 2.2724609375, 2.59375, 2.9150390625, 3.236328125, 3.5576171875, 3.87890625, 4.2001953125, 4.521484375, 4.8427734375, 5.1640625, 5.4853515625, 5.806640625, 6.1279296875, 6.44921875, 6.7705078125, 7.091796875, 7.4130859375, 7.734375, 8.0556640625, 8.376953125, 8.6982421875, 9.01953125, 9.3408203125, 9.662109375, 9.9833984375, 10.3046875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 26.0, 18.0, 41.0, 45.0, 52.0, 66.0, 63.0, 75.0, 57.0, 65.0, 56.0, 74.0, 63.0, 44.0, 32.0, 35.0, 22.0, 24.0, 13.0, 16.0, 14.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.74700927734375, -3.6112060546875, -3.47540283203125, -3.339599609375, -3.20379638671875, -3.0679931640625, -2.93218994140625, -2.79638671875, -2.66058349609375, -2.5247802734375, -2.38897705078125, -2.253173828125, -2.11737060546875, -1.9815673828125, -1.84576416015625, -1.7099609375, -1.57415771484375, -1.4383544921875, -1.30255126953125, -1.166748046875, -1.03094482421875, -0.8951416015625, -0.75933837890625, -0.62353515625, -0.48773193359375, -0.3519287109375, -0.21612548828125, -0.080322265625, 0.05548095703125, 0.1912841796875, 0.32708740234375, 0.462890625, 0.59869384765625, 0.7344970703125, 0.87030029296875, 1.006103515625, 1.14190673828125, 1.2777099609375, 1.41351318359375, 1.54931640625, 1.68511962890625, 1.8209228515625, 1.95672607421875, 2.092529296875, 2.22833251953125, 2.3641357421875, 2.49993896484375, 2.6357421875, 2.77154541015625, 2.9073486328125, 3.04315185546875, 3.178955078125, 3.31475830078125, 3.4505615234375, 3.58636474609375, 3.72216796875, 3.85797119140625, 3.9937744140625, 4.12957763671875, 4.265380859375, 4.40118408203125, 4.5369873046875, 4.67279052734375, 4.80859375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 7.0, 13.0, 3.0, 12.0, 16.0, 29.0, 30.0, 30.0, 37.0, 56.0, 44.0, 39.0, 63.0, 57.0, 67.0, 43.0, 37.0, 50.0, 53.0, 44.0, 45.0, 40.0, 38.0, 39.0, 23.0, 12.0, 16.0, 14.0, 5.0, 4.0, 8.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.73617935180664, -25.854040145874023, -24.971899032592773, -24.089759826660156, -23.20762062072754, -22.325481414794922, -21.443340301513672, -20.561201095581055, -19.679061889648438, -18.79692268371582, -17.91478157043457, -17.032642364501953, -16.150503158569336, -15.268362998962402, -14.386222839355469, -13.504083633422852, -12.621942520141602, -11.739802360534668, -10.85766315460205, -9.975522994995117, -9.0933837890625, -8.211243629455566, -7.329103469848633, -6.446963787078857, -5.564824104309082, -4.682684421539307, -3.800544500350952, -2.9184045791625977, -2.0362648963928223, -1.1541252136230469, -0.2719850540161133, 0.6101546287536621, 1.4922924041748047, 2.37443208694458, 3.2565720081329346, 4.138711929321289, 5.0208516120910645, 5.90299129486084, 6.785131454467773, 7.667271137237549, 8.549410820007324, 9.431550979614258, 10.313690185546875, 11.195830345153809, 12.077970504760742, 12.96010971069336, 13.842249870300293, 14.724390029907227, 15.606529235839844, 16.48866844177246, 17.37080955505371, 18.252948760986328, 19.135087966918945, 20.017227172851562, 20.899368286132812, 21.78150749206543, 22.663646697998047, 23.545785903930664, 24.427927017211914, 25.31006622314453, 26.19220542907715, 27.074344635009766, 27.956485748291016, 28.838624954223633, 29.720766067504883]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 0.0, 5.0, 5.0, 2.0, 11.0, 8.0, 8.0, 11.0, 10.0, 14.0, 7.0, 17.0, 18.0, 25.0, 19.0, 31.0, 22.0, 38.0, 36.0, 40.0, 38.0, 32.0, 51.0, 37.0, 34.0, 38.0, 48.0, 42.0, 32.0, 35.0, 33.0, 21.0, 32.0, 29.0, 23.0, 16.0, 23.0, 14.0, 15.0, 12.0, 13.0, 8.0, 15.0, 11.0, 5.0, 9.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-24.233980178833008, -23.551773071289062, -22.869565963745117, -22.187358856201172, -21.505151748657227, -20.82294464111328, -20.14073944091797, -19.45853042602539, -18.776325225830078, -18.094118118286133, -17.411911010742188, -16.729703903198242, -16.047496795654297, -15.365289688110352, -14.683083534240723, -14.000876426696777, -13.318668365478516, -12.63646125793457, -11.954254150390625, -11.27204704284668, -10.589839935302734, -9.907632827758789, -9.22542667388916, -8.543219566345215, -7.8610124588012695, -7.178805351257324, -6.496598243713379, -5.814391613006592, -5.1321845054626465, -4.449977397918701, -3.767770767211914, -3.0855636596679688, -2.4033584594726562, -1.7211514711380005, -1.0389444828033447, -0.3567376136779785, 0.3254694938659668, 1.007676601409912, 1.6898832321166992, 2.3720903396606445, 3.05429744720459, 3.736504554748535, 4.4187116622924805, 5.100918292999268, 5.783125400543213, 6.465332508087158, 7.147539138793945, 7.829746246337891, 8.511953353881836, 9.194160461425781, 9.876367568969727, 10.558574676513672, 11.240781784057617, 11.922988891601562, 12.605195045471191, 13.287402153015137, 13.969609260559082, 14.651816368103027, 15.334023475646973, 16.0162296295166, 16.698436737060547, 17.380643844604492, 18.062850952148438, 18.745058059692383, 19.427265167236328]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 10.0, 16.0, 20.0, 39.0, 60.0, 95.0, 133.0, 200.0, 294.0, 509.0, 811.0, 1348.0, 2261.0, 3855.0, 6811.0, 11720.0, 21053.0, 39053.0, 73023.0, 141012.0, 273685.0, 518285.0, 843565.0, 919731.0, 625401.0, 338054.0, 174321.0, 91071.0, 47567.0, 25884.0, 14245.0, 8200.0, 4815.0, 2782.0, 1713.0, 1011.0, 617.0, 371.0, 243.0, 140.0, 107.0, 58.0, 35.0, 17.0, 16.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-27.390625, -26.482421875, -25.57421875, -24.666015625, -23.7578125, -22.849609375, -21.94140625, -21.033203125, -20.125, -19.216796875, -18.30859375, -17.400390625, -16.4921875, -15.583984375, -14.67578125, -13.767578125, -12.859375, -11.951171875, -11.04296875, -10.134765625, -9.2265625, -8.318359375, -7.41015625, -6.501953125, -5.59375, -4.685546875, -3.77734375, -2.869140625, -1.9609375, -1.052734375, -0.14453125, 0.763671875, 1.671875, 2.580078125, 3.48828125, 4.396484375, 5.3046875, 6.212890625, 7.12109375, 8.029296875, 8.9375, 9.845703125, 10.75390625, 11.662109375, 12.5703125, 13.478515625, 14.38671875, 15.294921875, 16.203125, 17.111328125, 18.01953125, 18.927734375, 19.8359375, 20.744140625, 21.65234375, 22.560546875, 23.46875, 24.376953125, 25.28515625, 26.193359375, 27.1015625, 28.009765625, 28.91796875, 29.826171875, 30.734375]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 3.0, 5.0, 9.0, 7.0, 9.0, 10.0, 9.0, 13.0, 11.0, 14.0, 17.0, 21.0, 21.0, 28.0, 37.0, 42.0, 32.0, 21.0, 35.0, 46.0, 41.0, 42.0, 35.0, 44.0, 39.0, 38.0, 36.0, 42.0, 31.0, 26.0, 26.0, 32.0, 24.0, 23.0, 12.0, 13.0, 15.0, 21.0, 11.0, 11.0, 10.0, 6.0, 6.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.984375, -16.462158203125, -15.93994140625, -15.417724609375, -14.8955078125, -14.373291015625, -13.85107421875, -13.328857421875, -12.806640625, -12.284423828125, -11.76220703125, -11.239990234375, -10.7177734375, -10.195556640625, -9.67333984375, -9.151123046875, -8.62890625, -8.106689453125, -7.58447265625, -7.062255859375, -6.5400390625, -6.017822265625, -5.49560546875, -4.973388671875, -4.451171875, -3.928955078125, -3.40673828125, -2.884521484375, -2.3623046875, -1.840087890625, -1.31787109375, -0.795654296875, -0.2734375, 0.248779296875, 0.77099609375, 1.293212890625, 1.8154296875, 2.337646484375, 2.85986328125, 3.382080078125, 3.904296875, 4.426513671875, 4.94873046875, 5.470947265625, 5.9931640625, 6.515380859375, 7.03759765625, 7.559814453125, 8.08203125, 8.604248046875, 9.12646484375, 9.648681640625, 10.1708984375, 10.693115234375, 11.21533203125, 11.737548828125, 12.259765625, 12.781982421875, 13.30419921875, 13.826416015625, 14.3486328125, 14.870849609375, 15.39306640625, 15.915283203125, 16.4375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 9.0, 22.0, 35.0, 63.0, 99.0, 146.0, 227.0, 345.0, 562.0, 889.0, 1380.0, 2238.0, 3472.0, 5520.0, 8517.0, 13684.0, 21011.0, 33408.0, 52339.0, 82529.0, 127678.0, 196691.0, 295586.0, 423378.0, 556947.0, 618748.0, 542010.0, 405500.0, 280182.0, 186211.0, 121175.0, 78030.0, 49481.0, 31531.0, 20051.0, 12467.0, 7966.0, 4983.0, 3329.0, 2165.0, 1281.0, 878.0, 566.0, 349.0, 225.0, 137.0, 88.0, 62.0, 29.0, 30.0, 16.0, 11.0, 4.0, 0.0, 3.0, 1.0, 1.0], "bins": [-18.046875, -17.490478515625, -16.93408203125, -16.377685546875, -15.8212890625, -15.264892578125, -14.70849609375, -14.152099609375, -13.595703125, -13.039306640625, -12.48291015625, -11.926513671875, -11.3701171875, -10.813720703125, -10.25732421875, -9.700927734375, -9.14453125, -8.588134765625, -8.03173828125, -7.475341796875, -6.9189453125, -6.362548828125, -5.80615234375, -5.249755859375, -4.693359375, -4.136962890625, -3.58056640625, -3.024169921875, -2.4677734375, -1.911376953125, -1.35498046875, -0.798583984375, -0.2421875, 0.314208984375, 0.87060546875, 1.427001953125, 1.9833984375, 2.539794921875, 3.09619140625, 3.652587890625, 4.208984375, 4.765380859375, 5.32177734375, 5.878173828125, 6.4345703125, 6.990966796875, 7.54736328125, 8.103759765625, 8.66015625, 9.216552734375, 9.77294921875, 10.329345703125, 10.8857421875, 11.442138671875, 11.99853515625, 12.554931640625, 13.111328125, 13.667724609375, 14.22412109375, 14.780517578125, 15.3369140625, 15.893310546875, 16.44970703125, 17.006103515625, 17.5625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 11.0, 5.0, 13.0, 5.0, 18.0, 19.0, 22.0, 33.0, 39.0, 34.0, 55.0, 69.0, 69.0, 110.0, 133.0, 157.0, 158.0, 207.0, 238.0, 240.0, 277.0, 263.0, 258.0, 241.0, 224.0, 222.0, 150.0, 138.0, 114.0, 93.0, 89.0, 86.0, 65.0, 58.0, 40.0, 31.0, 25.0, 17.0, 8.0, 16.0, 4.0, 4.0, 1.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.078125, -8.80615234375, -8.5341796875, -8.26220703125, -7.990234375, -7.71826171875, -7.4462890625, -7.17431640625, -6.90234375, -6.63037109375, -6.3583984375, -6.08642578125, -5.814453125, -5.54248046875, -5.2705078125, -4.99853515625, -4.7265625, -4.45458984375, -4.1826171875, -3.91064453125, -3.638671875, -3.36669921875, -3.0947265625, -2.82275390625, -2.55078125, -2.27880859375, -2.0068359375, -1.73486328125, -1.462890625, -1.19091796875, -0.9189453125, -0.64697265625, -0.375, -0.10302734375, 0.1689453125, 0.44091796875, 0.712890625, 0.98486328125, 1.2568359375, 1.52880859375, 1.80078125, 2.07275390625, 2.3447265625, 2.61669921875, 2.888671875, 3.16064453125, 3.4326171875, 3.70458984375, 3.9765625, 4.24853515625, 4.5205078125, 4.79248046875, 5.064453125, 5.33642578125, 5.6083984375, 5.88037109375, 6.15234375, 6.42431640625, 6.6962890625, 6.96826171875, 7.240234375, 7.51220703125, 7.7841796875, 8.05615234375, 8.328125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 10.0, 9.0, 17.0, 10.0, 13.0, 17.0, 24.0, 32.0, 38.0, 36.0, 46.0, 36.0, 50.0, 44.0, 63.0, 46.0, 45.0, 55.0, 54.0, 59.0, 42.0, 26.0, 40.0, 29.0, 35.0, 19.0, 14.0, 16.0, 15.0, 13.0, 7.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.473526000976562, -24.72777557373047, -23.982027053833008, -23.236276626586914, -22.490528106689453, -21.74477767944336, -20.999027252197266, -20.253278732299805, -19.50752830505371, -18.761777877807617, -18.016029357910156, -17.270278930664062, -16.5245304107666, -15.778779983520508, -15.03303050994873, -14.287281036376953, -13.541531562805176, -12.795782089233398, -12.050032615661621, -11.304283142089844, -10.55853271484375, -9.812783241271973, -9.067033767700195, -8.321283340454102, -7.575534343719482, -6.829784870147705, -6.0840349197387695, -5.338285446166992, -4.592535972595215, -3.8467860221862793, -3.101036548614502, -2.3552865982055664, -1.609537124633789, -0.8637874722480774, -0.11803781986236572, 0.6277117729187012, 1.3734614849090576, 2.119211196899414, 2.8649606704711914, 3.610710620880127, 4.356460094451904, 5.102209568023682, 5.847959518432617, 6.5937089920043945, 7.339458465576172, 8.085208892822266, 8.830957412719727, 9.57670783996582, 10.322457313537598, 11.068206787109375, 11.813956260681152, 12.55970573425293, 13.305456161499023, 14.0512056350708, 14.796955108642578, 15.542705535888672, 16.288454055786133, 17.034204483032227, 17.779953002929688, 18.52570343017578, 19.271451950073242, 20.017202377319336, 20.762950897216797, 21.50870132446289, 22.254451751708984]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 6.0, 2.0, 7.0, 3.0, 10.0, 4.0, 6.0, 9.0, 8.0, 10.0, 13.0, 20.0, 18.0, 20.0, 28.0, 30.0, 41.0, 25.0, 39.0, 31.0, 37.0, 48.0, 46.0, 34.0, 37.0, 43.0, 35.0, 35.0, 48.0, 20.0, 42.0, 31.0, 29.0, 32.0, 20.0, 21.0, 25.0, 18.0, 19.0, 18.0, 13.0, 5.0, 4.0, 5.0, 7.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.582006454467773, -20.952877044677734, -20.323745727539062, -19.694616317749023, -19.065486907958984, -18.436357498168945, -17.807228088378906, -17.178096771240234, -16.548967361450195, -15.919837951660156, -15.2907075881958, -14.661577224731445, -14.032447814941406, -13.403318405151367, -12.774188041687012, -12.145057678222656, -11.515928268432617, -10.886798858642578, -10.257668495178223, -9.628538131713867, -8.999408721923828, -8.370279312133789, -7.741148948669434, -7.112019062042236, -6.482889175415039, -5.853759288787842, -5.2246294021606445, -4.595499515533447, -3.96636962890625, -3.3372397422790527, -2.7081098556518555, -2.078979969024658, -1.449850082397461, -0.8207201957702637, -0.1915903091430664, 0.43753957748413086, 1.0666694641113281, 1.6957993507385254, 2.3249292373657227, 2.95405912399292, 3.583189010620117, 4.2123188972473145, 4.841448783874512, 5.470578670501709, 6.099708557128906, 6.7288384437561035, 7.357968330383301, 7.987098217010498, 8.616228103637695, 9.245357513427734, 9.87448787689209, 10.503618240356445, 11.132747650146484, 11.761877059936523, 12.391007423400879, 13.020137786865234, 13.649267196655273, 14.278396606445312, 14.907526969909668, 15.536657333374023, 16.165786743164062, 16.7949161529541, 17.42404556274414, 18.053176879882812, 18.68230628967285]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 11.0, 15.0, 21.0, 37.0, 55.0, 88.0, 157.0, 234.0, 379.0, 650.0, 999.0, 1725.0, 2692.0, 4180.0, 6711.0, 10472.0, 15782.0, 23705.0, 34523.0, 48728.0, 65560.0, 84325.0, 101317.0, 112252.0, 112471.0, 103065.0, 87416.0, 69400.0, 51491.0, 36936.0, 25459.0, 17051.0, 11179.0, 7119.0, 4619.0, 2935.0, 1861.0, 1104.0, 682.0, 405.0, 265.0, 180.0, 131.0, 64.0, 47.0, 25.0, 12.0, 7.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-13.0546875, -12.6717529296875, -12.288818359375, -11.9058837890625, -11.52294921875, -11.1400146484375, -10.757080078125, -10.3741455078125, -9.9912109375, -9.6082763671875, -9.225341796875, -8.8424072265625, -8.45947265625, -8.0765380859375, -7.693603515625, -7.3106689453125, -6.927734375, -6.5447998046875, -6.161865234375, -5.7789306640625, -5.39599609375, -5.0130615234375, -4.630126953125, -4.2471923828125, -3.8642578125, -3.4813232421875, -3.098388671875, -2.7154541015625, -2.33251953125, -1.9495849609375, -1.566650390625, -1.1837158203125, -0.80078125, -0.4178466796875, -0.034912109375, 0.3480224609375, 0.73095703125, 1.1138916015625, 1.496826171875, 1.8797607421875, 2.2626953125, 2.6456298828125, 3.028564453125, 3.4114990234375, 3.79443359375, 4.1773681640625, 4.560302734375, 4.9432373046875, 5.326171875, 5.7091064453125, 6.092041015625, 6.4749755859375, 6.85791015625, 7.2408447265625, 7.623779296875, 8.0067138671875, 8.3896484375, 8.7725830078125, 9.155517578125, 9.5384521484375, 9.92138671875, 10.3043212890625, 10.687255859375, 11.0701904296875, 11.453125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 5.0, 3.0, 11.0, 10.0, 14.0, 15.0, 11.0, 24.0, 24.0, 35.0, 18.0, 32.0, 37.0, 32.0, 60.0, 41.0, 37.0, 41.0, 41.0, 44.0, 42.0, 41.0, 32.0, 36.0, 38.0, 30.0, 27.0, 27.0, 28.0, 33.0, 27.0, 16.0, 13.0, 17.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.55517578125, -17.0166015625, -16.47802734375, -15.939453125, -15.40087890625, -14.8623046875, -14.32373046875, -13.78515625, -13.24658203125, -12.7080078125, -12.16943359375, -11.630859375, -11.09228515625, -10.5537109375, -10.01513671875, -9.4765625, -8.93798828125, -8.3994140625, -7.86083984375, -7.322265625, -6.78369140625, -6.2451171875, -5.70654296875, -5.16796875, -4.62939453125, -4.0908203125, -3.55224609375, -3.013671875, -2.47509765625, -1.9365234375, -1.39794921875, -0.859375, -0.32080078125, 0.2177734375, 0.75634765625, 1.294921875, 1.83349609375, 2.3720703125, 2.91064453125, 3.44921875, 3.98779296875, 4.5263671875, 5.06494140625, 5.603515625, 6.14208984375, 6.6806640625, 7.21923828125, 7.7578125, 8.29638671875, 8.8349609375, 9.37353515625, 9.912109375, 10.45068359375, 10.9892578125, 11.52783203125, 12.06640625, 12.60498046875, 13.1435546875, 13.68212890625, 14.220703125, 14.75927734375, 15.2978515625, 15.83642578125, 16.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 2.0, 4.0, 5.0, 6.0, 9.0, 17.0, 15.0, 22.0, 41.0, 47.0, 50.0, 81.0, 120.0, 178.0, 205.0, 302.0, 413.0, 627.0, 833.0, 1233.0, 1712.0, 2520.0, 3452.0, 5218.0, 7937.0, 12790.0, 21520.0, 63395.0, 808992.0, 58145.0, 20983.0, 12579.0, 7964.0, 5200.0, 3692.0, 2421.0, 1728.0, 1133.0, 819.0, 619.0, 440.0, 287.0, 211.0, 161.0, 115.0, 81.0, 61.0, 46.0, 37.0, 27.0, 14.0, 17.0, 12.0, 5.0, 7.0, 6.0, 3.0, 2.0, 3.0, 1.0], "bins": [-36.75, -35.61865234375, -34.4873046875, -33.35595703125, -32.224609375, -31.09326171875, -29.9619140625, -28.83056640625, -27.69921875, -26.56787109375, -25.4365234375, -24.30517578125, -23.173828125, -22.04248046875, -20.9111328125, -19.77978515625, -18.6484375, -17.51708984375, -16.3857421875, -15.25439453125, -14.123046875, -12.99169921875, -11.8603515625, -10.72900390625, -9.59765625, -8.46630859375, -7.3349609375, -6.20361328125, -5.072265625, -3.94091796875, -2.8095703125, -1.67822265625, -0.546875, 0.58447265625, 1.7158203125, 2.84716796875, 3.978515625, 5.10986328125, 6.2412109375, 7.37255859375, 8.50390625, 9.63525390625, 10.7666015625, 11.89794921875, 13.029296875, 14.16064453125, 15.2919921875, 16.42333984375, 17.5546875, 18.68603515625, 19.8173828125, 20.94873046875, 22.080078125, 23.21142578125, 24.3427734375, 25.47412109375, 26.60546875, 27.73681640625, 28.8681640625, 29.99951171875, 31.130859375, 32.26220703125, 33.3935546875, 34.52490234375, 35.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 6.0, 8.0, 10.0, 7.0, 8.0, 15.0, 17.0, 14.0, 20.0, 30.0, 29.0, 35.0, 37.0, 30.0, 39.0, 48.0, 40.0, 66.0, 42.0, 51.0, 46.0, 36.0, 39.0, 41.0, 30.0, 30.0, 30.0, 39.0, 15.0, 19.0, 13.0, 17.0, 15.0, 16.0, 11.0, 13.0, 9.0, 8.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-26.359375, -25.589599609375, -24.81982421875, -24.050048828125, -23.2802734375, -22.510498046875, -21.74072265625, -20.970947265625, -20.201171875, -19.431396484375, -18.66162109375, -17.891845703125, -17.1220703125, -16.352294921875, -15.58251953125, -14.812744140625, -14.04296875, -13.273193359375, -12.50341796875, -11.733642578125, -10.9638671875, -10.194091796875, -9.42431640625, -8.654541015625, -7.884765625, -7.114990234375, -6.34521484375, -5.575439453125, -4.8056640625, -4.035888671875, -3.26611328125, -2.496337890625, -1.7265625, -0.956787109375, -0.18701171875, 0.582763671875, 1.3525390625, 2.122314453125, 2.89208984375, 3.661865234375, 4.431640625, 5.201416015625, 5.97119140625, 6.740966796875, 7.5107421875, 8.280517578125, 9.05029296875, 9.820068359375, 10.58984375, 11.359619140625, 12.12939453125, 12.899169921875, 13.6689453125, 14.438720703125, 15.20849609375, 15.978271484375, 16.748046875, 17.517822265625, 18.28759765625, 19.057373046875, 19.8271484375, 20.596923828125, 21.36669921875, 22.136474609375, 22.90625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 8.0, 15.0, 13.0, 20.0, 34.0, 51.0, 64.0, 92.0, 129.0, 190.0, 324.0, 454.0, 732.0, 1098.0, 1798.0, 2981.0, 5001.0, 8918.0, 17335.0, 48044.0, 801814.0, 110534.0, 22512.0, 11001.0, 5982.0, 3533.0, 2141.0, 1307.0, 831.0, 540.0, 314.0, 220.0, 140.0, 119.0, 83.0, 37.0, 31.0, 35.0, 15.0, 19.0, 12.0, 10.0, 5.0, 4.0, 7.0, 3.0, 3.0, 4.0], "bins": [-14.96875, -14.560546875, -14.15234375, -13.744140625, -13.3359375, -12.927734375, -12.51953125, -12.111328125, -11.703125, -11.294921875, -10.88671875, -10.478515625, -10.0703125, -9.662109375, -9.25390625, -8.845703125, -8.4375, -8.029296875, -7.62109375, -7.212890625, -6.8046875, -6.396484375, -5.98828125, -5.580078125, -5.171875, -4.763671875, -4.35546875, -3.947265625, -3.5390625, -3.130859375, -2.72265625, -2.314453125, -1.90625, -1.498046875, -1.08984375, -0.681640625, -0.2734375, 0.134765625, 0.54296875, 0.951171875, 1.359375, 1.767578125, 2.17578125, 2.583984375, 2.9921875, 3.400390625, 3.80859375, 4.216796875, 4.625, 5.033203125, 5.44140625, 5.849609375, 6.2578125, 6.666015625, 7.07421875, 7.482421875, 7.890625, 8.298828125, 8.70703125, 9.115234375, 9.5234375, 9.931640625, 10.33984375, 10.748046875, 11.15625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 6.0, 7.0, 21.0, 18.0, 19.0, 28.0, 38.0, 49.0, 58.0, 79.0, 91.0, 126.0, 95.0, 88.0, 63.0, 43.0, 28.0, 30.0, 15.0, 19.0, 17.0, 14.0, 9.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039005279541015625, -0.0037538111209869385, -0.0036070942878723145, -0.0034603774547576904, -0.0033136606216430664, -0.0031669437885284424, -0.0030202269554138184, -0.0028735101222991943, -0.0027267932891845703, -0.0025800764560699463, -0.0024333596229553223, -0.0022866427898406982, -0.0021399259567260742, -0.00199320912361145, -0.0018464922904968262, -0.0016997754573822021, -0.0015530586242675781, -0.001406341791152954, -0.00125962495803833, -0.001112908124923706, -0.000966191291809082, -0.000819474458694458, -0.000672757625579834, -0.00052604079246521, -0.00037932395935058594, -0.00023260712623596191, -8.589029312133789e-05, 6.082653999328613e-05, 0.00020754337310791016, 0.0003542602062225342, 0.0005009770393371582, 0.0006476938724517822, 0.0007944107055664062, 0.0009411275386810303, 0.0010878443717956543, 0.0012345612049102783, 0.0013812780380249023, 0.0015279948711395264, 0.0016747117042541504, 0.0018214285373687744, 0.0019681453704833984, 0.0021148622035980225, 0.0022615790367126465, 0.0024082958698272705, 0.0025550127029418945, 0.0027017295360565186, 0.0028484463691711426, 0.0029951632022857666, 0.0031418800354003906, 0.0032885968685150146, 0.0034353137016296387, 0.0035820305347442627, 0.0037287473678588867, 0.0038754642009735107, 0.004022181034088135, 0.004168897867202759, 0.004315614700317383, 0.004462331533432007, 0.004609048366546631, 0.004755765199661255, 0.004902482032775879, 0.005049198865890503, 0.005195915699005127, 0.005342632532119751, 0.005489349365234375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 8.0, 6.0, 22.0, 27.0, 36.0, 49.0, 67.0, 101.0, 126.0, 189.0, 300.0, 416.0, 616.0, 863.0, 1360.0, 2110.0, 3421.0, 5813.0, 10800.0, 21068.0, 42745.0, 89204.0, 181858.0, 274714.0, 205526.0, 104385.0, 49360.0, 23876.0, 12290.0, 6516.0, 3879.0, 2318.0, 1422.0, 873.0, 640.0, 477.0, 311.0, 239.0, 170.0, 101.0, 82.0, 53.0, 36.0, 30.0, 18.0, 12.0, 5.0, 7.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.70989990234375, -3.5994873046875, -3.48907470703125, -3.378662109375, -3.26824951171875, -3.1578369140625, -3.04742431640625, -2.93701171875, -2.82659912109375, -2.7161865234375, -2.60577392578125, -2.495361328125, -2.38494873046875, -2.2745361328125, -2.16412353515625, -2.0537109375, -1.94329833984375, -1.8328857421875, -1.72247314453125, -1.612060546875, -1.50164794921875, -1.3912353515625, -1.28082275390625, -1.17041015625, -1.05999755859375, -0.9495849609375, -0.83917236328125, -0.728759765625, -0.61834716796875, -0.5079345703125, -0.39752197265625, -0.287109375, -0.17669677734375, -0.0662841796875, 0.04412841796875, 0.154541015625, 0.26495361328125, 0.3753662109375, 0.48577880859375, 0.59619140625, 0.70660400390625, 0.8170166015625, 0.92742919921875, 1.037841796875, 1.14825439453125, 1.2586669921875, 1.36907958984375, 1.4794921875, 1.58990478515625, 1.7003173828125, 1.81072998046875, 1.921142578125, 2.03155517578125, 2.1419677734375, 2.25238037109375, 2.36279296875, 2.47320556640625, 2.5836181640625, 2.69403076171875, 2.804443359375, 2.91485595703125, 3.0252685546875, 3.13568115234375, 3.24609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 4.0, 10.0, 6.0, 12.0, 8.0, 13.0, 17.0, 25.0, 27.0, 27.0, 45.0, 50.0, 59.0, 61.0, 72.0, 79.0, 69.0, 72.0, 73.0, 55.0, 46.0, 36.0, 23.0, 20.0, 22.0, 8.0, 10.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.079315185546875, -1.04534912109375, -1.011383056640625, -0.9774169921875, -0.943450927734375, -0.90948486328125, -0.875518798828125, -0.841552734375, -0.807586669921875, -0.77362060546875, -0.739654541015625, -0.7056884765625, -0.671722412109375, -0.63775634765625, -0.603790283203125, -0.56982421875, -0.535858154296875, -0.50189208984375, -0.467926025390625, -0.4339599609375, -0.399993896484375, -0.36602783203125, -0.332061767578125, -0.298095703125, -0.264129638671875, -0.23016357421875, -0.196197509765625, -0.1622314453125, -0.128265380859375, -0.09429931640625, -0.060333251953125, -0.0263671875, 0.007598876953125, 0.04156494140625, 0.075531005859375, 0.1094970703125, 0.143463134765625, 0.17742919921875, 0.211395263671875, 0.245361328125, 0.279327392578125, 0.31329345703125, 0.347259521484375, 0.3812255859375, 0.415191650390625, 0.44915771484375, 0.483123779296875, 0.51708984375, 0.551055908203125, 0.58502197265625, 0.618988037109375, 0.6529541015625, 0.686920166015625, 0.72088623046875, 0.754852294921875, 0.788818359375, 0.822784423828125, 0.85675048828125, 0.890716552734375, 0.9246826171875, 0.958648681640625, 0.99261474609375, 1.026580810546875, 1.060546875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 2.0, 5.0, 6.0, 16.0, 9.0, 16.0, 19.0, 29.0, 24.0, 32.0, 33.0, 39.0, 32.0, 52.0, 51.0, 50.0, 41.0, 45.0, 55.0, 54.0, 46.0, 48.0, 33.0, 43.0, 33.0, 12.0, 21.0, 31.0, 19.0, 17.0, 19.0, 16.0, 9.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.877809524536133, -16.325790405273438, -15.773771286010742, -15.221752166748047, -14.669733047485352, -14.117713928222656, -13.565695762634277, -13.013676643371582, -12.461657524108887, -11.909638404846191, -11.357619285583496, -10.8056001663208, -10.253582000732422, -9.701562881469727, -9.149543762207031, -8.597524642944336, -8.04550552368164, -7.493486404418945, -6.94146728515625, -6.389448642730713, -5.837429523468018, -5.285410404205322, -4.733391761779785, -4.18137264251709, -3.6293535232543945, -3.077334403991699, -2.525315523147583, -1.9732965230941772, -1.4212775230407715, -0.8692584037780762, -0.31723952293395996, 0.23477935791015625, 0.7867965698242188, 1.3388155698776245, 1.8908345699310303, 2.4428534507751465, 2.994872570037842, 3.546891689300537, 4.098910331726074, 4.6509294509887695, 5.202948570251465, 5.75496768951416, 6.3069868087768555, 6.859005451202393, 7.411024570465088, 7.963043689727783, 8.51506233215332, 9.067081451416016, 9.619100570678711, 10.171119689941406, 10.723138809204102, 11.275157928466797, 11.827177047729492, 12.379196166992188, 12.931214332580566, 13.483233451843262, 14.035252571105957, 14.587271690368652, 15.139290809631348, 15.691309928894043, 16.243328094482422, 16.795347213745117, 17.347366333007812, 17.899385452270508, 18.451404571533203]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 5.0, 7.0, 12.0, 12.0, 10.0, 22.0, 11.0, 30.0, 24.0, 34.0, 34.0, 34.0, 28.0, 32.0, 49.0, 43.0, 37.0, 39.0, 38.0, 42.0, 33.0, 31.0, 41.0, 42.0, 26.0, 32.0, 26.0, 32.0, 25.0, 26.0, 21.0, 22.0, 17.0, 17.0, 15.0, 3.0, 10.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.759028434753418, -15.257232666015625, -14.755436897277832, -14.253641128540039, -13.751845359802246, -13.250049591064453, -12.748252868652344, -12.246458053588867, -11.744661331176758, -11.242865562438965, -10.741069793701172, -10.239274024963379, -9.737478256225586, -9.235682487487793, -8.73388671875, -8.23208999633789, -7.730295181274414, -7.228499412536621, -6.726703643798828, -6.224907875061035, -5.723112106323242, -5.221316337585449, -4.719520092010498, -4.217724323272705, -3.715928554534912, -3.214132785797119, -2.712337017059326, -2.210541009902954, -1.7087452411651611, -1.2069494724273682, -0.7051534652709961, -0.20335769653320312, 0.29843711853027344, 0.8002329468727112, 1.302028775215149, 1.8038246631622314, 2.3056204319000244, 2.8074162006378174, 3.3092122077941895, 3.8110079765319824, 4.312803745269775, 4.814599514007568, 5.316395282745361, 5.8181915283203125, 6.3199872970581055, 6.821783065795898, 7.323578834533691, 7.825374603271484, 8.327170372009277, 8.82896614074707, 9.330761909484863, 9.832557678222656, 10.33435344696045, 10.836149215698242, 11.337945938110352, 11.839740753173828, 12.341537475585938, 12.84333324432373, 13.345129013061523, 13.846924781799316, 14.34872055053711, 14.850516319274902, 15.352312088012695, 15.854108810424805, 16.35590362548828]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 17.0, 27.0, 26.0, 42.0, 59.0, 86.0, 119.0, 146.0, 223.0, 364.0, 520.0, 770.0, 1149.0, 1731.0, 2532.0, 3850.0, 5555.0, 8478.0, 12935.0, 19579.0, 29929.0, 44356.0, 64463.0, 89643.0, 114716.0, 131570.0, 129702.0, 111891.0, 86845.0, 61476.0, 42058.0, 28344.0, 18646.0, 12229.0, 8184.0, 5334.0, 3569.0, 2355.0, 1603.0, 1098.0, 743.0, 516.0, 315.0, 229.0, 145.0, 113.0, 74.0, 53.0, 45.0, 32.0, 21.0, 15.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0], "bins": [-13.7890625, -13.3572998046875, -12.925537109375, -12.4937744140625, -12.06201171875, -11.6302490234375, -11.198486328125, -10.7667236328125, -10.3349609375, -9.9031982421875, -9.471435546875, -9.0396728515625, -8.60791015625, -8.1761474609375, -7.744384765625, -7.3126220703125, -6.880859375, -6.4490966796875, -6.017333984375, -5.5855712890625, -5.15380859375, -4.7220458984375, -4.290283203125, -3.8585205078125, -3.4267578125, -2.9949951171875, -2.563232421875, -2.1314697265625, -1.69970703125, -1.2679443359375, -0.836181640625, -0.4044189453125, 0.02734375, 0.4591064453125, 0.890869140625, 1.3226318359375, 1.75439453125, 2.1861572265625, 2.617919921875, 3.0496826171875, 3.4814453125, 3.9132080078125, 4.344970703125, 4.7767333984375, 5.20849609375, 5.6402587890625, 6.072021484375, 6.5037841796875, 6.935546875, 7.3673095703125, 7.799072265625, 8.2308349609375, 8.66259765625, 9.0943603515625, 9.526123046875, 9.9578857421875, 10.3896484375, 10.8214111328125, 11.253173828125, 11.6849365234375, 12.11669921875, 12.5484619140625, 12.980224609375, 13.4119873046875, 13.84375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 6.0, 4.0, 9.0, 4.0, 2.0, 6.0, 11.0, 9.0, 8.0, 15.0, 14.0, 28.0, 19.0, 20.0, 28.0, 27.0, 31.0, 40.0, 32.0, 36.0, 45.0, 41.0, 34.0, 38.0, 31.0, 44.0, 30.0, 36.0, 30.0, 35.0, 23.0, 24.0, 26.0, 41.0, 28.0, 25.0, 19.0, 22.0, 21.0, 6.0, 11.0, 14.0, 7.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.203125, -12.791259765625, -12.37939453125, -11.967529296875, -11.5556640625, -11.143798828125, -10.73193359375, -10.320068359375, -9.908203125, -9.496337890625, -9.08447265625, -8.672607421875, -8.2607421875, -7.848876953125, -7.43701171875, -7.025146484375, -6.61328125, -6.201416015625, -5.78955078125, -5.377685546875, -4.9658203125, -4.553955078125, -4.14208984375, -3.730224609375, -3.318359375, -2.906494140625, -2.49462890625, -2.082763671875, -1.6708984375, -1.259033203125, -0.84716796875, -0.435302734375, -0.0234375, 0.388427734375, 0.80029296875, 1.212158203125, 1.6240234375, 2.035888671875, 2.44775390625, 2.859619140625, 3.271484375, 3.683349609375, 4.09521484375, 4.507080078125, 4.9189453125, 5.330810546875, 5.74267578125, 6.154541015625, 6.56640625, 6.978271484375, 7.39013671875, 7.802001953125, 8.2138671875, 8.625732421875, 9.03759765625, 9.449462890625, 9.861328125, 10.273193359375, 10.68505859375, 11.096923828125, 11.5087890625, 11.920654296875, 12.33251953125, 12.744384765625, 13.15625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 14.0, 24.0, 34.0, 60.0, 65.0, 118.0, 151.0, 235.0, 353.0, 520.0, 880.0, 1317.0, 1979.0, 2983.0, 4770.0, 7389.0, 11925.0, 19533.0, 30922.0, 48142.0, 74336.0, 105223.0, 134385.0, 147656.0, 135934.0, 108035.0, 75723.0, 49742.0, 32398.0, 19807.0, 12305.0, 7850.0, 4939.0, 3029.0, 2016.0, 1275.0, 824.0, 559.0, 380.0, 234.0, 138.0, 98.0, 73.0, 56.0, 45.0, 32.0, 17.0, 8.0, 7.0, 1.0, 7.0, 3.0, 0.0, 1.0], "bins": [-15.8046875, -15.3333740234375, -14.862060546875, -14.3907470703125, -13.91943359375, -13.4481201171875, -12.976806640625, -12.5054931640625, -12.0341796875, -11.5628662109375, -11.091552734375, -10.6202392578125, -10.14892578125, -9.6776123046875, -9.206298828125, -8.7349853515625, -8.263671875, -7.7923583984375, -7.321044921875, -6.8497314453125, -6.37841796875, -5.9071044921875, -5.435791015625, -4.9644775390625, -4.4931640625, -4.0218505859375, -3.550537109375, -3.0792236328125, -2.60791015625, -2.1365966796875, -1.665283203125, -1.1939697265625, -0.72265625, -0.2513427734375, 0.219970703125, 0.6912841796875, 1.16259765625, 1.6339111328125, 2.105224609375, 2.5765380859375, 3.0478515625, 3.5191650390625, 3.990478515625, 4.4617919921875, 4.93310546875, 5.4044189453125, 5.875732421875, 6.3470458984375, 6.818359375, 7.2896728515625, 7.760986328125, 8.2322998046875, 8.70361328125, 9.1749267578125, 9.646240234375, 10.1175537109375, 10.5888671875, 11.0601806640625, 11.531494140625, 12.0028076171875, 12.47412109375, 12.9454345703125, 13.416748046875, 13.8880615234375, 14.359375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 9.0, 12.0, 19.0, 15.0, 18.0, 16.0, 27.0, 28.0, 42.0, 32.0, 37.0, 37.0, 43.0, 33.0, 43.0, 35.0, 31.0, 40.0, 42.0, 45.0, 27.0, 44.0, 27.0, 44.0, 30.0, 27.0, 27.0, 14.0, 20.0, 12.0, 18.0, 12.0, 6.0, 11.0, 7.0, 11.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.86328125, -7.59539794921875, -7.3275146484375, -7.05963134765625, -6.791748046875, -6.52386474609375, -6.2559814453125, -5.98809814453125, -5.72021484375, -5.45233154296875, -5.1844482421875, -4.91656494140625, -4.648681640625, -4.38079833984375, -4.1129150390625, -3.84503173828125, -3.5771484375, -3.30926513671875, -3.0413818359375, -2.77349853515625, -2.505615234375, -2.23773193359375, -1.9698486328125, -1.70196533203125, -1.43408203125, -1.16619873046875, -0.8983154296875, -0.63043212890625, -0.362548828125, -0.09466552734375, 0.1732177734375, 0.44110107421875, 0.708984375, 0.97686767578125, 1.2447509765625, 1.51263427734375, 1.780517578125, 2.04840087890625, 2.3162841796875, 2.58416748046875, 2.85205078125, 3.11993408203125, 3.3878173828125, 3.65570068359375, 3.923583984375, 4.19146728515625, 4.4593505859375, 4.72723388671875, 4.9951171875, 5.26300048828125, 5.5308837890625, 5.79876708984375, 6.066650390625, 6.33453369140625, 6.6024169921875, 6.87030029296875, 7.13818359375, 7.40606689453125, 7.6739501953125, 7.94183349609375, 8.209716796875, 8.47760009765625, 8.7454833984375, 9.01336669921875, 9.28125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 9.0, 4.0, 18.0, 24.0, 42.0, 60.0, 83.0, 111.0, 160.0, 233.0, 370.0, 561.0, 812.0, 1238.0, 1915.0, 3074.0, 4732.0, 7811.0, 12400.0, 20174.0, 33030.0, 53879.0, 84073.0, 124766.0, 158954.0, 163212.0, 131269.0, 91133.0, 58864.0, 36226.0, 22419.0, 13711.0, 8408.0, 5330.0, 3386.0, 2091.0, 1362.0, 826.0, 592.0, 394.0, 259.0, 184.0, 110.0, 83.0, 54.0, 39.0, 25.0, 19.0, 5.0, 6.0, 11.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.953125, -7.705322265625, -7.45751953125, -7.209716796875, -6.9619140625, -6.714111328125, -6.46630859375, -6.218505859375, -5.970703125, -5.722900390625, -5.47509765625, -5.227294921875, -4.9794921875, -4.731689453125, -4.48388671875, -4.236083984375, -3.98828125, -3.740478515625, -3.49267578125, -3.244873046875, -2.9970703125, -2.749267578125, -2.50146484375, -2.253662109375, -2.005859375, -1.758056640625, -1.51025390625, -1.262451171875, -1.0146484375, -0.766845703125, -0.51904296875, -0.271240234375, -0.0234375, 0.224365234375, 0.47216796875, 0.719970703125, 0.9677734375, 1.215576171875, 1.46337890625, 1.711181640625, 1.958984375, 2.206787109375, 2.45458984375, 2.702392578125, 2.9501953125, 3.197998046875, 3.44580078125, 3.693603515625, 3.94140625, 4.189208984375, 4.43701171875, 4.684814453125, 4.9326171875, 5.180419921875, 5.42822265625, 5.676025390625, 5.923828125, 6.171630859375, 6.41943359375, 6.667236328125, 6.9150390625, 7.162841796875, 7.41064453125, 7.658447265625, 7.90625]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 9.0, 10.0, 14.0, 20.0, 29.0, 39.0, 55.0, 74.0, 94.0, 98.0, 101.0, 108.0, 103.0, 58.0, 51.0, 36.0, 27.0, 23.0, 17.0, 10.0, 6.0, 6.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00140380859375, -0.0013559907674789429, -0.0013081729412078857, -0.0012603551149368286, -0.0012125372886657715, -0.0011647194623947144, -0.0011169016361236572, -0.0010690838098526, -0.001021265983581543, -0.0009734481573104858, -0.0009256303310394287, -0.0008778125047683716, -0.0008299946784973145, -0.0007821768522262573, -0.0007343590259552002, -0.0006865411996841431, -0.0006387233734130859, -0.0005909055471420288, -0.0005430877208709717, -0.0004952698945999146, -0.0004474520683288574, -0.0003996342420578003, -0.00035181641578674316, -0.00030399858951568604, -0.0002561807632446289, -0.00020836293697357178, -0.00016054511070251465, -0.00011272728443145752, -6.490945816040039e-05, -1.7091631889343262e-05, 3.072619438171387e-05, 7.8544020652771e-05, 0.00012636184692382812, 0.00017417967319488525, 0.00022199749946594238, 0.0002698153257369995, 0.00031763315200805664, 0.00036545097827911377, 0.0004132688045501709, 0.00046108663082122803, 0.0005089044570922852, 0.0005567222833633423, 0.0006045401096343994, 0.0006523579359054565, 0.0007001757621765137, 0.0007479935884475708, 0.0007958114147186279, 0.0008436292409896851, 0.0008914470672607422, 0.0009392648935317993, 0.0009870827198028564, 0.0010349005460739136, 0.0010827183723449707, 0.0011305361986160278, 0.001178354024887085, 0.001226171851158142, 0.0012739896774291992, 0.0013218075037002563, 0.0013696253299713135, 0.0014174431562423706, 0.0014652609825134277, 0.0015130788087844849, 0.001560896635055542, 0.0016087144613265991, 0.0016565322875976562]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 11.0, 17.0, 36.0, 32.0, 69.0, 86.0, 153.0, 210.0, 297.0, 442.0, 694.0, 1053.0, 1673.0, 2687.0, 4275.0, 6731.0, 10606.0, 17240.0, 27443.0, 44538.0, 68329.0, 101748.0, 137975.0, 156612.0, 144188.0, 111441.0, 76816.0, 49277.0, 31262.0, 19679.0, 12131.0, 7588.0, 4834.0, 2981.0, 1903.0, 1170.0, 776.0, 525.0, 339.0, 214.0, 155.0, 127.0, 64.0, 45.0, 28.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.0234375, -7.791748046875, -7.56005859375, -7.328369140625, -7.0966796875, -6.864990234375, -6.63330078125, -6.401611328125, -6.169921875, -5.938232421875, -5.70654296875, -5.474853515625, -5.2431640625, -5.011474609375, -4.77978515625, -4.548095703125, -4.31640625, -4.084716796875, -3.85302734375, -3.621337890625, -3.3896484375, -3.157958984375, -2.92626953125, -2.694580078125, -2.462890625, -2.231201171875, -1.99951171875, -1.767822265625, -1.5361328125, -1.304443359375, -1.07275390625, -0.841064453125, -0.609375, -0.377685546875, -0.14599609375, 0.085693359375, 0.3173828125, 0.549072265625, 0.78076171875, 1.012451171875, 1.244140625, 1.475830078125, 1.70751953125, 1.939208984375, 2.1708984375, 2.402587890625, 2.63427734375, 2.865966796875, 3.09765625, 3.329345703125, 3.56103515625, 3.792724609375, 4.0244140625, 4.256103515625, 4.48779296875, 4.719482421875, 4.951171875, 5.182861328125, 5.41455078125, 5.646240234375, 5.8779296875, 6.109619140625, 6.34130859375, 6.572998046875, 6.8046875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 7.0, 8.0, 15.0, 14.0, 13.0, 20.0, 19.0, 32.0, 42.0, 40.0, 48.0, 60.0, 61.0, 54.0, 64.0, 58.0, 61.0, 48.0, 53.0, 50.0, 33.0, 39.0, 26.0, 28.0, 21.0, 17.0, 13.0, 20.0, 7.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.1484375, -3.058135986328125, -2.96783447265625, -2.877532958984375, -2.7872314453125, -2.696929931640625, -2.60662841796875, -2.516326904296875, -2.426025390625, -2.335723876953125, -2.24542236328125, -2.155120849609375, -2.0648193359375, -1.974517822265625, -1.88421630859375, -1.793914794921875, -1.70361328125, -1.613311767578125, -1.52301025390625, -1.432708740234375, -1.3424072265625, -1.252105712890625, -1.16180419921875, -1.071502685546875, -0.981201171875, -0.890899658203125, -0.80059814453125, -0.710296630859375, -0.6199951171875, -0.529693603515625, -0.43939208984375, -0.349090576171875, -0.2587890625, -0.168487548828125, -0.07818603515625, 0.012115478515625, 0.1024169921875, 0.192718505859375, 0.28302001953125, 0.373321533203125, 0.463623046875, 0.553924560546875, 0.64422607421875, 0.734527587890625, 0.8248291015625, 0.915130615234375, 1.00543212890625, 1.095733642578125, 1.18603515625, 1.276336669921875, 1.36663818359375, 1.456939697265625, 1.5472412109375, 1.637542724609375, 1.72784423828125, 1.818145751953125, 1.908447265625, 1.998748779296875, 2.08905029296875, 2.179351806640625, 2.2696533203125, 2.359954833984375, 2.45025634765625, 2.540557861328125, 2.630859375]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 8.0, 16.0, 7.0, 19.0, 24.0, 26.0, 27.0, 36.0, 36.0, 29.0, 47.0, 46.0, 42.0, 51.0, 49.0, 47.0, 49.0, 45.0, 50.0, 39.0, 41.0, 44.0, 21.0, 22.0, 33.0, 24.0, 18.0, 18.0, 8.0, 12.0, 7.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.070353507995605, -12.58980941772461, -12.10926628112793, -11.62872314453125, -11.148179054260254, -10.667634963989258, -10.187091827392578, -9.706548690795898, -9.226004600524902, -8.745460510253906, -8.264917373657227, -7.784373760223389, -7.303830146789551, -6.823286533355713, -6.342742919921875, -5.862199306488037, -5.381655693054199, -4.901112079620361, -4.420568466186523, -3.9400248527526855, -3.4594812393188477, -2.9789376258850098, -2.498394012451172, -2.017850399017334, -1.537306785583496, -1.0567631721496582, -0.5762195587158203, -0.09567594528198242, 0.38486766815185547, 0.8654112815856934, 1.3459548950195312, 1.8264985084533691, 2.3070430755615234, 2.7875866889953613, 3.268130302429199, 3.748673915863037, 4.229217529296875, 4.709761142730713, 5.190304756164551, 5.670848369598389, 6.151391983032227, 6.6319355964660645, 7.112479209899902, 7.59302282333374, 8.073566436767578, 8.554109573364258, 9.034653663635254, 9.51519775390625, 9.99574089050293, 10.47628402709961, 10.956828117370605, 11.437372207641602, 11.917915344238281, 12.398458480834961, 12.879002571105957, 13.359546661376953, 13.840089797973633, 14.320632934570312, 14.801177024841309, 15.281721115112305, 15.762264251708984, 16.242807388305664, 16.723350524902344, 17.203895568847656, 17.684438705444336]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 10.0, 7.0, 11.0, 15.0, 12.0, 14.0, 15.0, 24.0, 20.0, 23.0, 30.0, 34.0, 37.0, 33.0, 38.0, 41.0, 30.0, 46.0, 42.0, 35.0, 36.0, 39.0, 35.0, 41.0, 22.0, 38.0, 25.0, 33.0, 25.0, 30.0, 21.0, 20.0, 13.0, 15.0, 17.0, 9.0, 4.0, 13.0, 4.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.401455879211426, -12.971198081970215, -12.54094123840332, -12.11068344116211, -11.680426597595215, -11.250168800354004, -10.81991195678711, -10.389654159545898, -9.959396362304688, -9.529138565063477, -9.098881721496582, -8.668623924255371, -8.238367080688477, -7.808109283447266, -7.377851963043213, -6.94759464263916, -6.517337799072266, -6.087080478668213, -5.65682315826416, -5.226565361022949, -4.796308517456055, -4.366050720214844, -3.935793399810791, -3.5055360794067383, -3.0752787590026855, -2.645021438598633, -2.21476411819458, -1.7845065593719482, -1.3542492389678955, -0.9239919185638428, -0.49373435974121094, -0.0634770393371582, 0.3667793273925781, 0.7970367074012756, 1.2272940874099731, 1.6575515270233154, 2.087808847427368, 2.518066167831421, 2.9483237266540527, 3.3785810470581055, 3.808838367462158, 4.239095687866211, 4.669353008270264, 5.099610328674316, 5.529868125915527, 5.960124969482422, 6.390382766723633, 6.8206400871276855, 7.250897407531738, 7.681154727935791, 8.111412048339844, 8.541669845581055, 8.97192668914795, 9.40218448638916, 9.832441329956055, 10.262699127197266, 10.692956924438477, 11.123214721679688, 11.553471565246582, 11.983729362487793, 12.413986206054688, 12.844244003295898, 13.27450180053711, 13.704758644104004, 14.135015487670898]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 5.0, 9.0, 12.0, 30.0, 21.0, 36.0, 69.0, 87.0, 151.0, 228.0, 365.0, 568.0, 823.0, 1370.0, 2249.0, 3897.0, 6593.0, 11070.0, 19241.0, 33479.0, 58808.0, 106326.0, 195172.0, 353077.0, 578851.0, 763508.0, 754805.0, 555891.0, 332187.0, 182270.0, 99563.0, 55394.0, 31746.0, 18627.0, 10909.0, 6605.0, 3929.0, 2335.0, 1459.0, 903.0, 542.0, 378.0, 239.0, 142.0, 103.0, 69.0, 45.0, 34.0, 24.0, 15.0, 12.0, 5.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.3515625, -10.0059814453125, -9.660400390625, -9.3148193359375, -8.96923828125, -8.6236572265625, -8.278076171875, -7.9324951171875, -7.5869140625, -7.2413330078125, -6.895751953125, -6.5501708984375, -6.20458984375, -5.8590087890625, -5.513427734375, -5.1678466796875, -4.822265625, -4.4766845703125, -4.131103515625, -3.7855224609375, -3.43994140625, -3.0943603515625, -2.748779296875, -2.4031982421875, -2.0576171875, -1.7120361328125, -1.366455078125, -1.0208740234375, -0.67529296875, -0.3297119140625, 0.015869140625, 0.3614501953125, 0.70703125, 1.0526123046875, 1.398193359375, 1.7437744140625, 2.08935546875, 2.4349365234375, 2.780517578125, 3.1260986328125, 3.4716796875, 3.8172607421875, 4.162841796875, 4.5084228515625, 4.85400390625, 5.1995849609375, 5.545166015625, 5.8907470703125, 6.236328125, 6.5819091796875, 6.927490234375, 7.2730712890625, 7.61865234375, 7.9642333984375, 8.309814453125, 8.6553955078125, 9.0009765625, 9.3465576171875, 9.692138671875, 10.0377197265625, 10.38330078125, 10.7288818359375, 11.074462890625, 11.4200439453125, 11.765625]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 7.0, 9.0, 14.0, 14.0, 9.0, 9.0, 24.0, 18.0, 26.0, 16.0, 16.0, 29.0, 29.0, 29.0, 25.0, 29.0, 33.0, 49.0, 35.0, 43.0, 37.0, 36.0, 36.0, 26.0, 31.0, 36.0, 31.0, 25.0, 33.0, 24.0, 31.0, 19.0, 18.0, 28.0, 24.0, 11.0, 16.0, 14.0, 9.0, 7.0, 10.0, 7.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0], "bins": [-9.484375, -9.186279296875, -8.88818359375, -8.590087890625, -8.2919921875, -7.993896484375, -7.69580078125, -7.397705078125, -7.099609375, -6.801513671875, -6.50341796875, -6.205322265625, -5.9072265625, -5.609130859375, -5.31103515625, -5.012939453125, -4.71484375, -4.416748046875, -4.11865234375, -3.820556640625, -3.5224609375, -3.224365234375, -2.92626953125, -2.628173828125, -2.330078125, -2.031982421875, -1.73388671875, -1.435791015625, -1.1376953125, -0.839599609375, -0.54150390625, -0.243408203125, 0.0546875, 0.352783203125, 0.65087890625, 0.948974609375, 1.2470703125, 1.545166015625, 1.84326171875, 2.141357421875, 2.439453125, 2.737548828125, 3.03564453125, 3.333740234375, 3.6318359375, 3.929931640625, 4.22802734375, 4.526123046875, 4.82421875, 5.122314453125, 5.42041015625, 5.718505859375, 6.0166015625, 6.314697265625, 6.61279296875, 6.910888671875, 7.208984375, 7.507080078125, 7.80517578125, 8.103271484375, 8.4013671875, 8.699462890625, 8.99755859375, 9.295654296875, 9.59375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 15.0, 25.0, 42.0, 72.0, 95.0, 156.0, 228.0, 366.0, 586.0, 988.0, 1595.0, 2553.0, 3923.0, 6484.0, 10316.0, 17017.0, 27505.0, 45216.0, 72991.0, 117722.0, 187316.0, 290765.0, 427893.0, 573515.0, 640538.0, 568463.0, 422230.0, 287066.0, 184353.0, 115971.0, 72278.0, 44714.0, 27241.0, 16885.0, 10286.0, 6394.0, 3946.0, 2416.0, 1538.0, 941.0, 623.0, 360.0, 231.0, 159.0, 96.0, 54.0, 42.0, 23.0, 20.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0], "bins": [-10.8359375, -10.5123291015625, -10.188720703125, -9.8651123046875, -9.54150390625, -9.2178955078125, -8.894287109375, -8.5706787109375, -8.2470703125, -7.9234619140625, -7.599853515625, -7.2762451171875, -6.95263671875, -6.6290283203125, -6.305419921875, -5.9818115234375, -5.658203125, -5.3345947265625, -5.010986328125, -4.6873779296875, -4.36376953125, -4.0401611328125, -3.716552734375, -3.3929443359375, -3.0693359375, -2.7457275390625, -2.422119140625, -2.0985107421875, -1.77490234375, -1.4512939453125, -1.127685546875, -0.8040771484375, -0.48046875, -0.1568603515625, 0.166748046875, 0.4903564453125, 0.81396484375, 1.1375732421875, 1.461181640625, 1.7847900390625, 2.1083984375, 2.4320068359375, 2.755615234375, 3.0792236328125, 3.40283203125, 3.7264404296875, 4.050048828125, 4.3736572265625, 4.697265625, 5.0208740234375, 5.344482421875, 5.6680908203125, 5.99169921875, 6.3153076171875, 6.638916015625, 6.9625244140625, 7.2861328125, 7.6097412109375, 7.933349609375, 8.2569580078125, 8.58056640625, 8.9041748046875, 9.227783203125, 9.5513916015625, 9.875]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 13.0, 12.0, 18.0, 17.0, 25.0, 44.0, 43.0, 65.0, 71.0, 95.0, 98.0, 123.0, 135.0, 165.0, 193.0, 227.0, 223.0, 244.0, 265.0, 262.0, 257.0, 221.0, 221.0, 197.0, 150.0, 149.0, 109.0, 96.0, 88.0, 44.0, 46.0, 39.0, 23.0, 25.0, 21.0, 15.0, 8.0, 8.0, 5.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-5.76953125, -5.6160888671875, -5.462646484375, -5.3092041015625, -5.15576171875, -5.0023193359375, -4.848876953125, -4.6954345703125, -4.5419921875, -4.3885498046875, -4.235107421875, -4.0816650390625, -3.92822265625, -3.7747802734375, -3.621337890625, -3.4678955078125, -3.314453125, -3.1610107421875, -3.007568359375, -2.8541259765625, -2.70068359375, -2.5472412109375, -2.393798828125, -2.2403564453125, -2.0869140625, -1.9334716796875, -1.780029296875, -1.6265869140625, -1.47314453125, -1.3197021484375, -1.166259765625, -1.0128173828125, -0.859375, -0.7059326171875, -0.552490234375, -0.3990478515625, -0.24560546875, -0.0921630859375, 0.061279296875, 0.2147216796875, 0.3681640625, 0.5216064453125, 0.675048828125, 0.8284912109375, 0.98193359375, 1.1353759765625, 1.288818359375, 1.4422607421875, 1.595703125, 1.7491455078125, 1.902587890625, 2.0560302734375, 2.20947265625, 2.3629150390625, 2.516357421875, 2.6697998046875, 2.8232421875, 2.9766845703125, 3.130126953125, 3.2835693359375, 3.43701171875, 3.5904541015625, 3.743896484375, 3.8973388671875, 4.05078125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 7.0, 6.0, 4.0, 4.0, 8.0, 14.0, 17.0, 19.0, 25.0, 34.0, 41.0, 41.0, 45.0, 37.0, 48.0, 57.0, 57.0, 66.0, 46.0, 55.0, 53.0, 52.0, 52.0, 40.0, 32.0, 22.0, 22.0, 15.0, 14.0, 11.0, 8.0, 9.0, 14.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.228116989135742, -13.775860786437988, -13.323604583740234, -12.871347427368164, -12.41909122467041, -11.966835021972656, -11.514578819274902, -11.062322616577148, -10.610065460205078, -10.157809257507324, -9.70555305480957, -9.2532958984375, -8.801039695739746, -8.348783493041992, -7.896527290344238, -7.444271087646484, -6.9920148849487305, -6.539758682250977, -6.0875020027160645, -5.6352458000183105, -5.182989120483398, -4.7307329177856445, -4.278476715087891, -3.8262202739715576, -3.3739638328552246, -2.9217073917388916, -2.4694509506225586, -2.0171947479248047, -1.5649383068084717, -1.1126818656921387, -0.6604256629943848, -0.20816922187805176, 0.24408817291259766, 0.6963445544242859, 1.1486009359359741, 1.6008572578430176, 2.0531136989593506, 2.5053701400756836, 2.9576263427734375, 3.4098827838897705, 3.8621392250061035, 4.314395427703857, 4.7666521072387695, 5.218908309936523, 5.671164512634277, 6.1234211921691895, 6.575677394866943, 7.0279340744018555, 7.480190277099609, 7.932446479797363, 8.384702682495117, 8.836959838867188, 9.289216041564941, 9.741472244262695, 10.19372844696045, 10.645984649658203, 11.098241806030273, 11.550498008728027, 12.002754211425781, 12.455011367797852, 12.907267570495605, 13.35952377319336, 13.811779975891113, 14.264036178588867, 14.716292381286621]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 5.0, 5.0, 13.0, 11.0, 12.0, 10.0, 14.0, 16.0, 22.0, 19.0, 20.0, 27.0, 26.0, 24.0, 33.0, 52.0, 40.0, 35.0, 41.0, 30.0, 44.0, 35.0, 41.0, 35.0, 40.0, 34.0, 30.0, 38.0, 28.0, 27.0, 28.0, 19.0, 21.0, 19.0, 18.0, 22.0, 13.0, 11.0, 10.0, 4.0, 4.0, 7.0, 5.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.525537490844727, -10.185063362121582, -9.844590187072754, -9.50411605834961, -9.163642883300781, -8.823168754577637, -8.482694625854492, -8.142221450805664, -7.801747798919678, -7.461274147033691, -7.120800495147705, -6.780326843261719, -6.439852714538574, -6.099379539489746, -5.758905410766602, -5.418431758880615, -5.077958106994629, -4.737484455108643, -4.397010803222656, -4.056536674499512, -3.7160632610321045, -3.375589609146118, -3.0351157188415527, -2.6946420669555664, -2.35416841506958, -2.0136947631835938, -1.6732209920883179, -1.332747220993042, -0.9922735691070557, -0.6517999172210693, -0.3113260269165039, 0.029147624969482422, 0.36962223052978516, 0.7100959420204163, 1.0505696535110474, 1.3910434246063232, 1.7315170764923096, 2.071990728378296, 2.4124646186828613, 2.7529382705688477, 3.093411922454834, 3.4338855743408203, 3.7743592262268066, 4.114832878112793, 4.4553070068359375, 4.795780181884766, 5.13625431060791, 5.4767279624938965, 5.817201614379883, 6.157675266265869, 6.4981489181518555, 6.838623046875, 7.179096221923828, 7.519570350646973, 7.860044002532959, 8.200517654418945, 8.540990829467773, 8.881464958190918, 9.221938133239746, 9.56241226196289, 9.902885437011719, 10.243359565734863, 10.583833694458008, 10.924306869506836, 11.26478099822998]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 8.0, 15.0, 25.0, 40.0, 53.0, 76.0, 129.0, 167.0, 269.0, 410.0, 627.0, 962.0, 1504.0, 2238.0, 3293.0, 4812.0, 7283.0, 10814.0, 15949.0, 23721.0, 35060.0, 51081.0, 74672.0, 104481.0, 135839.0, 147348.0, 127751.0, 94001.0, 66203.0, 44949.0, 30923.0, 20660.0, 14231.0, 9551.0, 6479.0, 4356.0, 2888.0, 1980.0, 1249.0, 829.0, 556.0, 355.0, 245.0, 148.0, 108.0, 66.0, 50.0, 37.0, 16.0, 15.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0], "bins": [-9.0390625, -8.7679443359375, -8.496826171875, -8.2257080078125, -7.95458984375, -7.6834716796875, -7.412353515625, -7.1412353515625, -6.8701171875, -6.5989990234375, -6.327880859375, -6.0567626953125, -5.78564453125, -5.5145263671875, -5.243408203125, -4.9722900390625, -4.701171875, -4.4300537109375, -4.158935546875, -3.8878173828125, -3.61669921875, -3.3455810546875, -3.074462890625, -2.8033447265625, -2.5322265625, -2.2611083984375, -1.989990234375, -1.7188720703125, -1.44775390625, -1.1766357421875, -0.905517578125, -0.6343994140625, -0.36328125, -0.0921630859375, 0.178955078125, 0.4500732421875, 0.72119140625, 0.9923095703125, 1.263427734375, 1.5345458984375, 1.8056640625, 2.0767822265625, 2.347900390625, 2.6190185546875, 2.89013671875, 3.1612548828125, 3.432373046875, 3.7034912109375, 3.974609375, 4.2457275390625, 4.516845703125, 4.7879638671875, 5.05908203125, 5.3302001953125, 5.601318359375, 5.8724365234375, 6.1435546875, 6.4146728515625, 6.685791015625, 6.9569091796875, 7.22802734375, 7.4991455078125, 7.770263671875, 8.0413818359375, 8.3125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 10.0, 9.0, 8.0, 8.0, 18.0, 11.0, 17.0, 14.0, 25.0, 20.0, 21.0, 25.0, 28.0, 31.0, 20.0, 36.0, 29.0, 40.0, 43.0, 36.0, 42.0, 33.0, 37.0, 32.0, 41.0, 38.0, 29.0, 27.0, 30.0, 24.0, 31.0, 21.0, 23.0, 20.0, 15.0, 11.0, 10.0, 13.0, 16.0, 14.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.640625, -9.3333740234375, -9.026123046875, -8.7188720703125, -8.41162109375, -8.1043701171875, -7.797119140625, -7.4898681640625, -7.1826171875, -6.8753662109375, -6.568115234375, -6.2608642578125, -5.95361328125, -5.6463623046875, -5.339111328125, -5.0318603515625, -4.724609375, -4.4173583984375, -4.110107421875, -3.8028564453125, -3.49560546875, -3.1883544921875, -2.881103515625, -2.5738525390625, -2.2666015625, -1.9593505859375, -1.652099609375, -1.3448486328125, -1.03759765625, -0.7303466796875, -0.423095703125, -0.1158447265625, 0.19140625, 0.4986572265625, 0.805908203125, 1.1131591796875, 1.42041015625, 1.7276611328125, 2.034912109375, 2.3421630859375, 2.6494140625, 2.9566650390625, 3.263916015625, 3.5711669921875, 3.87841796875, 4.1856689453125, 4.492919921875, 4.8001708984375, 5.107421875, 5.4146728515625, 5.721923828125, 6.0291748046875, 6.33642578125, 6.6436767578125, 6.950927734375, 7.2581787109375, 7.5654296875, 7.8726806640625, 8.179931640625, 8.4871826171875, 8.79443359375, 9.1016845703125, 9.408935546875, 9.7161865234375, 10.0234375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 12.0, 18.0, 25.0, 29.0, 57.0, 55.0, 84.0, 145.0, 157.0, 205.0, 294.0, 452.0, 609.0, 851.0, 1287.0, 1793.0, 2717.0, 3863.0, 5919.0, 9275.0, 15152.0, 28784.0, 396290.0, 506438.0, 30269.0, 15679.0, 9420.0, 5863.0, 3813.0, 2723.0, 1873.0, 1226.0, 936.0, 609.0, 435.0, 352.0, 231.0, 175.0, 127.0, 84.0, 59.0, 43.0, 25.0, 26.0, 21.0, 12.0, 8.0, 7.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0], "bins": [-14.9765625, -14.5089111328125, -14.041259765625, -13.5736083984375, -13.10595703125, -12.6383056640625, -12.170654296875, -11.7030029296875, -11.2353515625, -10.7677001953125, -10.300048828125, -9.8323974609375, -9.36474609375, -8.8970947265625, -8.429443359375, -7.9617919921875, -7.494140625, -7.0264892578125, -6.558837890625, -6.0911865234375, -5.62353515625, -5.1558837890625, -4.688232421875, -4.2205810546875, -3.7529296875, -3.2852783203125, -2.817626953125, -2.3499755859375, -1.88232421875, -1.4146728515625, -0.947021484375, -0.4793701171875, -0.01171875, 0.4559326171875, 0.923583984375, 1.3912353515625, 1.85888671875, 2.3265380859375, 2.794189453125, 3.2618408203125, 3.7294921875, 4.1971435546875, 4.664794921875, 5.1324462890625, 5.60009765625, 6.0677490234375, 6.535400390625, 7.0030517578125, 7.470703125, 7.9383544921875, 8.406005859375, 8.8736572265625, 9.34130859375, 9.8089599609375, 10.276611328125, 10.7442626953125, 11.2119140625, 11.6795654296875, 12.147216796875, 12.6148681640625, 13.08251953125, 13.5501708984375, 14.017822265625, 14.4854736328125, 14.953125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 11.0, 10.0, 16.0, 13.0, 14.0, 16.0, 25.0, 30.0, 34.0, 38.0, 38.0, 36.0, 47.0, 46.0, 41.0, 40.0, 57.0, 36.0, 46.0, 56.0, 39.0, 38.0, 31.0, 33.0, 25.0, 31.0, 25.0, 28.0, 19.0, 10.0, 10.0, 10.0, 8.0, 5.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.5859375, -10.2733154296875, -9.960693359375, -9.6480712890625, -9.33544921875, -9.0228271484375, -8.710205078125, -8.3975830078125, -8.0849609375, -7.7723388671875, -7.459716796875, -7.1470947265625, -6.83447265625, -6.5218505859375, -6.209228515625, -5.8966064453125, -5.583984375, -5.2713623046875, -4.958740234375, -4.6461181640625, -4.33349609375, -4.0208740234375, -3.708251953125, -3.3956298828125, -3.0830078125, -2.7703857421875, -2.457763671875, -2.1451416015625, -1.83251953125, -1.5198974609375, -1.207275390625, -0.8946533203125, -0.58203125, -0.2694091796875, 0.043212890625, 0.3558349609375, 0.66845703125, 0.9810791015625, 1.293701171875, 1.6063232421875, 1.9189453125, 2.2315673828125, 2.544189453125, 2.8568115234375, 3.16943359375, 3.4820556640625, 3.794677734375, 4.1072998046875, 4.419921875, 4.7325439453125, 5.045166015625, 5.3577880859375, 5.67041015625, 5.9830322265625, 6.295654296875, 6.6082763671875, 6.9208984375, 7.2335205078125, 7.546142578125, 7.8587646484375, 8.17138671875, 8.4840087890625, 8.796630859375, 9.1092529296875, 9.421875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 19.0, 21.0, 25.0, 18.0, 41.0, 62.0, 91.0, 120.0, 134.0, 225.0, 284.0, 440.0, 697.0, 1014.0, 1618.0, 2767.0, 4744.0, 8478.0, 17236.0, 49938.0, 843003.0, 73936.0, 20300.0, 9616.0, 5299.0, 3085.0, 1802.0, 1135.0, 698.0, 497.0, 314.0, 223.0, 161.0, 122.0, 84.0, 80.0, 47.0, 37.0, 35.0, 19.0, 18.0, 13.0, 5.0, 7.0, 9.0, 6.0, 2.0, 3.0, 3.0], "bins": [-8.3515625, -8.116943359375, -7.88232421875, -7.647705078125, -7.4130859375, -7.178466796875, -6.94384765625, -6.709228515625, -6.474609375, -6.239990234375, -6.00537109375, -5.770751953125, -5.5361328125, -5.301513671875, -5.06689453125, -4.832275390625, -4.59765625, -4.363037109375, -4.12841796875, -3.893798828125, -3.6591796875, -3.424560546875, -3.18994140625, -2.955322265625, -2.720703125, -2.486083984375, -2.25146484375, -2.016845703125, -1.7822265625, -1.547607421875, -1.31298828125, -1.078369140625, -0.84375, -0.609130859375, -0.37451171875, -0.139892578125, 0.0947265625, 0.329345703125, 0.56396484375, 0.798583984375, 1.033203125, 1.267822265625, 1.50244140625, 1.737060546875, 1.9716796875, 2.206298828125, 2.44091796875, 2.675537109375, 2.91015625, 3.144775390625, 3.37939453125, 3.614013671875, 3.8486328125, 4.083251953125, 4.31787109375, 4.552490234375, 4.787109375, 5.021728515625, 5.25634765625, 5.490966796875, 5.7255859375, 5.960205078125, 6.19482421875, 6.429443359375, 6.6640625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 4.0, 7.0, 5.0, 7.0, 7.0, 13.0, 8.0, 9.0, 17.0, 22.0, 29.0, 35.0, 67.0, 88.0, 151.0, 156.0, 119.0, 62.0, 46.0, 31.0, 27.0, 20.0, 15.0, 10.0, 8.0, 10.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010576248168945312, -0.0010138154029846191, -0.000970005989074707, -0.0009261965751647949, -0.0008823871612548828, -0.0008385777473449707, -0.0007947683334350586, -0.0007509589195251465, -0.0007071495056152344, -0.0006633400917053223, -0.0006195306777954102, -0.000575721263885498, -0.0005319118499755859, -0.00048810243606567383, -0.0004442930221557617, -0.0004004836082458496, -0.0003566741943359375, -0.0003128647804260254, -0.0002690553665161133, -0.00022524595260620117, -0.00018143653869628906, -0.00013762712478637695, -9.381771087646484e-05, -5.0008296966552734e-05, -6.198883056640625e-06, 3.7610530853271484e-05, 8.14199447631836e-05, 0.0001252293586730957, 0.0001690387725830078, 0.00021284818649291992, 0.00025665760040283203, 0.00030046701431274414, 0.00034427642822265625, 0.00038808584213256836, 0.00043189525604248047, 0.0004757046699523926, 0.0005195140838623047, 0.0005633234977722168, 0.0006071329116821289, 0.000650942325592041, 0.0006947517395019531, 0.0007385611534118652, 0.0007823705673217773, 0.0008261799812316895, 0.0008699893951416016, 0.0009137988090515137, 0.0009576082229614258, 0.0010014176368713379, 0.00104522705078125, 0.0010890364646911621, 0.0011328458786010742, 0.0011766552925109863, 0.0012204647064208984, 0.0012642741203308105, 0.0013080835342407227, 0.0013518929481506348, 0.0013957023620605469, 0.001439511775970459, 0.001483321189880371, 0.0015271306037902832, 0.0015709400177001953, 0.0016147494316101074, 0.0016585588455200195, 0.0017023682594299316, 0.0017461776733398438]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 7.0, 10.0, 17.0, 12.0, 17.0, 25.0, 33.0, 48.0, 68.0, 81.0, 134.0, 158.0, 257.0, 392.0, 614.0, 981.0, 1658.0, 2742.0, 4794.0, 8730.0, 17221.0, 38524.0, 94946.0, 230141.0, 326906.0, 184924.0, 72890.0, 30321.0, 14060.0, 7190.0, 4092.0, 2389.0, 1513.0, 905.0, 551.0, 382.0, 256.0, 171.0, 125.0, 79.0, 41.0, 46.0, 29.0, 24.0, 11.0, 13.0, 7.0, 11.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.232421875, -3.132537841796875, -3.03265380859375, -2.932769775390625, -2.8328857421875, -2.733001708984375, -2.63311767578125, -2.533233642578125, -2.433349609375, -2.333465576171875, -2.23358154296875, -2.133697509765625, -2.0338134765625, -1.933929443359375, -1.83404541015625, -1.734161376953125, -1.63427734375, -1.534393310546875, -1.43450927734375, -1.334625244140625, -1.2347412109375, -1.134857177734375, -1.03497314453125, -0.935089111328125, -0.835205078125, -0.735321044921875, -0.63543701171875, -0.535552978515625, -0.4356689453125, -0.335784912109375, -0.23590087890625, -0.136016845703125, -0.0361328125, 0.063751220703125, 0.16363525390625, 0.263519287109375, 0.3634033203125, 0.463287353515625, 0.56317138671875, 0.663055419921875, 0.762939453125, 0.862823486328125, 0.96270751953125, 1.062591552734375, 1.1624755859375, 1.262359619140625, 1.36224365234375, 1.462127685546875, 1.56201171875, 1.661895751953125, 1.76177978515625, 1.861663818359375, 1.9615478515625, 2.061431884765625, 2.16131591796875, 2.261199951171875, 2.361083984375, 2.460968017578125, 2.56085205078125, 2.660736083984375, 2.7606201171875, 2.860504150390625, 2.96038818359375, 3.060272216796875, 3.16015625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 10.0, 5.0, 8.0, 10.0, 12.0, 14.0, 22.0, 21.0, 21.0, 30.0, 36.0, 40.0, 65.0, 53.0, 78.0, 65.0, 67.0, 80.0, 53.0, 60.0, 46.0, 41.0, 26.0, 21.0, 25.0, 8.0, 6.0, 13.0, 9.0, 6.0, 5.0, 3.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.53369140625, -0.5145263671875, -0.495361328125, -0.4761962890625, -0.45703125, -0.4378662109375, -0.418701171875, -0.3995361328125, -0.38037109375, -0.3612060546875, -0.342041015625, -0.3228759765625, -0.3037109375, -0.2845458984375, -0.265380859375, -0.2462158203125, -0.22705078125, -0.2078857421875, -0.188720703125, -0.1695556640625, -0.150390625, -0.1312255859375, -0.112060546875, -0.0928955078125, -0.07373046875, -0.0545654296875, -0.035400390625, -0.0162353515625, 0.0029296875, 0.0220947265625, 0.041259765625, 0.0604248046875, 0.07958984375, 0.0987548828125, 0.117919921875, 0.1370849609375, 0.15625, 0.1754150390625, 0.194580078125, 0.2137451171875, 0.23291015625, 0.2520751953125, 0.271240234375, 0.2904052734375, 0.3095703125, 0.3287353515625, 0.347900390625, 0.3670654296875, 0.38623046875, 0.4053955078125, 0.424560546875, 0.4437255859375, 0.462890625, 0.4820556640625, 0.501220703125, 0.5203857421875, 0.53955078125, 0.5587158203125, 0.577880859375, 0.5970458984375, 0.6162109375, 0.6353759765625, 0.654541015625, 0.6737060546875, 0.69287109375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 15.0, 6.0, 14.0, 11.0, 10.0, 18.0, 18.0, 30.0, 34.0, 42.0, 55.0, 49.0, 53.0, 48.0, 55.0, 45.0, 66.0, 50.0, 51.0, 56.0, 52.0, 37.0, 39.0, 19.0, 28.0, 10.0, 15.0, 16.0, 14.0, 5.0, 6.0, 11.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.213982582092285, -13.781763076782227, -13.349544525146484, -12.917325019836426, -12.485105514526367, -12.052886009216309, -11.62066650390625, -11.188447952270508, -10.75622844696045, -10.32400894165039, -9.891790390014648, -9.45957088470459, -9.027351379394531, -8.595131874084473, -8.162912368774414, -7.730693817138672, -7.298474311828613, -6.866254806518555, -6.434035778045654, -6.001816749572754, -5.569597244262695, -5.137377738952637, -4.705158710479736, -4.272939682006836, -3.8407201766967773, -3.408500909805298, -2.9762816429138184, -2.544062376022339, -2.1118431091308594, -1.6796238422393799, -1.2474045753479004, -0.8151853084564209, -0.3829669952392578, 0.04925227165222168, 0.48147153854370117, 0.9136908054351807, 1.3459100723266602, 1.7781293392181396, 2.210348606109619, 2.6425678730010986, 3.074787139892578, 3.5070064067840576, 3.939225673675537, 4.3714447021484375, 4.803664207458496, 5.235883712768555, 5.668102741241455, 6.1003217697143555, 6.532541275024414, 6.964760780334473, 7.396979808807373, 7.829198837280273, 8.261418342590332, 8.69363784790039, 9.125856399536133, 9.558075904846191, 9.99029541015625, 10.422514915466309, 10.854734420776367, 11.28695297241211, 11.719172477722168, 12.151391983032227, 12.583610534667969, 13.015830039978027, 13.448049545288086]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 15.0, 11.0, 13.0, 15.0, 19.0, 24.0, 24.0, 20.0, 26.0, 31.0, 41.0, 42.0, 32.0, 36.0, 41.0, 40.0, 39.0, 40.0, 36.0, 41.0, 41.0, 29.0, 34.0, 28.0, 27.0, 29.0, 29.0, 18.0, 19.0, 20.0, 25.0, 14.0, 8.0, 18.0, 7.0, 6.0, 5.0, 6.0, 1.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.732009887695312, -9.416609764099121, -9.101210594177246, -8.785810470581055, -8.47041130065918, -8.155011177062988, -7.839611530303955, -7.524211883544922, -7.208812236785889, -6.8934125900268555, -6.578012943267822, -6.262613296508789, -5.947213172912598, -5.631814002990723, -5.316413879394531, -5.001014232635498, -4.685614585876465, -4.370214939117432, -4.054815292358398, -3.739415407180786, -3.424015760421753, -3.1086161136627197, -2.7932162284851074, -2.477816581726074, -2.162416934967041, -1.8470172882080078, -1.531617522239685, -1.2162177562713623, -0.9008181095123291, -0.5854184627532959, -0.27001869678497314, 0.04538106918334961, 0.3607816696166992, 0.6761813759803772, 0.9915810823440552, 1.306980848312378, 1.6223804950714111, 1.9377801418304443, 2.2531800270080566, 2.56857967376709, 2.883979320526123, 3.1993789672851562, 3.5147786140441895, 3.8301784992218018, 4.145578384399414, 4.460977554321289, 4.7763776779174805, 5.091777324676514, 5.407176971435547, 5.72257661819458, 6.037976264953613, 6.3533759117126465, 6.66877555847168, 6.984175682067871, 7.299575328826904, 7.6149749755859375, 7.930374622344971, 8.245774269104004, 8.561174392700195, 8.87657356262207, 9.191973686218262, 9.507372856140137, 9.822772979736328, 10.138172149658203, 10.453572273254395]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 18.0, 30.0, 47.0, 79.0, 154.0, 268.0, 515.0, 876.0, 1592.0, 3057.0, 5713.0, 10713.0, 19830.0, 36602.0, 64949.0, 106147.0, 152297.0, 179042.0, 165238.0, 123306.0, 78149.0, 45754.0, 25138.0, 13640.0, 7211.0, 3730.0, 1978.0, 1090.0, 605.0, 336.0, 149.0, 94.0, 80.0, 30.0, 31.0, 15.0, 15.0, 2.0, 1.0, 3.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.5703125, -14.1619873046875, -13.753662109375, -13.3453369140625, -12.93701171875, -12.5286865234375, -12.120361328125, -11.7120361328125, -11.3037109375, -10.8953857421875, -10.487060546875, -10.0787353515625, -9.67041015625, -9.2620849609375, -8.853759765625, -8.4454345703125, -8.037109375, -7.6287841796875, -7.220458984375, -6.8121337890625, -6.40380859375, -5.9954833984375, -5.587158203125, -5.1788330078125, -4.7705078125, -4.3621826171875, -3.953857421875, -3.5455322265625, -3.13720703125, -2.7288818359375, -2.320556640625, -1.9122314453125, -1.50390625, -1.0955810546875, -0.687255859375, -0.2789306640625, 0.12939453125, 0.5377197265625, 0.946044921875, 1.3543701171875, 1.7626953125, 2.1710205078125, 2.579345703125, 2.9876708984375, 3.39599609375, 3.8043212890625, 4.212646484375, 4.6209716796875, 5.029296875, 5.4376220703125, 5.845947265625, 6.2542724609375, 6.66259765625, 7.0709228515625, 7.479248046875, 7.8875732421875, 8.2958984375, 8.7042236328125, 9.112548828125, 9.5208740234375, 9.92919921875, 10.3375244140625, 10.745849609375, 11.1541748046875, 11.5625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 6.0, 9.0, 12.0, 12.0, 22.0, 22.0, 16.0, 25.0, 21.0, 22.0, 14.0, 32.0, 36.0, 32.0, 48.0, 45.0, 57.0, 37.0, 47.0, 50.0, 34.0, 41.0, 41.0, 44.0, 38.0, 32.0, 28.0, 34.0, 26.0, 15.0, 15.0, 18.0, 21.0, 15.0, 9.0, 9.0, 1.0, 5.0, 9.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.3125, -9.988525390625, -9.66455078125, -9.340576171875, -9.0166015625, -8.692626953125, -8.36865234375, -8.044677734375, -7.720703125, -7.396728515625, -7.07275390625, -6.748779296875, -6.4248046875, -6.100830078125, -5.77685546875, -5.452880859375, -5.12890625, -4.804931640625, -4.48095703125, -4.156982421875, -3.8330078125, -3.509033203125, -3.18505859375, -2.861083984375, -2.537109375, -2.213134765625, -1.88916015625, -1.565185546875, -1.2412109375, -0.917236328125, -0.59326171875, -0.269287109375, 0.0546875, 0.378662109375, 0.70263671875, 1.026611328125, 1.3505859375, 1.674560546875, 1.99853515625, 2.322509765625, 2.646484375, 2.970458984375, 3.29443359375, 3.618408203125, 3.9423828125, 4.266357421875, 4.59033203125, 4.914306640625, 5.23828125, 5.562255859375, 5.88623046875, 6.210205078125, 6.5341796875, 6.858154296875, 7.18212890625, 7.506103515625, 7.830078125, 8.154052734375, 8.47802734375, 8.802001953125, 9.1259765625, 9.449951171875, 9.77392578125, 10.097900390625, 10.421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 6.0, 11.0, 21.0, 33.0, 50.0, 78.0, 135.0, 173.0, 267.0, 425.0, 748.0, 1246.0, 2127.0, 3528.0, 6155.0, 10332.0, 17578.0, 28821.0, 46972.0, 73088.0, 104807.0, 136400.0, 151487.0, 141885.0, 112424.0, 79260.0, 51377.0, 31819.0, 19121.0, 11491.0, 6712.0, 3992.0, 2427.0, 1375.0, 862.0, 510.0, 318.0, 183.0, 120.0, 70.0, 47.0, 31.0, 15.0, 8.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.8671875, -9.554931640625, -9.24267578125, -8.930419921875, -8.6181640625, -8.305908203125, -7.99365234375, -7.681396484375, -7.369140625, -7.056884765625, -6.74462890625, -6.432373046875, -6.1201171875, -5.807861328125, -5.49560546875, -5.183349609375, -4.87109375, -4.558837890625, -4.24658203125, -3.934326171875, -3.6220703125, -3.309814453125, -2.99755859375, -2.685302734375, -2.373046875, -2.060791015625, -1.74853515625, -1.436279296875, -1.1240234375, -0.811767578125, -0.49951171875, -0.187255859375, 0.125, 0.437255859375, 0.74951171875, 1.061767578125, 1.3740234375, 1.686279296875, 1.99853515625, 2.310791015625, 2.623046875, 2.935302734375, 3.24755859375, 3.559814453125, 3.8720703125, 4.184326171875, 4.49658203125, 4.808837890625, 5.12109375, 5.433349609375, 5.74560546875, 6.057861328125, 6.3701171875, 6.682373046875, 6.99462890625, 7.306884765625, 7.619140625, 7.931396484375, 8.24365234375, 8.555908203125, 8.8681640625, 9.180419921875, 9.49267578125, 9.804931640625, 10.1171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 6.0, 11.0, 5.0, 17.0, 18.0, 24.0, 28.0, 29.0, 33.0, 28.0, 26.0, 38.0, 46.0, 32.0, 39.0, 47.0, 63.0, 40.0, 48.0, 50.0, 31.0, 40.0, 36.0, 38.0, 33.0, 20.0, 33.0, 21.0, 15.0, 15.0, 21.0, 13.0, 10.0, 13.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.145751953125, -5.93603515625, -5.726318359375, -5.5166015625, -5.306884765625, -5.09716796875, -4.887451171875, -4.677734375, -4.468017578125, -4.25830078125, -4.048583984375, -3.8388671875, -3.629150390625, -3.41943359375, -3.209716796875, -3.0, -2.790283203125, -2.58056640625, -2.370849609375, -2.1611328125, -1.951416015625, -1.74169921875, -1.531982421875, -1.322265625, -1.112548828125, -0.90283203125, -0.693115234375, -0.4833984375, -0.273681640625, -0.06396484375, 0.145751953125, 0.35546875, 0.565185546875, 0.77490234375, 0.984619140625, 1.1943359375, 1.404052734375, 1.61376953125, 1.823486328125, 2.033203125, 2.242919921875, 2.45263671875, 2.662353515625, 2.8720703125, 3.081787109375, 3.29150390625, 3.501220703125, 3.7109375, 3.920654296875, 4.13037109375, 4.340087890625, 4.5498046875, 4.759521484375, 4.96923828125, 5.178955078125, 5.388671875, 5.598388671875, 5.80810546875, 6.017822265625, 6.2275390625, 6.437255859375, 6.64697265625, 6.856689453125, 7.06640625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 4.0, 5.0, 12.0, 11.0, 16.0, 25.0, 37.0, 50.0, 89.0, 180.0, 286.0, 492.0, 1047.0, 2105.0, 4813.0, 11940.0, 31999.0, 91204.0, 242333.0, 354366.0, 195095.0, 70508.0, 24867.0, 9466.0, 3923.0, 1781.0, 834.0, 446.0, 238.0, 154.0, 82.0, 52.0, 28.0, 17.0, 25.0, 8.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9609375, -13.5013427734375, -13.041748046875, -12.5821533203125, -12.12255859375, -11.6629638671875, -11.203369140625, -10.7437744140625, -10.2841796875, -9.8245849609375, -9.364990234375, -8.9053955078125, -8.44580078125, -7.9862060546875, -7.526611328125, -7.0670166015625, -6.607421875, -6.1478271484375, -5.688232421875, -5.2286376953125, -4.76904296875, -4.3094482421875, -3.849853515625, -3.3902587890625, -2.9306640625, -2.4710693359375, -2.011474609375, -1.5518798828125, -1.09228515625, -0.6326904296875, -0.173095703125, 0.2864990234375, 0.74609375, 1.2056884765625, 1.665283203125, 2.1248779296875, 2.58447265625, 3.0440673828125, 3.503662109375, 3.9632568359375, 4.4228515625, 4.8824462890625, 5.342041015625, 5.8016357421875, 6.26123046875, 6.7208251953125, 7.180419921875, 7.6400146484375, 8.099609375, 8.5592041015625, 9.018798828125, 9.4783935546875, 9.93798828125, 10.3975830078125, 10.857177734375, 11.3167724609375, 11.7763671875, 12.2359619140625, 12.695556640625, 13.1551513671875, 13.61474609375, 14.0743408203125, 14.533935546875, 14.9935302734375, 15.453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 4.0, 4.0, 2.0, 5.0, 11.0, 12.0, 13.0, 18.0, 32.0, 32.0, 36.0, 51.0, 71.0, 77.0, 89.0, 82.0, 83.0, 65.0, 60.0, 60.0, 28.0, 34.0, 29.0, 22.0, 20.0, 9.0, 12.0, 9.0, 8.0, 3.0, 8.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008578747510910034, -0.0008278787136077881, -0.0007978826761245728, -0.0007678866386413574, -0.0007378906011581421, -0.0007078945636749268, -0.0006778985261917114, -0.0006479024887084961, -0.0006179064512252808, -0.0005879104137420654, -0.0005579143762588501, -0.0005279183387756348, -0.0004979223012924194, -0.0004679262638092041, -0.00043793022632598877, -0.00040793418884277344, -0.0003779381513595581, -0.0003479421138763428, -0.00031794607639312744, -0.0002879500389099121, -0.0002579540014266968, -0.00022795796394348145, -0.0001979619264602661, -0.00016796588897705078, -0.00013796985149383545, -0.00010797381401062012, -7.797777652740479e-05, -4.798173904418945e-05, -1.798570156097412e-05, 1.2010335922241211e-05, 4.200637340545654e-05, 7.200241088867188e-05, 0.00010199844837188721, 0.00013199448585510254, 0.00016199052333831787, 0.0001919865608215332, 0.00022198259830474854, 0.00025197863578796387, 0.0002819746732711792, 0.00031197071075439453, 0.00034196674823760986, 0.0003719627857208252, 0.00040195882320404053, 0.00043195486068725586, 0.0004619508981704712, 0.0004919469356536865, 0.0005219429731369019, 0.0005519390106201172, 0.0005819350481033325, 0.0006119310855865479, 0.0006419271230697632, 0.0006719231605529785, 0.0007019191980361938, 0.0007319152355194092, 0.0007619112730026245, 0.0007919073104858398, 0.0008219033479690552, 0.0008518993854522705, 0.0008818954229354858, 0.0009118914604187012, 0.0009418874979019165, 0.0009718835353851318, 0.0010018795728683472, 0.0010318756103515625]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 30.0, 23.0, 32.0, 48.0, 59.0, 92.0, 137.0, 192.0, 335.0, 450.0, 840.0, 1352.0, 2395.0, 4413.0, 8617.0, 17424.0, 37035.0, 78320.0, 155757.0, 238713.0, 228306.0, 139716.0, 69449.0, 32429.0, 15288.0, 7760.0, 3930.0, 2242.0, 1173.0, 729.0, 403.0, 238.0, 179.0, 127.0, 90.0, 53.0, 53.0, 28.0, 17.0, 15.0, 15.0, 8.0, 12.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.8001708984375, -9.483154296875, -9.1661376953125, -8.84912109375, -8.5321044921875, -8.215087890625, -7.8980712890625, -7.5810546875, -7.2640380859375, -6.947021484375, -6.6300048828125, -6.31298828125, -5.9959716796875, -5.678955078125, -5.3619384765625, -5.044921875, -4.7279052734375, -4.410888671875, -4.0938720703125, -3.77685546875, -3.4598388671875, -3.142822265625, -2.8258056640625, -2.5087890625, -2.1917724609375, -1.874755859375, -1.5577392578125, -1.24072265625, -0.9237060546875, -0.606689453125, -0.2896728515625, 0.02734375, 0.3443603515625, 0.661376953125, 0.9783935546875, 1.29541015625, 1.6124267578125, 1.929443359375, 2.2464599609375, 2.5634765625, 2.8804931640625, 3.197509765625, 3.5145263671875, 3.83154296875, 4.1485595703125, 4.465576171875, 4.7825927734375, 5.099609375, 5.4166259765625, 5.733642578125, 6.0506591796875, 6.36767578125, 6.6846923828125, 7.001708984375, 7.3187255859375, 7.6357421875, 7.9527587890625, 8.269775390625, 8.5867919921875, 8.90380859375, 9.2208251953125, 9.537841796875, 9.8548583984375, 10.171875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 6.0, 6.0, 14.0, 18.0, 16.0, 20.0, 19.0, 33.0, 46.0, 43.0, 53.0, 53.0, 67.0, 63.0, 64.0, 77.0, 60.0, 64.0, 65.0, 44.0, 30.0, 25.0, 17.0, 19.0, 14.0, 8.0, 11.0, 1.0, 10.0, 4.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.5179443359375, -2.434326171875, -2.3507080078125, -2.26708984375, -2.1834716796875, -2.099853515625, -2.0162353515625, -1.9326171875, -1.8489990234375, -1.765380859375, -1.6817626953125, -1.59814453125, -1.5145263671875, -1.430908203125, -1.3472900390625, -1.263671875, -1.1800537109375, -1.096435546875, -1.0128173828125, -0.92919921875, -0.8455810546875, -0.761962890625, -0.6783447265625, -0.5947265625, -0.5111083984375, -0.427490234375, -0.3438720703125, -0.26025390625, -0.1766357421875, -0.093017578125, -0.0093994140625, 0.07421875, 0.1578369140625, 0.241455078125, 0.3250732421875, 0.40869140625, 0.4923095703125, 0.575927734375, 0.6595458984375, 0.7431640625, 0.8267822265625, 0.910400390625, 0.9940185546875, 1.07763671875, 1.1612548828125, 1.244873046875, 1.3284912109375, 1.412109375, 1.4957275390625, 1.579345703125, 1.6629638671875, 1.74658203125, 1.8302001953125, 1.913818359375, 1.9974365234375, 2.0810546875, 2.1646728515625, 2.248291015625, 2.3319091796875, 2.41552734375, 2.4991455078125, 2.582763671875, 2.6663818359375, 2.75]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 12.0, 8.0, 8.0, 12.0, 15.0, 9.0, 19.0, 33.0, 25.0, 33.0, 36.0, 37.0, 34.0, 37.0, 60.0, 43.0, 39.0, 43.0, 35.0, 56.0, 45.0, 50.0, 45.0, 38.0, 25.0, 26.0, 19.0, 18.0, 17.0, 14.0, 14.0, 17.0, 9.0, 12.0, 4.0, 6.0, 7.0, 5.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.719067573547363, -9.397351264953613, -9.07563591003418, -8.75391960144043, -8.43220329284668, -8.11048698425293, -7.788771152496338, -7.467055320739746, -7.145339012145996, -6.823622703552246, -6.501906871795654, -6.1801910400390625, -5.8584747314453125, -5.5367584228515625, -5.215042591094971, -4.893326759338379, -4.571610450744629, -4.249894142150879, -3.928178310394287, -3.606462240219116, -3.2847461700439453, -2.9630300998687744, -2.6413140296936035, -2.3195979595184326, -1.9978818893432617, -1.6761658191680908, -1.35444974899292, -1.032733678817749, -0.7110176086425781, -0.3893015384674072, -0.06758546829223633, 0.25413060188293457, 0.5758476257324219, 0.8975636959075928, 1.2192797660827637, 1.5409958362579346, 1.8627119064331055, 2.1844279766082764, 2.5061440467834473, 2.827860116958618, 3.149576187133789, 3.47129225730896, 3.793008327484131, 4.114724159240723, 4.436440467834473, 4.758156776428223, 5.0798726081848145, 5.401588439941406, 5.723304748535156, 6.045021057128906, 6.366736888885498, 6.68845272064209, 7.01016902923584, 7.33188533782959, 7.653601169586182, 7.975317001342773, 8.297033309936523, 8.618749618530273, 8.940465927124023, 9.262181282043457, 9.583897590637207, 9.905613899230957, 10.22732925415039, 10.54904556274414, 10.87076187133789]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 6.0, 6.0, 3.0, 17.0, 15.0, 19.0, 16.0, 20.0, 12.0, 27.0, 35.0, 27.0, 35.0, 34.0, 29.0, 49.0, 39.0, 44.0, 41.0, 40.0, 44.0, 36.0, 38.0, 44.0, 38.0, 33.0, 36.0, 24.0, 21.0, 24.0, 20.0, 22.0, 21.0, 20.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-10.343703269958496, -10.032953262329102, -9.722203254699707, -9.411454200744629, -9.100704193115234, -8.78995418548584, -8.479204177856445, -8.16845417022705, -7.8577046394348145, -7.54695463180542, -7.236205101013184, -6.925455093383789, -6.6147050857543945, -6.303955554962158, -5.993205547332764, -5.682456016540527, -5.371706008911133, -5.060956001281738, -4.750206470489502, -4.439456462860107, -4.128706932067871, -3.8179569244384766, -3.507206916809082, -3.1964571475982666, -2.885707378387451, -2.5749576091766357, -2.2642078399658203, -1.9534578323364258, -1.6427080631256104, -1.331958293914795, -1.02120840549469, -0.710458517074585, -0.39970970153808594, -0.08895987272262573, 0.22178995609283447, 0.5325397849082947, 0.8432896137237549, 1.1540393829345703, 1.4647892713546753, 1.7755391597747803, 2.0862889289855957, 2.397038698196411, 2.7077884674072266, 3.018538475036621, 3.3292882442474365, 3.640038013458252, 3.9507880210876465, 4.261537551879883, 4.572287559509277, 4.883037567138672, 5.193787097930908, 5.504537105560303, 5.815286636352539, 6.126036643981934, 6.436786651611328, 6.747536659240723, 7.058286190032959, 7.3690361976623535, 7.67978572845459, 7.990535736083984, 8.301285743713379, 8.612035751342773, 8.922784805297852, 9.233534812927246, 9.54428482055664]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 17.0, 24.0, 44.0, 53.0, 70.0, 121.0, 180.0, 290.0, 477.0, 692.0, 1167.0, 1808.0, 2929.0, 4538.0, 7566.0, 12299.0, 20815.0, 35748.0, 62829.0, 112185.0, 203305.0, 370422.0, 610841.0, 800621.0, 751076.0, 518889.0, 298203.0, 162118.0, 88962.0, 50514.0, 29569.0, 17444.0, 10642.0, 6377.0, 4108.0, 2582.0, 1609.0, 1039.0, 712.0, 479.0, 318.0, 196.0, 119.0, 85.0, 66.0, 47.0, 19.0, 18.0, 14.0, 15.0, 4.0, 9.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.234375, -7.9755859375, -7.716796875, -7.4580078125, -7.19921875, -6.9404296875, -6.681640625, -6.4228515625, -6.1640625, -5.9052734375, -5.646484375, -5.3876953125, -5.12890625, -4.8701171875, -4.611328125, -4.3525390625, -4.09375, -3.8349609375, -3.576171875, -3.3173828125, -3.05859375, -2.7998046875, -2.541015625, -2.2822265625, -2.0234375, -1.7646484375, -1.505859375, -1.2470703125, -0.98828125, -0.7294921875, -0.470703125, -0.2119140625, 0.046875, 0.3056640625, 0.564453125, 0.8232421875, 1.08203125, 1.3408203125, 1.599609375, 1.8583984375, 2.1171875, 2.3759765625, 2.634765625, 2.8935546875, 3.15234375, 3.4111328125, 3.669921875, 3.9287109375, 4.1875, 4.4462890625, 4.705078125, 4.9638671875, 5.22265625, 5.4814453125, 5.740234375, 5.9990234375, 6.2578125, 6.5166015625, 6.775390625, 7.0341796875, 7.29296875, 7.5517578125, 7.810546875, 8.0693359375, 8.328125]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 7.0, 6.0, 6.0, 8.0, 8.0, 8.0, 9.0, 11.0, 18.0, 17.0, 24.0, 15.0, 30.0, 25.0, 30.0, 30.0, 31.0, 29.0, 34.0, 51.0, 28.0, 43.0, 49.0, 38.0, 42.0, 36.0, 25.0, 43.0, 46.0, 30.0, 30.0, 33.0, 19.0, 14.0, 17.0, 21.0, 16.0, 20.0, 10.0, 9.0, 14.0, 5.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.015625, -6.80096435546875, -6.5863037109375, -6.37164306640625, -6.156982421875, -5.94232177734375, -5.7276611328125, -5.51300048828125, -5.29833984375, -5.08367919921875, -4.8690185546875, -4.65435791015625, -4.439697265625, -4.22503662109375, -4.0103759765625, -3.79571533203125, -3.5810546875, -3.36639404296875, -3.1517333984375, -2.93707275390625, -2.722412109375, -2.50775146484375, -2.2930908203125, -2.07843017578125, -1.86376953125, -1.64910888671875, -1.4344482421875, -1.21978759765625, -1.005126953125, -0.79046630859375, -0.5758056640625, -0.36114501953125, -0.146484375, 0.06817626953125, 0.2828369140625, 0.49749755859375, 0.712158203125, 0.92681884765625, 1.1414794921875, 1.35614013671875, 1.57080078125, 1.78546142578125, 2.0001220703125, 2.21478271484375, 2.429443359375, 2.64410400390625, 2.8587646484375, 3.07342529296875, 3.2880859375, 3.50274658203125, 3.7174072265625, 3.93206787109375, 4.146728515625, 4.36138916015625, 4.5760498046875, 4.79071044921875, 5.00537109375, 5.22003173828125, 5.4346923828125, 5.64935302734375, 5.864013671875, 6.07867431640625, 6.2933349609375, 6.50799560546875, 6.72265625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 10.0, 18.0, 21.0, 26.0, 41.0, 82.0, 122.0, 178.0, 306.0, 454.0, 785.0, 1216.0, 2084.0, 3358.0, 5603.0, 9921.0, 17056.0, 29552.0, 52403.0, 93519.0, 167999.0, 296895.0, 495000.0, 721810.0, 788104.0, 611985.0, 386256.0, 222038.0, 125412.0, 69962.0, 39324.0, 21911.0, 12688.0, 7206.0, 4317.0, 2609.0, 1491.0, 919.0, 607.0, 381.0, 240.0, 123.0, 93.0, 68.0, 27.0, 25.0, 17.0, 8.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.2734375, -8.98583984375, -8.6982421875, -8.41064453125, -8.123046875, -7.83544921875, -7.5478515625, -7.26025390625, -6.97265625, -6.68505859375, -6.3974609375, -6.10986328125, -5.822265625, -5.53466796875, -5.2470703125, -4.95947265625, -4.671875, -4.38427734375, -4.0966796875, -3.80908203125, -3.521484375, -3.23388671875, -2.9462890625, -2.65869140625, -2.37109375, -2.08349609375, -1.7958984375, -1.50830078125, -1.220703125, -0.93310546875, -0.6455078125, -0.35791015625, -0.0703125, 0.21728515625, 0.5048828125, 0.79248046875, 1.080078125, 1.36767578125, 1.6552734375, 1.94287109375, 2.23046875, 2.51806640625, 2.8056640625, 3.09326171875, 3.380859375, 3.66845703125, 3.9560546875, 4.24365234375, 4.53125, 4.81884765625, 5.1064453125, 5.39404296875, 5.681640625, 5.96923828125, 6.2568359375, 6.54443359375, 6.83203125, 7.11962890625, 7.4072265625, 7.69482421875, 7.982421875, 8.27001953125, 8.5576171875, 8.84521484375, 9.1328125]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 10.0, 11.0, 12.0, 18.0, 20.0, 39.0, 36.0, 54.0, 66.0, 92.0, 113.0, 150.0, 162.0, 212.0, 234.0, 253.0, 265.0, 278.0, 281.0, 259.0, 245.0, 222.0, 224.0, 164.0, 147.0, 108.0, 112.0, 80.0, 61.0, 44.0, 29.0, 19.0, 9.0, 8.0, 11.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.089874267578125, -3.96881103515625, -3.847747802734375, -3.7266845703125, -3.605621337890625, -3.48455810546875, -3.363494873046875, -3.242431640625, -3.121368408203125, -3.00030517578125, -2.879241943359375, -2.7581787109375, -2.637115478515625, -2.51605224609375, -2.394989013671875, -2.27392578125, -2.152862548828125, -2.03179931640625, -1.910736083984375, -1.7896728515625, -1.668609619140625, -1.54754638671875, -1.426483154296875, -1.305419921875, -1.184356689453125, -1.06329345703125, -0.942230224609375, -0.8211669921875, -0.700103759765625, -0.57904052734375, -0.457977294921875, -0.3369140625, -0.215850830078125, -0.09478759765625, 0.026275634765625, 0.1473388671875, 0.268402099609375, 0.38946533203125, 0.510528564453125, 0.631591796875, 0.752655029296875, 0.87371826171875, 0.994781494140625, 1.1158447265625, 1.236907958984375, 1.35797119140625, 1.479034423828125, 1.60009765625, 1.721160888671875, 1.84222412109375, 1.963287353515625, 2.0843505859375, 2.205413818359375, 2.32647705078125, 2.447540283203125, 2.568603515625, 2.689666748046875, 2.81072998046875, 2.931793212890625, 3.0528564453125, 3.173919677734375, 3.29498291015625, 3.416046142578125, 3.537109375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 1.0, 9.0, 8.0, 5.0, 8.0, 15.0, 8.0, 15.0, 26.0, 18.0, 21.0, 23.0, 17.0, 36.0, 38.0, 44.0, 58.0, 44.0, 53.0, 53.0, 46.0, 43.0, 47.0, 55.0, 36.0, 38.0, 33.0, 42.0, 19.0, 25.0, 18.0, 20.0, 13.0, 10.0, 14.0, 4.0, 12.0, 9.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.56761646270752, -9.275262832641602, -8.982908248901367, -8.69055461883545, -8.398200035095215, -8.105846405029297, -7.813492298126221, -7.5211381912231445, -7.228784561157227, -6.93643045425415, -6.644076347351074, -6.351722717285156, -6.05936861038208, -5.767014503479004, -5.474660396575928, -5.182306289672852, -4.889952182769775, -4.597598075866699, -4.305243968963623, -4.012889862060547, -3.720536231994629, -3.4281821250915527, -3.1358280181884766, -2.8434741497039795, -2.5511200428009033, -2.258765935897827, -1.96641206741333, -1.674057960510254, -1.3817039728164673, -1.0893499851226807, -0.7969958782196045, -0.5046420097351074, -0.21228790283203125, 0.08006611466407776, 0.37242013216018677, 0.6647741794586182, 0.9571281671524048, 1.2494821548461914, 1.5418362617492676, 1.8341901302337646, 2.126544237136841, 2.418898344039917, 2.711252212524414, 3.0036063194274902, 3.2959604263305664, 3.5883142948150635, 3.8806684017181396, 4.173022270202637, 4.465376377105713, 4.757730484008789, 5.050084590911865, 5.342438697814941, 5.634792327880859, 5.9271464347839355, 6.219500541687012, 6.51185417175293, 6.804208755493164, 7.09656286239624, 7.388916969299316, 7.681270599365234, 7.9736247062683105, 8.265978813171387, 8.558332443237305, 8.850687026977539, 9.143040657043457]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 4.0, 11.0, 2.0, 6.0, 16.0, 12.0, 8.0, 15.0, 20.0, 14.0, 25.0, 30.0, 34.0, 27.0, 43.0, 42.0, 36.0, 42.0, 45.0, 45.0, 41.0, 39.0, 45.0, 44.0, 29.0, 42.0, 39.0, 36.0, 26.0, 21.0, 25.0, 23.0, 16.0, 12.0, 20.0, 10.0, 10.0, 13.0, 10.0, 6.0, 1.0, 2.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.662756443023682, -7.401858806610107, -7.140961647033691, -6.880064010620117, -6.619166851043701, -6.358269214630127, -6.097372055053711, -5.836474418640137, -5.5755767822265625, -5.314679145812988, -5.053781986236572, -4.792884349822998, -4.531987190246582, -4.271089553833008, -4.010191917419434, -3.7492947578430176, -3.4883975982666016, -3.2275002002716064, -2.9666028022766113, -2.705705165863037, -2.444808006286621, -2.183910369873047, -1.9230129718780518, -1.6621155738830566, -1.4012181758880615, -1.1403207778930664, -0.8794233202934265, -0.6185258626937866, -0.3576284646987915, -0.09673106670379639, 0.16416645050048828, 0.4250638484954834, 0.6859617233276367, 0.9468591213226318, 1.207756519317627, 1.4686540365219116, 1.7295514345169067, 1.9904488325119019, 2.2513463497161865, 2.5122437477111816, 2.7731411457061768, 3.034038543701172, 3.294935941696167, 3.555833339691162, 3.8167309761047363, 4.077628135681152, 4.338525772094727, 4.599423408508301, 4.860320568084717, 5.121218204498291, 5.382115364074707, 5.643013000488281, 5.903910160064697, 6.1648077964782715, 6.4257049560546875, 6.686602592468262, 6.947500228881836, 7.20839786529541, 7.469295024871826, 7.7301926612854, 7.991089820861816, 8.25198745727539, 8.512885093688965, 8.773782730102539, 9.034679412841797]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 5.0, 8.0, 12.0, 5.0, 13.0, 29.0, 53.0, 83.0, 130.0, 157.0, 259.0, 388.0, 647.0, 922.0, 1470.0, 2454.0, 3909.0, 6557.0, 12383.0, 24185.0, 49598.0, 105272.0, 205733.0, 270700.0, 183630.0, 90225.0, 42556.0, 20627.0, 10956.0, 6044.0, 3522.0, 2118.0, 1384.0, 895.0, 559.0, 366.0, 230.0, 161.0, 106.0, 81.0, 37.0, 28.0, 20.0, 15.0, 15.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.2890625, -8.033203125, -7.77734375, -7.521484375, -7.265625, -7.009765625, -6.75390625, -6.498046875, -6.2421875, -5.986328125, -5.73046875, -5.474609375, -5.21875, -4.962890625, -4.70703125, -4.451171875, -4.1953125, -3.939453125, -3.68359375, -3.427734375, -3.171875, -2.916015625, -2.66015625, -2.404296875, -2.1484375, -1.892578125, -1.63671875, -1.380859375, -1.125, -0.869140625, -0.61328125, -0.357421875, -0.1015625, 0.154296875, 0.41015625, 0.666015625, 0.921875, 1.177734375, 1.43359375, 1.689453125, 1.9453125, 2.201171875, 2.45703125, 2.712890625, 2.96875, 3.224609375, 3.48046875, 3.736328125, 3.9921875, 4.248046875, 4.50390625, 4.759765625, 5.015625, 5.271484375, 5.52734375, 5.783203125, 6.0390625, 6.294921875, 6.55078125, 6.806640625, 7.0625, 7.318359375, 7.57421875, 7.830078125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 4.0, 5.0, 2.0, 7.0, 6.0, 8.0, 7.0, 8.0, 12.0, 16.0, 13.0, 15.0, 11.0, 18.0, 22.0, 16.0, 29.0, 32.0, 41.0, 32.0, 42.0, 51.0, 42.0, 30.0, 41.0, 38.0, 40.0, 49.0, 34.0, 38.0, 37.0, 29.0, 27.0, 32.0, 32.0, 12.0, 14.0, 17.0, 17.0, 11.0, 16.0, 14.0, 6.0, 8.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.14453125, -6.89788818359375, -6.6512451171875, -6.40460205078125, -6.157958984375, -5.91131591796875, -5.6646728515625, -5.41802978515625, -5.17138671875, -4.92474365234375, -4.6781005859375, -4.43145751953125, -4.184814453125, -3.93817138671875, -3.6915283203125, -3.44488525390625, -3.1982421875, -2.95159912109375, -2.7049560546875, -2.45831298828125, -2.211669921875, -1.96502685546875, -1.7183837890625, -1.47174072265625, -1.22509765625, -0.97845458984375, -0.7318115234375, -0.48516845703125, -0.238525390625, 0.00811767578125, 0.2547607421875, 0.50140380859375, 0.748046875, 0.99468994140625, 1.2413330078125, 1.48797607421875, 1.734619140625, 1.98126220703125, 2.2279052734375, 2.47454833984375, 2.72119140625, 2.96783447265625, 3.2144775390625, 3.46112060546875, 3.707763671875, 3.95440673828125, 4.2010498046875, 4.44769287109375, 4.6943359375, 4.94097900390625, 5.1876220703125, 5.43426513671875, 5.680908203125, 5.92755126953125, 6.1741943359375, 6.42083740234375, 6.66748046875, 6.91412353515625, 7.1607666015625, 7.40740966796875, 7.654052734375, 7.90069580078125, 8.1473388671875, 8.39398193359375, 8.640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 15.0, 13.0, 23.0, 31.0, 51.0, 47.0, 88.0, 135.0, 193.0, 272.0, 431.0, 625.0, 1057.0, 1512.0, 2485.0, 4049.0, 6672.0, 11366.0, 21519.0, 64316.0, 843820.0, 44243.0, 18870.0, 10463.0, 5959.0, 3735.0, 2368.0, 1402.0, 910.0, 635.0, 400.0, 252.0, 201.0, 128.0, 83.0, 47.0, 33.0, 29.0, 23.0, 25.0, 7.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.28125, -9.9908447265625, -9.700439453125, -9.4100341796875, -9.11962890625, -8.8292236328125, -8.538818359375, -8.2484130859375, -7.9580078125, -7.6676025390625, -7.377197265625, -7.0867919921875, -6.79638671875, -6.5059814453125, -6.215576171875, -5.9251708984375, -5.634765625, -5.3443603515625, -5.053955078125, -4.7635498046875, -4.47314453125, -4.1827392578125, -3.892333984375, -3.6019287109375, -3.3115234375, -3.0211181640625, -2.730712890625, -2.4403076171875, -2.14990234375, -1.8594970703125, -1.569091796875, -1.2786865234375, -0.98828125, -0.6978759765625, -0.407470703125, -0.1170654296875, 0.17333984375, 0.4637451171875, 0.754150390625, 1.0445556640625, 1.3349609375, 1.6253662109375, 1.915771484375, 2.2061767578125, 2.49658203125, 2.7869873046875, 3.077392578125, 3.3677978515625, 3.658203125, 3.9486083984375, 4.239013671875, 4.5294189453125, 4.81982421875, 5.1102294921875, 5.400634765625, 5.6910400390625, 5.9814453125, 6.2718505859375, 6.562255859375, 6.8526611328125, 7.14306640625, 7.4334716796875, 7.723876953125, 8.0142822265625, 8.3046875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 11.0, 8.0, 19.0, 13.0, 14.0, 22.0, 20.0, 17.0, 29.0, 36.0, 24.0, 31.0, 43.0, 36.0, 31.0, 50.0, 34.0, 42.0, 39.0, 43.0, 36.0, 41.0, 40.0, 34.0, 33.0, 22.0, 28.0, 24.0, 24.0, 19.0, 22.0, 10.0, 12.0, 14.0, 8.0, 6.0, 8.0, 12.0, 4.0, 4.0, 10.0, 2.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.984375, -5.78448486328125, -5.5845947265625, -5.38470458984375, -5.184814453125, -4.98492431640625, -4.7850341796875, -4.58514404296875, -4.38525390625, -4.18536376953125, -3.9854736328125, -3.78558349609375, -3.585693359375, -3.38580322265625, -3.1859130859375, -2.98602294921875, -2.7861328125, -2.58624267578125, -2.3863525390625, -2.18646240234375, -1.986572265625, -1.78668212890625, -1.5867919921875, -1.38690185546875, -1.18701171875, -0.98712158203125, -0.7872314453125, -0.58734130859375, -0.387451171875, -0.18756103515625, 0.0123291015625, 0.21221923828125, 0.412109375, 0.61199951171875, 0.8118896484375, 1.01177978515625, 1.211669921875, 1.41156005859375, 1.6114501953125, 1.81134033203125, 2.01123046875, 2.21112060546875, 2.4110107421875, 2.61090087890625, 2.810791015625, 3.01068115234375, 3.2105712890625, 3.41046142578125, 3.6103515625, 3.81024169921875, 4.0101318359375, 4.21002197265625, 4.409912109375, 4.60980224609375, 4.8096923828125, 5.00958251953125, 5.20947265625, 5.40936279296875, 5.6092529296875, 5.80914306640625, 6.009033203125, 6.20892333984375, 6.4088134765625, 6.60870361328125, 6.80859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 5.0, 5.0, 9.0, 7.0, 11.0, 25.0, 29.0, 41.0, 59.0, 104.0, 144.0, 219.0, 329.0, 557.0, 896.0, 1604.0, 2985.0, 5978.0, 13948.0, 44478.0, 903255.0, 45795.0, 14525.0, 6409.0, 3140.0, 1557.0, 979.0, 506.0, 354.0, 190.0, 130.0, 87.0, 63.0, 27.0, 30.0, 17.0, 13.0, 12.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.546875, -6.32501220703125, -6.1031494140625, -5.88128662109375, -5.659423828125, -5.43756103515625, -5.2156982421875, -4.99383544921875, -4.77197265625, -4.55010986328125, -4.3282470703125, -4.10638427734375, -3.884521484375, -3.66265869140625, -3.4407958984375, -3.21893310546875, -2.9970703125, -2.77520751953125, -2.5533447265625, -2.33148193359375, -2.109619140625, -1.88775634765625, -1.6658935546875, -1.44403076171875, -1.22216796875, -1.00030517578125, -0.7784423828125, -0.55657958984375, -0.334716796875, -0.11285400390625, 0.1090087890625, 0.33087158203125, 0.552734375, 0.77459716796875, 0.9964599609375, 1.21832275390625, 1.440185546875, 1.66204833984375, 1.8839111328125, 2.10577392578125, 2.32763671875, 2.54949951171875, 2.7713623046875, 2.99322509765625, 3.215087890625, 3.43695068359375, 3.6588134765625, 3.88067626953125, 4.1025390625, 4.32440185546875, 4.5462646484375, 4.76812744140625, 4.989990234375, 5.21185302734375, 5.4337158203125, 5.65557861328125, 5.87744140625, 6.09930419921875, 6.3211669921875, 6.54302978515625, 6.764892578125, 6.98675537109375, 7.2086181640625, 7.43048095703125, 7.65234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 8.0, 10.0, 10.0, 21.0, 23.0, 26.0, 55.0, 69.0, 85.0, 126.0, 132.0, 115.0, 81.0, 60.0, 45.0, 16.0, 21.0, 19.0, 8.0, 15.0, 15.0, 5.0, 5.0, 6.0, 3.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005664825439453125, -0.0005449503660202026, -0.0005234181880950928, -0.0005018860101699829, -0.00048035383224487305, -0.0004588216543197632, -0.0004372894763946533, -0.00041575729846954346, -0.0003942251205444336, -0.00037269294261932373, -0.00035116076469421387, -0.000329628586769104, -0.00030809640884399414, -0.0002865642309188843, -0.0002650320529937744, -0.00024349987506866455, -0.0002219676971435547, -0.00020043551921844482, -0.00017890334129333496, -0.0001573711633682251, -0.00013583898544311523, -0.00011430680751800537, -9.277462959289551e-05, -7.124245166778564e-05, -4.971027374267578e-05, -2.8178095817565918e-05, -6.645917892456055e-06, 1.4886260032653809e-05, 3.641843795776367e-05, 5.7950615882873535e-05, 7.94827938079834e-05, 0.00010101497173309326, 0.00012254714965820312, 0.000144079327583313, 0.00016561150550842285, 0.00018714368343353271, 0.00020867586135864258, 0.00023020803928375244, 0.0002517402172088623, 0.00027327239513397217, 0.00029480457305908203, 0.0003163367509841919, 0.00033786892890930176, 0.0003594011068344116, 0.0003809332847595215, 0.00040246546268463135, 0.0004239976406097412, 0.0004455298185348511, 0.00046706199645996094, 0.0004885941743850708, 0.0005101263523101807, 0.0005316585302352905, 0.0005531907081604004, 0.0005747228860855103, 0.0005962550640106201, 0.00061778724193573, 0.0006393194198608398, 0.0006608515977859497, 0.0006823837757110596, 0.0007039159536361694, 0.0007254481315612793, 0.0007469803094863892, 0.000768512487411499, 0.0007900446653366089, 0.0008115768432617188]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 11.0, 22.0, 33.0, 47.0, 59.0, 78.0, 105.0, 199.0, 286.0, 400.0, 640.0, 1040.0, 1559.0, 2497.0, 3764.0, 6036.0, 9585.0, 15677.0, 26419.0, 45234.0, 80064.0, 139462.0, 212095.0, 201431.0, 126590.0, 71734.0, 40948.0, 23863.0, 14519.0, 8981.0, 5420.0, 3468.0, 2239.0, 1375.0, 894.0, 583.0, 411.0, 252.0, 181.0, 118.0, 81.0, 43.0, 35.0, 32.0, 13.0, 9.0, 6.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.9306640625, -1.8719940185546875, -1.813323974609375, -1.7546539306640625, -1.69598388671875, -1.6373138427734375, -1.578643798828125, -1.5199737548828125, -1.4613037109375, -1.4026336669921875, -1.343963623046875, -1.2852935791015625, -1.22662353515625, -1.1679534912109375, -1.109283447265625, -1.0506134033203125, -0.991943359375, -0.9332733154296875, -0.874603271484375, -0.8159332275390625, -0.75726318359375, -0.6985931396484375, -0.639923095703125, -0.5812530517578125, -0.5225830078125, -0.4639129638671875, -0.405242919921875, -0.3465728759765625, -0.28790283203125, -0.2292327880859375, -0.170562744140625, -0.1118927001953125, -0.05322265625, 0.0054473876953125, 0.064117431640625, 0.1227874755859375, 0.18145751953125, 0.2401275634765625, 0.298797607421875, 0.3574676513671875, 0.4161376953125, 0.4748077392578125, 0.533477783203125, 0.5921478271484375, 0.65081787109375, 0.7094879150390625, 0.768157958984375, 0.8268280029296875, 0.885498046875, 0.9441680908203125, 1.002838134765625, 1.0615081787109375, 1.12017822265625, 1.1788482666015625, 1.237518310546875, 1.2961883544921875, 1.3548583984375, 1.4135284423828125, 1.472198486328125, 1.5308685302734375, 1.58953857421875, 1.6482086181640625, 1.706878662109375, 1.7655487060546875, 1.82421875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 10.0, 12.0, 7.0, 18.0, 26.0, 20.0, 12.0, 28.0, 25.0, 31.0, 30.0, 43.0, 35.0, 53.0, 46.0, 51.0, 51.0, 63.0, 54.0, 43.0, 42.0, 36.0, 32.0, 32.0, 25.0, 22.0, 26.0, 19.0, 18.0, 13.0, 9.0, 8.0, 12.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.580078125, -0.563812255859375, -0.54754638671875, -0.531280517578125, -0.5150146484375, -0.498748779296875, -0.48248291015625, -0.466217041015625, -0.449951171875, -0.433685302734375, -0.41741943359375, -0.401153564453125, -0.3848876953125, -0.368621826171875, -0.35235595703125, -0.336090087890625, -0.31982421875, -0.303558349609375, -0.28729248046875, -0.271026611328125, -0.2547607421875, -0.238494873046875, -0.22222900390625, -0.205963134765625, -0.189697265625, -0.173431396484375, -0.15716552734375, -0.140899658203125, -0.1246337890625, -0.108367919921875, -0.09210205078125, -0.075836181640625, -0.0595703125, -0.043304443359375, -0.02703857421875, -0.010772705078125, 0.0054931640625, 0.021759033203125, 0.03802490234375, 0.054290771484375, 0.070556640625, 0.086822509765625, 0.10308837890625, 0.119354248046875, 0.1356201171875, 0.151885986328125, 0.16815185546875, 0.184417724609375, 0.20068359375, 0.216949462890625, 0.23321533203125, 0.249481201171875, 0.2657470703125, 0.282012939453125, 0.29827880859375, 0.314544677734375, 0.330810546875, 0.347076416015625, 0.36334228515625, 0.379608154296875, 0.3958740234375, 0.412139892578125, 0.42840576171875, 0.444671630859375, 0.4609375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 2.0, 8.0, 5.0, 12.0, 13.0, 12.0, 21.0, 10.0, 31.0, 21.0, 24.0, 18.0, 37.0, 40.0, 48.0, 42.0, 48.0, 46.0, 54.0, 44.0, 51.0, 37.0, 47.0, 52.0, 50.0, 32.0, 32.0, 34.0, 16.0, 10.0, 15.0, 13.0, 17.0, 11.0, 6.0, 6.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-10.060894012451172, -9.771018028259277, -9.4811429977417, -9.191267013549805, -8.901391983032227, -8.611515998840332, -8.321640968322754, -8.03176498413086, -7.741889476776123, -7.452013969421387, -7.16213846206665, -6.872262954711914, -6.5823869705200195, -6.292511940002441, -6.002635955810547, -5.7127604484558105, -5.422884941101074, -5.133009433746338, -4.843133926391602, -4.553258419036865, -4.263382911682129, -3.9735071659088135, -3.683631420135498, -3.3937559127807617, -3.1038804054260254, -2.814004898071289, -2.5241293907165527, -2.2342536449432373, -1.944378137588501, -1.6545026302337646, -1.3646270036697388, -1.074751377105713, -0.7848758697509766, -0.49500030279159546, -0.20512473583221436, 0.08475083112716675, 0.37462639808654785, 0.6645019054412842, 0.9543775320053101, 1.244253158569336, 1.5341286659240723, 1.8240041732788086, 2.113879680633545, 2.4037554264068604, 2.6936309337615967, 2.983506441116333, 3.2733821868896484, 3.5632576942443848, 3.853133201599121, 4.143008708953857, 4.432884216308594, 4.72275972366333, 5.012635231018066, 5.302511215209961, 5.592386722564697, 5.882262229919434, 6.17213773727417, 6.462013244628906, 6.751888751983643, 7.041764259338379, 7.331640243530273, 7.621515274047852, 7.911391258239746, 8.20126724243164, 8.491142272949219]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 8.0, 14.0, 5.0, 16.0, 9.0, 13.0, 17.0, 24.0, 22.0, 26.0, 30.0, 45.0, 37.0, 38.0, 46.0, 38.0, 40.0, 50.0, 43.0, 43.0, 49.0, 35.0, 33.0, 39.0, 35.0, 34.0, 31.0, 18.0, 22.0, 19.0, 26.0, 12.0, 11.0, 13.0, 11.0, 7.0, 9.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.855771541595459, -7.594684600830078, -7.3335981369018555, -7.072511196136475, -6.811424255371094, -6.550337791442871, -6.28925085067749, -6.028163909912109, -5.767077445983887, -5.505990505218506, -5.244904041290283, -4.983817100524902, -4.72273063659668, -4.461643695831299, -4.200556755065918, -3.939470052719116, -3.6783833503723145, -3.4172966480255127, -3.156209945678711, -2.89512300491333, -2.6340363025665283, -2.3729496002197266, -2.1118626594543457, -1.850775957107544, -1.5896892547607422, -1.3286025524139404, -1.0675157308578491, -0.8064289689064026, -0.545342206954956, -0.2842555046081543, -0.02316868305206299, 0.23791813850402832, 0.4990043640136719, 0.7600911259651184, 1.021177887916565, 1.2822647094726562, 1.543351411819458, 1.8044381141662598, 2.0655250549316406, 2.3266117572784424, 2.587698459625244, 2.848785161972046, 3.1098718643188477, 3.3709588050842285, 3.6320455074310303, 3.893132209777832, 4.154219150543213, 4.415306091308594, 4.676392555236816, 4.937479496002197, 5.19856595993042, 5.459652900695801, 5.720739364624023, 5.981826305389404, 6.242913246154785, 6.503999710083008, 6.765086650848389, 7.0261735916137695, 7.287260055541992, 7.548346996307373, 7.809433937072754, 8.070520401000977, 8.3316068649292, 8.592694282531738, 8.853780746459961]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 11.0, 11.0, 22.0, 31.0, 54.0, 83.0, 137.0, 178.0, 315.0, 464.0, 862.0, 1225.0, 1957.0, 3137.0, 4978.0, 7774.0, 12057.0, 18977.0, 29103.0, 43546.0, 63881.0, 88546.0, 113429.0, 129365.0, 129841.0, 114158.0, 90403.0, 65683.0, 44813.0, 29899.0, 19306.0, 12518.0, 8036.0, 5036.0, 3167.0, 2001.0, 1315.0, 780.0, 529.0, 329.0, 242.0, 140.0, 75.0, 41.0, 36.0, 22.0, 15.0, 12.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0], "bins": [-9.7421875, -9.4559326171875, -9.169677734375, -8.8834228515625, -8.59716796875, -8.3109130859375, -8.024658203125, -7.7384033203125, -7.4521484375, -7.1658935546875, -6.879638671875, -6.5933837890625, -6.30712890625, -6.0208740234375, -5.734619140625, -5.4483642578125, -5.162109375, -4.8758544921875, -4.589599609375, -4.3033447265625, -4.01708984375, -3.7308349609375, -3.444580078125, -3.1583251953125, -2.8720703125, -2.5858154296875, -2.299560546875, -2.0133056640625, -1.72705078125, -1.4407958984375, -1.154541015625, -0.8682861328125, -0.58203125, -0.2957763671875, -0.009521484375, 0.2767333984375, 0.56298828125, 0.8492431640625, 1.135498046875, 1.4217529296875, 1.7080078125, 1.9942626953125, 2.280517578125, 2.5667724609375, 2.85302734375, 3.1392822265625, 3.425537109375, 3.7117919921875, 3.998046875, 4.2843017578125, 4.570556640625, 4.8568115234375, 5.14306640625, 5.4293212890625, 5.715576171875, 6.0018310546875, 6.2880859375, 6.5743408203125, 6.860595703125, 7.1468505859375, 7.43310546875, 7.7193603515625, 8.005615234375, 8.2918701171875, 8.578125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 5.0, 5.0, 10.0, 6.0, 15.0, 13.0, 13.0, 10.0, 12.0, 16.0, 23.0, 25.0, 13.0, 27.0, 38.0, 40.0, 30.0, 41.0, 33.0, 37.0, 41.0, 43.0, 44.0, 39.0, 37.0, 27.0, 37.0, 34.0, 25.0, 33.0, 32.0, 31.0, 28.0, 10.0, 16.0, 7.0, 16.0, 15.0, 15.0, 11.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-7.0625, -6.8468017578125, -6.631103515625, -6.4154052734375, -6.19970703125, -5.9840087890625, -5.768310546875, -5.5526123046875, -5.3369140625, -5.1212158203125, -4.905517578125, -4.6898193359375, -4.47412109375, -4.2584228515625, -4.042724609375, -3.8270263671875, -3.611328125, -3.3956298828125, -3.179931640625, -2.9642333984375, -2.74853515625, -2.5328369140625, -2.317138671875, -2.1014404296875, -1.8857421875, -1.6700439453125, -1.454345703125, -1.2386474609375, -1.02294921875, -0.8072509765625, -0.591552734375, -0.3758544921875, -0.16015625, 0.0555419921875, 0.271240234375, 0.4869384765625, 0.70263671875, 0.9183349609375, 1.134033203125, 1.3497314453125, 1.5654296875, 1.7811279296875, 1.996826171875, 2.2125244140625, 2.42822265625, 2.6439208984375, 2.859619140625, 3.0753173828125, 3.291015625, 3.5067138671875, 3.722412109375, 3.9381103515625, 4.15380859375, 4.3695068359375, 4.585205078125, 4.8009033203125, 5.0166015625, 5.2322998046875, 5.447998046875, 5.6636962890625, 5.87939453125, 6.0950927734375, 6.310791015625, 6.5264892578125, 6.7421875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 17.0, 27.0, 34.0, 53.0, 75.0, 135.0, 196.0, 294.0, 426.0, 610.0, 961.0, 1530.0, 2176.0, 3489.0, 4966.0, 7708.0, 11825.0, 17313.0, 25558.0, 36354.0, 50381.0, 68076.0, 87439.0, 104432.0, 113779.0, 112589.0, 100717.0, 82802.0, 63753.0, 46737.0, 33383.0, 23103.0, 15772.0, 10533.0, 7175.0, 4839.0, 3165.0, 2170.0, 1403.0, 858.0, 580.0, 368.0, 252.0, 182.0, 116.0, 67.0, 42.0, 37.0, 21.0, 9.0, 9.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.08203125, -6.85272216796875, -6.6234130859375, -6.39410400390625, -6.164794921875, -5.93548583984375, -5.7061767578125, -5.47686767578125, -5.24755859375, -5.01824951171875, -4.7889404296875, -4.55963134765625, -4.330322265625, -4.10101318359375, -3.8717041015625, -3.64239501953125, -3.4130859375, -3.18377685546875, -2.9544677734375, -2.72515869140625, -2.495849609375, -2.26654052734375, -2.0372314453125, -1.80792236328125, -1.57861328125, -1.34930419921875, -1.1199951171875, -0.89068603515625, -0.661376953125, -0.43206787109375, -0.2027587890625, 0.02655029296875, 0.255859375, 0.48516845703125, 0.7144775390625, 0.94378662109375, 1.173095703125, 1.40240478515625, 1.6317138671875, 1.86102294921875, 2.09033203125, 2.31964111328125, 2.5489501953125, 2.77825927734375, 3.007568359375, 3.23687744140625, 3.4661865234375, 3.69549560546875, 3.9248046875, 4.15411376953125, 4.3834228515625, 4.61273193359375, 4.842041015625, 5.07135009765625, 5.3006591796875, 5.52996826171875, 5.75927734375, 5.98858642578125, 6.2178955078125, 6.44720458984375, 6.676513671875, 6.90582275390625, 7.1351318359375, 7.36444091796875, 7.59375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 9.0, 9.0, 4.0, 11.0, 19.0, 8.0, 11.0, 25.0, 26.0, 30.0, 33.0, 29.0, 42.0, 28.0, 39.0, 38.0, 32.0, 36.0, 38.0, 43.0, 53.0, 47.0, 38.0, 52.0, 37.0, 40.0, 28.0, 23.0, 23.0, 22.0, 21.0, 18.0, 17.0, 17.0, 12.0, 17.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.68511962890625, -4.5225830078125, -4.36004638671875, -4.197509765625, -4.03497314453125, -3.8724365234375, -3.70989990234375, -3.54736328125, -3.38482666015625, -3.2222900390625, -3.05975341796875, -2.897216796875, -2.73468017578125, -2.5721435546875, -2.40960693359375, -2.2470703125, -2.08453369140625, -1.9219970703125, -1.75946044921875, -1.596923828125, -1.43438720703125, -1.2718505859375, -1.10931396484375, -0.94677734375, -0.78424072265625, -0.6217041015625, -0.45916748046875, -0.296630859375, -0.13409423828125, 0.0284423828125, 0.19097900390625, 0.353515625, 0.51605224609375, 0.6785888671875, 0.84112548828125, 1.003662109375, 1.16619873046875, 1.3287353515625, 1.49127197265625, 1.65380859375, 1.81634521484375, 1.9788818359375, 2.14141845703125, 2.303955078125, 2.46649169921875, 2.6290283203125, 2.79156494140625, 2.9541015625, 3.11663818359375, 3.2791748046875, 3.44171142578125, 3.604248046875, 3.76678466796875, 3.9293212890625, 4.09185791015625, 4.25439453125, 4.41693115234375, 4.5794677734375, 4.74200439453125, 4.904541015625, 5.06707763671875, 5.2296142578125, 5.39215087890625, 5.5546875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 16.0, 18.0, 25.0, 38.0, 62.0, 68.0, 122.0, 173.0, 294.0, 509.0, 783.0, 1303.0, 2260.0, 3947.0, 7121.0, 13454.0, 26432.0, 54661.0, 124783.0, 268067.0, 283316.0, 139514.0, 60150.0, 28810.0, 14613.0, 7825.0, 4260.0, 2395.0, 1325.0, 852.0, 503.0, 296.0, 190.0, 134.0, 78.0, 51.0, 34.0, 26.0, 21.0, 9.0, 7.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.807373046875, -11.42724609375, -11.047119140625, -10.6669921875, -10.286865234375, -9.90673828125, -9.526611328125, -9.146484375, -8.766357421875, -8.38623046875, -8.006103515625, -7.6259765625, -7.245849609375, -6.86572265625, -6.485595703125, -6.10546875, -5.725341796875, -5.34521484375, -4.965087890625, -4.5849609375, -4.204833984375, -3.82470703125, -3.444580078125, -3.064453125, -2.684326171875, -2.30419921875, -1.924072265625, -1.5439453125, -1.163818359375, -0.78369140625, -0.403564453125, -0.0234375, 0.356689453125, 0.73681640625, 1.116943359375, 1.4970703125, 1.877197265625, 2.25732421875, 2.637451171875, 3.017578125, 3.397705078125, 3.77783203125, 4.157958984375, 4.5380859375, 4.918212890625, 5.29833984375, 5.678466796875, 6.05859375, 6.438720703125, 6.81884765625, 7.198974609375, 7.5791015625, 7.959228515625, 8.33935546875, 8.719482421875, 9.099609375, 9.479736328125, 9.85986328125, 10.239990234375, 10.6201171875, 11.000244140625, 11.38037109375, 11.760498046875, 12.140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 1.0, 1.0, 9.0, 10.0, 13.0, 14.0, 14.0, 20.0, 22.0, 17.0, 26.0, 35.0, 48.0, 53.0, 65.0, 71.0, 79.0, 78.0, 75.0, 60.0, 51.0, 43.0, 42.0, 32.0, 24.0, 18.0, 12.0, 7.0, 10.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008878707885742188, -0.0008592531085014343, -0.0008306354284286499, -0.0008020177483558655, -0.0007734000682830811, -0.0007447823882102966, -0.0007161647081375122, -0.0006875470280647278, -0.0006589293479919434, -0.0006303116679191589, -0.0006016939878463745, -0.0005730763077735901, -0.0005444586277008057, -0.0005158409476280212, -0.0004872232675552368, -0.0004586055874824524, -0.00042998790740966797, -0.00040137022733688354, -0.0003727525472640991, -0.0003441348671913147, -0.0003155171871185303, -0.00028689950704574585, -0.0002582818269729614, -0.000229664146900177, -0.00020104646682739258, -0.00017242878675460815, -0.00014381110668182373, -0.0001151934266090393, -8.657574653625488e-05, -5.795806646347046e-05, -2.9340386390686035e-05, -7.227063179016113e-07, 2.7894973754882812e-05, 5.6512653827667236e-05, 8.513033390045166e-05, 0.00011374801397323608, 0.0001423656940460205, 0.00017098337411880493, 0.00019960105419158936, 0.00022821873426437378, 0.0002568364143371582, 0.0002854540944099426, 0.00031407177448272705, 0.0003426894545555115, 0.0003713071346282959, 0.0003999248147010803, 0.00042854249477386475, 0.00045716017484664917, 0.0004857778549194336, 0.000514395534992218, 0.0005430132150650024, 0.0005716308951377869, 0.0006002485752105713, 0.0006288662552833557, 0.0006574839353561401, 0.0006861016154289246, 0.000714719295501709, 0.0007433369755744934, 0.0007719546556472778, 0.0008005723357200623, 0.0008291900157928467, 0.0008578076958656311, 0.0008864253759384155, 0.0009150430560112, 0.0009436607360839844]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 5.0, 3.0, 5.0, 1.0, 10.0, 11.0, 21.0, 32.0, 40.0, 52.0, 75.0, 115.0, 192.0, 240.0, 379.0, 554.0, 797.0, 1303.0, 2050.0, 3091.0, 4856.0, 7722.0, 12611.0, 20275.0, 33985.0, 57398.0, 96471.0, 152021.0, 190058.0, 171335.0, 116294.0, 70379.0, 41409.0, 24411.0, 14709.0, 9266.0, 5786.0, 3638.0, 2368.0, 1565.0, 945.0, 656.0, 463.0, 325.0, 191.0, 139.0, 105.0, 63.0, 45.0, 28.0, 23.0, 15.0, 9.0, 16.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.55859375, -6.35162353515625, -6.1446533203125, -5.93768310546875, -5.730712890625, -5.52374267578125, -5.3167724609375, -5.10980224609375, -4.90283203125, -4.69586181640625, -4.4888916015625, -4.28192138671875, -4.074951171875, -3.86798095703125, -3.6610107421875, -3.45404052734375, -3.2470703125, -3.04010009765625, -2.8331298828125, -2.62615966796875, -2.419189453125, -2.21221923828125, -2.0052490234375, -1.79827880859375, -1.59130859375, -1.38433837890625, -1.1773681640625, -0.97039794921875, -0.763427734375, -0.55645751953125, -0.3494873046875, -0.14251708984375, 0.064453125, 0.27142333984375, 0.4783935546875, 0.68536376953125, 0.892333984375, 1.09930419921875, 1.3062744140625, 1.51324462890625, 1.72021484375, 1.92718505859375, 2.1341552734375, 2.34112548828125, 2.548095703125, 2.75506591796875, 2.9620361328125, 3.16900634765625, 3.3759765625, 3.58294677734375, 3.7899169921875, 3.99688720703125, 4.203857421875, 4.41082763671875, 4.6177978515625, 4.82476806640625, 5.03173828125, 5.23870849609375, 5.4456787109375, 5.65264892578125, 5.859619140625, 6.06658935546875, 6.2735595703125, 6.48052978515625, 6.6875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 8.0, 8.0, 8.0, 9.0, 18.0, 30.0, 29.0, 35.0, 55.0, 50.0, 97.0, 94.0, 89.0, 78.0, 92.0, 55.0, 56.0, 49.0, 23.0, 30.0, 18.0, 11.0, 18.0, 7.0, 3.0, 7.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6953125, -3.585357666015625, -3.47540283203125, -3.365447998046875, -3.2554931640625, -3.145538330078125, -3.03558349609375, -2.925628662109375, -2.815673828125, -2.705718994140625, -2.59576416015625, -2.485809326171875, -2.3758544921875, -2.265899658203125, -2.15594482421875, -2.045989990234375, -1.93603515625, -1.826080322265625, -1.71612548828125, -1.606170654296875, -1.4962158203125, -1.386260986328125, -1.27630615234375, -1.166351318359375, -1.056396484375, -0.946441650390625, -0.83648681640625, -0.726531982421875, -0.6165771484375, -0.506622314453125, -0.39666748046875, -0.286712646484375, -0.1767578125, -0.066802978515625, 0.04315185546875, 0.153106689453125, 0.2630615234375, 0.373016357421875, 0.48297119140625, 0.592926025390625, 0.702880859375, 0.812835693359375, 0.92279052734375, 1.032745361328125, 1.1427001953125, 1.252655029296875, 1.36260986328125, 1.472564697265625, 1.58251953125, 1.692474365234375, 1.80242919921875, 1.912384033203125, 2.0223388671875, 2.132293701171875, 2.24224853515625, 2.352203369140625, 2.462158203125, 2.572113037109375, 2.68206787109375, 2.792022705078125, 2.9019775390625, 3.011932373046875, 3.12188720703125, 3.231842041015625, 3.341796875]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 9.0, 11.0, 13.0, 12.0, 16.0, 23.0, 25.0, 25.0, 33.0, 35.0, 37.0, 47.0, 39.0, 44.0, 50.0, 63.0, 57.0, 58.0, 55.0, 37.0, 37.0, 31.0, 39.0, 37.0, 29.0, 19.0, 17.0, 21.0, 13.0, 14.0, 6.0, 5.0, 7.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 2.0], "bins": [-10.720756530761719, -10.420270919799805, -10.119786262512207, -9.819300651550293, -9.518815994262695, -9.218330383300781, -8.917844772338867, -8.617359161376953, -8.316874504089355, -8.016388893127441, -7.715904235839844, -7.41541862487793, -7.114933490753174, -6.814448356628418, -6.513962745666504, -6.213477611541748, -5.912992477416992, -5.612507343292236, -5.3120222091674805, -5.011536598205566, -4.7110514640808105, -4.410566329956055, -4.110080718994141, -3.8095955848693848, -3.509110450744629, -3.208625316619873, -2.908139944076538, -2.607654571533203, -2.3071694374084473, -2.0066843032836914, -1.7061989307403564, -1.4057135581970215, -1.105229377746582, -0.8047441244125366, -0.5042588710784912, -0.2037736177444458, 0.09671163558959961, 0.397196888923645, 0.6976821422576904, 0.9981675148010254, 1.2986526489257812, 1.5991379022598267, 1.899623155593872, 2.200108528137207, 2.500593662261963, 2.8010787963867188, 3.1015641689300537, 3.4020495414733887, 3.7025346755981445, 4.0030198097229, 4.303504943847656, 4.60399055480957, 4.904475688934326, 5.204960823059082, 5.505446434020996, 5.805931568145752, 6.106416702270508, 6.406901836395264, 6.7073869705200195, 7.007872581481934, 7.3083577156066895, 7.608842849731445, 7.909328460693359, 8.209814071655273, 8.510298728942871]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 7.0, 7.0, 11.0, 12.0, 9.0, 12.0, 11.0, 15.0, 13.0, 16.0, 15.0, 21.0, 24.0, 25.0, 36.0, 38.0, 29.0, 48.0, 34.0, 41.0, 42.0, 28.0, 35.0, 52.0, 39.0, 26.0, 33.0, 33.0, 36.0, 26.0, 26.0, 25.0, 27.0, 18.0, 12.0, 23.0, 10.0, 16.0, 16.0, 10.0, 7.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0], "bins": [-7.543928146362305, -7.321154594421387, -7.098381042480469, -6.875607490539551, -6.652833938598633, -6.430060386657715, -6.207286834716797, -5.984513759613037, -5.761740207672119, -5.538966655731201, -5.316193103790283, -5.093419551849365, -4.870645999908447, -4.6478729248046875, -4.4250993728637695, -4.202325820922852, -3.9795520305633545, -3.7567784786224365, -3.5340049266815186, -3.3112316131591797, -3.0884580612182617, -2.8656845092773438, -2.642910957336426, -2.420137405395508, -2.19736385345459, -1.9745903015136719, -1.7518168687820435, -1.5290433168411255, -1.306269884109497, -1.083496332168579, -0.8607227802276611, -0.6379493474960327, -0.4151759147644043, -0.1924024075269699, 0.030371099710464478, 0.25314462184906006, 0.47591811418533325, 0.6986916065216064, 0.9214651584625244, 1.1442385911941528, 1.3670121431350708, 1.5897856950759888, 1.8125591278076172, 2.035332679748535, 2.258106231689453, 2.480879783630371, 2.703653335571289, 2.926426649093628, 3.149200201034546, 3.371973752975464, 3.594747304916382, 3.8175206184387207, 4.040294170379639, 4.263067722320557, 4.485841274261475, 4.708614826202393, 4.9313883781433105, 5.1541619300842285, 5.3769354820251465, 5.5997090339660645, 5.822482585906982, 6.045255661010742, 6.26802921295166, 6.490802764892578, 6.713576316833496]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 9.0, 17.0, 31.0, 32.0, 56.0, 78.0, 109.0, 168.0, 303.0, 417.0, 651.0, 1078.0, 1719.0, 2944.0, 4770.0, 8296.0, 14328.0, 25254.0, 45626.0, 86464.0, 166599.0, 331000.0, 614813.0, 894592.0, 850681.0, 545320.0, 283812.0, 144057.0, 75290.0, 40789.0, 22880.0, 12857.0, 7482.0, 4476.0, 2689.0, 1700.0, 1025.0, 644.0, 400.0, 266.0, 204.0, 113.0, 93.0, 50.0, 27.0, 27.0, 23.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.3515625, -7.11358642578125, -6.8756103515625, -6.63763427734375, -6.399658203125, -6.16168212890625, -5.9237060546875, -5.68572998046875, -5.44775390625, -5.20977783203125, -4.9718017578125, -4.73382568359375, -4.495849609375, -4.25787353515625, -4.0198974609375, -3.78192138671875, -3.5439453125, -3.30596923828125, -3.0679931640625, -2.83001708984375, -2.592041015625, -2.35406494140625, -2.1160888671875, -1.87811279296875, -1.64013671875, -1.40216064453125, -1.1641845703125, -0.92620849609375, -0.688232421875, -0.45025634765625, -0.2122802734375, 0.02569580078125, 0.263671875, 0.50164794921875, 0.7396240234375, 0.97760009765625, 1.215576171875, 1.45355224609375, 1.6915283203125, 1.92950439453125, 2.16748046875, 2.40545654296875, 2.6434326171875, 2.88140869140625, 3.119384765625, 3.35736083984375, 3.5953369140625, 3.83331298828125, 4.0712890625, 4.30926513671875, 4.5472412109375, 4.78521728515625, 5.023193359375, 5.26116943359375, 5.4991455078125, 5.73712158203125, 5.97509765625, 6.21307373046875, 6.4510498046875, 6.68902587890625, 6.927001953125, 7.16497802734375, 7.4029541015625, 7.64093017578125, 7.87890625]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 10.0, 5.0, 11.0, 15.0, 15.0, 8.0, 18.0, 14.0, 25.0, 19.0, 27.0, 23.0, 24.0, 41.0, 52.0, 33.0, 36.0, 53.0, 42.0, 48.0, 46.0, 33.0, 29.0, 34.0, 33.0, 36.0, 27.0, 22.0, 32.0, 24.0, 22.0, 20.0, 20.0, 17.0, 17.0, 15.0, 6.0, 9.0, 6.0, 5.0, 3.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.4296875, -5.2633056640625, -5.096923828125, -4.9305419921875, -4.76416015625, -4.5977783203125, -4.431396484375, -4.2650146484375, -4.0986328125, -3.9322509765625, -3.765869140625, -3.5994873046875, -3.43310546875, -3.2667236328125, -3.100341796875, -2.9339599609375, -2.767578125, -2.6011962890625, -2.434814453125, -2.2684326171875, -2.10205078125, -1.9356689453125, -1.769287109375, -1.6029052734375, -1.4365234375, -1.2701416015625, -1.103759765625, -0.9373779296875, -0.77099609375, -0.6046142578125, -0.438232421875, -0.2718505859375, -0.10546875, 0.0609130859375, 0.227294921875, 0.3936767578125, 0.56005859375, 0.7264404296875, 0.892822265625, 1.0592041015625, 1.2255859375, 1.3919677734375, 1.558349609375, 1.7247314453125, 1.89111328125, 2.0574951171875, 2.223876953125, 2.3902587890625, 2.556640625, 2.7230224609375, 2.889404296875, 3.0557861328125, 3.22216796875, 3.3885498046875, 3.554931640625, 3.7213134765625, 3.8876953125, 4.0540771484375, 4.220458984375, 4.3868408203125, 4.55322265625, 4.7196044921875, 4.885986328125, 5.0523681640625, 5.21875]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 8.0, 9.0, 12.0, 11.0, 31.0, 54.0, 78.0, 118.0, 204.0, 321.0, 506.0, 877.0, 1415.0, 2497.0, 4007.0, 6859.0, 12094.0, 21487.0, 38404.0, 70958.0, 132556.0, 245837.0, 447001.0, 730841.0, 887211.0, 687002.0, 410612.0, 225317.0, 121236.0, 65149.0, 35214.0, 19747.0, 11207.0, 6421.0, 3602.0, 2090.0, 1287.0, 805.0, 461.0, 277.0, 171.0, 98.0, 60.0, 50.0, 33.0, 21.0, 9.0, 5.0, 4.0, 5.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0], "bins": [-8.171875, -7.91986083984375, -7.6678466796875, -7.41583251953125, -7.163818359375, -6.91180419921875, -6.6597900390625, -6.40777587890625, -6.15576171875, -5.90374755859375, -5.6517333984375, -5.39971923828125, -5.147705078125, -4.89569091796875, -4.6436767578125, -4.39166259765625, -4.1396484375, -3.88763427734375, -3.6356201171875, -3.38360595703125, -3.131591796875, -2.87957763671875, -2.6275634765625, -2.37554931640625, -2.12353515625, -1.87152099609375, -1.6195068359375, -1.36749267578125, -1.115478515625, -0.86346435546875, -0.6114501953125, -0.35943603515625, -0.107421875, 0.14459228515625, 0.3966064453125, 0.64862060546875, 0.900634765625, 1.15264892578125, 1.4046630859375, 1.65667724609375, 1.90869140625, 2.16070556640625, 2.4127197265625, 2.66473388671875, 2.916748046875, 3.16876220703125, 3.4207763671875, 3.67279052734375, 3.9248046875, 4.17681884765625, 4.4288330078125, 4.68084716796875, 4.932861328125, 5.18487548828125, 5.4368896484375, 5.68890380859375, 5.94091796875, 6.19293212890625, 6.4449462890625, 6.69696044921875, 6.948974609375, 7.20098876953125, 7.4530029296875, 7.70501708984375, 7.95703125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 19.0, 23.0, 24.0, 39.0, 50.0, 42.0, 68.0, 81.0, 105.0, 128.0, 133.0, 173.0, 183.0, 204.0, 222.0, 251.0, 240.0, 261.0, 246.0, 210.0, 229.0, 195.0, 197.0, 153.0, 123.0, 94.0, 91.0, 63.0, 33.0, 43.0, 29.0, 27.0, 12.0, 18.0, 7.0, 11.0, 7.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.44921875, -2.365692138671875, -2.28216552734375, -2.198638916015625, -2.1151123046875, -2.031585693359375, -1.94805908203125, -1.864532470703125, -1.781005859375, -1.697479248046875, -1.61395263671875, -1.530426025390625, -1.4468994140625, -1.363372802734375, -1.27984619140625, -1.196319580078125, -1.11279296875, -1.029266357421875, -0.94573974609375, -0.862213134765625, -0.7786865234375, -0.695159912109375, -0.61163330078125, -0.528106689453125, -0.444580078125, -0.361053466796875, -0.27752685546875, -0.194000244140625, -0.1104736328125, -0.026947021484375, 0.05657958984375, 0.140106201171875, 0.2236328125, 0.307159423828125, 0.39068603515625, 0.474212646484375, 0.5577392578125, 0.641265869140625, 0.72479248046875, 0.808319091796875, 0.891845703125, 0.975372314453125, 1.05889892578125, 1.142425537109375, 1.2259521484375, 1.309478759765625, 1.39300537109375, 1.476531982421875, 1.56005859375, 1.643585205078125, 1.72711181640625, 1.810638427734375, 1.8941650390625, 1.977691650390625, 2.06121826171875, 2.144744873046875, 2.228271484375, 2.311798095703125, 2.39532470703125, 2.478851318359375, 2.5623779296875, 2.645904541015625, 2.72943115234375, 2.812957763671875, 2.896484375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 8.0, 8.0, 6.0, 10.0, 10.0, 13.0, 26.0, 28.0, 29.0, 50.0, 30.0, 37.0, 44.0, 69.0, 54.0, 49.0, 64.0, 58.0, 48.0, 47.0, 53.0, 55.0, 32.0, 28.0, 29.0, 26.0, 3.0, 19.0, 14.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.61583137512207, -8.329607009887695, -8.04338264465332, -7.757158279418945, -7.47093391418457, -7.184709548950195, -6.898484706878662, -6.612260341644287, -6.326035976409912, -6.039811611175537, -5.753587245941162, -5.467362880706787, -5.181138038635254, -4.894913673400879, -4.608689308166504, -4.322464942932129, -4.036240577697754, -3.750016212463379, -3.463791847229004, -3.17756724357605, -2.891342878341675, -2.6051185131073, -2.3188939094543457, -2.0326695442199707, -1.7464451789855957, -1.4602208137512207, -1.1739963293075562, -0.8877719044685364, -0.6015474796295166, -0.3153231143951416, -0.02909862995147705, 0.2571258544921875, 0.5433511734008789, 0.8295755982398987, 1.1158000230789185, 1.402024507522583, 1.688248872756958, 1.974473237991333, 2.260697841644287, 2.546922206878662, 2.833146572113037, 3.119370937347412, 3.405595302581787, 3.691819906234741, 3.978044271469116, 4.26426887512207, 4.550493240356445, 4.83671760559082, 5.122941970825195, 5.40916633605957, 5.695390701293945, 5.98161506652832, 6.267839431762695, 6.55406379699707, 6.8402886390686035, 7.1265130043029785, 7.4127373695373535, 7.6989617347717285, 7.9851861000061035, 8.271410942077637, 8.557635307312012, 8.843859672546387, 9.130084037780762, 9.416308403015137, 9.702532768249512]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 10.0, 12.0, 9.0, 10.0, 13.0, 12.0, 18.0, 25.0, 17.0, 26.0, 29.0, 30.0, 30.0, 48.0, 29.0, 34.0, 37.0, 37.0, 40.0, 44.0, 24.0, 42.0, 40.0, 32.0, 35.0, 41.0, 30.0, 32.0, 21.0, 23.0, 21.0, 22.0, 17.0, 11.0, 15.0, 13.0, 13.0, 10.0, 9.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.515998840332031, -5.333995819091797, -5.151993274688721, -4.969990253448486, -4.78798770904541, -4.605984687805176, -4.423981666564941, -4.241978645324707, -4.059976100921631, -3.8779733180999756, -3.6959705352783203, -3.513967514038086, -3.3319647312164307, -3.1499619483947754, -2.967958927154541, -2.7859561443328857, -2.6039533615112305, -2.421950578689575, -2.23994779586792, -2.0579447746276855, -1.8759419918060303, -1.693939208984375, -1.5119363069534302, -1.3299334049224854, -1.14793062210083, -0.96592777967453, -0.78392493724823, -0.6019220948219299, -0.4199192523956299, -0.23791640996932983, -0.055913567543029785, 0.12608933448791504, 0.3080916404724121, 0.49009448289871216, 0.6720973253250122, 0.8541001677513123, 1.0361030101776123, 1.2181057929992676, 1.4001086950302124, 1.5821115970611572, 1.7641143798828125, 1.9461171627044678, 2.128119945526123, 2.3101229667663574, 2.4921257495880127, 2.674128532409668, 2.8561315536499023, 3.0381343364715576, 3.220137119293213, 3.402139902114868, 3.5841426849365234, 3.766145706176758, 3.948148488998413, 4.130151271820068, 4.312154293060303, 4.494156837463379, 4.676159858703613, 4.858162879943848, 5.040165424346924, 5.222168445587158, 5.404170989990234, 5.586174011230469, 5.768177032470703, 5.9501800537109375, 6.132182598114014]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 5.0, 9.0, 11.0, 18.0, 25.0, 42.0, 50.0, 69.0, 101.0, 146.0, 222.0, 308.0, 482.0, 682.0, 978.0, 1488.0, 2288.0, 3346.0, 5112.0, 7630.0, 11771.0, 17443.0, 27202.0, 41491.0, 63116.0, 90782.0, 124535.0, 148296.0, 143223.0, 114674.0, 81227.0, 55246.0, 36433.0, 24295.0, 15561.0, 10003.0, 6655.0, 4499.0, 2857.0, 2060.0, 1370.0, 922.0, 576.0, 414.0, 280.0, 203.0, 115.0, 95.0, 67.0, 47.0, 35.0, 23.0, 22.0, 6.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.3515625, -2.27532958984375, -2.1990966796875, -2.12286376953125, -2.046630859375, -1.97039794921875, -1.8941650390625, -1.81793212890625, -1.74169921875, -1.66546630859375, -1.5892333984375, -1.51300048828125, -1.436767578125, -1.36053466796875, -1.2843017578125, -1.20806884765625, -1.1318359375, -1.05560302734375, -0.9793701171875, -0.90313720703125, -0.826904296875, -0.75067138671875, -0.6744384765625, -0.59820556640625, -0.52197265625, -0.44573974609375, -0.3695068359375, -0.29327392578125, -0.217041015625, -0.14080810546875, -0.0645751953125, 0.01165771484375, 0.087890625, 0.16412353515625, 0.2403564453125, 0.31658935546875, 0.392822265625, 0.46905517578125, 0.5452880859375, 0.62152099609375, 0.69775390625, 0.77398681640625, 0.8502197265625, 0.92645263671875, 1.002685546875, 1.07891845703125, 1.1551513671875, 1.23138427734375, 1.3076171875, 1.38385009765625, 1.4600830078125, 1.53631591796875, 1.612548828125, 1.68878173828125, 1.7650146484375, 1.84124755859375, 1.91748046875, 1.99371337890625, 2.0699462890625, 2.14617919921875, 2.222412109375, 2.29864501953125, 2.3748779296875, 2.45111083984375, 2.52734375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 3.0, 3.0, 3.0, 8.0, 9.0, 7.0, 8.0, 14.0, 14.0, 19.0, 18.0, 14.0, 25.0, 18.0, 38.0, 30.0, 41.0, 39.0, 40.0, 46.0, 37.0, 40.0, 39.0, 33.0, 42.0, 35.0, 39.0, 41.0, 36.0, 24.0, 25.0, 29.0, 27.0, 15.0, 17.0, 21.0, 10.0, 22.0, 9.0, 17.0, 8.0, 10.0, 6.0, 5.0, 10.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.1484375, -5.950439453125, -5.75244140625, -5.554443359375, -5.3564453125, -5.158447265625, -4.96044921875, -4.762451171875, -4.564453125, -4.366455078125, -4.16845703125, -3.970458984375, -3.7724609375, -3.574462890625, -3.37646484375, -3.178466796875, -2.98046875, -2.782470703125, -2.58447265625, -2.386474609375, -2.1884765625, -1.990478515625, -1.79248046875, -1.594482421875, -1.396484375, -1.198486328125, -1.00048828125, -0.802490234375, -0.6044921875, -0.406494140625, -0.20849609375, -0.010498046875, 0.1875, 0.385498046875, 0.58349609375, 0.781494140625, 0.9794921875, 1.177490234375, 1.37548828125, 1.573486328125, 1.771484375, 1.969482421875, 2.16748046875, 2.365478515625, 2.5634765625, 2.761474609375, 2.95947265625, 3.157470703125, 3.35546875, 3.553466796875, 3.75146484375, 3.949462890625, 4.1474609375, 4.345458984375, 4.54345703125, 4.741455078125, 4.939453125, 5.137451171875, 5.33544921875, 5.533447265625, 5.7314453125, 5.929443359375, 6.12744140625, 6.325439453125, 6.5234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 20.0, 24.0, 35.0, 62.0, 87.0, 123.0, 218.0, 324.0, 526.0, 832.0, 1275.0, 2083.0, 3514.0, 6024.0, 10588.0, 20403.0, 56507.0, 858412.0, 44531.0, 18681.0, 9906.0, 5435.0, 3466.0, 1990.0, 1286.0, 736.0, 505.0, 333.0, 193.0, 143.0, 94.0, 68.0, 43.0, 30.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-8.859375, -8.63470458984375, -8.4100341796875, -8.18536376953125, -7.960693359375, -7.73602294921875, -7.5113525390625, -7.28668212890625, -7.06201171875, -6.83734130859375, -6.6126708984375, -6.38800048828125, -6.163330078125, -5.93865966796875, -5.7139892578125, -5.48931884765625, -5.2646484375, -5.03997802734375, -4.8153076171875, -4.59063720703125, -4.365966796875, -4.14129638671875, -3.9166259765625, -3.69195556640625, -3.46728515625, -3.24261474609375, -3.0179443359375, -2.79327392578125, -2.568603515625, -2.34393310546875, -2.1192626953125, -1.89459228515625, -1.669921875, -1.44525146484375, -1.2205810546875, -0.99591064453125, -0.771240234375, -0.54656982421875, -0.3218994140625, -0.09722900390625, 0.12744140625, 0.35211181640625, 0.5767822265625, 0.80145263671875, 1.026123046875, 1.25079345703125, 1.4754638671875, 1.70013427734375, 1.9248046875, 2.14947509765625, 2.3741455078125, 2.59881591796875, 2.823486328125, 3.04815673828125, 3.2728271484375, 3.49749755859375, 3.72216796875, 3.94683837890625, 4.1715087890625, 4.39617919921875, 4.620849609375, 4.84552001953125, 5.0701904296875, 5.29486083984375, 5.51953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 5.0, 10.0, 4.0, 11.0, 13.0, 11.0, 20.0, 18.0, 29.0, 23.0, 24.0, 30.0, 30.0, 29.0, 34.0, 30.0, 35.0, 38.0, 41.0, 41.0, 36.0, 33.0, 36.0, 50.0, 42.0, 30.0, 35.0, 44.0, 26.0, 27.0, 23.0, 18.0, 23.0, 24.0, 14.0, 17.0, 8.0, 7.0, 4.0, 14.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.69732666015625, -4.5430908203125, -4.38885498046875, -4.234619140625, -4.08038330078125, -3.9261474609375, -3.77191162109375, -3.61767578125, -3.46343994140625, -3.3092041015625, -3.15496826171875, -3.000732421875, -2.84649658203125, -2.6922607421875, -2.53802490234375, -2.3837890625, -2.22955322265625, -2.0753173828125, -1.92108154296875, -1.766845703125, -1.61260986328125, -1.4583740234375, -1.30413818359375, -1.14990234375, -0.99566650390625, -0.8414306640625, -0.68719482421875, -0.532958984375, -0.37872314453125, -0.2244873046875, -0.07025146484375, 0.083984375, 0.23822021484375, 0.3924560546875, 0.54669189453125, 0.700927734375, 0.85516357421875, 1.0093994140625, 1.16363525390625, 1.31787109375, 1.47210693359375, 1.6263427734375, 1.78057861328125, 1.934814453125, 2.08905029296875, 2.2432861328125, 2.39752197265625, 2.5517578125, 2.70599365234375, 2.8602294921875, 3.01446533203125, 3.168701171875, 3.32293701171875, 3.4771728515625, 3.63140869140625, 3.78564453125, 3.93988037109375, 4.0941162109375, 4.24835205078125, 4.402587890625, 4.55682373046875, 4.7110595703125, 4.86529541015625, 5.01953125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 9.0, 14.0, 23.0, 41.0, 57.0, 100.0, 158.0, 229.0, 413.0, 720.0, 1285.0, 2416.0, 4514.0, 9502.0, 24101.0, 615508.0, 348575.0, 22511.0, 9077.0, 4207.0, 2184.0, 1217.0, 660.0, 379.0, 196.0, 113.0, 96.0, 59.0, 39.0, 30.0, 19.0, 18.0, 15.0, 11.0, 11.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.05078125, -4.8975830078125, -4.744384765625, -4.5911865234375, -4.43798828125, -4.2847900390625, -4.131591796875, -3.9783935546875, -3.8251953125, -3.6719970703125, -3.518798828125, -3.3656005859375, -3.21240234375, -3.0592041015625, -2.906005859375, -2.7528076171875, -2.599609375, -2.4464111328125, -2.293212890625, -2.1400146484375, -1.98681640625, -1.8336181640625, -1.680419921875, -1.5272216796875, -1.3740234375, -1.2208251953125, -1.067626953125, -0.9144287109375, -0.76123046875, -0.6080322265625, -0.454833984375, -0.3016357421875, -0.1484375, 0.0047607421875, 0.157958984375, 0.3111572265625, 0.46435546875, 0.6175537109375, 0.770751953125, 0.9239501953125, 1.0771484375, 1.2303466796875, 1.383544921875, 1.5367431640625, 1.68994140625, 1.8431396484375, 1.996337890625, 2.1495361328125, 2.302734375, 2.4559326171875, 2.609130859375, 2.7623291015625, 2.91552734375, 3.0687255859375, 3.221923828125, 3.3751220703125, 3.5283203125, 3.6815185546875, 3.834716796875, 3.9879150390625, 4.14111328125, 4.2943115234375, 4.447509765625, 4.6007080078125, 4.75390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 16.0, 10.0, 10.0, 12.0, 19.0, 21.0, 18.0, 23.0, 36.0, 41.0, 60.0, 60.0, 59.0, 67.0, 67.0, 64.0, 55.0, 40.0, 41.0, 46.0, 33.0, 35.0, 26.0, 19.0, 10.0, 18.0, 11.0, 19.0, 5.0, 9.0, 10.0, 6.0, 4.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002180337905883789, -0.00021154806017875671, -0.00020506232976913452, -0.00019857659935951233, -0.00019209086894989014, -0.00018560513854026794, -0.00017911940813064575, -0.00017263367772102356, -0.00016614794731140137, -0.00015966221690177917, -0.00015317648649215698, -0.0001466907560825348, -0.0001402050256729126, -0.0001337192952632904, -0.0001272335648536682, -0.00012074783444404602, -0.00011426210403442383, -0.00010777637362480164, -0.00010129064321517944, -9.480491280555725e-05, -8.831918239593506e-05, -8.183345198631287e-05, -7.534772157669067e-05, -6.886199116706848e-05, -6.237626075744629e-05, -5.58905303478241e-05, -4.9404799938201904e-05, -4.291906952857971e-05, -3.643333911895752e-05, -2.9947608709335327e-05, -2.3461878299713135e-05, -1.6976147890090942e-05, -1.049041748046875e-05, -4.004687070846558e-06, 2.4810433387756348e-06, 8.966773748397827e-06, 1.545250415802002e-05, 2.1938234567642212e-05, 2.8423964977264404e-05, 3.49096953868866e-05, 4.139542579650879e-05, 4.788115620613098e-05, 5.4366886615753174e-05, 6.0852617025375366e-05, 6.733834743499756e-05, 7.382407784461975e-05, 8.030980825424194e-05, 8.679553866386414e-05, 9.328126907348633e-05, 9.976699948310852e-05, 0.00010625272989273071, 0.0001127384603023529, 0.0001192241907119751, 0.0001257099211215973, 0.00013219565153121948, 0.00013868138194084167, 0.00014516711235046387, 0.00015165284276008606, 0.00015813857316970825, 0.00016462430357933044, 0.00017111003398895264, 0.00017759576439857483, 0.00018408149480819702, 0.00019056722521781921, 0.0001970529556274414]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 6.0, 14.0, 17.0, 17.0, 37.0, 43.0, 82.0, 131.0, 166.0, 272.0, 421.0, 699.0, 1196.0, 1910.0, 3174.0, 5535.0, 10072.0, 18396.0, 35723.0, 69917.0, 139327.0, 249604.0, 240833.0, 131793.0, 65405.0, 33467.0, 17510.0, 9578.0, 5307.0, 3128.0, 1801.0, 1128.0, 657.0, 396.0, 285.0, 162.0, 116.0, 78.0, 52.0, 39.0, 19.0, 13.0, 6.0, 7.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4912109375, -1.4430389404296875, -1.394866943359375, -1.3466949462890625, -1.29852294921875, -1.2503509521484375, -1.202178955078125, -1.1540069580078125, -1.1058349609375, -1.0576629638671875, -1.009490966796875, -0.9613189697265625, -0.91314697265625, -0.8649749755859375, -0.816802978515625, -0.7686309814453125, -0.720458984375, -0.6722869873046875, -0.624114990234375, -0.5759429931640625, -0.52777099609375, -0.4795989990234375, -0.431427001953125, -0.3832550048828125, -0.3350830078125, -0.2869110107421875, -0.238739013671875, -0.1905670166015625, -0.14239501953125, -0.0942230224609375, -0.046051025390625, 0.0021209716796875, 0.05029296875, 0.0984649658203125, 0.146636962890625, 0.1948089599609375, 0.24298095703125, 0.2911529541015625, 0.339324951171875, 0.3874969482421875, 0.4356689453125, 0.4838409423828125, 0.532012939453125, 0.5801849365234375, 0.62835693359375, 0.6765289306640625, 0.724700927734375, 0.7728729248046875, 0.821044921875, 0.8692169189453125, 0.917388916015625, 0.9655609130859375, 1.01373291015625, 1.0619049072265625, 1.110076904296875, 1.1582489013671875, 1.2064208984375, 1.2545928955078125, 1.302764892578125, 1.3509368896484375, 1.39910888671875, 1.4472808837890625, 1.495452880859375, 1.5436248779296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 5.0, 9.0, 11.0, 11.0, 15.0, 14.0, 25.0, 27.0, 33.0, 37.0, 47.0, 45.0, 42.0, 47.0, 54.0, 48.0, 53.0, 60.0, 49.0, 36.0, 30.0, 37.0, 46.0, 41.0, 25.0, 23.0, 15.0, 10.0, 13.0, 13.0, 16.0, 11.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.36554718017578125, -0.3531646728515625, -0.34078216552734375, -0.328399658203125, -0.31601715087890625, -0.3036346435546875, -0.29125213623046875, -0.27886962890625, -0.26648712158203125, -0.2541046142578125, -0.24172210693359375, -0.229339599609375, -0.21695709228515625, -0.2045745849609375, -0.19219207763671875, -0.1798095703125, -0.16742706298828125, -0.1550445556640625, -0.14266204833984375, -0.130279541015625, -0.11789703369140625, -0.1055145263671875, -0.09313201904296875, -0.08074951171875, -0.06836700439453125, -0.0559844970703125, -0.04360198974609375, -0.031219482421875, -0.01883697509765625, -0.0064544677734375, 0.00592803955078125, 0.018310546875, 0.03069305419921875, 0.0430755615234375, 0.05545806884765625, 0.067840576171875, 0.08022308349609375, 0.0926055908203125, 0.10498809814453125, 0.11737060546875, 0.12975311279296875, 0.1421356201171875, 0.15451812744140625, 0.166900634765625, 0.17928314208984375, 0.1916656494140625, 0.20404815673828125, 0.2164306640625, 0.22881317138671875, 0.2411956787109375, 0.25357818603515625, 0.265960693359375, 0.27834320068359375, 0.2907257080078125, 0.30310821533203125, 0.31549072265625, 0.32787322998046875, 0.3402557373046875, 0.35263824462890625, 0.365020751953125, 0.37740325927734375, 0.3897857666015625, 0.40216827392578125, 0.41455078125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 5.0, 9.0, 7.0, 15.0, 13.0, 12.0, 29.0, 33.0, 28.0, 40.0, 38.0, 53.0, 37.0, 46.0, 61.0, 72.0, 56.0, 55.0, 51.0, 48.0, 55.0, 25.0, 44.0, 30.0, 28.0, 17.0, 14.0, 14.0, 14.0, 7.0, 7.0, 9.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.376655578613281, -8.093968391418457, -7.811281204223633, -7.528594493865967, -7.245907306671143, -6.963220119476318, -6.680533409118652, -6.397846221923828, -6.115159034729004, -5.83247184753418, -5.5497846603393555, -5.2670979499816895, -4.984410762786865, -4.701723575592041, -4.419036865234375, -4.136349678039551, -3.8536624908447266, -3.5709753036499023, -3.2882883548736572, -3.005601406097412, -2.722914218902588, -2.4402270317077637, -2.1575400829315186, -1.8748530149459839, -1.5921659469604492, -1.3094788789749146, -1.0267918109893799, -0.7441047430038452, -0.46141767501831055, -0.17873060703277588, 0.10395646095275879, 0.38664352893829346, 0.6693305969238281, 0.9520176649093628, 1.2347047328948975, 1.5173918008804321, 1.8000788688659668, 2.082766056060791, 2.365453004837036, 2.6481399536132812, 2.9308271408081055, 3.2135143280029297, 3.496201276779175, 3.77888822555542, 4.061575412750244, 4.344262599945068, 4.626949310302734, 4.909636497497559, 5.192323684692383, 5.475010871887207, 5.757698059082031, 6.040384769439697, 6.3230719566345215, 6.605759143829346, 6.888445854187012, 7.171133041381836, 7.45382022857666, 7.736507415771484, 8.019194602966309, 8.301881790161133, 8.58456802368164, 8.867255210876465, 9.149942398071289, 9.432629585266113, 9.715316772460938]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 8.0, 8.0, 13.0, 5.0, 16.0, 10.0, 14.0, 16.0, 26.0, 18.0, 34.0, 26.0, 32.0, 34.0, 30.0, 30.0, 48.0, 33.0, 41.0, 34.0, 36.0, 30.0, 47.0, 36.0, 37.0, 45.0, 28.0, 24.0, 27.0, 25.0, 27.0, 20.0, 23.0, 10.0, 19.0, 13.0, 11.0, 14.0, 7.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.696194648742676, -5.513446807861328, -5.3306989669799805, -5.147950649261475, -4.965202808380127, -4.782454967498779, -4.599706649780273, -4.416958808898926, -4.234210968017578, -4.0514631271362305, -3.8687150478363037, -3.685966968536377, -3.5032191276550293, -3.3204712867736816, -3.137723207473755, -2.954975128173828, -2.7722272872924805, -2.589479446411133, -2.406731367111206, -2.2239832878112793, -2.0412354469299316, -1.8584874868392944, -1.6757395267486572, -1.49299156665802, -1.3102436065673828, -1.1274956464767456, -0.9447476863861084, -0.7619997262954712, -0.579251766204834, -0.3965038061141968, -0.21375584602355957, -0.031007885932922363, 0.15174007415771484, 0.33448803424835205, 0.5172359943389893, 0.6999839544296265, 0.8827319145202637, 1.0654798746109009, 1.248227834701538, 1.4309757947921753, 1.6137237548828125, 1.7964717149734497, 1.979219675064087, 2.1619677543640137, 2.3447155952453613, 2.527463436126709, 2.7102115154266357, 2.8929595947265625, 3.07570743560791, 3.258455276489258, 3.4412033557891846, 3.6239514350891113, 3.806699275970459, 3.9894471168518066, 4.1721954345703125, 4.35494327545166, 4.537691116333008, 4.7204389572143555, 4.903186798095703, 5.085935115814209, 5.268682956695557, 5.451430797576904, 5.63417911529541, 5.816926956176758, 5.9996747970581055]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 9.0, 12.0, 29.0, 44.0, 57.0, 95.0, 141.0, 197.0, 327.0, 534.0, 864.0, 1299.0, 2252.0, 3612.0, 6233.0, 10835.0, 19725.0, 35065.0, 62495.0, 105398.0, 158284.0, 191417.0, 169097.0, 116923.0, 70843.0, 39878.0, 22475.0, 12461.0, 7202.0, 4141.0, 2519.0, 1460.0, 950.0, 604.0, 394.0, 247.0, 166.0, 97.0, 68.0, 37.0, 20.0, 20.0, 8.0, 11.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2421875, -7.9638671875, -7.685546875, -7.4072265625, -7.12890625, -6.8505859375, -6.572265625, -6.2939453125, -6.015625, -5.7373046875, -5.458984375, -5.1806640625, -4.90234375, -4.6240234375, -4.345703125, -4.0673828125, -3.7890625, -3.5107421875, -3.232421875, -2.9541015625, -2.67578125, -2.3974609375, -2.119140625, -1.8408203125, -1.5625, -1.2841796875, -1.005859375, -0.7275390625, -0.44921875, -0.1708984375, 0.107421875, 0.3857421875, 0.6640625, 0.9423828125, 1.220703125, 1.4990234375, 1.77734375, 2.0556640625, 2.333984375, 2.6123046875, 2.890625, 3.1689453125, 3.447265625, 3.7255859375, 4.00390625, 4.2822265625, 4.560546875, 4.8388671875, 5.1171875, 5.3955078125, 5.673828125, 5.9521484375, 6.23046875, 6.5087890625, 6.787109375, 7.0654296875, 7.34375, 7.6220703125, 7.900390625, 8.1787109375, 8.45703125, 8.7353515625, 9.013671875, 9.2919921875, 9.5703125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 1.0, 4.0, 5.0, 3.0, 12.0, 7.0, 13.0, 10.0, 8.0, 15.0, 19.0, 23.0, 25.0, 17.0, 36.0, 30.0, 29.0, 40.0, 31.0, 46.0, 49.0, 38.0, 38.0, 36.0, 39.0, 25.0, 41.0, 41.0, 38.0, 37.0, 28.0, 31.0, 26.0, 29.0, 16.0, 22.0, 15.0, 15.0, 11.0, 7.0, 10.0, 4.0, 9.0, 5.0, 5.0, 3.0, 0.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.21771240234375, -5.0369873046875, -4.85626220703125, -4.675537109375, -4.49481201171875, -4.3140869140625, -4.13336181640625, -3.95263671875, -3.77191162109375, -3.5911865234375, -3.41046142578125, -3.229736328125, -3.04901123046875, -2.8682861328125, -2.68756103515625, -2.5068359375, -2.32611083984375, -2.1453857421875, -1.96466064453125, -1.783935546875, -1.60321044921875, -1.4224853515625, -1.24176025390625, -1.06103515625, -0.88031005859375, -0.6995849609375, -0.51885986328125, -0.338134765625, -0.15740966796875, 0.0233154296875, 0.20404052734375, 0.384765625, 0.56549072265625, 0.7462158203125, 0.92694091796875, 1.107666015625, 1.28839111328125, 1.4691162109375, 1.64984130859375, 1.83056640625, 2.01129150390625, 2.1920166015625, 2.37274169921875, 2.553466796875, 2.73419189453125, 2.9149169921875, 3.09564208984375, 3.2763671875, 3.45709228515625, 3.6378173828125, 3.81854248046875, 3.999267578125, 4.17999267578125, 4.3607177734375, 4.54144287109375, 4.72216796875, 4.90289306640625, 5.0836181640625, 5.26434326171875, 5.445068359375, 5.62579345703125, 5.8065185546875, 5.98724365234375, 6.16796875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [8.0, 0.0, 2.0, 6.0, 12.0, 11.0, 15.0, 18.0, 39.0, 46.0, 64.0, 101.0, 153.0, 185.0, 294.0, 420.0, 598.0, 878.0, 1310.0, 1821.0, 2803.0, 4013.0, 6337.0, 9505.0, 14818.0, 22867.0, 36199.0, 55581.0, 83225.0, 115698.0, 142173.0, 147786.0, 126237.0, 93705.0, 63336.0, 41552.0, 26814.0, 17025.0, 11082.0, 7167.0, 4661.0, 3196.0, 2079.0, 1414.0, 1046.0, 663.0, 494.0, 313.0, 242.0, 158.0, 130.0, 65.0, 56.0, 45.0, 37.0, 25.0, 15.0, 8.0, 8.0, 8.0, 3.0, 4.0, 1.0, 1.0], "bins": [-5.828125, -5.64111328125, -5.4541015625, -5.26708984375, -5.080078125, -4.89306640625, -4.7060546875, -4.51904296875, -4.33203125, -4.14501953125, -3.9580078125, -3.77099609375, -3.583984375, -3.39697265625, -3.2099609375, -3.02294921875, -2.8359375, -2.64892578125, -2.4619140625, -2.27490234375, -2.087890625, -1.90087890625, -1.7138671875, -1.52685546875, -1.33984375, -1.15283203125, -0.9658203125, -0.77880859375, -0.591796875, -0.40478515625, -0.2177734375, -0.03076171875, 0.15625, 0.34326171875, 0.5302734375, 0.71728515625, 0.904296875, 1.09130859375, 1.2783203125, 1.46533203125, 1.65234375, 1.83935546875, 2.0263671875, 2.21337890625, 2.400390625, 2.58740234375, 2.7744140625, 2.96142578125, 3.1484375, 3.33544921875, 3.5224609375, 3.70947265625, 3.896484375, 4.08349609375, 4.2705078125, 4.45751953125, 4.64453125, 4.83154296875, 5.0185546875, 5.20556640625, 5.392578125, 5.57958984375, 5.7666015625, 5.95361328125, 6.140625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 4.0, 5.0, 9.0, 9.0, 8.0, 14.0, 12.0, 20.0, 23.0, 23.0, 28.0, 27.0, 36.0, 35.0, 27.0, 40.0, 42.0, 42.0, 39.0, 39.0, 33.0, 37.0, 49.0, 46.0, 22.0, 37.0, 34.0, 38.0, 33.0, 31.0, 25.0, 25.0, 18.0, 16.0, 11.0, 11.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.765625, -4.63037109375, -4.4951171875, -4.35986328125, -4.224609375, -4.08935546875, -3.9541015625, -3.81884765625, -3.68359375, -3.54833984375, -3.4130859375, -3.27783203125, -3.142578125, -3.00732421875, -2.8720703125, -2.73681640625, -2.6015625, -2.46630859375, -2.3310546875, -2.19580078125, -2.060546875, -1.92529296875, -1.7900390625, -1.65478515625, -1.51953125, -1.38427734375, -1.2490234375, -1.11376953125, -0.978515625, -0.84326171875, -0.7080078125, -0.57275390625, -0.4375, -0.30224609375, -0.1669921875, -0.03173828125, 0.103515625, 0.23876953125, 0.3740234375, 0.50927734375, 0.64453125, 0.77978515625, 0.9150390625, 1.05029296875, 1.185546875, 1.32080078125, 1.4560546875, 1.59130859375, 1.7265625, 1.86181640625, 1.9970703125, 2.13232421875, 2.267578125, 2.40283203125, 2.5380859375, 2.67333984375, 2.80859375, 2.94384765625, 3.0791015625, 3.21435546875, 3.349609375, 3.48486328125, 3.6201171875, 3.75537109375, 3.890625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 15.0, 19.0, 42.0, 60.0, 55.0, 79.0, 113.0, 193.0, 310.0, 568.0, 957.0, 1871.0, 3903.0, 9381.0, 24283.0, 78425.0, 274249.0, 418800.0, 161109.0, 46024.0, 15751.0, 6096.0, 2835.0, 1412.0, 732.0, 452.0, 266.0, 162.0, 103.0, 80.0, 63.0, 39.0, 25.0, 10.0, 7.0, 10.0, 7.0, 10.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.96875, -19.38623046875, -18.8037109375, -18.22119140625, -17.638671875, -17.05615234375, -16.4736328125, -15.89111328125, -15.30859375, -14.72607421875, -14.1435546875, -13.56103515625, -12.978515625, -12.39599609375, -11.8134765625, -11.23095703125, -10.6484375, -10.06591796875, -9.4833984375, -8.90087890625, -8.318359375, -7.73583984375, -7.1533203125, -6.57080078125, -5.98828125, -5.40576171875, -4.8232421875, -4.24072265625, -3.658203125, -3.07568359375, -2.4931640625, -1.91064453125, -1.328125, -0.74560546875, -0.1630859375, 0.41943359375, 1.001953125, 1.58447265625, 2.1669921875, 2.74951171875, 3.33203125, 3.91455078125, 4.4970703125, 5.07958984375, 5.662109375, 6.24462890625, 6.8271484375, 7.40966796875, 7.9921875, 8.57470703125, 9.1572265625, 9.73974609375, 10.322265625, 10.90478515625, 11.4873046875, 12.06982421875, 12.65234375, 13.23486328125, 13.8173828125, 14.39990234375, 14.982421875, 15.56494140625, 16.1474609375, 16.72998046875, 17.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 13.0, 13.0, 6.0, 17.0, 23.0, 24.0, 51.0, 51.0, 66.0, 91.0, 108.0, 121.0, 100.0, 80.0, 55.0, 38.0, 38.0, 30.0, 19.0, 12.0, 16.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009946823120117188, -0.0009517073631286621, -0.0009087324142456055, -0.0008657574653625488, -0.0008227825164794922, -0.0007798075675964355, -0.0007368326187133789, -0.0006938576698303223, -0.0006508827209472656, -0.000607907772064209, -0.0005649328231811523, -0.0005219578742980957, -0.00047898292541503906, -0.0004360079765319824, -0.0003930330276489258, -0.00035005807876586914, -0.0003070831298828125, -0.00026410818099975586, -0.00022113323211669922, -0.00017815828323364258, -0.00013518333435058594, -9.22083854675293e-05, -4.9233436584472656e-05, -6.258487701416016e-06, 3.6716461181640625e-05, 7.969141006469727e-05, 0.0001226663589477539, 0.00016564130783081055, 0.0002086162567138672, 0.00025159120559692383, 0.00029456615447998047, 0.0003375411033630371, 0.00038051605224609375, 0.0004234910011291504, 0.00046646595001220703, 0.0005094408988952637, 0.0005524158477783203, 0.000595390796661377, 0.0006383657455444336, 0.0006813406944274902, 0.0007243156433105469, 0.0007672905921936035, 0.0008102655410766602, 0.0008532404899597168, 0.0008962154388427734, 0.0009391903877258301, 0.0009821653366088867, 0.0010251402854919434, 0.001068115234375, 0.0011110901832580566, 0.0011540651321411133, 0.00119704008102417, 0.0012400150299072266, 0.0012829899787902832, 0.0013259649276733398, 0.0013689398765563965, 0.0014119148254394531, 0.0014548897743225098, 0.0014978647232055664, 0.001540839672088623, 0.0015838146209716797, 0.0016267895698547363, 0.001669764518737793, 0.0017127394676208496, 0.0017557144165039062]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 6.0, 11.0, 9.0, 24.0, 21.0, 38.0, 53.0, 66.0, 85.0, 120.0, 165.0, 249.0, 407.0, 666.0, 1371.0, 3293.0, 9587.0, 36036.0, 156658.0, 447038.0, 292679.0, 72490.0, 17508.0, 5412.0, 2035.0, 966.0, 526.0, 349.0, 170.0, 135.0, 102.0, 54.0, 52.0, 33.0, 34.0, 25.0, 18.0, 13.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.8125, -20.21337890625, -19.6142578125, -19.01513671875, -18.416015625, -17.81689453125, -17.2177734375, -16.61865234375, -16.01953125, -15.42041015625, -14.8212890625, -14.22216796875, -13.623046875, -13.02392578125, -12.4248046875, -11.82568359375, -11.2265625, -10.62744140625, -10.0283203125, -9.42919921875, -8.830078125, -8.23095703125, -7.6318359375, -7.03271484375, -6.43359375, -5.83447265625, -5.2353515625, -4.63623046875, -4.037109375, -3.43798828125, -2.8388671875, -2.23974609375, -1.640625, -1.04150390625, -0.4423828125, 0.15673828125, 0.755859375, 1.35498046875, 1.9541015625, 2.55322265625, 3.15234375, 3.75146484375, 4.3505859375, 4.94970703125, 5.548828125, 6.14794921875, 6.7470703125, 7.34619140625, 7.9453125, 8.54443359375, 9.1435546875, 9.74267578125, 10.341796875, 10.94091796875, 11.5400390625, 12.13916015625, 12.73828125, 13.33740234375, 13.9365234375, 14.53564453125, 15.134765625, 15.73388671875, 16.3330078125, 16.93212890625, 17.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 10.0, 17.0, 25.0, 35.0, 39.0, 71.0, 121.0, 119.0, 128.0, 113.0, 99.0, 65.0, 49.0, 32.0, 20.0, 22.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.949462890625, -4.80517578125, -4.660888671875, -4.5166015625, -4.372314453125, -4.22802734375, -4.083740234375, -3.939453125, -3.795166015625, -3.65087890625, -3.506591796875, -3.3623046875, -3.218017578125, -3.07373046875, -2.929443359375, -2.78515625, -2.640869140625, -2.49658203125, -2.352294921875, -2.2080078125, -2.063720703125, -1.91943359375, -1.775146484375, -1.630859375, -1.486572265625, -1.34228515625, -1.197998046875, -1.0537109375, -0.909423828125, -0.76513671875, -0.620849609375, -0.4765625, -0.332275390625, -0.18798828125, -0.043701171875, 0.1005859375, 0.244873046875, 0.38916015625, 0.533447265625, 0.677734375, 0.822021484375, 0.96630859375, 1.110595703125, 1.2548828125, 1.399169921875, 1.54345703125, 1.687744140625, 1.83203125, 1.976318359375, 2.12060546875, 2.264892578125, 2.4091796875, 2.553466796875, 2.69775390625, 2.842041015625, 2.986328125, 3.130615234375, 3.27490234375, 3.419189453125, 3.5634765625, 3.707763671875, 3.85205078125, 3.996337890625, 4.140625]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 11.0, 11.0, 17.0, 8.0, 14.0, 20.0, 28.0, 45.0, 48.0, 52.0, 49.0, 58.0, 71.0, 65.0, 59.0, 52.0, 50.0, 55.0, 47.0, 38.0, 31.0, 31.0, 33.0, 19.0, 23.0, 12.0, 11.0, 5.0, 3.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.411050796508789, -8.113692283630371, -7.816334247589111, -7.518975734710693, -7.221617698669434, -6.924259185791016, -6.626900672912598, -6.329542636871338, -6.032184600830078, -5.73482608795166, -5.4374680519104, -5.140109539031982, -4.842751502990723, -4.545392990112305, -4.248034477233887, -3.950676441192627, -3.653317928314209, -3.35595965385437, -3.0586013793945312, -2.7612428665161133, -2.4638848304748535, -2.1665263175964355, -1.8691680431365967, -1.5718097686767578, -1.274451494216919, -0.9770932197570801, -0.6797348856925964, -0.3823765516281128, -0.08501827716827393, 0.21233999729156494, 0.5096983909606934, 0.8070566654205322, 1.104414939880371, 1.40177321434021, 1.6991314888000488, 1.9964898824691772, 2.2938480377197266, 2.5912065505981445, 2.8885648250579834, 3.1859230995178223, 3.483281373977661, 3.7806396484375, 4.077998161315918, 4.375356197357178, 4.672714710235596, 4.9700727462768555, 5.267431259155273, 5.564789772033691, 5.862147808074951, 6.159506320953369, 6.456864356994629, 6.754222869873047, 7.051580905914307, 7.348939418792725, 7.646297454833984, 7.943655967712402, 8.24101448059082, 8.538372993469238, 8.835731506347656, 9.133089065551758, 9.430447578430176, 9.727806091308594, 10.025164604187012, 10.32252311706543, 10.619880676269531]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 7.0, 5.0, 2.0, 2.0, 9.0, 10.0, 6.0, 14.0, 16.0, 15.0, 18.0, 18.0, 34.0, 29.0, 17.0, 30.0, 27.0, 28.0, 27.0, 36.0, 35.0, 47.0, 38.0, 48.0, 27.0, 47.0, 36.0, 28.0, 22.0, 39.0, 32.0, 30.0, 26.0, 25.0, 28.0, 21.0, 14.0, 20.0, 13.0, 10.0, 19.0, 14.0, 5.0, 7.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.186312198638916, -6.003700256347656, -5.8210883140563965, -5.638476371765137, -5.455864429473877, -5.273252487182617, -5.090640544891357, -4.908028602600098, -4.725416660308838, -4.542804718017578, -4.360192775726318, -4.177580833435059, -3.994968891143799, -3.812356948852539, -3.6297450065612793, -3.4471330642700195, -3.2645208835601807, -3.081908941268921, -2.899296998977661, -2.7166850566864014, -2.5340731143951416, -2.351461172103882, -2.168848991394043, -1.9862371683120728, -1.803625226020813, -1.6210132837295532, -1.4384013414382935, -1.2557892799377441, -1.0731773376464844, -0.8905654549598694, -0.7079534530639648, -0.5253415107727051, -0.3427295684814453, -0.16011761128902435, 0.022494345903396606, 0.20510631799697876, 0.3877182602882385, 0.5703302025794983, 0.7529422044754028, 0.9355541467666626, 1.1181660890579224, 1.3007780313491821, 1.483389973640442, 1.6660020351409912, 1.848613977432251, 2.0312259197235107, 2.2138378620147705, 2.3964498043060303, 2.57906174659729, 2.76167368888855, 2.9442856311798096, 3.1268975734710693, 3.309509515762329, 3.492121458053589, 3.6747336387634277, 3.8573455810546875, 4.039957523345947, 4.222569465637207, 4.405181407928467, 4.587793350219727, 4.770405292510986, 4.953017234802246, 5.135629177093506, 5.318241119384766, 5.500853061676025]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 7.0, 7.0, 7.0, 10.0, 14.0, 31.0, 32.0, 68.0, 70.0, 163.0, 203.0, 274.0, 407.0, 625.0, 1017.0, 1546.0, 2396.0, 3777.0, 5652.0, 9263.0, 15120.0, 25485.0, 44816.0, 79050.0, 145080.0, 273344.0, 506066.0, 790298.0, 860680.0, 628876.0, 359274.0, 192795.0, 104658.0, 58145.0, 33571.0, 19636.0, 11622.0, 7274.0, 4510.0, 2843.0, 1927.0, 1185.0, 808.0, 556.0, 379.0, 214.0, 178.0, 109.0, 96.0, 50.0, 31.0, 19.0, 18.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.140625, -5.94390869140625, -5.7471923828125, -5.55047607421875, -5.353759765625, -5.15704345703125, -4.9603271484375, -4.76361083984375, -4.56689453125, -4.37017822265625, -4.1734619140625, -3.97674560546875, -3.780029296875, -3.58331298828125, -3.3865966796875, -3.18988037109375, -2.9931640625, -2.79644775390625, -2.5997314453125, -2.40301513671875, -2.206298828125, -2.00958251953125, -1.8128662109375, -1.61614990234375, -1.41943359375, -1.22271728515625, -1.0260009765625, -0.82928466796875, -0.632568359375, -0.43585205078125, -0.2391357421875, -0.04241943359375, 0.154296875, 0.35101318359375, 0.5477294921875, 0.74444580078125, 0.941162109375, 1.13787841796875, 1.3345947265625, 1.53131103515625, 1.72802734375, 1.92474365234375, 2.1214599609375, 2.31817626953125, 2.514892578125, 2.71160888671875, 2.9083251953125, 3.10504150390625, 3.3017578125, 3.49847412109375, 3.6951904296875, 3.89190673828125, 4.088623046875, 4.28533935546875, 4.4820556640625, 4.67877197265625, 4.87548828125, 5.07220458984375, 5.2689208984375, 5.46563720703125, 5.662353515625, 5.85906982421875, 6.0557861328125, 6.25250244140625, 6.44921875]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 6.0, 2.0, 3.0, 3.0, 9.0, 5.0, 6.0, 13.0, 5.0, 6.0, 9.0, 16.0, 25.0, 23.0, 29.0, 26.0, 23.0, 36.0, 20.0, 34.0, 19.0, 38.0, 39.0, 41.0, 27.0, 29.0, 49.0, 33.0, 48.0, 31.0, 38.0, 32.0, 32.0, 34.0, 24.0, 20.0, 29.0, 21.0, 21.0, 19.0, 17.0, 14.0, 7.0, 11.0, 6.0, 12.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.724609375, -3.599578857421875, -3.47454833984375, -3.349517822265625, -3.2244873046875, -3.099456787109375, -2.97442626953125, -2.849395751953125, -2.724365234375, -2.599334716796875, -2.47430419921875, -2.349273681640625, -2.2242431640625, -2.099212646484375, -1.97418212890625, -1.849151611328125, -1.72412109375, -1.599090576171875, -1.47406005859375, -1.349029541015625, -1.2239990234375, -1.098968505859375, -0.97393798828125, -0.848907470703125, -0.723876953125, -0.598846435546875, -0.47381591796875, -0.348785400390625, -0.2237548828125, -0.098724365234375, 0.02630615234375, 0.151336669921875, 0.2763671875, 0.401397705078125, 0.52642822265625, 0.651458740234375, 0.7764892578125, 0.901519775390625, 1.02655029296875, 1.151580810546875, 1.276611328125, 1.401641845703125, 1.52667236328125, 1.651702880859375, 1.7767333984375, 1.901763916015625, 2.02679443359375, 2.151824951171875, 2.27685546875, 2.401885986328125, 2.52691650390625, 2.651947021484375, 2.7769775390625, 2.902008056640625, 3.02703857421875, 3.152069091796875, 3.277099609375, 3.402130126953125, 3.52716064453125, 3.652191162109375, 3.7772216796875, 3.902252197265625, 4.02728271484375, 4.152313232421875, 4.27734375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 4.0, 4.0, 7.0, 15.0, 12.0, 23.0, 38.0, 58.0, 100.0, 147.0, 210.0, 293.0, 423.0, 713.0, 1105.0, 1669.0, 2598.0, 4135.0, 6563.0, 10398.0, 17365.0, 28614.0, 48184.0, 82582.0, 142720.0, 241622.0, 402969.0, 608902.0, 753030.0, 672889.0, 465473.0, 288033.0, 169470.0, 99109.0, 57487.0, 34194.0, 20221.0, 12338.0, 7460.0, 4723.0, 3009.0, 1900.0, 1213.0, 802.0, 501.0, 301.0, 225.0, 148.0, 95.0, 81.0, 36.0, 27.0, 20.0, 15.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0], "bins": [-5.67578125, -5.49652099609375, -5.3172607421875, -5.13800048828125, -4.958740234375, -4.77947998046875, -4.6002197265625, -4.42095947265625, -4.24169921875, -4.06243896484375, -3.8831787109375, -3.70391845703125, -3.524658203125, -3.34539794921875, -3.1661376953125, -2.98687744140625, -2.8076171875, -2.62835693359375, -2.4490966796875, -2.26983642578125, -2.090576171875, -1.91131591796875, -1.7320556640625, -1.55279541015625, -1.37353515625, -1.19427490234375, -1.0150146484375, -0.83575439453125, -0.656494140625, -0.47723388671875, -0.2979736328125, -0.11871337890625, 0.060546875, 0.23980712890625, 0.4190673828125, 0.59832763671875, 0.777587890625, 0.95684814453125, 1.1361083984375, 1.31536865234375, 1.49462890625, 1.67388916015625, 1.8531494140625, 2.03240966796875, 2.211669921875, 2.39093017578125, 2.5701904296875, 2.74945068359375, 2.9287109375, 3.10797119140625, 3.2872314453125, 3.46649169921875, 3.645751953125, 3.82501220703125, 4.0042724609375, 4.18353271484375, 4.36279296875, 4.54205322265625, 4.7213134765625, 4.90057373046875, 5.079833984375, 5.25909423828125, 5.4383544921875, 5.61761474609375, 5.796875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 10.0, 2.0, 12.0, 14.0, 20.0, 21.0, 25.0, 26.0, 23.0, 41.0, 55.0, 67.0, 93.0, 102.0, 132.0, 163.0, 182.0, 172.0, 211.0, 246.0, 254.0, 244.0, 258.0, 240.0, 231.0, 186.0, 164.0, 167.0, 138.0, 107.0, 90.0, 74.0, 59.0, 50.0, 36.0, 31.0, 28.0, 18.0, 16.0, 18.0, 14.0, 8.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.041015625, -1.974884033203125, -1.90875244140625, -1.842620849609375, -1.7764892578125, -1.710357666015625, -1.64422607421875, -1.578094482421875, -1.511962890625, -1.445831298828125, -1.37969970703125, -1.313568115234375, -1.2474365234375, -1.181304931640625, -1.11517333984375, -1.049041748046875, -0.98291015625, -0.916778564453125, -0.85064697265625, -0.784515380859375, -0.7183837890625, -0.652252197265625, -0.58612060546875, -0.519989013671875, -0.453857421875, -0.387725830078125, -0.32159423828125, -0.255462646484375, -0.1893310546875, -0.123199462890625, -0.05706787109375, 0.009063720703125, 0.0751953125, 0.141326904296875, 0.20745849609375, 0.273590087890625, 0.3397216796875, 0.405853271484375, 0.47198486328125, 0.538116455078125, 0.604248046875, 0.670379638671875, 0.73651123046875, 0.802642822265625, 0.8687744140625, 0.934906005859375, 1.00103759765625, 1.067169189453125, 1.13330078125, 1.199432373046875, 1.26556396484375, 1.331695556640625, 1.3978271484375, 1.463958740234375, 1.53009033203125, 1.596221923828125, 1.662353515625, 1.728485107421875, 1.79461669921875, 1.860748291015625, 1.9268798828125, 1.993011474609375, 2.05914306640625, 2.125274658203125, 2.19140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 0.0, 5.0, 7.0, 9.0, 11.0, 17.0, 14.0, 33.0, 33.0, 29.0, 38.0, 55.0, 55.0, 55.0, 81.0, 84.0, 67.0, 57.0, 57.0, 55.0, 49.0, 49.0, 25.0, 32.0, 20.0, 17.0, 14.0, 9.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.106962203979492, -7.835235118865967, -7.5635085105896, -7.291781425476074, -7.020054817199707, -6.748327732086182, -6.476600646972656, -6.204874038696289, -5.933146953582764, -5.661419868469238, -5.389693260192871, -5.117966175079346, -4.84623908996582, -4.574512481689453, -4.302785396575928, -4.031058311462402, -3.759331703186035, -3.487604856491089, -3.2158780097961426, -2.944150924682617, -2.672424077987671, -2.4006972312927246, -2.128970146179199, -1.857243299484253, -1.5855164527893066, -1.3137896060943604, -1.0420626401901245, -0.7703357338905334, -0.4986088275909424, -0.2268819808959961, 0.044844985008239746, 0.3165719509124756, 0.5882987976074219, 0.8600257039070129, 1.131752610206604, 1.4034795761108398, 1.6752064228057861, 1.9469332695007324, 2.218660354614258, 2.490387201309204, 2.7621140480041504, 3.0338408946990967, 3.305567741394043, 3.5772948265075684, 3.8490216732025146, 4.120748519897461, 4.392475605010986, 4.664202690124512, 4.935929298400879, 5.207656383514404, 5.4793829917907715, 5.751110076904297, 6.022836685180664, 6.2945637702941895, 6.566290855407715, 6.838017463684082, 7.109744548797607, 7.381471633911133, 7.6531982421875, 7.924925327301025, 8.19665241241455, 8.468379020690918, 8.740105628967285, 9.011833190917969, 9.283559799194336]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 3.0, 9.0, 12.0, 8.0, 7.0, 16.0, 18.0, 18.0, 23.0, 28.0, 26.0, 23.0, 39.0, 36.0, 40.0, 38.0, 38.0, 51.0, 45.0, 38.0, 37.0, 49.0, 41.0, 36.0, 31.0, 30.0, 35.0, 33.0, 21.0, 23.0, 21.0, 26.0, 23.0, 14.0, 14.0, 11.0, 7.0, 8.0, 11.0, 4.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.849778175354004, -5.6817708015441895, -5.513762950897217, -5.345755577087402, -5.17774772644043, -5.009740352630615, -4.841732978820801, -4.673725128173828, -4.5057172775268555, -4.337709903717041, -4.169702053070068, -4.001694679260254, -3.8336868286132812, -3.665679454803467, -3.4976718425750732, -3.3296642303466797, -3.1616568565368652, -2.9936492443084717, -2.825641632080078, -2.6576342582702637, -2.489626407623291, -2.3216190338134766, -2.153611421585083, -1.9856038093566895, -1.817596197128296, -1.6495885848999023, -1.4815809726715088, -1.3135734796524048, -1.1455658674240112, -0.9775582551956177, -0.8095507621765137, -0.6415431499481201, -0.47353506088256836, -0.3055274784564972, -0.13751989603042603, 0.030487656593322754, 0.1984952688217163, 0.36650288105010986, 0.5345103740692139, 0.7025179862976074, 0.870525598526001, 1.0385332107543945, 1.206540822982788, 1.374548316001892, 1.5425559282302856, 1.7105635404586792, 1.8785710334777832, 2.0465786457061768, 2.2145862579345703, 2.382593870162964, 2.5506014823913574, 2.718608856201172, 2.8866167068481445, 3.054624080657959, 3.2226316928863525, 3.390639305114746, 3.5586469173431396, 3.726654529571533, 3.8946621417999268, 4.06266975402832, 4.230677127838135, 4.398684978485107, 4.566692352294922, 4.7347002029418945, 4.902707576751709]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 3.0, 8.0, 9.0, 23.0, 19.0, 30.0, 56.0, 79.0, 121.0, 199.0, 284.0, 429.0, 619.0, 937.0, 1306.0, 2049.0, 3371.0, 5073.0, 7916.0, 12267.0, 19274.0, 30350.0, 47941.0, 75047.0, 111741.0, 151599.0, 165040.0, 138344.0, 97719.0, 63699.0, 40961.0, 25758.0, 16423.0, 10638.0, 6805.0, 4282.0, 2793.0, 1798.0, 1191.0, 814.0, 513.0, 330.0, 231.0, 156.0, 94.0, 69.0, 57.0, 34.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.5595703125, -1.5081329345703125, -1.456695556640625, -1.4052581787109375, -1.35382080078125, -1.3023834228515625, -1.250946044921875, -1.1995086669921875, -1.1480712890625, -1.0966339111328125, -1.045196533203125, -0.9937591552734375, -0.94232177734375, -0.8908843994140625, -0.839447021484375, -0.7880096435546875, -0.736572265625, -0.6851348876953125, -0.633697509765625, -0.5822601318359375, -0.53082275390625, -0.4793853759765625, -0.427947998046875, -0.3765106201171875, -0.3250732421875, -0.2736358642578125, -0.222198486328125, -0.1707611083984375, -0.11932373046875, -0.0678863525390625, -0.016448974609375, 0.0349884033203125, 0.08642578125, 0.1378631591796875, 0.189300537109375, 0.2407379150390625, 0.29217529296875, 0.3436126708984375, 0.395050048828125, 0.4464874267578125, 0.4979248046875, 0.5493621826171875, 0.600799560546875, 0.6522369384765625, 0.70367431640625, 0.7551116943359375, 0.806549072265625, 0.8579864501953125, 0.909423828125, 0.9608612060546875, 1.012298583984375, 1.0637359619140625, 1.11517333984375, 1.1666107177734375, 1.218048095703125, 1.2694854736328125, 1.3209228515625, 1.3723602294921875, 1.423797607421875, 1.4752349853515625, 1.52667236328125, 1.5781097412109375, 1.629547119140625, 1.6809844970703125, 1.732421875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 7.0, 5.0, 13.0, 12.0, 17.0, 26.0, 21.0, 27.0, 30.0, 35.0, 43.0, 31.0, 39.0, 31.0, 53.0, 50.0, 34.0, 40.0, 50.0, 40.0, 47.0, 40.0, 42.0, 24.0, 31.0, 31.0, 22.0, 21.0, 22.0, 16.0, 17.0, 25.0, 7.0, 8.0, 11.0, 12.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.2890625, -6.106201171875, -5.92333984375, -5.740478515625, -5.5576171875, -5.374755859375, -5.19189453125, -5.009033203125, -4.826171875, -4.643310546875, -4.46044921875, -4.277587890625, -4.0947265625, -3.911865234375, -3.72900390625, -3.546142578125, -3.36328125, -3.180419921875, -2.99755859375, -2.814697265625, -2.6318359375, -2.448974609375, -2.26611328125, -2.083251953125, -1.900390625, -1.717529296875, -1.53466796875, -1.351806640625, -1.1689453125, -0.986083984375, -0.80322265625, -0.620361328125, -0.4375, -0.254638671875, -0.07177734375, 0.111083984375, 0.2939453125, 0.476806640625, 0.65966796875, 0.842529296875, 1.025390625, 1.208251953125, 1.39111328125, 1.573974609375, 1.7568359375, 1.939697265625, 2.12255859375, 2.305419921875, 2.48828125, 2.671142578125, 2.85400390625, 3.036865234375, 3.2197265625, 3.402587890625, 3.58544921875, 3.768310546875, 3.951171875, 4.134033203125, 4.31689453125, 4.499755859375, 4.6826171875, 4.865478515625, 5.04833984375, 5.231201171875, 5.4140625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 9.0, 14.0, 18.0, 20.0, 30.0, 34.0, 56.0, 90.0, 111.0, 153.0, 202.0, 316.0, 453.0, 606.0, 916.0, 1330.0, 1950.0, 2878.0, 4533.0, 7138.0, 11989.0, 22749.0, 81009.0, 824131.0, 42079.0, 18066.0, 9979.0, 5996.0, 3784.0, 2440.0, 1703.0, 1193.0, 815.0, 484.0, 360.0, 247.0, 199.0, 128.0, 94.0, 82.0, 30.0, 41.0, 27.0, 16.0, 9.0, 8.0, 11.0, 3.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.947998046875, -3.81787109375, -3.687744140625, -3.5576171875, -3.427490234375, -3.29736328125, -3.167236328125, -3.037109375, -2.906982421875, -2.77685546875, -2.646728515625, -2.5166015625, -2.386474609375, -2.25634765625, -2.126220703125, -1.99609375, -1.865966796875, -1.73583984375, -1.605712890625, -1.4755859375, -1.345458984375, -1.21533203125, -1.085205078125, -0.955078125, -0.824951171875, -0.69482421875, -0.564697265625, -0.4345703125, -0.304443359375, -0.17431640625, -0.044189453125, 0.0859375, 0.216064453125, 0.34619140625, 0.476318359375, 0.6064453125, 0.736572265625, 0.86669921875, 0.996826171875, 1.126953125, 1.257080078125, 1.38720703125, 1.517333984375, 1.6474609375, 1.777587890625, 1.90771484375, 2.037841796875, 2.16796875, 2.298095703125, 2.42822265625, 2.558349609375, 2.6884765625, 2.818603515625, 2.94873046875, 3.078857421875, 3.208984375, 3.339111328125, 3.46923828125, 3.599365234375, 3.7294921875, 3.859619140625, 3.98974609375, 4.119873046875, 4.25]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 20.0, 17.0, 20.0, 23.0, 24.0, 27.0, 34.0, 30.0, 34.0, 43.0, 31.0, 55.0, 54.0, 44.0, 45.0, 36.0, 37.0, 39.0, 44.0, 42.0, 41.0, 33.0, 19.0, 25.0, 16.0, 23.0, 19.0, 11.0, 7.0, 6.0, 13.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9140625, -3.7760009765625, -3.637939453125, -3.4998779296875, -3.36181640625, -3.2237548828125, -3.085693359375, -2.9476318359375, -2.8095703125, -2.6715087890625, -2.533447265625, -2.3953857421875, -2.25732421875, -2.1192626953125, -1.981201171875, -1.8431396484375, -1.705078125, -1.5670166015625, -1.428955078125, -1.2908935546875, -1.15283203125, -1.0147705078125, -0.876708984375, -0.7386474609375, -0.6005859375, -0.4625244140625, -0.324462890625, -0.1864013671875, -0.04833984375, 0.0897216796875, 0.227783203125, 0.3658447265625, 0.50390625, 0.6419677734375, 0.780029296875, 0.9180908203125, 1.05615234375, 1.1942138671875, 1.332275390625, 1.4703369140625, 1.6083984375, 1.7464599609375, 1.884521484375, 2.0225830078125, 2.16064453125, 2.2987060546875, 2.436767578125, 2.5748291015625, 2.712890625, 2.8509521484375, 2.989013671875, 3.1270751953125, 3.26513671875, 3.4031982421875, 3.541259765625, 3.6793212890625, 3.8173828125, 3.9554443359375, 4.093505859375, 4.2315673828125, 4.36962890625, 4.5076904296875, 4.645751953125, 4.7838134765625, 4.921875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 5.0, 19.0, 13.0, 11.0, 28.0, 35.0, 51.0, 68.0, 66.0, 115.0, 158.0, 191.0, 281.0, 447.0, 654.0, 970.0, 1567.0, 2405.0, 3785.0, 6177.0, 10946.0, 20743.0, 73722.0, 851059.0, 35683.0, 16061.0, 8812.0, 5107.0, 3223.0, 2031.0, 1299.0, 867.0, 584.0, 405.0, 260.0, 201.0, 151.0, 91.0, 77.0, 50.0, 33.0, 30.0, 21.0, 21.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.759765625, -1.706939697265625, -1.65411376953125, -1.601287841796875, -1.5484619140625, -1.495635986328125, -1.44281005859375, -1.389984130859375, -1.337158203125, -1.284332275390625, -1.23150634765625, -1.178680419921875, -1.1258544921875, -1.073028564453125, -1.02020263671875, -0.967376708984375, -0.91455078125, -0.861724853515625, -0.80889892578125, -0.756072998046875, -0.7032470703125, -0.650421142578125, -0.59759521484375, -0.544769287109375, -0.491943359375, -0.439117431640625, -0.38629150390625, -0.333465576171875, -0.2806396484375, -0.227813720703125, -0.17498779296875, -0.122161865234375, -0.0693359375, -0.016510009765625, 0.03631591796875, 0.089141845703125, 0.1419677734375, 0.194793701171875, 0.24761962890625, 0.300445556640625, 0.353271484375, 0.406097412109375, 0.45892333984375, 0.511749267578125, 0.5645751953125, 0.617401123046875, 0.67022705078125, 0.723052978515625, 0.77587890625, 0.828704833984375, 0.88153076171875, 0.934356689453125, 0.9871826171875, 1.040008544921875, 1.09283447265625, 1.145660400390625, 1.198486328125, 1.251312255859375, 1.30413818359375, 1.356964111328125, 1.4097900390625, 1.462615966796875, 1.51544189453125, 1.568267822265625, 1.62109375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 4.0, 8.0, 8.0, 10.0, 19.0, 22.0, 37.0, 57.0, 71.0, 98.0, 113.0, 122.0, 104.0, 78.0, 67.0, 44.0, 32.0, 19.0, 17.0, 17.0, 2.0, 8.0, 7.0, 4.0, 1.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00021076202392578125, -0.00020478293299674988, -0.0001988038420677185, -0.00019282475113868713, -0.00018684566020965576, -0.0001808665692806244, -0.00017488747835159302, -0.00016890838742256165, -0.00016292929649353027, -0.0001569502055644989, -0.00015097111463546753, -0.00014499202370643616, -0.00013901293277740479, -0.0001330338418483734, -0.00012705475091934204, -0.00012107565999031067, -0.0001150965690612793, -0.00010911747813224792, -0.00010313838720321655, -9.715929627418518e-05, -9.118020534515381e-05, -8.520111441612244e-05, -7.922202348709106e-05, -7.324293255805969e-05, -6.726384162902832e-05, -6.128475069999695e-05, -5.5305659770965576e-05, -4.9326568841934204e-05, -4.334747791290283e-05, -3.736838698387146e-05, -3.138929605484009e-05, -2.5410205125808716e-05, -1.9431114196777344e-05, -1.3452023267745972e-05, -7.4729323387146e-06, -1.4938414096832275e-06, 4.4852495193481445e-06, 1.0464340448379517e-05, 1.644343137741089e-05, 2.242252230644226e-05, 2.8401613235473633e-05, 3.4380704164505005e-05, 4.035979509353638e-05, 4.633888602256775e-05, 5.231797695159912e-05, 5.829706788063049e-05, 6.427615880966187e-05, 7.025524973869324e-05, 7.623434066772461e-05, 8.221343159675598e-05, 8.819252252578735e-05, 9.417161345481873e-05, 0.0001001507043838501, 0.00010612979531288147, 0.00011210888624191284, 0.00011808797717094421, 0.00012406706809997559, 0.00013004615902900696, 0.00013602524995803833, 0.0001420043408870697, 0.00014798343181610107, 0.00015396252274513245, 0.00015994161367416382, 0.0001659207046031952, 0.00017189979553222656]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 7.0, 7.0, 13.0, 21.0, 34.0, 42.0, 61.0, 76.0, 116.0, 177.0, 260.0, 402.0, 629.0, 898.0, 1407.0, 2186.0, 3504.0, 5583.0, 9501.0, 15300.0, 25773.0, 43533.0, 73987.0, 126400.0, 198073.0, 206229.0, 135998.0, 80311.0, 47045.0, 27878.0, 16356.0, 10080.0, 6094.0, 3724.0, 2429.0, 1495.0, 985.0, 679.0, 410.0, 266.0, 190.0, 135.0, 87.0, 64.0, 36.0, 19.0, 17.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.736328125, -0.7126312255859375, -0.688934326171875, -0.6652374267578125, -0.64154052734375, -0.6178436279296875, -0.594146728515625, -0.5704498291015625, -0.5467529296875, -0.5230560302734375, -0.499359130859375, -0.4756622314453125, -0.45196533203125, -0.4282684326171875, -0.404571533203125, -0.3808746337890625, -0.357177734375, -0.3334808349609375, -0.309783935546875, -0.2860870361328125, -0.26239013671875, -0.2386932373046875, -0.214996337890625, -0.1912994384765625, -0.1676025390625, -0.1439056396484375, -0.120208740234375, -0.0965118408203125, -0.07281494140625, -0.0491180419921875, -0.025421142578125, -0.0017242431640625, 0.02197265625, 0.0456695556640625, 0.069366455078125, 0.0930633544921875, 0.11676025390625, 0.1404571533203125, 0.164154052734375, 0.1878509521484375, 0.2115478515625, 0.2352447509765625, 0.258941650390625, 0.2826385498046875, 0.30633544921875, 0.3300323486328125, 0.353729248046875, 0.3774261474609375, 0.401123046875, 0.4248199462890625, 0.448516845703125, 0.4722137451171875, 0.49591064453125, 0.5196075439453125, 0.543304443359375, 0.5670013427734375, 0.5906982421875, 0.6143951416015625, 0.638092041015625, 0.6617889404296875, 0.68548583984375, 0.7091827392578125, 0.732879638671875, 0.7565765380859375, 0.7802734375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 8.0, 13.0, 17.0, 19.0, 14.0, 25.0, 27.0, 33.0, 31.0, 40.0, 49.0, 44.0, 51.0, 54.0, 51.0, 53.0, 44.0, 65.0, 50.0, 45.0, 41.0, 27.0, 37.0, 24.0, 22.0, 18.0, 12.0, 12.0, 10.0, 14.0, 9.0, 5.0, 4.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24935150146484375, -0.2411346435546875, -0.23291778564453125, -0.224700927734375, -0.21648406982421875, -0.2082672119140625, -0.20005035400390625, -0.19183349609375, -0.18361663818359375, -0.1753997802734375, -0.16718292236328125, -0.158966064453125, -0.15074920654296875, -0.1425323486328125, -0.13431549072265625, -0.1260986328125, -0.11788177490234375, -0.1096649169921875, -0.10144805908203125, -0.093231201171875, -0.08501434326171875, -0.0767974853515625, -0.06858062744140625, -0.06036376953125, -0.05214691162109375, -0.0439300537109375, -0.03571319580078125, -0.027496337890625, -0.01927947998046875, -0.0110626220703125, -0.00284576416015625, 0.00537109375, 0.01358795166015625, 0.0218048095703125, 0.03002166748046875, 0.038238525390625, 0.04645538330078125, 0.0546722412109375, 0.06288909912109375, 0.07110595703125, 0.07932281494140625, 0.0875396728515625, 0.09575653076171875, 0.103973388671875, 0.11219024658203125, 0.1204071044921875, 0.12862396240234375, 0.1368408203125, 0.14505767822265625, 0.1532745361328125, 0.16149139404296875, 0.169708251953125, 0.17792510986328125, 0.1861419677734375, 0.19435882568359375, 0.20257568359375, 0.21079254150390625, 0.2190093994140625, 0.22722625732421875, 0.235443115234375, 0.24365997314453125, 0.2518768310546875, 0.26009368896484375, 0.268310546875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 7.0, 14.0, 14.0, 16.0, 28.0, 34.0, 38.0, 47.0, 45.0, 58.0, 64.0, 74.0, 84.0, 70.0, 72.0, 46.0, 62.0, 52.0, 29.0, 33.0, 27.0, 15.0, 19.0, 14.0, 8.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.229190826416016, -7.951141834259033, -7.673092842102051, -7.395044326782227, -7.116995334625244, -6.838946342468262, -6.5608978271484375, -6.282848834991455, -6.004799842834473, -5.72675085067749, -5.448701858520508, -5.170653343200684, -4.892604351043701, -4.614555358886719, -4.3365068435668945, -4.058457851409912, -3.7804088592529297, -3.5023598670959473, -3.224311113357544, -2.9462623596191406, -2.668213367462158, -2.390164375305176, -2.1121156215667725, -1.8340667486190796, -1.5560178756713867, -1.2779690027236938, -0.999920129776001, -0.7218712568283081, -0.44382238388061523, -0.16577351093292236, 0.11227536201477051, 0.3903242349624634, 0.6683740615844727, 0.9464229345321655, 1.2244718074798584, 1.5025206804275513, 1.7805695533752441, 2.0586185455322266, 2.33666729927063, 2.614716053009033, 2.8927650451660156, 3.170814037322998, 3.4488627910614014, 3.7269115447998047, 4.004960536956787, 4.2830095291137695, 4.561058044433594, 4.839107036590576, 5.117156028747559, 5.395205020904541, 5.673254013061523, 5.951302528381348, 6.22935152053833, 6.5074005126953125, 6.785449028015137, 7.063498020172119, 7.341547012329102, 7.619596004486084, 7.897644996643066, 8.17569351196289, 8.453742980957031, 8.731791496276855, 9.00984001159668, 9.28788948059082, 9.565937995910645]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 12.0, 9.0, 14.0, 21.0, 22.0, 22.0, 29.0, 28.0, 24.0, 37.0, 39.0, 43.0, 41.0, 43.0, 48.0, 46.0, 32.0, 48.0, 45.0, 46.0, 29.0, 33.0, 39.0, 28.0, 24.0, 28.0, 22.0, 24.0, 19.0, 19.0, 11.0, 15.0, 6.0, 10.0, 11.0, 3.0, 5.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.924797058105469, -5.7518486976623535, -5.578900337219238, -5.405952453613281, -5.233004093170166, -5.060055732727051, -4.887107849121094, -4.7141594886779785, -4.541211128234863, -4.368262767791748, -4.195314407348633, -4.022366523742676, -3.8494181632995605, -3.6764698028564453, -3.503521680831909, -3.330573558807373, -3.157625198364258, -2.9846768379211426, -2.8117287158966064, -2.6387805938720703, -2.465832233428955, -2.29288387298584, -2.1199357509613037, -1.946987509727478, -1.7740392684936523, -1.6010910272598267, -1.428142786026001, -1.2551945447921753, -1.0822463035583496, -0.9092980623245239, -0.7363498210906982, -0.5634015798568726, -0.39045286178588867, -0.217504620552063, -0.044556379318237305, 0.12839186191558838, 0.30134010314941406, 0.47428834438323975, 0.6472365856170654, 0.8201848268508911, 0.9931330680847168, 1.1660813093185425, 1.3390295505523682, 1.5119777917861938, 1.6849260330200195, 1.8578742742538452, 2.030822515487671, 2.203770637512207, 2.3767189979553223, 2.5496673583984375, 2.7226154804229736, 2.8955636024475098, 3.068511962890625, 3.2414603233337402, 3.4144084453582764, 3.5873565673828125, 3.7603049278259277, 3.933253288269043, 4.106201171875, 4.279149532318115, 4.4520978927612305, 4.625046253204346, 4.797994613647461, 4.970942497253418, 5.143890857696533]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 9.0, 16.0, 14.0, 34.0, 35.0, 55.0, 91.0, 116.0, 199.0, 252.0, 397.0, 587.0, 832.0, 1310.0, 1877.0, 2924.0, 4276.0, 6176.0, 9534.0, 14046.0, 20801.0, 30915.0, 45108.0, 64110.0, 87238.0, 111080.0, 126907.0, 126229.0, 109124.0, 85512.0, 62809.0, 44059.0, 30282.0, 20342.0, 13616.0, 9014.0, 6169.0, 4062.0, 2793.0, 1792.0, 1188.0, 859.0, 580.0, 390.0, 258.0, 178.0, 106.0, 86.0, 59.0, 32.0, 23.0, 20.0, 16.0, 6.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-4.5546875, -4.4075927734375, -4.260498046875, -4.1134033203125, -3.96630859375, -3.8192138671875, -3.672119140625, -3.5250244140625, -3.3779296875, -3.2308349609375, -3.083740234375, -2.9366455078125, -2.78955078125, -2.6424560546875, -2.495361328125, -2.3482666015625, -2.201171875, -2.0540771484375, -1.906982421875, -1.7598876953125, -1.61279296875, -1.4656982421875, -1.318603515625, -1.1715087890625, -1.0244140625, -0.8773193359375, -0.730224609375, -0.5831298828125, -0.43603515625, -0.2889404296875, -0.141845703125, 0.0052490234375, 0.15234375, 0.2994384765625, 0.446533203125, 0.5936279296875, 0.74072265625, 0.8878173828125, 1.034912109375, 1.1820068359375, 1.3291015625, 1.4761962890625, 1.623291015625, 1.7703857421875, 1.91748046875, 2.0645751953125, 2.211669921875, 2.3587646484375, 2.505859375, 2.6529541015625, 2.800048828125, 2.9471435546875, 3.09423828125, 3.2413330078125, 3.388427734375, 3.5355224609375, 3.6826171875, 3.8297119140625, 3.976806640625, 4.1239013671875, 4.27099609375, 4.4180908203125, 4.565185546875, 4.7122802734375, 4.859375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 4.0, 6.0, 5.0, 7.0, 24.0, 20.0, 11.0, 24.0, 27.0, 27.0, 33.0, 35.0, 37.0, 44.0, 38.0, 40.0, 50.0, 44.0, 51.0, 41.0, 47.0, 35.0, 29.0, 41.0, 40.0, 30.0, 28.0, 30.0, 26.0, 31.0, 20.0, 22.0, 9.0, 6.0, 6.0, 7.0, 7.0, 5.0, 2.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.43634033203125, -6.2593994140625, -6.08245849609375, -5.905517578125, -5.72857666015625, -5.5516357421875, -5.37469482421875, -5.19775390625, -5.02081298828125, -4.8438720703125, -4.66693115234375, -4.489990234375, -4.31304931640625, -4.1361083984375, -3.95916748046875, -3.7822265625, -3.60528564453125, -3.4283447265625, -3.25140380859375, -3.074462890625, -2.89752197265625, -2.7205810546875, -2.54364013671875, -2.36669921875, -2.18975830078125, -2.0128173828125, -1.83587646484375, -1.658935546875, -1.48199462890625, -1.3050537109375, -1.12811279296875, -0.951171875, -0.77423095703125, -0.5972900390625, -0.42034912109375, -0.243408203125, -0.06646728515625, 0.1104736328125, 0.28741455078125, 0.46435546875, 0.64129638671875, 0.8182373046875, 0.99517822265625, 1.172119140625, 1.34906005859375, 1.5260009765625, 1.70294189453125, 1.8798828125, 2.05682373046875, 2.2337646484375, 2.41070556640625, 2.587646484375, 2.76458740234375, 2.9415283203125, 3.11846923828125, 3.29541015625, 3.47235107421875, 3.6492919921875, 3.82623291015625, 4.003173828125, 4.18011474609375, 4.3570556640625, 4.53399658203125, 4.7109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 7.0, 16.0, 36.0, 37.0, 76.0, 100.0, 173.0, 275.0, 400.0, 691.0, 1173.0, 1905.0, 3180.0, 5298.0, 8996.0, 15324.0, 25724.0, 43032.0, 71236.0, 109577.0, 150350.0, 169462.0, 150723.0, 110458.0, 71969.0, 44098.0, 26385.0, 15316.0, 9062.0, 5428.0, 3205.0, 1856.0, 1160.0, 673.0, 419.0, 281.0, 175.0, 94.0, 72.0, 41.0, 21.0, 20.0, 16.0, 11.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.4305419921875, -4.263427734375, -4.0963134765625, -3.92919921875, -3.7620849609375, -3.594970703125, -3.4278564453125, -3.2607421875, -3.0936279296875, -2.926513671875, -2.7593994140625, -2.59228515625, -2.4251708984375, -2.258056640625, -2.0909423828125, -1.923828125, -1.7567138671875, -1.589599609375, -1.4224853515625, -1.25537109375, -1.0882568359375, -0.921142578125, -0.7540283203125, -0.5869140625, -0.4197998046875, -0.252685546875, -0.0855712890625, 0.08154296875, 0.2486572265625, 0.415771484375, 0.5828857421875, 0.75, 0.9171142578125, 1.084228515625, 1.2513427734375, 1.41845703125, 1.5855712890625, 1.752685546875, 1.9197998046875, 2.0869140625, 2.2540283203125, 2.421142578125, 2.5882568359375, 2.75537109375, 2.9224853515625, 3.089599609375, 3.2567138671875, 3.423828125, 3.5909423828125, 3.758056640625, 3.9251708984375, 4.09228515625, 4.2593994140625, 4.426513671875, 4.5936279296875, 4.7607421875, 4.9278564453125, 5.094970703125, 5.2620849609375, 5.42919921875, 5.5963134765625, 5.763427734375, 5.9305419921875, 6.09765625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 13.0, 5.0, 6.0, 18.0, 6.0, 10.0, 13.0, 21.0, 13.0, 24.0, 24.0, 29.0, 37.0, 28.0, 32.0, 28.0, 47.0, 46.0, 40.0, 49.0, 50.0, 41.0, 40.0, 46.0, 38.0, 23.0, 39.0, 33.0, 21.0, 18.0, 26.0, 22.0, 21.0, 18.0, 14.0, 17.0, 12.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.31640625, -4.18438720703125, -4.0523681640625, -3.92034912109375, -3.788330078125, -3.65631103515625, -3.5242919921875, -3.39227294921875, -3.26025390625, -3.12823486328125, -2.9962158203125, -2.86419677734375, -2.732177734375, -2.60015869140625, -2.4681396484375, -2.33612060546875, -2.2041015625, -2.07208251953125, -1.9400634765625, -1.80804443359375, -1.676025390625, -1.54400634765625, -1.4119873046875, -1.27996826171875, -1.14794921875, -1.01593017578125, -0.8839111328125, -0.75189208984375, -0.619873046875, -0.48785400390625, -0.3558349609375, -0.22381591796875, -0.091796875, 0.04022216796875, 0.1722412109375, 0.30426025390625, 0.436279296875, 0.56829833984375, 0.7003173828125, 0.83233642578125, 0.96435546875, 1.09637451171875, 1.2283935546875, 1.36041259765625, 1.492431640625, 1.62445068359375, 1.7564697265625, 1.88848876953125, 2.0205078125, 2.15252685546875, 2.2845458984375, 2.41656494140625, 2.548583984375, 2.68060302734375, 2.8126220703125, 2.94464111328125, 3.07666015625, 3.20867919921875, 3.3406982421875, 3.47271728515625, 3.604736328125, 3.73675537109375, 3.8687744140625, 4.00079345703125, 4.1328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 9.0, 9.0, 13.0, 22.0, 38.0, 68.0, 95.0, 158.0, 282.0, 499.0, 961.0, 1711.0, 3487.0, 7773.0, 18918.0, 54102.0, 169702.0, 383499.0, 267489.0, 88908.0, 29807.0, 11214.0, 4898.0, 2264.0, 1143.0, 599.0, 315.0, 223.0, 114.0, 68.0, 53.0, 38.0, 23.0, 15.0, 11.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.5, -10.1790771484375, -9.858154296875, -9.5372314453125, -9.21630859375, -8.8953857421875, -8.574462890625, -8.2535400390625, -7.9326171875, -7.6116943359375, -7.290771484375, -6.9698486328125, -6.64892578125, -6.3280029296875, -6.007080078125, -5.6861572265625, -5.365234375, -5.0443115234375, -4.723388671875, -4.4024658203125, -4.08154296875, -3.7606201171875, -3.439697265625, -3.1187744140625, -2.7978515625, -2.4769287109375, -2.156005859375, -1.8350830078125, -1.51416015625, -1.1932373046875, -0.872314453125, -0.5513916015625, -0.23046875, 0.0904541015625, 0.411376953125, 0.7322998046875, 1.05322265625, 1.3741455078125, 1.695068359375, 2.0159912109375, 2.3369140625, 2.6578369140625, 2.978759765625, 3.2996826171875, 3.62060546875, 3.9415283203125, 4.262451171875, 4.5833740234375, 4.904296875, 5.2252197265625, 5.546142578125, 5.8670654296875, 6.18798828125, 6.5089111328125, 6.829833984375, 7.1507568359375, 7.4716796875, 7.7926025390625, 8.113525390625, 8.4344482421875, 8.75537109375, 9.0762939453125, 9.397216796875, 9.7181396484375, 10.0390625]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 7.0, 11.0, 12.0, 15.0, 20.0, 31.0, 21.0, 31.0, 40.0, 52.0, 46.0, 35.0, 65.0, 53.0, 68.0, 63.0, 60.0, 50.0, 46.0, 51.0, 47.0, 30.0, 35.0, 19.0, 19.0, 13.0, 10.0, 8.0, 10.0, 8.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00045680999755859375, -0.0004429668188095093, -0.0004291236400604248, -0.00041528046131134033, -0.00040143728256225586, -0.0003875941038131714, -0.0003737509250640869, -0.00035990774631500244, -0.00034606456756591797, -0.0003322213888168335, -0.000318378210067749, -0.00030453503131866455, -0.0002906918525695801, -0.0002768486738204956, -0.00026300549507141113, -0.00024916231632232666, -0.0002353191375732422, -0.00022147595882415771, -0.00020763278007507324, -0.00019378960132598877, -0.0001799464225769043, -0.00016610324382781982, -0.00015226006507873535, -0.00013841688632965088, -0.0001245737075805664, -0.00011073052883148193, -9.688735008239746e-05, -8.304417133331299e-05, -6.920099258422852e-05, -5.535781383514404e-05, -4.151463508605957e-05, -2.7671456336975098e-05, -1.3828277587890625e-05, 1.4901161193847656e-08, 1.385807991027832e-05, 2.7701258659362793e-05, 4.1544437408447266e-05, 5.538761615753174e-05, 6.923079490661621e-05, 8.307397365570068e-05, 9.691715240478516e-05, 0.00011076033115386963, 0.0001246035099029541, 0.00013844668865203857, 0.00015228986740112305, 0.00016613304615020752, 0.000179976224899292, 0.00019381940364837646, 0.00020766258239746094, 0.0002215057611465454, 0.00023534893989562988, 0.00024919211864471436, 0.00026303529739379883, 0.0002768784761428833, 0.0002907216548919678, 0.00030456483364105225, 0.0003184080123901367, 0.0003322511911392212, 0.00034609436988830566, 0.00035993754863739014, 0.0003737807273864746, 0.0003876239061355591, 0.00040146708488464355, 0.00041531026363372803, 0.0004291534423828125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 13.0, 12.0, 21.0, 26.0, 37.0, 52.0, 77.0, 114.0, 204.0, 291.0, 424.0, 697.0, 1135.0, 1982.0, 3497.0, 6604.0, 13414.0, 29688.0, 69528.0, 160943.0, 280028.0, 251471.0, 127685.0, 53854.0, 23125.0, 10841.0, 5467.0, 2824.0, 1731.0, 1003.0, 643.0, 384.0, 238.0, 156.0, 112.0, 64.0, 44.0, 40.0, 18.0, 16.0, 17.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65972900390625, -6.4366455078125, -6.21356201171875, -5.990478515625, -5.76739501953125, -5.5443115234375, -5.32122802734375, -5.09814453125, -4.87506103515625, -4.6519775390625, -4.42889404296875, -4.205810546875, -3.98272705078125, -3.7596435546875, -3.53656005859375, -3.3134765625, -3.09039306640625, -2.8673095703125, -2.64422607421875, -2.421142578125, -2.19805908203125, -1.9749755859375, -1.75189208984375, -1.52880859375, -1.30572509765625, -1.0826416015625, -0.85955810546875, -0.636474609375, -0.41339111328125, -0.1903076171875, 0.03277587890625, 0.255859375, 0.47894287109375, 0.7020263671875, 0.92510986328125, 1.148193359375, 1.37127685546875, 1.5943603515625, 1.81744384765625, 2.04052734375, 2.26361083984375, 2.4866943359375, 2.70977783203125, 2.932861328125, 3.15594482421875, 3.3790283203125, 3.60211181640625, 3.8251953125, 4.04827880859375, 4.2713623046875, 4.49444580078125, 4.717529296875, 4.94061279296875, 5.1636962890625, 5.38677978515625, 5.60986328125, 5.83294677734375, 6.0560302734375, 6.27911376953125, 6.502197265625, 6.72528076171875, 6.9483642578125, 7.17144775390625, 7.39453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 5.0, 15.0, 10.0, 10.0, 20.0, 23.0, 39.0, 41.0, 81.0, 79.0, 110.0, 110.0, 92.0, 89.0, 50.0, 40.0, 27.0, 35.0, 21.0, 24.0, 9.0, 12.0, 7.0, 5.0, 6.0, 4.0, 6.0, 0.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.4609375, -3.35986328125, -3.2587890625, -3.15771484375, -3.056640625, -2.95556640625, -2.8544921875, -2.75341796875, -2.65234375, -2.55126953125, -2.4501953125, -2.34912109375, -2.248046875, -2.14697265625, -2.0458984375, -1.94482421875, -1.84375, -1.74267578125, -1.6416015625, -1.54052734375, -1.439453125, -1.33837890625, -1.2373046875, -1.13623046875, -1.03515625, -0.93408203125, -0.8330078125, -0.73193359375, -0.630859375, -0.52978515625, -0.4287109375, -0.32763671875, -0.2265625, -0.12548828125, -0.0244140625, 0.07666015625, 0.177734375, 0.27880859375, 0.3798828125, 0.48095703125, 0.58203125, 0.68310546875, 0.7841796875, 0.88525390625, 0.986328125, 1.08740234375, 1.1884765625, 1.28955078125, 1.390625, 1.49169921875, 1.5927734375, 1.69384765625, 1.794921875, 1.89599609375, 1.9970703125, 2.09814453125, 2.19921875, 2.30029296875, 2.4013671875, 2.50244140625, 2.603515625, 2.70458984375, 2.8056640625, 2.90673828125, 3.0078125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 9.0, 4.0, 16.0, 21.0, 25.0, 29.0, 31.0, 45.0, 48.0, 66.0, 65.0, 71.0, 91.0, 73.0, 79.0, 67.0, 53.0, 50.0, 43.0, 20.0, 20.0, 21.0, 12.0, 13.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9293670654296875, -7.647541522979736, -7.365716457366943, -7.083890914916992, -6.802065372467041, -6.52023983001709, -6.238414764404297, -5.956589221954346, -5.6747636795043945, -5.392938137054443, -5.11111307144165, -4.829287528991699, -4.547461986541748, -4.265636444091797, -3.983811378479004, -3.7019858360290527, -3.4201607704162598, -3.1383354663848877, -2.8565099239349365, -2.5746846199035645, -2.2928590774536133, -2.011033773422241, -1.7292084693908691, -1.4473830461502075, -1.165557622909546, -0.8837321996688843, -0.6019068360328674, -0.3200814723968506, -0.038256049156188965, 0.24356937408447266, 0.5253946781158447, 0.8072201013565063, 1.089045524597168, 1.3708709478378296, 1.6526963710784912, 1.9345216751098633, 2.2163472175598145, 2.4981725215911865, 2.7799978256225586, 3.0618233680725098, 3.343648672103882, 3.625473976135254, 3.907299518585205, 4.189125061035156, 4.470950126647949, 4.7527756690979, 5.034601211547852, 5.3164262771606445, 5.598251819610596, 5.880077362060547, 6.16190242767334, 6.443727970123291, 6.725553512573242, 7.007378578186035, 7.289204120635986, 7.5710296630859375, 7.8528547286987305, 8.134679794311523, 8.416505813598633, 8.698330879211426, 8.980155944824219, 9.261981964111328, 9.543807029724121, 9.825632095336914, 10.107458114624023]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 3.0, 3.0, 5.0, 7.0, 4.0, 14.0, 12.0, 17.0, 21.0, 23.0, 24.0, 22.0, 29.0, 45.0, 27.0, 41.0, 33.0, 42.0, 52.0, 37.0, 29.0, 47.0, 39.0, 29.0, 47.0, 48.0, 28.0, 29.0, 24.0, 31.0, 24.0, 28.0, 27.0, 15.0, 19.0, 15.0, 15.0, 15.0, 11.0, 5.0, 6.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.836164951324463, -5.655647277832031, -5.475129127502441, -5.294610977172852, -5.11409330368042, -4.933575630187988, -4.753057479858398, -4.572539329528809, -4.392021656036377, -4.211503982543945, -4.0309858322143555, -3.8504679203033447, -3.669950008392334, -3.4894320964813232, -3.3089141845703125, -3.1283962726593018, -2.947878360748291, -2.7673604488372803, -2.5868425369262695, -2.406324625015259, -2.225806713104248, -2.0452888011932373, -1.8647708892822266, -1.6842529773712158, -1.503735065460205, -1.3232171535491943, -1.1426992416381836, -0.9621813297271729, -0.7816634178161621, -0.6011455059051514, -0.4206275939941406, -0.24010968208312988, -0.05959129333496094, 0.1209266185760498, 0.30144453048706055, 0.4819624423980713, 0.662480354309082, 0.8429982662200928, 1.0235161781311035, 1.2040340900421143, 1.384552001953125, 1.5650699138641357, 1.7455878257751465, 1.9261057376861572, 2.106623649597168, 2.2871415615081787, 2.4676594734191895, 2.6481773853302, 2.828695297241211, 3.0092132091522217, 3.1897311210632324, 3.370249032974243, 3.550766944885254, 3.7312848567962646, 3.9118027687072754, 4.092320442199707, 4.272838592529297, 4.453356742858887, 4.633874416351318, 4.81439208984375, 4.99491024017334, 5.17542839050293, 5.355946063995361, 5.536463737487793, 5.716981887817383]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 6.0, 11.0, 12.0, 15.0, 23.0, 39.0, 51.0, 103.0, 131.0, 199.0, 296.0, 463.0, 732.0, 1198.0, 1966.0, 3413.0, 6195.0, 11297.0, 20973.0, 41158.0, 84003.0, 181458.0, 404994.0, 825437.0, 1106660.0, 791045.0, 381939.0, 170126.0, 78954.0, 37907.0, 19182.0, 10273.0, 5636.0, 3266.0, 1970.0, 1161.0, 669.0, 492.0, 286.0, 169.0, 119.0, 86.0, 55.0, 32.0, 27.0, 18.0, 18.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-6.62890625, -6.4246826171875, -6.220458984375, -6.0162353515625, -5.81201171875, -5.6077880859375, -5.403564453125, -5.1993408203125, -4.9951171875, -4.7908935546875, -4.586669921875, -4.3824462890625, -4.17822265625, -3.9739990234375, -3.769775390625, -3.5655517578125, -3.361328125, -3.1571044921875, -2.952880859375, -2.7486572265625, -2.54443359375, -2.3402099609375, -2.135986328125, -1.9317626953125, -1.7275390625, -1.5233154296875, -1.319091796875, -1.1148681640625, -0.91064453125, -0.7064208984375, -0.502197265625, -0.2979736328125, -0.09375, 0.1104736328125, 0.314697265625, 0.5189208984375, 0.72314453125, 0.9273681640625, 1.131591796875, 1.3358154296875, 1.5400390625, 1.7442626953125, 1.948486328125, 2.1527099609375, 2.35693359375, 2.5611572265625, 2.765380859375, 2.9696044921875, 3.173828125, 3.3780517578125, 3.582275390625, 3.7864990234375, 3.99072265625, 4.1949462890625, 4.399169921875, 4.6033935546875, 4.8076171875, 5.0118408203125, 5.216064453125, 5.4202880859375, 5.62451171875, 5.8287353515625, 6.032958984375, 6.2371826171875, 6.44140625]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 11.0, 7.0, 12.0, 22.0, 21.0, 22.0, 22.0, 27.0, 27.0, 37.0, 37.0, 35.0, 52.0, 45.0, 47.0, 33.0, 38.0, 43.0, 37.0, 31.0, 39.0, 22.0, 40.0, 43.0, 38.0, 33.0, 26.0, 24.0, 10.0, 19.0, 15.0, 17.0, 17.0, 10.0, 10.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.79296875, -3.676300048828125, -3.55963134765625, -3.442962646484375, -3.3262939453125, -3.209625244140625, -3.09295654296875, -2.976287841796875, -2.859619140625, -2.742950439453125, -2.62628173828125, -2.509613037109375, -2.3929443359375, -2.276275634765625, -2.15960693359375, -2.042938232421875, -1.92626953125, -1.809600830078125, -1.69293212890625, -1.576263427734375, -1.4595947265625, -1.342926025390625, -1.22625732421875, -1.109588623046875, -0.992919921875, -0.876251220703125, -0.75958251953125, -0.642913818359375, -0.5262451171875, -0.409576416015625, -0.29290771484375, -0.176239013671875, -0.0595703125, 0.057098388671875, 0.17376708984375, 0.290435791015625, 0.4071044921875, 0.523773193359375, 0.64044189453125, 0.757110595703125, 0.873779296875, 0.990447998046875, 1.10711669921875, 1.223785400390625, 1.3404541015625, 1.457122802734375, 1.57379150390625, 1.690460205078125, 1.80712890625, 1.923797607421875, 2.04046630859375, 2.157135009765625, 2.2738037109375, 2.390472412109375, 2.50714111328125, 2.623809814453125, 2.740478515625, 2.857147216796875, 2.97381591796875, 3.090484619140625, 3.2071533203125, 3.323822021484375, 3.44049072265625, 3.557159423828125, 3.673828125]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 8.0, 20.0, 20.0, 31.0, 66.0, 69.0, 108.0, 128.0, 232.0, 373.0, 513.0, 745.0, 1099.0, 1795.0, 2774.0, 4490.0, 7219.0, 12021.0, 19952.0, 34184.0, 59727.0, 106214.0, 188841.0, 329165.0, 541379.0, 756543.0, 766135.0, 558444.0, 341447.0, 197232.0, 111090.0, 62699.0, 35717.0, 21235.0, 12450.0, 7281.0, 4679.0, 2781.0, 1881.0, 1114.0, 740.0, 557.0, 348.0, 230.0, 160.0, 118.0, 79.0, 50.0, 26.0, 25.0, 15.0, 17.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0], "bins": [-4.9921875, -4.83636474609375, -4.6805419921875, -4.52471923828125, -4.368896484375, -4.21307373046875, -4.0572509765625, -3.90142822265625, -3.74560546875, -3.58978271484375, -3.4339599609375, -3.27813720703125, -3.122314453125, -2.96649169921875, -2.8106689453125, -2.65484619140625, -2.4990234375, -2.34320068359375, -2.1873779296875, -2.03155517578125, -1.875732421875, -1.71990966796875, -1.5640869140625, -1.40826416015625, -1.25244140625, -1.09661865234375, -0.9407958984375, -0.78497314453125, -0.629150390625, -0.47332763671875, -0.3175048828125, -0.16168212890625, -0.005859375, 0.14996337890625, 0.3057861328125, 0.46160888671875, 0.617431640625, 0.77325439453125, 0.9290771484375, 1.08489990234375, 1.24072265625, 1.39654541015625, 1.5523681640625, 1.70819091796875, 1.864013671875, 2.01983642578125, 2.1756591796875, 2.33148193359375, 2.4873046875, 2.64312744140625, 2.7989501953125, 2.95477294921875, 3.110595703125, 3.26641845703125, 3.4222412109375, 3.57806396484375, 3.73388671875, 3.88970947265625, 4.0455322265625, 4.20135498046875, 4.357177734375, 4.51300048828125, 4.6688232421875, 4.82464599609375, 4.98046875]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 13.0, 18.0, 25.0, 22.0, 47.0, 51.0, 58.0, 91.0, 94.0, 121.0, 167.0, 171.0, 203.0, 240.0, 288.0, 309.0, 256.0, 268.0, 280.0, 250.0, 209.0, 180.0, 130.0, 125.0, 91.0, 78.0, 66.0, 40.0, 42.0, 29.0, 24.0, 24.0, 15.0, 12.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.23046875, -2.1687164306640625, -2.106964111328125, -2.0452117919921875, -1.98345947265625, -1.9217071533203125, -1.859954833984375, -1.7982025146484375, -1.7364501953125, -1.6746978759765625, -1.612945556640625, -1.5511932373046875, -1.48944091796875, -1.4276885986328125, -1.365936279296875, -1.3041839599609375, -1.242431640625, -1.1806793212890625, -1.118927001953125, -1.0571746826171875, -0.99542236328125, -0.9336700439453125, -0.871917724609375, -0.8101654052734375, -0.7484130859375, -0.6866607666015625, -0.624908447265625, -0.5631561279296875, -0.50140380859375, -0.4396514892578125, -0.377899169921875, -0.3161468505859375, -0.25439453125, -0.1926422119140625, -0.130889892578125, -0.0691375732421875, -0.00738525390625, 0.0543670654296875, 0.116119384765625, 0.1778717041015625, 0.2396240234375, 0.3013763427734375, 0.363128662109375, 0.4248809814453125, 0.48663330078125, 0.5483856201171875, 0.610137939453125, 0.6718902587890625, 0.733642578125, 0.7953948974609375, 0.857147216796875, 0.9188995361328125, 0.98065185546875, 1.0424041748046875, 1.104156494140625, 1.1659088134765625, 1.2276611328125, 1.2894134521484375, 1.351165771484375, 1.4129180908203125, 1.47467041015625, 1.5364227294921875, 1.598175048828125, 1.6599273681640625, 1.7216796875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 7.0, 13.0, 22.0, 22.0, 33.0, 41.0, 39.0, 54.0, 68.0, 81.0, 66.0, 81.0, 53.0, 81.0, 64.0, 70.0, 42.0, 33.0, 26.0, 20.0, 18.0, 15.0, 7.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.195919513702393, -5.962164402008057, -5.728409290313721, -5.494654178619385, -5.260899543762207, -5.027144432067871, -4.793389320373535, -4.559634208679199, -4.325879096984863, -4.092123985290527, -3.8583688735961914, -3.6246140003204346, -3.3908588886260986, -3.1571037769317627, -2.923348903656006, -2.68959379196167, -2.455838680267334, -2.222083568572998, -1.9883285760879517, -1.7545735836029053, -1.5208184719085693, -1.2870633602142334, -1.053308367729187, -0.8195533752441406, -0.5857982635498047, -0.3520432114601135, -0.11828815937042236, 0.1154668927192688, 0.34922194480895996, 0.5829770565032959, 0.8167320489883423, 1.0504870414733887, 1.2842426300048828, 1.5179977416992188, 1.7517527341842651, 1.9855077266693115, 2.2192628383636475, 2.4530179500579834, 2.6867728233337402, 2.920527935028076, 3.154283046722412, 3.388038158416748, 3.621793270111084, 3.855548143386841, 4.089303016662598, 4.323058128356934, 4.5568132400512695, 4.7905683517456055, 5.024323463439941, 5.258078575134277, 5.491833686828613, 5.725588798522949, 5.959343910217285, 6.193099021911621, 6.426853656768799, 6.660608768463135, 6.894363880157471, 7.128118991851807, 7.361874103546143, 7.5956292152404785, 7.829383850097656, 8.063138961791992, 8.296894073486328, 8.530649185180664, 8.764404296875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 7.0, 13.0, 6.0, 19.0, 14.0, 28.0, 25.0, 27.0, 34.0, 36.0, 34.0, 44.0, 51.0, 38.0, 52.0, 44.0, 43.0, 32.0, 46.0, 44.0, 33.0, 35.0, 27.0, 28.0, 30.0, 34.0, 24.0, 29.0, 25.0, 11.0, 13.0, 9.0, 13.0, 12.0, 5.0, 11.0, 8.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.548825263977051, -4.397319316864014, -4.245813369750977, -4.0943074226379395, -3.9428014755249023, -3.7912955284118652, -3.639789581298828, -3.488283634185791, -3.336777687072754, -3.185271739959717, -3.0337657928466797, -2.8822598457336426, -2.7307538986206055, -2.5792479515075684, -2.4277420043945312, -2.276236057281494, -2.124730348587036, -1.973224401473999, -1.821718454360962, -1.6702125072479248, -1.5187065601348877, -1.3672006130218506, -1.215694785118103, -1.064188838005066, -0.9126828908920288, -0.7611769437789917, -0.6096709966659546, -0.45816510915756226, -0.30665916204452515, -0.15515321493148804, -0.003647327423095703, 0.1478586196899414, 0.2993645668029785, 0.4508705139160156, 0.6023764610290527, 0.7538823485374451, 0.9053882956504822, 1.056894302368164, 1.2084001302719116, 1.3599060773849487, 1.5114120244979858, 1.662917971611023, 1.81442391872406, 1.9659297466278076, 2.1174356937408447, 2.268941640853882, 2.420447587966919, 2.571953535079956, 2.723459482192993, 2.8749654293060303, 3.0264713764190674, 3.1779773235321045, 3.3294832706451416, 3.4809892177581787, 3.6324949264526367, 3.784000873565674, 3.935506820678711, 4.087012767791748, 4.238518714904785, 4.390024662017822, 4.541530609130859, 4.6930365562438965, 4.844542503356934, 4.996048450469971, 5.147554397583008]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 9.0, 8.0, 5.0, 11.0, 15.0, 27.0, 26.0, 39.0, 56.0, 81.0, 148.0, 251.0, 434.0, 729.0, 1275.0, 2242.0, 4016.0, 7384.0, 14448.0, 27744.0, 53823.0, 102481.0, 181313.0, 238863.0, 186995.0, 107195.0, 56845.0, 29499.0, 15053.0, 7970.0, 4178.0, 2229.0, 1302.0, 712.0, 398.0, 290.0, 166.0, 86.0, 67.0, 36.0, 30.0, 27.0, 10.0, 17.0, 7.0, 11.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2333984375, -1.186920166015625, -1.14044189453125, -1.093963623046875, -1.0474853515625, -1.001007080078125, -0.95452880859375, -0.908050537109375, -0.861572265625, -0.815093994140625, -0.76861572265625, -0.722137451171875, -0.6756591796875, -0.629180908203125, -0.58270263671875, -0.536224365234375, -0.48974609375, -0.443267822265625, -0.39678955078125, -0.350311279296875, -0.3038330078125, -0.257354736328125, -0.21087646484375, -0.164398193359375, -0.117919921875, -0.071441650390625, -0.02496337890625, 0.021514892578125, 0.0679931640625, 0.114471435546875, 0.16094970703125, 0.207427978515625, 0.25390625, 0.300384521484375, 0.34686279296875, 0.393341064453125, 0.4398193359375, 0.486297607421875, 0.53277587890625, 0.579254150390625, 0.625732421875, 0.672210693359375, 0.71868896484375, 0.765167236328125, 0.8116455078125, 0.858123779296875, 0.90460205078125, 0.951080322265625, 0.99755859375, 1.044036865234375, 1.09051513671875, 1.136993408203125, 1.1834716796875, 1.229949951171875, 1.27642822265625, 1.322906494140625, 1.369384765625, 1.415863037109375, 1.46234130859375, 1.508819580078125, 1.5552978515625, 1.601776123046875, 1.64825439453125, 1.694732666015625, 1.7412109375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 10.0, 6.0, 11.0, 20.0, 12.0, 21.0, 26.0, 25.0, 22.0, 22.0, 30.0, 33.0, 44.0, 53.0, 42.0, 42.0, 44.0, 43.0, 40.0, 43.0, 44.0, 35.0, 39.0, 29.0, 32.0, 21.0, 29.0, 24.0, 28.0, 19.0, 20.0, 16.0, 8.0, 12.0, 14.0, 10.0, 9.0, 13.0, 3.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.12518310546875, -3.9691162109375, -3.81304931640625, -3.656982421875, -3.50091552734375, -3.3448486328125, -3.18878173828125, -3.03271484375, -2.87664794921875, -2.7205810546875, -2.56451416015625, -2.408447265625, -2.25238037109375, -2.0963134765625, -1.94024658203125, -1.7841796875, -1.62811279296875, -1.4720458984375, -1.31597900390625, -1.159912109375, -1.00384521484375, -0.8477783203125, -0.69171142578125, -0.53564453125, -0.37957763671875, -0.2235107421875, -0.06744384765625, 0.088623046875, 0.24468994140625, 0.4007568359375, 0.55682373046875, 0.712890625, 0.86895751953125, 1.0250244140625, 1.18109130859375, 1.337158203125, 1.49322509765625, 1.6492919921875, 1.80535888671875, 1.96142578125, 2.11749267578125, 2.2735595703125, 2.42962646484375, 2.585693359375, 2.74176025390625, 2.8978271484375, 3.05389404296875, 3.2099609375, 3.36602783203125, 3.5220947265625, 3.67816162109375, 3.834228515625, 3.99029541015625, 4.1463623046875, 4.30242919921875, 4.45849609375, 4.61456298828125, 4.7706298828125, 4.92669677734375, 5.082763671875, 5.23883056640625, 5.3948974609375, 5.55096435546875, 5.70703125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 6.0, 1.0, 5.0, 2.0, 10.0, 5.0, 13.0, 12.0, 26.0, 28.0, 41.0, 52.0, 70.0, 109.0, 148.0, 210.0, 320.0, 502.0, 721.0, 1162.0, 1777.0, 3040.0, 5326.0, 9684.0, 20313.0, 66851.0, 844900.0, 52989.0, 18508.0, 9193.0, 4920.0, 2712.0, 1725.0, 1077.0, 700.0, 473.0, 259.0, 200.0, 126.0, 108.0, 64.0, 38.0, 30.0, 25.0, 16.0, 15.0, 10.0, 11.0, 8.0, 10.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.099609375, -2.997802734375, -2.89599609375, -2.794189453125, -2.6923828125, -2.590576171875, -2.48876953125, -2.386962890625, -2.28515625, -2.183349609375, -2.08154296875, -1.979736328125, -1.8779296875, -1.776123046875, -1.67431640625, -1.572509765625, -1.470703125, -1.368896484375, -1.26708984375, -1.165283203125, -1.0634765625, -0.961669921875, -0.85986328125, -0.758056640625, -0.65625, -0.554443359375, -0.45263671875, -0.350830078125, -0.2490234375, -0.147216796875, -0.04541015625, 0.056396484375, 0.158203125, 0.260009765625, 0.36181640625, 0.463623046875, 0.5654296875, 0.667236328125, 0.76904296875, 0.870849609375, 0.97265625, 1.074462890625, 1.17626953125, 1.278076171875, 1.3798828125, 1.481689453125, 1.58349609375, 1.685302734375, 1.787109375, 1.888916015625, 1.99072265625, 2.092529296875, 2.1943359375, 2.296142578125, 2.39794921875, 2.499755859375, 2.6015625, 2.703369140625, 2.80517578125, 2.906982421875, 3.0087890625, 3.110595703125, 3.21240234375, 3.314208984375, 3.416015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 13.0, 15.0, 14.0, 16.0, 27.0, 30.0, 28.0, 28.0, 29.0, 34.0, 38.0, 42.0, 50.0, 53.0, 53.0, 44.0, 54.0, 55.0, 46.0, 41.0, 44.0, 29.0, 35.0, 33.0, 17.0, 29.0, 25.0, 14.0, 9.0, 11.0, 9.0, 7.0, 2.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.0892333984375, -4.897216796875, -4.7052001953125, -4.51318359375, -4.3211669921875, -4.129150390625, -3.9371337890625, -3.7451171875, -3.5531005859375, -3.361083984375, -3.1690673828125, -2.97705078125, -2.7850341796875, -2.593017578125, -2.4010009765625, -2.208984375, -2.0169677734375, -1.824951171875, -1.6329345703125, -1.44091796875, -1.2489013671875, -1.056884765625, -0.8648681640625, -0.6728515625, -0.4808349609375, -0.288818359375, -0.0968017578125, 0.09521484375, 0.2872314453125, 0.479248046875, 0.6712646484375, 0.86328125, 1.0552978515625, 1.247314453125, 1.4393310546875, 1.63134765625, 1.8233642578125, 2.015380859375, 2.2073974609375, 2.3994140625, 2.5914306640625, 2.783447265625, 2.9754638671875, 3.16748046875, 3.3594970703125, 3.551513671875, 3.7435302734375, 3.935546875, 4.1275634765625, 4.319580078125, 4.5115966796875, 4.70361328125, 4.8956298828125, 5.087646484375, 5.2796630859375, 5.4716796875, 5.6636962890625, 5.855712890625, 6.0477294921875, 6.23974609375, 6.4317626953125, 6.623779296875, 6.8157958984375, 7.0078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 6.0, 4.0, 14.0, 16.0, 26.0, 24.0, 43.0, 56.0, 91.0, 129.0, 218.0, 322.0, 539.0, 899.0, 1573.0, 2909.0, 5476.0, 12350.0, 32948.0, 892365.0, 63667.0, 18175.0, 7762.0, 3838.0, 2051.0, 1173.0, 661.0, 405.0, 244.0, 179.0, 131.0, 83.0, 40.0, 37.0, 38.0, 16.0, 12.0, 13.0, 2.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.69140625, -1.6380615234375, -1.584716796875, -1.5313720703125, -1.47802734375, -1.4246826171875, -1.371337890625, -1.3179931640625, -1.2646484375, -1.2113037109375, -1.157958984375, -1.1046142578125, -1.05126953125, -0.9979248046875, -0.944580078125, -0.8912353515625, -0.837890625, -0.7845458984375, -0.731201171875, -0.6778564453125, -0.62451171875, -0.5711669921875, -0.517822265625, -0.4644775390625, -0.4111328125, -0.3577880859375, -0.304443359375, -0.2510986328125, -0.19775390625, -0.1444091796875, -0.091064453125, -0.0377197265625, 0.015625, 0.0689697265625, 0.122314453125, 0.1756591796875, 0.22900390625, 0.2823486328125, 0.335693359375, 0.3890380859375, 0.4423828125, 0.4957275390625, 0.549072265625, 0.6024169921875, 0.65576171875, 0.7091064453125, 0.762451171875, 0.8157958984375, 0.869140625, 0.9224853515625, 0.975830078125, 1.0291748046875, 1.08251953125, 1.1358642578125, 1.189208984375, 1.2425537109375, 1.2958984375, 1.3492431640625, 1.402587890625, 1.4559326171875, 1.50927734375, 1.5626220703125, 1.615966796875, 1.6693115234375, 1.72265625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 14.0, 18.0, 21.0, 29.0, 37.0, 44.0, 47.0, 54.0, 64.0, 59.0, 57.0, 58.0, 78.0, 56.0, 39.0, 47.0, 35.0, 29.0, 26.0, 23.0, 21.0, 12.0, 15.0, 8.0, 7.0, 3.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.8041343688964844e-05, -4.650000482797623e-05, -4.495866596698761e-05, -4.341732710599899e-05, -4.1875988245010376e-05, -4.033464938402176e-05, -3.879331052303314e-05, -3.7251971662044525e-05, -3.571063280105591e-05, -3.416929394006729e-05, -3.2627955079078674e-05, -3.108661621809006e-05, -2.954527735710144e-05, -2.8003938496112823e-05, -2.6462599635124207e-05, -2.492126077413559e-05, -2.3379921913146973e-05, -2.1838583052158356e-05, -2.029724419116974e-05, -1.8755905330181122e-05, -1.7214566469192505e-05, -1.5673227608203888e-05, -1.4131888747215271e-05, -1.2590549886226654e-05, -1.1049211025238037e-05, -9.50787216424942e-06, -7.966533303260803e-06, -6.425194442272186e-06, -4.883855581283569e-06, -3.3425167202949524e-06, -1.8011778593063354e-06, -2.598389983177185e-07, 1.2814998626708984e-06, 2.8228387236595154e-06, 4.364177584648132e-06, 5.905516445636749e-06, 7.446855306625366e-06, 8.988194167613983e-06, 1.05295330286026e-05, 1.2070871889591217e-05, 1.3612210750579834e-05, 1.5153549611568451e-05, 1.6694888472557068e-05, 1.8236227333545685e-05, 1.9777566194534302e-05, 2.131890505552292e-05, 2.2860243916511536e-05, 2.4401582777500153e-05, 2.594292163848877e-05, 2.7484260499477386e-05, 2.9025599360466003e-05, 3.056693822145462e-05, 3.210827708244324e-05, 3.3649615943431854e-05, 3.519095480442047e-05, 3.673229366540909e-05, 3.8273632526397705e-05, 3.981497138738632e-05, 4.135631024837494e-05, 4.2897649109363556e-05, 4.443898797035217e-05, 4.598032683134079e-05, 4.752166569232941e-05, 4.9063004553318024e-05, 5.060434341430664e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 2.0, 9.0, 10.0, 17.0, 27.0, 46.0, 40.0, 73.0, 112.0, 149.0, 236.0, 333.0, 491.0, 676.0, 1048.0, 1698.0, 2533.0, 3938.0, 6196.0, 10152.0, 17297.0, 29049.0, 52089.0, 95094.0, 173293.0, 244294.0, 179787.0, 99015.0, 54012.0, 30464.0, 17699.0, 10559.0, 6479.0, 4008.0, 2544.0, 1666.0, 1089.0, 737.0, 506.0, 373.0, 240.0, 141.0, 90.0, 88.0, 43.0, 42.0, 29.0, 20.0, 9.0, 7.0, 3.0, 7.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.53955078125, -0.5234603881835938, -0.5073699951171875, -0.49127960205078125, -0.475189208984375, -0.45909881591796875, -0.4430084228515625, -0.42691802978515625, -0.41082763671875, -0.39473724365234375, -0.3786468505859375, -0.36255645751953125, -0.346466064453125, -0.33037567138671875, -0.3142852783203125, -0.29819488525390625, -0.2821044921875, -0.26601409912109375, -0.2499237060546875, -0.23383331298828125, -0.217742919921875, -0.20165252685546875, -0.1855621337890625, -0.16947174072265625, -0.15338134765625, -0.13729095458984375, -0.1212005615234375, -0.10511016845703125, -0.089019775390625, -0.07292938232421875, -0.0568389892578125, -0.04074859619140625, -0.024658203125, -0.00856781005859375, 0.0075225830078125, 0.02361297607421875, 0.039703369140625, 0.05579376220703125, 0.0718841552734375, 0.08797454833984375, 0.10406494140625, 0.12015533447265625, 0.1362457275390625, 0.15233612060546875, 0.168426513671875, 0.18451690673828125, 0.2006072998046875, 0.21669769287109375, 0.2327880859375, 0.24887847900390625, 0.2649688720703125, 0.28105926513671875, 0.297149658203125, 0.31324005126953125, 0.3293304443359375, 0.34542083740234375, 0.36151123046875, 0.37760162353515625, 0.3936920166015625, 0.40978240966796875, 0.425872802734375, 0.44196319580078125, 0.4580535888671875, 0.47414398193359375, 0.490234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 12.0, 7.0, 19.0, 17.0, 22.0, 30.0, 18.0, 41.0, 37.0, 56.0, 51.0, 54.0, 88.0, 65.0, 73.0, 65.0, 68.0, 44.0, 42.0, 27.0, 28.0, 23.0, 21.0, 11.0, 12.0, 15.0, 7.0, 8.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2783203125, -0.2678680419921875, -0.257415771484375, -0.2469635009765625, -0.23651123046875, -0.2260589599609375, -0.215606689453125, -0.2051544189453125, -0.1947021484375, -0.1842498779296875, -0.173797607421875, -0.1633453369140625, -0.15289306640625, -0.1424407958984375, -0.131988525390625, -0.1215362548828125, -0.111083984375, -0.1006317138671875, -0.090179443359375, -0.0797271728515625, -0.06927490234375, -0.0588226318359375, -0.048370361328125, -0.0379180908203125, -0.0274658203125, -0.0170135498046875, -0.006561279296875, 0.0038909912109375, 0.01434326171875, 0.0247955322265625, 0.035247802734375, 0.0457000732421875, 0.05615234375, 0.0666046142578125, 0.077056884765625, 0.0875091552734375, 0.09796142578125, 0.1084136962890625, 0.118865966796875, 0.1293182373046875, 0.1397705078125, 0.1502227783203125, 0.160675048828125, 0.1711273193359375, 0.18157958984375, 0.1920318603515625, 0.202484130859375, 0.2129364013671875, 0.223388671875, 0.2338409423828125, 0.244293212890625, 0.2547454833984375, 0.26519775390625, 0.2756500244140625, 0.286102294921875, 0.2965545654296875, 0.3070068359375, 0.3174591064453125, 0.327911376953125, 0.3383636474609375, 0.34881591796875, 0.3592681884765625, 0.369720458984375, 0.3801727294921875, 0.390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 9.0, 7.0, 18.0, 16.0, 26.0, 31.0, 46.0, 49.0, 48.0, 80.0, 70.0, 65.0, 74.0, 72.0, 72.0, 72.0, 52.0, 49.0, 30.0, 30.0, 19.0, 13.0, 16.0, 10.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2333083152771, -5.998308181762695, -5.763307571411133, -5.52830696105957, -5.293306827545166, -5.058306694030762, -4.823306083679199, -4.588305473327637, -4.353305339813232, -4.118305206298828, -3.8833045959472656, -3.6483042240142822, -3.413303852081299, -3.1783034801483154, -2.943303108215332, -2.7083027362823486, -2.4733023643493652, -2.238301992416382, -2.0033016204833984, -1.768301248550415, -1.5333008766174316, -1.2983005046844482, -1.0633001327514648, -0.8282997608184814, -0.593299388885498, -0.35829901695251465, -0.12329864501953125, 0.11170172691345215, 0.34670209884643555, 0.581702470779419, 0.8167028427124023, 1.0517032146453857, 1.286703109741211, 1.5217034816741943, 1.7567038536071777, 1.9917042255401611, 2.2267045974731445, 2.461704969406128, 2.6967053413391113, 2.9317057132720947, 3.166706085205078, 3.4017064571380615, 3.636706829071045, 3.8717072010040283, 4.106707572937012, 4.341708183288574, 4.5767083168029785, 4.811708450317383, 5.046709060668945, 5.281709671020508, 5.516709804534912, 5.751709938049316, 5.986710548400879, 6.221711158752441, 6.456711292266846, 6.69171142578125, 6.9267120361328125, 7.161712646484375, 7.396712779998779, 7.631712913513184, 7.866713523864746, 8.101714134216309, 8.336713790893555, 8.571714401245117, 8.80671501159668]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 13.0, 19.0, 33.0, 29.0, 33.0, 24.0, 41.0, 39.0, 55.0, 38.0, 49.0, 39.0, 47.0, 40.0, 50.0, 29.0, 44.0, 35.0, 35.0, 24.0, 32.0, 32.0, 27.0, 27.0, 17.0, 20.0, 13.0, 8.0, 19.0, 7.0, 12.0, 6.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.304595470428467, -4.1580305099487305, -4.011465072631836, -3.8649001121520996, -3.7183351516723633, -3.571769952774048, -3.4252047538757324, -3.278639793395996, -3.1320745944976807, -2.9855093955993652, -2.838944435119629, -2.6923792362213135, -2.545814037322998, -2.3992490768432617, -2.2526838779449463, -2.106118679046631, -1.9595537185668945, -1.8129886388778687, -1.6664235591888428, -1.5198583602905273, -1.3732932806015015, -1.2267282009124756, -1.0801630020141602, -0.9335979223251343, -0.7870328426361084, -0.6404677629470825, -0.49390262365341187, -0.3473375141620636, -0.20077240467071533, -0.05420732498168945, 0.0923578143119812, 0.23892295360565186, 0.38548755645751953, 0.5320526361465454, 0.6786177754402161, 0.8251829147338867, 0.9717479944229126, 1.1183130741119385, 1.264878273010254, 1.4114433526992798, 1.5580084323883057, 1.7045735120773315, 1.8511385917663574, 1.9977037906646729, 2.1442689895629883, 2.2908339500427246, 2.43739914894104, 2.5839643478393555, 2.730529308319092, 2.8770945072174072, 3.0236594676971436, 3.170224666595459, 3.3167896270751953, 3.4633548259735107, 3.609920024871826, 3.7564849853515625, 3.903050184249878, 4.049615383148193, 4.19618034362793, 4.342745304107666, 4.4893107414245605, 4.635875701904297, 4.782440662384033, 4.929006099700928, 5.075571060180664]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 16.0, 19.0, 31.0, 39.0, 76.0, 99.0, 154.0, 227.0, 352.0, 539.0, 796.0, 1295.0, 1919.0, 2953.0, 4726.0, 7163.0, 11233.0, 17176.0, 26680.0, 40126.0, 58488.0, 82887.0, 108401.0, 127656.0, 131114.0, 118378.0, 94883.0, 69800.0, 48561.0, 32503.0, 21137.0, 13791.0, 8782.0, 5722.0, 3807.0, 2408.0, 1656.0, 1032.0, 687.0, 424.0, 285.0, 173.0, 127.0, 77.0, 62.0, 36.0, 19.0, 15.0, 5.0, 10.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.76171875, -3.65185546875, -3.5419921875, -3.43212890625, -3.322265625, -3.21240234375, -3.1025390625, -2.99267578125, -2.8828125, -2.77294921875, -2.6630859375, -2.55322265625, -2.443359375, -2.33349609375, -2.2236328125, -2.11376953125, -2.00390625, -1.89404296875, -1.7841796875, -1.67431640625, -1.564453125, -1.45458984375, -1.3447265625, -1.23486328125, -1.125, -1.01513671875, -0.9052734375, -0.79541015625, -0.685546875, -0.57568359375, -0.4658203125, -0.35595703125, -0.24609375, -0.13623046875, -0.0263671875, 0.08349609375, 0.193359375, 0.30322265625, 0.4130859375, 0.52294921875, 0.6328125, 0.74267578125, 0.8525390625, 0.96240234375, 1.072265625, 1.18212890625, 1.2919921875, 1.40185546875, 1.51171875, 1.62158203125, 1.7314453125, 1.84130859375, 1.951171875, 2.06103515625, 2.1708984375, 2.28076171875, 2.390625, 2.50048828125, 2.6103515625, 2.72021484375, 2.830078125, 2.93994140625, 3.0498046875, 3.15966796875, 3.26953125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 10.0, 9.0, 17.0, 21.0, 18.0, 25.0, 48.0, 39.0, 34.0, 35.0, 36.0, 42.0, 35.0, 51.0, 53.0, 50.0, 41.0, 45.0, 32.0, 42.0, 32.0, 24.0, 33.0, 39.0, 23.0, 20.0, 19.0, 16.0, 13.0, 12.0, 17.0, 9.0, 7.0, 14.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.2835693359375, -4.137451171875, -3.9913330078125, -3.84521484375, -3.6990966796875, -3.552978515625, -3.4068603515625, -3.2607421875, -3.1146240234375, -2.968505859375, -2.8223876953125, -2.67626953125, -2.5301513671875, -2.384033203125, -2.2379150390625, -2.091796875, -1.9456787109375, -1.799560546875, -1.6534423828125, -1.50732421875, -1.3612060546875, -1.215087890625, -1.0689697265625, -0.9228515625, -0.7767333984375, -0.630615234375, -0.4844970703125, -0.33837890625, -0.1922607421875, -0.046142578125, 0.0999755859375, 0.24609375, 0.3922119140625, 0.538330078125, 0.6844482421875, 0.83056640625, 0.9766845703125, 1.122802734375, 1.2689208984375, 1.4150390625, 1.5611572265625, 1.707275390625, 1.8533935546875, 1.99951171875, 2.1456298828125, 2.291748046875, 2.4378662109375, 2.583984375, 2.7301025390625, 2.876220703125, 3.0223388671875, 3.16845703125, 3.3145751953125, 3.460693359375, 3.6068115234375, 3.7529296875, 3.8990478515625, 4.045166015625, 4.1912841796875, 4.33740234375, 4.4835205078125, 4.629638671875, 4.7757568359375, 4.921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 4.0, 6.0, 7.0, 8.0, 18.0, 26.0, 33.0, 77.0, 99.0, 142.0, 220.0, 307.0, 549.0, 767.0, 1168.0, 2005.0, 3197.0, 5069.0, 8030.0, 13053.0, 21199.0, 34063.0, 54207.0, 80869.0, 113051.0, 140179.0, 147682.0, 131324.0, 100960.0, 69943.0, 45153.0, 28328.0, 17684.0, 11034.0, 6712.0, 4079.0, 2599.0, 1741.0, 1037.0, 676.0, 406.0, 306.0, 176.0, 129.0, 73.0, 54.0, 49.0, 15.0, 14.0, 12.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0], "bins": [-3.83203125, -3.7203369140625, -3.608642578125, -3.4969482421875, -3.38525390625, -3.2735595703125, -3.161865234375, -3.0501708984375, -2.9384765625, -2.8267822265625, -2.715087890625, -2.6033935546875, -2.49169921875, -2.3800048828125, -2.268310546875, -2.1566162109375, -2.044921875, -1.9332275390625, -1.821533203125, -1.7098388671875, -1.59814453125, -1.4864501953125, -1.374755859375, -1.2630615234375, -1.1513671875, -1.0396728515625, -0.927978515625, -0.8162841796875, -0.70458984375, -0.5928955078125, -0.481201171875, -0.3695068359375, -0.2578125, -0.1461181640625, -0.034423828125, 0.0772705078125, 0.18896484375, 0.3006591796875, 0.412353515625, 0.5240478515625, 0.6357421875, 0.7474365234375, 0.859130859375, 0.9708251953125, 1.08251953125, 1.1942138671875, 1.305908203125, 1.4176025390625, 1.529296875, 1.6409912109375, 1.752685546875, 1.8643798828125, 1.97607421875, 2.0877685546875, 2.199462890625, 2.3111572265625, 2.4228515625, 2.5345458984375, 2.646240234375, 2.7579345703125, 2.86962890625, 2.9813232421875, 3.093017578125, 3.2047119140625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 9.0, 4.0, 6.0, 5.0, 8.0, 9.0, 17.0, 12.0, 8.0, 18.0, 20.0, 32.0, 28.0, 27.0, 45.0, 33.0, 27.0, 29.0, 35.0, 45.0, 43.0, 50.0, 36.0, 41.0, 55.0, 39.0, 44.0, 32.0, 29.0, 26.0, 31.0, 24.0, 24.0, 23.0, 15.0, 10.0, 15.0, 10.0, 7.0, 9.0, 6.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0], "bins": [-4.33203125, -4.212890625, -4.09375, -3.974609375, -3.85546875, -3.736328125, -3.6171875, -3.498046875, -3.37890625, -3.259765625, -3.140625, -3.021484375, -2.90234375, -2.783203125, -2.6640625, -2.544921875, -2.42578125, -2.306640625, -2.1875, -2.068359375, -1.94921875, -1.830078125, -1.7109375, -1.591796875, -1.47265625, -1.353515625, -1.234375, -1.115234375, -0.99609375, -0.876953125, -0.7578125, -0.638671875, -0.51953125, -0.400390625, -0.28125, -0.162109375, -0.04296875, 0.076171875, 0.1953125, 0.314453125, 0.43359375, 0.552734375, 0.671875, 0.791015625, 0.91015625, 1.029296875, 1.1484375, 1.267578125, 1.38671875, 1.505859375, 1.625, 1.744140625, 1.86328125, 1.982421875, 2.1015625, 2.220703125, 2.33984375, 2.458984375, 2.578125, 2.697265625, 2.81640625, 2.935546875, 3.0546875, 3.173828125, 3.29296875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 17.0, 25.0, 27.0, 45.0, 72.0, 115.0, 161.0, 238.0, 433.0, 642.0, 1093.0, 1968.0, 3548.0, 7078.0, 15768.0, 40082.0, 113649.0, 311182.0, 338553.0, 133093.0, 46091.0, 17663.0, 7941.0, 3892.0, 2098.0, 1194.0, 708.0, 431.0, 267.0, 152.0, 112.0, 55.0, 39.0, 34.0, 25.0, 15.0, 11.0, 12.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.0390625, -8.78131103515625, -8.5235595703125, -8.26580810546875, -8.008056640625, -7.75030517578125, -7.4925537109375, -7.23480224609375, -6.97705078125, -6.71929931640625, -6.4615478515625, -6.20379638671875, -5.946044921875, -5.68829345703125, -5.4305419921875, -5.17279052734375, -4.9150390625, -4.65728759765625, -4.3995361328125, -4.14178466796875, -3.884033203125, -3.62628173828125, -3.3685302734375, -3.11077880859375, -2.85302734375, -2.59527587890625, -2.3375244140625, -2.07977294921875, -1.822021484375, -1.56427001953125, -1.3065185546875, -1.04876708984375, -0.791015625, -0.53326416015625, -0.2755126953125, -0.01776123046875, 0.239990234375, 0.49774169921875, 0.7554931640625, 1.01324462890625, 1.27099609375, 1.52874755859375, 1.7864990234375, 2.04425048828125, 2.302001953125, 2.55975341796875, 2.8175048828125, 3.07525634765625, 3.3330078125, 3.59075927734375, 3.8485107421875, 4.10626220703125, 4.364013671875, 4.62176513671875, 4.8795166015625, 5.13726806640625, 5.39501953125, 5.65277099609375, 5.9105224609375, 6.16827392578125, 6.426025390625, 6.68377685546875, 6.9415283203125, 7.19927978515625, 7.45703125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 3.0, 12.0, 8.0, 21.0, 15.0, 26.0, 31.0, 33.0, 47.0, 50.0, 54.0, 61.0, 60.0, 81.0, 68.0, 73.0, 67.0, 71.0, 52.0, 45.0, 28.0, 23.0, 22.0, 14.0, 13.0, 6.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.000514984130859375, -0.0005029588937759399, -0.0004909336566925049, -0.0004789084196090698, -0.00046688318252563477, -0.0004548579454421997, -0.00044283270835876465, -0.0004308074712753296, -0.00041878223419189453, -0.00040675699710845947, -0.0003947317600250244, -0.00038270652294158936, -0.0003706812858581543, -0.00035865604877471924, -0.0003466308116912842, -0.0003346055746078491, -0.00032258033752441406, -0.000310555100440979, -0.00029852986335754395, -0.0002865046262741089, -0.00027447938919067383, -0.00026245415210723877, -0.0002504289150238037, -0.00023840367794036865, -0.0002263784408569336, -0.00021435320377349854, -0.00020232796669006348, -0.00019030272960662842, -0.00017827749252319336, -0.0001662522554397583, -0.00015422701835632324, -0.00014220178127288818, -0.00013017654418945312, -0.00011815130710601807, -0.00010612607002258301, -9.410083293914795e-05, -8.207559585571289e-05, -7.005035877227783e-05, -5.8025121688842773e-05, -4.5999884605407715e-05, -3.3974647521972656e-05, -2.1949410438537598e-05, -9.924173355102539e-06, 2.1010637283325195e-06, 1.4126300811767578e-05, 2.6151537895202637e-05, 3.8176774978637695e-05, 5.0202012062072754e-05, 6.222724914550781e-05, 7.425248622894287e-05, 8.627772331237793e-05, 9.830296039581299e-05, 0.00011032819747924805, 0.0001223534345626831, 0.00013437867164611816, 0.00014640390872955322, 0.00015842914581298828, 0.00017045438289642334, 0.0001824796199798584, 0.00019450485706329346, 0.00020653009414672852, 0.00021855533123016357, 0.00023058056831359863, 0.0002426058053970337, 0.00025463104248046875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 10.0, 17.0, 18.0, 23.0, 41.0, 62.0, 79.0, 117.0, 153.0, 227.0, 392.0, 591.0, 964.0, 1647.0, 3026.0, 6058.0, 13460.0, 34626.0, 99420.0, 255053.0, 342844.0, 181911.0, 64687.0, 23213.0, 9450.0, 4447.0, 2332.0, 1322.0, 811.0, 507.0, 312.0, 208.0, 149.0, 97.0, 84.0, 55.0, 48.0, 29.0, 18.0, 12.0, 10.0, 7.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0], "bins": [-7.71875, -7.506103515625, -7.29345703125, -7.080810546875, -6.8681640625, -6.655517578125, -6.44287109375, -6.230224609375, -6.017578125, -5.804931640625, -5.59228515625, -5.379638671875, -5.1669921875, -4.954345703125, -4.74169921875, -4.529052734375, -4.31640625, -4.103759765625, -3.89111328125, -3.678466796875, -3.4658203125, -3.253173828125, -3.04052734375, -2.827880859375, -2.615234375, -2.402587890625, -2.18994140625, -1.977294921875, -1.7646484375, -1.552001953125, -1.33935546875, -1.126708984375, -0.9140625, -0.701416015625, -0.48876953125, -0.276123046875, -0.0634765625, 0.149169921875, 0.36181640625, 0.574462890625, 0.787109375, 0.999755859375, 1.21240234375, 1.425048828125, 1.6376953125, 1.850341796875, 2.06298828125, 2.275634765625, 2.48828125, 2.700927734375, 2.91357421875, 3.126220703125, 3.3388671875, 3.551513671875, 3.76416015625, 3.976806640625, 4.189453125, 4.402099609375, 4.61474609375, 4.827392578125, 5.0400390625, 5.252685546875, 5.46533203125, 5.677978515625, 5.890625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 9.0, 4.0, 7.0, 4.0, 11.0, 12.0, 18.0, 25.0, 40.0, 61.0, 76.0, 108.0, 124.0, 110.0, 96.0, 82.0, 52.0, 42.0, 31.0, 18.0, 18.0, 7.0, 5.0, 6.0, 9.0, 2.0, 2.0, 1.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -3.99114990234375, -3.8533935546875, -3.71563720703125, -3.577880859375, -3.44012451171875, -3.3023681640625, -3.16461181640625, -3.02685546875, -2.88909912109375, -2.7513427734375, -2.61358642578125, -2.475830078125, -2.33807373046875, -2.2003173828125, -2.06256103515625, -1.9248046875, -1.78704833984375, -1.6492919921875, -1.51153564453125, -1.373779296875, -1.23602294921875, -1.0982666015625, -0.96051025390625, -0.82275390625, -0.68499755859375, -0.5472412109375, -0.40948486328125, -0.271728515625, -0.13397216796875, 0.0037841796875, 0.14154052734375, 0.279296875, 0.41705322265625, 0.5548095703125, 0.69256591796875, 0.830322265625, 0.96807861328125, 1.1058349609375, 1.24359130859375, 1.38134765625, 1.51910400390625, 1.6568603515625, 1.79461669921875, 1.932373046875, 2.07012939453125, 2.2078857421875, 2.34564208984375, 2.4833984375, 2.62115478515625, 2.7589111328125, 2.89666748046875, 3.034423828125, 3.17218017578125, 3.3099365234375, 3.44769287109375, 3.58544921875, 3.72320556640625, 3.8609619140625, 3.99871826171875, 4.136474609375, 4.27423095703125, 4.4119873046875, 4.54974365234375, 4.6875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 15.0, 9.0, 20.0, 21.0, 28.0, 22.0, 44.0, 51.0, 61.0, 61.0, 59.0, 61.0, 68.0, 77.0, 71.0, 60.0, 51.0, 47.0, 34.0, 20.0, 29.0, 17.0, 13.0, 14.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9219207763671875, -5.702857494354248, -5.48379373550415, -5.264730453491211, -5.0456671714782715, -4.826603889465332, -4.607540130615234, -4.388476848602295, -4.1694135665893555, -3.950350046157837, -3.7312867641448975, -3.512223243713379, -3.2931599617004395, -3.074096441268921, -2.8550329208374023, -2.635969638824463, -2.4169058799743652, -2.1978423595428467, -1.9787790775299072, -1.7597155570983887, -1.5406521558761597, -1.3215887546539307, -1.102525234222412, -0.8834618330001831, -0.6643984317779541, -0.4453350007534027, -0.22627156972885132, -0.007208108901977539, 0.21185529232025146, 0.43091869354248047, 0.649982213973999, 0.869045615196228, 1.088109016418457, 1.307172417640686, 1.526235818862915, 1.7452993392944336, 1.9643627405166626, 2.1834261417388916, 2.40248966217041, 2.6215529441833496, 2.840616464614868, 3.0596799850463867, 3.278743267059326, 3.4978067874908447, 3.7168703079223633, 3.9359335899353027, 4.154996871948242, 4.37406063079834, 4.593123912811279, 4.812187194824219, 5.031250953674316, 5.250314235687256, 5.469377517700195, 5.688441276550293, 5.907504558563232, 6.126567840576172, 6.3456315994262695, 6.564694881439209, 6.783758640289307, 7.002821922302246, 7.2218852043151855, 7.440948486328125, 7.660012245178223, 7.879075527191162, 8.098138809204102]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 5.0, 3.0, 7.0, 4.0, 7.0, 6.0, 14.0, 14.0, 12.0, 23.0, 23.0, 23.0, 27.0, 30.0, 25.0, 29.0, 35.0, 29.0, 48.0, 23.0, 58.0, 35.0, 41.0, 46.0, 43.0, 46.0, 34.0, 32.0, 24.0, 31.0, 22.0, 26.0, 26.0, 26.0, 16.0, 16.0, 21.0, 10.0, 11.0, 12.0, 7.0, 8.0, 7.0, 4.0, 4.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.201750755310059, -4.0681376457214355, -3.9345247745513916, -3.8009116649627686, -3.6672987937927246, -3.5336856842041016, -3.4000725746154785, -3.2664594650268555, -3.1328465938568115, -2.9992334842681885, -2.8656206130981445, -2.7320075035095215, -2.5983943939208984, -2.4647815227508545, -2.3311684131622314, -2.1975555419921875, -2.0639424324035645, -1.930329442024231, -1.7967164516448975, -1.6631033420562744, -1.529490351676941, -1.3958773612976074, -1.2622642517089844, -1.1286512613296509, -0.9950382709503174, -0.8614252805709839, -0.7278122305870056, -0.5941991806030273, -0.46058619022369385, -0.32697319984436035, -0.19336014986038208, -0.05974709987640381, 0.07386636734008789, 0.20747938752174377, 0.34109240770339966, 0.47470542788505554, 0.6083184480667114, 0.7419314384460449, 0.8755444884300232, 1.0091575384140015, 1.142770528793335, 1.2763835191726685, 1.409996509552002, 1.543609619140625, 1.6772226095199585, 1.810835599899292, 1.944448709487915, 2.078061580657959, 2.211674690246582, 2.345287799835205, 2.478900671005249, 2.612513780593872, 2.746126651763916, 2.879739761352539, 3.013352870941162, 3.146965980529785, 3.280578851699829, 3.414191961288452, 3.547804832458496, 3.681417942047119, 3.815031051635742, 3.948643922805786, 4.08225679397583, 4.215869903564453, 4.349483013153076]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 10.0, 12.0, 16.0, 22.0, 37.0, 59.0, 89.0, 121.0, 167.0, 238.0, 391.0, 587.0, 908.0, 1377.0, 2223.0, 3708.0, 6034.0, 10597.0, 18808.0, 35303.0, 69897.0, 148690.0, 331050.0, 717269.0, 1103106.0, 897387.0, 449642.0, 200628.0, 94093.0, 45803.0, 24388.0, 13014.0, 7266.0, 4379.0, 2643.0, 1582.0, 974.0, 599.0, 412.0, 275.0, 159.0, 113.0, 70.0, 48.0, 30.0, 18.0, 15.0, 13.0, 5.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.39453125, -5.22430419921875, -5.0540771484375, -4.88385009765625, -4.713623046875, -4.54339599609375, -4.3731689453125, -4.20294189453125, -4.03271484375, -3.86248779296875, -3.6922607421875, -3.52203369140625, -3.351806640625, -3.18157958984375, -3.0113525390625, -2.84112548828125, -2.6708984375, -2.50067138671875, -2.3304443359375, -2.16021728515625, -1.989990234375, -1.81976318359375, -1.6495361328125, -1.47930908203125, -1.30908203125, -1.13885498046875, -0.9686279296875, -0.79840087890625, -0.628173828125, -0.45794677734375, -0.2877197265625, -0.11749267578125, 0.052734375, 0.22296142578125, 0.3931884765625, 0.56341552734375, 0.733642578125, 0.90386962890625, 1.0740966796875, 1.24432373046875, 1.41455078125, 1.58477783203125, 1.7550048828125, 1.92523193359375, 2.095458984375, 2.26568603515625, 2.4359130859375, 2.60614013671875, 2.7763671875, 2.94659423828125, 3.1168212890625, 3.28704833984375, 3.457275390625, 3.62750244140625, 3.7977294921875, 3.96795654296875, 4.13818359375, 4.30841064453125, 4.4786376953125, 4.64886474609375, 4.819091796875, 4.98931884765625, 5.1595458984375, 5.32977294921875, 5.5]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 7.0, 11.0, 10.0, 13.0, 7.0, 14.0, 14.0, 21.0, 28.0, 27.0, 26.0, 31.0, 29.0, 35.0, 36.0, 28.0, 46.0, 29.0, 33.0, 40.0, 37.0, 36.0, 40.0, 33.0, 36.0, 29.0, 22.0, 29.0, 28.0, 30.0, 18.0, 16.0, 20.0, 16.0, 15.0, 23.0, 11.0, 14.0, 8.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.49609375, -2.417938232421875, -2.33978271484375, -2.261627197265625, -2.1834716796875, -2.105316162109375, -2.02716064453125, -1.949005126953125, -1.870849609375, -1.792694091796875, -1.71453857421875, -1.636383056640625, -1.5582275390625, -1.480072021484375, -1.40191650390625, -1.323760986328125, -1.24560546875, -1.167449951171875, -1.08929443359375, -1.011138916015625, -0.9329833984375, -0.854827880859375, -0.77667236328125, -0.698516845703125, -0.620361328125, -0.542205810546875, -0.46405029296875, -0.385894775390625, -0.3077392578125, -0.229583740234375, -0.15142822265625, -0.073272705078125, 0.0048828125, 0.083038330078125, 0.16119384765625, 0.239349365234375, 0.3175048828125, 0.395660400390625, 0.47381591796875, 0.551971435546875, 0.630126953125, 0.708282470703125, 0.78643798828125, 0.864593505859375, 0.9427490234375, 1.020904541015625, 1.09906005859375, 1.177215576171875, 1.25537109375, 1.333526611328125, 1.41168212890625, 1.489837646484375, 1.5679931640625, 1.646148681640625, 1.72430419921875, 1.802459716796875, 1.880615234375, 1.958770751953125, 2.03692626953125, 2.115081787109375, 2.1932373046875, 2.271392822265625, 2.34954833984375, 2.427703857421875, 2.505859375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 5.0, 12.0, 9.0, 20.0, 22.0, 38.0, 46.0, 54.0, 99.0, 161.0, 229.0, 346.0, 554.0, 899.0, 1479.0, 2338.0, 3986.0, 6904.0, 11790.0, 20967.0, 37055.0, 67625.0, 127072.0, 240662.0, 446529.0, 745203.0, 907245.0, 695983.0, 405284.0, 215979.0, 114646.0, 61573.0, 33689.0, 18992.0, 10794.0, 6277.0, 3759.0, 2219.0, 1406.0, 789.0, 553.0, 343.0, 220.0, 113.0, 98.0, 77.0, 48.0, 21.0, 14.0, 16.0, 11.0, 8.0, 9.0, 6.0, 7.0, 1.0, 4.0], "bins": [-5.015625, -4.86553955078125, -4.7154541015625, -4.56536865234375, -4.415283203125, -4.26519775390625, -4.1151123046875, -3.96502685546875, -3.81494140625, -3.66485595703125, -3.5147705078125, -3.36468505859375, -3.214599609375, -3.06451416015625, -2.9144287109375, -2.76434326171875, -2.6142578125, -2.46417236328125, -2.3140869140625, -2.16400146484375, -2.013916015625, -1.86383056640625, -1.7137451171875, -1.56365966796875, -1.41357421875, -1.26348876953125, -1.1134033203125, -0.96331787109375, -0.813232421875, -0.66314697265625, -0.5130615234375, -0.36297607421875, -0.212890625, -0.06280517578125, 0.0872802734375, 0.23736572265625, 0.387451171875, 0.53753662109375, 0.6876220703125, 0.83770751953125, 0.98779296875, 1.13787841796875, 1.2879638671875, 1.43804931640625, 1.588134765625, 1.73822021484375, 1.8883056640625, 2.03839111328125, 2.1884765625, 2.33856201171875, 2.4886474609375, 2.63873291015625, 2.788818359375, 2.93890380859375, 3.0889892578125, 3.23907470703125, 3.38916015625, 3.53924560546875, 3.6893310546875, 3.83941650390625, 3.989501953125, 4.13958740234375, 4.2896728515625, 4.43975830078125, 4.58984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 8.0, 6.0, 4.0, 8.0, 15.0, 18.0, 18.0, 27.0, 50.0, 43.0, 51.0, 65.0, 76.0, 93.0, 90.0, 140.0, 177.0, 189.0, 201.0, 259.0, 242.0, 290.0, 265.0, 240.0, 219.0, 193.0, 201.0, 164.0, 132.0, 123.0, 101.0, 73.0, 74.0, 56.0, 44.0, 31.0, 27.0, 17.0, 18.0, 10.0, 4.0, 5.0, 9.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4921875, -1.444854736328125, -1.39752197265625, -1.350189208984375, -1.3028564453125, -1.255523681640625, -1.20819091796875, -1.160858154296875, -1.113525390625, -1.066192626953125, -1.01885986328125, -0.971527099609375, -0.9241943359375, -0.876861572265625, -0.82952880859375, -0.782196044921875, -0.73486328125, -0.687530517578125, -0.64019775390625, -0.592864990234375, -0.5455322265625, -0.498199462890625, -0.45086669921875, -0.403533935546875, -0.356201171875, -0.308868408203125, -0.26153564453125, -0.214202880859375, -0.1668701171875, -0.119537353515625, -0.07220458984375, -0.024871826171875, 0.0224609375, 0.069793701171875, 0.11712646484375, 0.164459228515625, 0.2117919921875, 0.259124755859375, 0.30645751953125, 0.353790283203125, 0.401123046875, 0.448455810546875, 0.49578857421875, 0.543121337890625, 0.5904541015625, 0.637786865234375, 0.68511962890625, 0.732452392578125, 0.77978515625, 0.827117919921875, 0.87445068359375, 0.921783447265625, 0.9691162109375, 1.016448974609375, 1.06378173828125, 1.111114501953125, 1.158447265625, 1.205780029296875, 1.25311279296875, 1.300445556640625, 1.3477783203125, 1.395111083984375, 1.44244384765625, 1.489776611328125, 1.537109375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 8.0, 14.0, 15.0, 27.0, 36.0, 30.0, 42.0, 55.0, 63.0, 65.0, 84.0, 81.0, 68.0, 54.0, 62.0, 52.0, 38.0, 35.0, 31.0, 29.0, 21.0, 15.0, 16.0, 15.0, 11.0, 3.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.318307876586914, -5.1266021728515625, -4.934896469116211, -4.743190765380859, -4.55148458480835, -4.359778881072998, -4.1680731773376465, -3.976367473602295, -3.7846615314483643, -3.5929558277130127, -3.401249885559082, -3.2095441818237305, -3.017838478088379, -2.8261325359344482, -2.6344268321990967, -2.442720890045166, -2.2510151863098145, -2.059309482574463, -1.8676035404205322, -1.6758978366851807, -1.4841920137405396, -1.2924861907958984, -1.1007804870605469, -0.9090746641159058, -0.7173688411712646, -0.5256630182266235, -0.3339572548866272, -0.14225149154663086, 0.049454331398010254, 0.24116015434265137, 0.43286585807800293, 0.624571681022644, 0.8162775039672852, 1.0079833269119263, 1.1996891498565674, 1.391394853591919, 1.58310067653656, 1.7748064994812012, 1.9665122032165527, 2.1582179069519043, 2.349923849105835, 2.5416295528411865, 2.733335494995117, 2.9250411987304688, 3.1167469024658203, 3.308452844619751, 3.5001585483551025, 3.691864490509033, 3.8835701942443848, 4.075275897979736, 4.266981601715088, 4.458687782287598, 4.650393486022949, 4.842099189758301, 5.033804893493652, 5.225510597229004, 5.4172163009643555, 5.608922004699707, 5.800627708435059, 5.99233341217041, 6.18403959274292, 6.3757452964782715, 6.567451000213623, 6.759156703948975, 6.950862884521484]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 2.0, 8.0, 5.0, 7.0, 19.0, 11.0, 18.0, 12.0, 20.0, 17.0, 32.0, 34.0, 19.0, 28.0, 31.0, 32.0, 42.0, 29.0, 37.0, 24.0, 45.0, 36.0, 24.0, 33.0, 36.0, 37.0, 43.0, 32.0, 34.0, 23.0, 28.0, 20.0, 21.0, 15.0, 24.0, 19.0, 11.0, 15.0, 9.0, 10.0, 12.0, 5.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.2040908336639404, -3.1065220832824707, -3.008953332901001, -2.9113845825195312, -2.8138160705566406, -2.716247320175171, -2.618678569793701, -2.5211098194122314, -2.4235410690307617, -2.325972318649292, -2.2284035682678223, -2.1308350563049316, -2.033266305923462, -1.9356975555419922, -1.8381288051605225, -1.7405600547790527, -1.642991542816162, -1.5454227924346924, -1.4478541612625122, -1.3502854108810425, -1.2527167797088623, -1.1551480293273926, -1.0575792789459229, -0.9600105881690979, -0.862441897392273, -0.764873206615448, -0.667304515838623, -0.5697357654571533, -0.47216707468032837, -0.3745983839035034, -0.2770296335220337, -0.17946094274520874, -0.08189201354980469, 0.015676692128181458, 0.1132453978061676, 0.21081411838531494, 0.3083828091621399, 0.40595149993896484, 0.5035202503204346, 0.6010889410972595, 0.6986576318740845, 0.7962263226509094, 0.8937950134277344, 0.9913637638092041, 1.0889325141906738, 1.186501145362854, 1.2840698957443237, 1.381638526916504, 1.4792072772979736, 1.5767760276794434, 1.6743446588516235, 1.7719134092330933, 1.8694820404052734, 1.9670507907867432, 2.064619541168213, 2.1621882915496826, 2.2597570419311523, 2.357325792312622, 2.454894542694092, 2.5524630546569824, 2.650031805038452, 2.747600555419922, 2.8451693058013916, 2.9427380561828613, 3.040306568145752]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 26.0, 19.0, 39.0, 73.0, 119.0, 184.0, 316.0, 499.0, 846.0, 1528.0, 2853.0, 5200.0, 9820.0, 19282.0, 39256.0, 78906.0, 152554.0, 239338.0, 225355.0, 134413.0, 68508.0, 33800.0, 16820.0, 8670.0, 4400.0, 2448.0, 1355.0, 768.0, 458.0, 257.0, 138.0, 92.0, 68.0, 50.0, 24.0, 18.0, 11.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92333984375, -0.8952713012695312, -0.8672027587890625, -0.8391342163085938, -0.811065673828125, -0.7829971313476562, -0.7549285888671875, -0.7268600463867188, -0.69879150390625, -0.6707229614257812, -0.6426544189453125, -0.6145858764648438, -0.586517333984375, -0.5584487915039062, -0.5303802490234375, -0.5023117065429688, -0.4742431640625, -0.44617462158203125, -0.4181060791015625, -0.39003753662109375, -0.361968994140625, -0.33390045166015625, -0.3058319091796875, -0.27776336669921875, -0.24969482421875, -0.22162628173828125, -0.1935577392578125, -0.16548919677734375, -0.137420654296875, -0.10935211181640625, -0.0812835693359375, -0.05321502685546875, -0.025146484375, 0.00292205810546875, 0.0309906005859375, 0.05905914306640625, 0.087127685546875, 0.11519622802734375, 0.1432647705078125, 0.17133331298828125, 0.19940185546875, 0.22747039794921875, 0.2555389404296875, 0.28360748291015625, 0.311676025390625, 0.33974456787109375, 0.3678131103515625, 0.39588165283203125, 0.4239501953125, 0.45201873779296875, 0.4800872802734375, 0.5081558227539062, 0.536224365234375, 0.5642929077148438, 0.5923614501953125, 0.6204299926757812, 0.64849853515625, 0.6765670776367188, 0.7046356201171875, 0.7327041625976562, 0.760772705078125, 0.7888412475585938, 0.8169097900390625, 0.8449783325195312, 0.873046875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 13.0, 17.0, 28.0, 19.0, 10.0, 23.0, 20.0, 20.0, 37.0, 40.0, 31.0, 33.0, 22.0, 32.0, 38.0, 34.0, 34.0, 40.0, 31.0, 40.0, 27.0, 34.0, 36.0, 23.0, 34.0, 23.0, 39.0, 20.0, 30.0, 23.0, 8.0, 14.0, 11.0, 16.0, 5.0, 12.0, 12.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.197265625, -3.09100341796875, -2.9847412109375, -2.87847900390625, -2.772216796875, -2.66595458984375, -2.5596923828125, -2.45343017578125, -2.34716796875, -2.24090576171875, -2.1346435546875, -2.02838134765625, -1.922119140625, -1.81585693359375, -1.7095947265625, -1.60333251953125, -1.4970703125, -1.39080810546875, -1.2845458984375, -1.17828369140625, -1.072021484375, -0.96575927734375, -0.8594970703125, -0.75323486328125, -0.64697265625, -0.54071044921875, -0.4344482421875, -0.32818603515625, -0.221923828125, -0.11566162109375, -0.0093994140625, 0.09686279296875, 0.203125, 0.30938720703125, 0.4156494140625, 0.52191162109375, 0.628173828125, 0.73443603515625, 0.8406982421875, 0.94696044921875, 1.05322265625, 1.15948486328125, 1.2657470703125, 1.37200927734375, 1.478271484375, 1.58453369140625, 1.6907958984375, 1.79705810546875, 1.9033203125, 2.00958251953125, 2.1158447265625, 2.22210693359375, 2.328369140625, 2.43463134765625, 2.5408935546875, 2.64715576171875, 2.75341796875, 2.85968017578125, 2.9659423828125, 3.07220458984375, 3.178466796875, 3.28472900390625, 3.3909912109375, 3.49725341796875, 3.603515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 12.0, 11.0, 13.0, 11.0, 27.0, 27.0, 41.0, 62.0, 87.0, 120.0, 204.0, 284.0, 429.0, 727.0, 1165.0, 2045.0, 4039.0, 8765.0, 21462.0, 107276.0, 835929.0, 39045.0, 13580.0, 6064.0, 2930.0, 1614.0, 955.0, 513.0, 345.0, 222.0, 142.0, 117.0, 80.0, 54.0, 32.0, 34.0, 34.0, 16.0, 11.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-2.708984375, -2.632171630859375, -2.55535888671875, -2.478546142578125, -2.4017333984375, -2.324920654296875, -2.24810791015625, -2.171295166015625, -2.094482421875, -2.017669677734375, -1.94085693359375, -1.864044189453125, -1.7872314453125, -1.710418701171875, -1.63360595703125, -1.556793212890625, -1.47998046875, -1.403167724609375, -1.32635498046875, -1.249542236328125, -1.1727294921875, -1.095916748046875, -1.01910400390625, -0.942291259765625, -0.865478515625, -0.788665771484375, -0.71185302734375, -0.635040283203125, -0.5582275390625, -0.481414794921875, -0.40460205078125, -0.327789306640625, -0.2509765625, -0.174163818359375, -0.09735107421875, -0.020538330078125, 0.0562744140625, 0.133087158203125, 0.20989990234375, 0.286712646484375, 0.363525390625, 0.440338134765625, 0.51715087890625, 0.593963623046875, 0.6707763671875, 0.747589111328125, 0.82440185546875, 0.901214599609375, 0.97802734375, 1.054840087890625, 1.13165283203125, 1.208465576171875, 1.2852783203125, 1.362091064453125, 1.43890380859375, 1.515716552734375, 1.592529296875, 1.669342041015625, 1.74615478515625, 1.822967529296875, 1.8997802734375, 1.976593017578125, 2.05340576171875, 2.130218505859375, 2.20703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 7.0, 6.0, 10.0, 10.0, 8.0, 17.0, 18.0, 20.0, 19.0, 24.0, 32.0, 36.0, 40.0, 42.0, 41.0, 39.0, 55.0, 49.0, 45.0, 47.0, 49.0, 50.0, 40.0, 44.0, 37.0, 36.0, 30.0, 34.0, 13.0, 20.0, 10.0, 16.0, 16.0, 11.0, 4.0, 5.0, 2.0, 9.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.467315673828125, -4.33306884765625, -4.198822021484375, -4.0645751953125, -3.930328369140625, -3.79608154296875, -3.661834716796875, -3.527587890625, -3.393341064453125, -3.25909423828125, -3.124847412109375, -2.9906005859375, -2.856353759765625, -2.72210693359375, -2.587860107421875, -2.45361328125, -2.319366455078125, -2.18511962890625, -2.050872802734375, -1.9166259765625, -1.782379150390625, -1.64813232421875, -1.513885498046875, -1.379638671875, -1.245391845703125, -1.11114501953125, -0.976898193359375, -0.8426513671875, -0.708404541015625, -0.57415771484375, -0.439910888671875, -0.3056640625, -0.171417236328125, -0.03717041015625, 0.097076416015625, 0.2313232421875, 0.365570068359375, 0.49981689453125, 0.634063720703125, 0.768310546875, 0.902557373046875, 1.03680419921875, 1.171051025390625, 1.3052978515625, 1.439544677734375, 1.57379150390625, 1.708038330078125, 1.84228515625, 1.976531982421875, 2.11077880859375, 2.245025634765625, 2.3792724609375, 2.513519287109375, 2.64776611328125, 2.782012939453125, 2.916259765625, 3.050506591796875, 3.18475341796875, 3.319000244140625, 3.4532470703125, 3.587493896484375, 3.72174072265625, 3.855987548828125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 10.0, 9.0, 15.0, 24.0, 29.0, 34.0, 46.0, 76.0, 119.0, 184.0, 270.0, 432.0, 632.0, 942.0, 1477.0, 2401.0, 3956.0, 6728.0, 12622.0, 28406.0, 787769.0, 152518.0, 22975.0, 10927.0, 5982.0, 3704.0, 2201.0, 1322.0, 894.0, 617.0, 397.0, 280.0, 168.0, 117.0, 87.0, 48.0, 35.0, 32.0, 27.0, 14.0, 9.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0016326904296875, -0.968109130859375, -0.9345855712890625, -0.90106201171875, -0.8675384521484375, -0.834014892578125, -0.8004913330078125, -0.7669677734375, -0.7334442138671875, -0.699920654296875, -0.6663970947265625, -0.63287353515625, -0.5993499755859375, -0.565826416015625, -0.5323028564453125, -0.498779296875, -0.4652557373046875, -0.431732177734375, -0.3982086181640625, -0.36468505859375, -0.3311614990234375, -0.297637939453125, -0.2641143798828125, -0.2305908203125, -0.1970672607421875, -0.163543701171875, -0.1300201416015625, -0.09649658203125, -0.0629730224609375, -0.029449462890625, 0.0040740966796875, 0.03759765625, 0.0711212158203125, 0.104644775390625, 0.1381683349609375, 0.17169189453125, 0.2052154541015625, 0.238739013671875, 0.2722625732421875, 0.3057861328125, 0.3393096923828125, 0.372833251953125, 0.4063568115234375, 0.43988037109375, 0.4734039306640625, 0.506927490234375, 0.5404510498046875, 0.573974609375, 0.6074981689453125, 0.641021728515625, 0.6745452880859375, 0.70806884765625, 0.7415924072265625, 0.775115966796875, 0.8086395263671875, 0.8421630859375, 0.8756866455078125, 0.909210205078125, 0.9427337646484375, 0.97625732421875, 1.0097808837890625, 1.043304443359375, 1.0768280029296875, 1.1103515625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 1.0, 4.0, 6.0, 5.0, 6.0, 4.0, 12.0, 15.0, 24.0, 38.0, 66.0, 93.0, 110.0, 115.0, 130.0, 110.0, 95.0, 52.0, 37.0, 24.0, 14.0, 7.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.7738037109375e-05, -8.535012602806091e-05, -8.296221494674683e-05, -8.057430386543274e-05, -7.818639278411865e-05, -7.579848170280457e-05, -7.341057062149048e-05, -7.102265954017639e-05, -6.86347484588623e-05, -6.624683737754822e-05, -6.385892629623413e-05, -6.147101521492004e-05, -5.908310413360596e-05, -5.669519305229187e-05, -5.430728197097778e-05, -5.1919370889663696e-05, -4.953145980834961e-05, -4.714354872703552e-05, -4.4755637645721436e-05, -4.236772656440735e-05, -3.997981548309326e-05, -3.7591904401779175e-05, -3.520399332046509e-05, -3.2816082239151e-05, -3.0428171157836914e-05, -2.8040260076522827e-05, -2.565234899520874e-05, -2.3264437913894653e-05, -2.0876526832580566e-05, -1.848861575126648e-05, -1.6100704669952393e-05, -1.3712793588638306e-05, -1.1324882507324219e-05, -8.936971426010132e-06, -6.549060344696045e-06, -4.161149263381958e-06, -1.773238182067871e-06, 6.146728992462158e-07, 3.0025839805603027e-06, 5.39049506187439e-06, 7.778406143188477e-06, 1.0166317224502563e-05, 1.255422830581665e-05, 1.4942139387130737e-05, 1.7330050468444824e-05, 1.971796154975891e-05, 2.2105872631072998e-05, 2.4493783712387085e-05, 2.6881694793701172e-05, 2.926960587501526e-05, 3.1657516956329346e-05, 3.404542803764343e-05, 3.643333911895752e-05, 3.8821250200271606e-05, 4.120916128158569e-05, 4.359707236289978e-05, 4.598498344421387e-05, 4.8372894525527954e-05, 5.076080560684204e-05, 5.314871668815613e-05, 5.5536627769470215e-05, 5.79245388507843e-05, 6.031244993209839e-05, 6.270036101341248e-05, 6.508827209472656e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 14.0, 18.0, 19.0, 27.0, 50.0, 61.0, 84.0, 105.0, 184.0, 228.0, 347.0, 530.0, 720.0, 1107.0, 1709.0, 2713.0, 4352.0, 7331.0, 12446.0, 22368.0, 42006.0, 84907.0, 178772.0, 292808.0, 197128.0, 93713.0, 46410.0, 24195.0, 13353.0, 7757.0, 4615.0, 2877.0, 1828.0, 1177.0, 766.0, 532.0, 375.0, 269.0, 177.0, 120.0, 90.0, 74.0, 51.0, 42.0, 28.0, 9.0, 17.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0], "bins": [-0.356689453125, -0.34539031982421875, -0.3340911865234375, -0.32279205322265625, -0.311492919921875, -0.30019378662109375, -0.2888946533203125, -0.27759552001953125, -0.26629638671875, -0.25499725341796875, -0.2436981201171875, -0.23239898681640625, -0.221099853515625, -0.20980072021484375, -0.1985015869140625, -0.18720245361328125, -0.1759033203125, -0.16460418701171875, -0.1533050537109375, -0.14200592041015625, -0.130706787109375, -0.11940765380859375, -0.1081085205078125, -0.09680938720703125, -0.08551025390625, -0.07421112060546875, -0.0629119873046875, -0.05161285400390625, -0.040313720703125, -0.02901458740234375, -0.0177154541015625, -0.00641632080078125, 0.0048828125, 0.01618194580078125, 0.0274810791015625, 0.03878021240234375, 0.050079345703125, 0.06137847900390625, 0.0726776123046875, 0.08397674560546875, 0.09527587890625, 0.10657501220703125, 0.1178741455078125, 0.12917327880859375, 0.140472412109375, 0.15177154541015625, 0.1630706787109375, 0.17436981201171875, 0.1856689453125, 0.19696807861328125, 0.2082672119140625, 0.21956634521484375, 0.230865478515625, 0.24216461181640625, 0.2534637451171875, 0.26476287841796875, 0.27606201171875, 0.28736114501953125, 0.2986602783203125, 0.30995941162109375, 0.321258544921875, 0.33255767822265625, 0.3438568115234375, 0.35515594482421875, 0.366455078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 9.0, 7.0, 12.0, 13.0, 32.0, 21.0, 23.0, 38.0, 30.0, 56.0, 76.0, 85.0, 85.0, 89.0, 64.0, 69.0, 43.0, 34.0, 27.0, 28.0, 26.0, 28.0, 17.0, 13.0, 5.0, 7.0, 8.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24890899658203125, -0.2402496337890625, -0.23159027099609375, -0.222930908203125, -0.21427154541015625, -0.2056121826171875, -0.19695281982421875, -0.18829345703125, -0.17963409423828125, -0.1709747314453125, -0.16231536865234375, -0.153656005859375, -0.14499664306640625, -0.1363372802734375, -0.12767791748046875, -0.1190185546875, -0.11035919189453125, -0.1016998291015625, -0.09304046630859375, -0.084381103515625, -0.07572174072265625, -0.0670623779296875, -0.05840301513671875, -0.04974365234375, -0.04108428955078125, -0.0324249267578125, -0.02376556396484375, -0.015106201171875, -0.00644683837890625, 0.0022125244140625, 0.01087188720703125, 0.01953125, 0.02819061279296875, 0.0368499755859375, 0.04550933837890625, 0.054168701171875, 0.06282806396484375, 0.0714874267578125, 0.08014678955078125, 0.08880615234375, 0.09746551513671875, 0.1061248779296875, 0.11478424072265625, 0.123443603515625, 0.13210296630859375, 0.1407623291015625, 0.14942169189453125, 0.1580810546875, 0.16674041748046875, 0.1753997802734375, 0.18405914306640625, 0.192718505859375, 0.20137786865234375, 0.2100372314453125, 0.21869659423828125, 0.22735595703125, 0.23601531982421875, 0.2446746826171875, 0.25333404541015625, 0.261993408203125, 0.27065277099609375, 0.2793121337890625, 0.28797149658203125, 0.296630859375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 16.0, 14.0, 20.0, 28.0, 37.0, 32.0, 55.0, 52.0, 71.0, 84.0, 64.0, 84.0, 53.0, 65.0, 56.0, 40.0, 37.0, 39.0, 27.0, 21.0, 23.0, 10.0, 17.0, 13.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.360625743865967, -5.171506881713867, -4.982387542724609, -4.79326868057251, -4.60414981842041, -4.4150309562683105, -4.225912094116211, -4.036792755126953, -3.8476738929748535, -3.658555030822754, -3.469435930252075, -3.2803168296813965, -3.091197967529297, -2.9020791053771973, -2.7129600048065186, -2.52384090423584, -2.3347220420837402, -2.1456031799316406, -1.956484079360962, -1.7673650979995728, -1.5782461166381836, -1.3891271352767944, -1.2000081539154053, -1.0108891725540161, -0.821770191192627, -0.6326512098312378, -0.44353222846984863, -0.2544132471084595, -0.06529426574707031, 0.12382471561431885, 0.312943696975708, 0.5020626783370972, 0.6911821365356445, 0.8803011178970337, 1.0694200992584229, 1.258539080619812, 1.4476580619812012, 1.6367770433425903, 1.8258960247039795, 2.015015125274658, 2.204133987426758, 2.3932528495788574, 2.582371950149536, 2.771491050720215, 2.9606099128723145, 3.149728775024414, 3.3388478755950928, 3.5279669761657715, 3.717085838317871, 3.9062047004699707, 4.09532356262207, 4.284442901611328, 4.473561763763428, 4.662680625915527, 4.851799964904785, 5.040918827056885, 5.230037689208984, 5.419156551361084, 5.608275413513184, 5.797394752502441, 5.986513614654541, 6.175632476806641, 6.364751815795898, 6.553870677947998, 6.742989540100098]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 2.0, 8.0, 5.0, 7.0, 10.0, 12.0, 16.0, 11.0, 24.0, 20.0, 27.0, 23.0, 33.0, 31.0, 21.0, 35.0, 31.0, 31.0, 25.0, 35.0, 44.0, 32.0, 35.0, 34.0, 28.0, 37.0, 38.0, 36.0, 36.0, 34.0, 19.0, 24.0, 28.0, 19.0, 21.0, 16.0, 18.0, 12.0, 14.0, 6.0, 14.0, 10.0, 3.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 3.0, 1.0, 2.0], "bins": [-3.0880866050720215, -2.992785692214966, -2.8974850177764893, -2.8021841049194336, -2.706883192062378, -2.6115822792053223, -2.5162816047668457, -2.42098069190979, -2.3256797790527344, -2.2303788661956787, -2.135078191757202, -2.0397772789001465, -1.9444763660430908, -1.8491755723953247, -1.7538747787475586, -1.658573865890503, -1.5632731914520264, -1.4679723978042603, -1.3726714849472046, -1.2773706912994385, -1.1820697784423828, -1.0867689847946167, -0.9914681911468506, -0.8961673378944397, -0.8008664846420288, -0.7055656313896179, -0.610264778137207, -0.5149639844894409, -0.41966313123703003, -0.32436227798461914, -0.22906148433685303, -0.13376063108444214, -0.03845977783203125, 0.056841060519218445, 0.15214189887046814, 0.24744272232055664, 0.34274357557296753, 0.4380444288253784, 0.5333452224731445, 0.6286460757255554, 0.7239469289779663, 0.8192477822303772, 0.9145486354827881, 1.0098494291305542, 1.1051502227783203, 1.200451135635376, 1.295751929283142, 1.3910527229309082, 1.4863536357879639, 1.58165442943573, 1.6769553422927856, 1.7722561359405518, 1.8675570487976074, 1.9628578424453735, 2.0581586360931396, 2.1534595489501953, 2.248760223388672, 2.3440611362457275, 2.439361810684204, 2.5346627235412598, 2.6299636363983154, 2.725264549255371, 2.8205652236938477, 2.9158661365509033, 3.011167049407959]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 6.0, 11.0, 13.0, 22.0, 22.0, 47.0, 81.0, 110.0, 171.0, 302.0, 524.0, 936.0, 1580.0, 3029.0, 5480.0, 10103.0, 19143.0, 35976.0, 65418.0, 112024.0, 165511.0, 192244.0, 169839.0, 116472.0, 68522.0, 37525.0, 19848.0, 10635.0, 5743.0, 3177.0, 1670.0, 959.0, 541.0, 312.0, 188.0, 136.0, 87.0, 47.0, 32.0, 23.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.2421875, -4.09857177734375, -3.9549560546875, -3.81134033203125, -3.667724609375, -3.52410888671875, -3.3804931640625, -3.23687744140625, -3.09326171875, -2.94964599609375, -2.8060302734375, -2.66241455078125, -2.518798828125, -2.37518310546875, -2.2315673828125, -2.08795166015625, -1.9443359375, -1.80072021484375, -1.6571044921875, -1.51348876953125, -1.369873046875, -1.22625732421875, -1.0826416015625, -0.93902587890625, -0.79541015625, -0.65179443359375, -0.5081787109375, -0.36456298828125, -0.220947265625, -0.07733154296875, 0.0662841796875, 0.20989990234375, 0.353515625, 0.49713134765625, 0.6407470703125, 0.78436279296875, 0.927978515625, 1.07159423828125, 1.2152099609375, 1.35882568359375, 1.50244140625, 1.64605712890625, 1.7896728515625, 1.93328857421875, 2.076904296875, 2.22052001953125, 2.3641357421875, 2.50775146484375, 2.6513671875, 2.79498291015625, 2.9385986328125, 3.08221435546875, 3.225830078125, 3.36944580078125, 3.5130615234375, 3.65667724609375, 3.80029296875, 3.94390869140625, 4.0875244140625, 4.23114013671875, 4.374755859375, 4.51837158203125, 4.6619873046875, 4.80560302734375, 4.94921875]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 6.0, 12.0, 7.0, 17.0, 12.0, 22.0, 19.0, 22.0, 19.0, 28.0, 37.0, 29.0, 34.0, 47.0, 46.0, 32.0, 40.0, 34.0, 34.0, 40.0, 48.0, 40.0, 42.0, 46.0, 37.0, 41.0, 24.0, 25.0, 22.0, 20.0, 20.0, 19.0, 12.0, 15.0, 9.0, 6.0, 10.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.125, -3.00823974609375, -2.8914794921875, -2.77471923828125, -2.657958984375, -2.54119873046875, -2.4244384765625, -2.30767822265625, -2.19091796875, -2.07415771484375, -1.9573974609375, -1.84063720703125, -1.723876953125, -1.60711669921875, -1.4903564453125, -1.37359619140625, -1.2568359375, -1.14007568359375, -1.0233154296875, -0.90655517578125, -0.789794921875, -0.67303466796875, -0.5562744140625, -0.43951416015625, -0.32275390625, -0.20599365234375, -0.0892333984375, 0.02752685546875, 0.144287109375, 0.26104736328125, 0.3778076171875, 0.49456787109375, 0.611328125, 0.72808837890625, 0.8448486328125, 0.96160888671875, 1.078369140625, 1.19512939453125, 1.3118896484375, 1.42864990234375, 1.54541015625, 1.66217041015625, 1.7789306640625, 1.89569091796875, 2.012451171875, 2.12921142578125, 2.2459716796875, 2.36273193359375, 2.4794921875, 2.59625244140625, 2.7130126953125, 2.82977294921875, 2.946533203125, 3.06329345703125, 3.1800537109375, 3.29681396484375, 3.41357421875, 3.53033447265625, 3.6470947265625, 3.76385498046875, 3.880615234375, 3.99737548828125, 4.1141357421875, 4.23089599609375, 4.34765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 12.0, 13.0, 22.0, 35.0, 35.0, 68.0, 101.0, 170.0, 219.0, 366.0, 573.0, 858.0, 1310.0, 2150.0, 3342.0, 5456.0, 8890.0, 15337.0, 26202.0, 44065.0, 72350.0, 110534.0, 149037.0, 166005.0, 149346.0, 110605.0, 72066.0, 43999.0, 26066.0, 15193.0, 9332.0, 5405.0, 3574.0, 2133.0, 1273.0, 851.0, 529.0, 320.0, 246.0, 146.0, 91.0, 65.0, 40.0, 43.0, 24.0, 15.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.521270751953125, -3.40582275390625, -3.290374755859375, -3.1749267578125, -3.059478759765625, -2.94403076171875, -2.828582763671875, -2.713134765625, -2.597686767578125, -2.48223876953125, -2.366790771484375, -2.2513427734375, -2.135894775390625, -2.02044677734375, -1.904998779296875, -1.78955078125, -1.674102783203125, -1.55865478515625, -1.443206787109375, -1.3277587890625, -1.212310791015625, -1.09686279296875, -0.981414794921875, -0.865966796875, -0.750518798828125, -0.63507080078125, -0.519622802734375, -0.4041748046875, -0.288726806640625, -0.17327880859375, -0.057830810546875, 0.0576171875, 0.173065185546875, 0.28851318359375, 0.403961181640625, 0.5194091796875, 0.634857177734375, 0.75030517578125, 0.865753173828125, 0.981201171875, 1.096649169921875, 1.21209716796875, 1.327545166015625, 1.4429931640625, 1.558441162109375, 1.67388916015625, 1.789337158203125, 1.90478515625, 2.020233154296875, 2.13568115234375, 2.251129150390625, 2.3665771484375, 2.482025146484375, 2.59747314453125, 2.712921142578125, 2.828369140625, 2.943817138671875, 3.05926513671875, 3.174713134765625, 3.2901611328125, 3.405609130859375, 3.52105712890625, 3.636505126953125, 3.751953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 13.0, 8.0, 15.0, 16.0, 24.0, 13.0, 26.0, 29.0, 23.0, 25.0, 31.0, 26.0, 36.0, 41.0, 41.0, 37.0, 35.0, 36.0, 47.0, 37.0, 37.0, 38.0, 35.0, 37.0, 37.0, 34.0, 27.0, 26.0, 31.0, 20.0, 16.0, 15.0, 7.0, 16.0, 13.0, 10.0, 3.0, 3.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.383148193359375, -2.30340576171875, -2.223663330078125, -2.1439208984375, -2.064178466796875, -1.98443603515625, -1.904693603515625, -1.824951171875, -1.745208740234375, -1.66546630859375, -1.585723876953125, -1.5059814453125, -1.426239013671875, -1.34649658203125, -1.266754150390625, -1.18701171875, -1.107269287109375, -1.02752685546875, -0.947784423828125, -0.8680419921875, -0.788299560546875, -0.70855712890625, -0.628814697265625, -0.549072265625, -0.469329833984375, -0.38958740234375, -0.309844970703125, -0.2301025390625, -0.150360107421875, -0.07061767578125, 0.009124755859375, 0.0888671875, 0.168609619140625, 0.24835205078125, 0.328094482421875, 0.4078369140625, 0.487579345703125, 0.56732177734375, 0.647064208984375, 0.726806640625, 0.806549072265625, 0.88629150390625, 0.966033935546875, 1.0457763671875, 1.125518798828125, 1.20526123046875, 1.285003662109375, 1.36474609375, 1.444488525390625, 1.52423095703125, 1.603973388671875, 1.6837158203125, 1.763458251953125, 1.84320068359375, 1.922943115234375, 2.002685546875, 2.082427978515625, 2.16217041015625, 2.241912841796875, 2.3216552734375, 2.401397705078125, 2.48114013671875, 2.560882568359375, 2.640625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 10.0, 12.0, 5.0, 16.0, 27.0, 38.0, 49.0, 108.0, 120.0, 193.0, 252.0, 409.0, 656.0, 1085.0, 1909.0, 3168.0, 5830.0, 11121.0, 23458.0, 49758.0, 105314.0, 203392.0, 265370.0, 190279.0, 96457.0, 44835.0, 21162.0, 10466.0, 5481.0, 3107.0, 1652.0, 998.0, 633.0, 388.0, 275.0, 169.0, 120.0, 71.0, 42.0, 33.0, 23.0, 16.0, 12.0, 16.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.748046875, -3.624908447265625, -3.50177001953125, -3.378631591796875, -3.2554931640625, -3.132354736328125, -3.00921630859375, -2.886077880859375, -2.762939453125, -2.639801025390625, -2.51666259765625, -2.393524169921875, -2.2703857421875, -2.147247314453125, -2.02410888671875, -1.900970458984375, -1.77783203125, -1.654693603515625, -1.53155517578125, -1.408416748046875, -1.2852783203125, -1.162139892578125, -1.03900146484375, -0.915863037109375, -0.792724609375, -0.669586181640625, -0.54644775390625, -0.423309326171875, -0.3001708984375, -0.177032470703125, -0.05389404296875, 0.069244384765625, 0.1923828125, 0.315521240234375, 0.43865966796875, 0.561798095703125, 0.6849365234375, 0.808074951171875, 0.93121337890625, 1.054351806640625, 1.177490234375, 1.300628662109375, 1.42376708984375, 1.546905517578125, 1.6700439453125, 1.793182373046875, 1.91632080078125, 2.039459228515625, 2.16259765625, 2.285736083984375, 2.40887451171875, 2.532012939453125, 2.6551513671875, 2.778289794921875, 2.90142822265625, 3.024566650390625, 3.147705078125, 3.270843505859375, 3.39398193359375, 3.517120361328125, 3.6402587890625, 3.763397216796875, 3.88653564453125, 4.009674072265625, 4.1328125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 12.0, 13.0, 12.0, 17.0, 15.0, 26.0, 22.0, 25.0, 34.0, 35.0, 47.0, 36.0, 57.0, 58.0, 52.0, 47.0, 72.0, 48.0, 60.0, 47.0, 33.0, 46.0, 34.0, 23.0, 23.0, 22.0, 12.0, 16.0, 5.0, 11.0, 11.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.000209808349609375, -0.00020260736346244812, -0.00019540637731552124, -0.00018820539116859436, -0.00018100440502166748, -0.0001738034188747406, -0.00016660243272781372, -0.00015940144658088684, -0.00015220046043395996, -0.00014499947428703308, -0.0001377984881401062, -0.00013059750199317932, -0.00012339651584625244, -0.00011619552969932556, -0.00010899454355239868, -0.0001017935574054718, -9.459257125854492e-05, -8.739158511161804e-05, -8.019059896469116e-05, -7.298961281776428e-05, -6.57886266708374e-05, -5.858764052391052e-05, -5.138665437698364e-05, -4.418566823005676e-05, -3.698468208312988e-05, -2.9783695936203003e-05, -2.2582709789276123e-05, -1.5381723642349243e-05, -8.180737495422363e-06, -9.797513484954834e-07, 6.2212347984313965e-06, 1.3422220945358276e-05, 2.0623207092285156e-05, 2.7824193239212036e-05, 3.5025179386138916e-05, 4.2226165533065796e-05, 4.9427151679992676e-05, 5.6628137826919556e-05, 6.382912397384644e-05, 7.103011012077332e-05, 7.82310962677002e-05, 8.543208241462708e-05, 9.263306856155396e-05, 9.983405470848083e-05, 0.00010703504085540771, 0.0001142360270023346, 0.00012143701314926147, 0.00012863799929618835, 0.00013583898544311523, 0.00014303997159004211, 0.000150240957736969, 0.00015744194388389587, 0.00016464293003082275, 0.00017184391617774963, 0.00017904490232467651, 0.0001862458884716034, 0.00019344687461853027, 0.00020064786076545715, 0.00020784884691238403, 0.0002150498330593109, 0.0002222508192062378, 0.00022945180535316467, 0.00023665279150009155, 0.00024385377764701843, 0.0002510547637939453]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 4.0, 3.0, 5.0, 13.0, 14.0, 23.0, 34.0, 46.0, 46.0, 68.0, 98.0, 123.0, 197.0, 267.0, 379.0, 616.0, 872.0, 1345.0, 2105.0, 3591.0, 6139.0, 10970.0, 20373.0, 39507.0, 76686.0, 140605.0, 213647.0, 216364.0, 145298.0, 79573.0, 40885.0, 21268.0, 11206.0, 6129.0, 3663.0, 2136.0, 1379.0, 905.0, 598.0, 435.0, 286.0, 173.0, 127.0, 98.0, 69.0, 56.0, 38.0, 34.0, 20.0, 15.0, 11.0, 12.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.771697998046875, -2.67620849609375, -2.580718994140625, -2.4852294921875, -2.389739990234375, -2.29425048828125, -2.198760986328125, -2.103271484375, -2.007781982421875, -1.91229248046875, -1.816802978515625, -1.7213134765625, -1.625823974609375, -1.53033447265625, -1.434844970703125, -1.33935546875, -1.243865966796875, -1.14837646484375, -1.052886962890625, -0.9573974609375, -0.861907958984375, -0.76641845703125, -0.670928955078125, -0.575439453125, -0.479949951171875, -0.38446044921875, -0.288970947265625, -0.1934814453125, -0.097991943359375, -0.00250244140625, 0.092987060546875, 0.1884765625, 0.283966064453125, 0.37945556640625, 0.474945068359375, 0.5704345703125, 0.665924072265625, 0.76141357421875, 0.856903076171875, 0.952392578125, 1.047882080078125, 1.14337158203125, 1.238861083984375, 1.3343505859375, 1.429840087890625, 1.52532958984375, 1.620819091796875, 1.71630859375, 1.811798095703125, 1.90728759765625, 2.002777099609375, 2.0982666015625, 2.193756103515625, 2.28924560546875, 2.384735107421875, 2.480224609375, 2.575714111328125, 2.67120361328125, 2.766693115234375, 2.8621826171875, 2.957672119140625, 3.05316162109375, 3.148651123046875, 3.244140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 17.0, 16.0, 25.0, 43.0, 41.0, 50.0, 74.0, 85.0, 90.0, 99.0, 94.0, 75.0, 64.0, 61.0, 45.0, 25.0, 18.0, 16.0, 8.0, 9.0, 4.0, 7.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.8076171875, -1.753326416015625, -1.69903564453125, -1.644744873046875, -1.5904541015625, -1.536163330078125, -1.48187255859375, -1.427581787109375, -1.373291015625, -1.319000244140625, -1.26470947265625, -1.210418701171875, -1.1561279296875, -1.101837158203125, -1.04754638671875, -0.993255615234375, -0.93896484375, -0.884674072265625, -0.83038330078125, -0.776092529296875, -0.7218017578125, -0.667510986328125, -0.61322021484375, -0.558929443359375, -0.504638671875, -0.450347900390625, -0.39605712890625, -0.341766357421875, -0.2874755859375, -0.233184814453125, -0.17889404296875, -0.124603271484375, -0.0703125, -0.016021728515625, 0.03826904296875, 0.092559814453125, 0.1468505859375, 0.201141357421875, 0.25543212890625, 0.309722900390625, 0.364013671875, 0.418304443359375, 0.47259521484375, 0.526885986328125, 0.5811767578125, 0.635467529296875, 0.68975830078125, 0.744049072265625, 0.79833984375, 0.852630615234375, 0.90692138671875, 0.961212158203125, 1.0155029296875, 1.069793701171875, 1.12408447265625, 1.178375244140625, 1.232666015625, 1.286956787109375, 1.34124755859375, 1.395538330078125, 1.4498291015625, 1.504119873046875, 1.55841064453125, 1.612701416015625, 1.6669921875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 6.0, 12.0, 8.0, 14.0, 14.0, 21.0, 27.0, 34.0, 46.0, 47.0, 60.0, 64.0, 66.0, 64.0, 76.0, 76.0, 72.0, 48.0, 38.0, 39.0, 39.0, 21.0, 20.0, 18.0, 15.0, 12.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.441328048706055, -5.262688636779785, -5.084048748016357, -4.905409336090088, -4.72676944732666, -4.548130035400391, -4.369490623474121, -4.190850734710693, -4.012210845947266, -3.833571195602417, -3.6549315452575684, -3.476292133331299, -3.297652244567871, -3.1190128326416016, -2.940373182296753, -2.7617335319519043, -2.5830941200256348, -2.404454469680786, -2.2258148193359375, -2.047175407409668, -1.8685356378555298, -1.6898959875106812, -1.511256456375122, -1.3326168060302734, -1.1539771556854248, -0.9753375053405762, -0.7966979146003723, -0.6180583238601685, -0.4394186735153198, -0.2607790231704712, -0.08213949203491211, 0.09650015830993652, 0.27513980865478516, 0.4537794291973114, 0.6324190497398376, 0.8110586404800415, 0.9896982908248901, 1.1683379411697388, 1.3469774723052979, 1.5256171226501465, 1.7042567729949951, 1.8828964233398438, 2.0615360736846924, 2.240175724029541, 2.4188151359558105, 2.5974550247192383, 2.776094436645508, 2.9547340869903564, 3.133373737335205, 3.3120133876800537, 3.4906530380249023, 3.669292449951172, 3.8479323387145996, 4.026571750640869, 4.205211639404297, 4.383851051330566, 4.562490463256836, 4.7411298751831055, 4.919769763946533, 5.098409175872803, 5.2770490646362305, 5.4556884765625, 5.6343278884887695, 5.812967777252197, 5.991607666015625]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 7.0, 7.0, 10.0, 8.0, 15.0, 12.0, 11.0, 20.0, 23.0, 22.0, 17.0, 26.0, 35.0, 29.0, 32.0, 32.0, 40.0, 42.0, 36.0, 40.0, 39.0, 37.0, 45.0, 35.0, 53.0, 26.0, 33.0, 35.0, 27.0, 31.0, 20.0, 21.0, 23.0, 20.0, 12.0, 9.0, 10.0, 14.0, 14.0, 10.0, 3.0, 0.0, 8.0, 1.0, 3.0, 6.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904827833175659, -2.800170660018921, -2.6955134868621826, -2.5908563137054443, -2.486199378967285, -2.381542205810547, -2.2768850326538086, -2.1722278594970703, -2.067570686340332, -1.9629135131835938, -1.8582563400268555, -1.7535992860794067, -1.6489421129226685, -1.5442849397659302, -1.4396278858184814, -1.3349707126617432, -1.2303135395050049, -1.1256563663482666, -1.0209991931915283, -0.9163421392440796, -0.8116849660873413, -0.707027792930603, -0.6023706793785095, -0.497713565826416, -0.39305639266967773, -0.28839924931526184, -0.18374210596084595, -0.07908496260643005, 0.02557218074798584, 0.13022935390472412, 0.23488646745681763, 0.33954358100891113, 0.4442005157470703, 0.5488576889038086, 0.6535148024559021, 0.7581719160079956, 0.8628290891647339, 0.9674862623214722, 1.072143316268921, 1.1768004894256592, 1.2814576625823975, 1.3861148357391357, 1.490772008895874, 1.5954290628433228, 1.700086236000061, 1.8047434091567993, 1.909400463104248, 2.0140576362609863, 2.1187148094177246, 2.223371982574463, 2.328029155731201, 2.4326863288879395, 2.5373435020446777, 2.642000675201416, 2.746657609939575, 2.8513147830963135, 2.9559719562530518, 3.06062912940979, 3.1652863025665283, 3.2699434757232666, 3.374600410461426, 3.479257583618164, 3.5839147567749023, 3.6885719299316406, 3.793229103088379]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 9.0, 6.0, 11.0, 21.0, 31.0, 40.0, 62.0, 97.0, 137.0, 206.0, 341.0, 536.0, 857.0, 1391.0, 2189.0, 3936.0, 6655.0, 11866.0, 21978.0, 42679.0, 89275.0, 207019.0, 517130.0, 1103335.0, 1172823.0, 581934.0, 230019.0, 99202.0, 46537.0, 23532.0, 12924.0, 6989.0, 4121.0, 2376.0, 1473.0, 943.0, 556.0, 351.0, 249.0, 146.0, 94.0, 69.0, 46.0, 36.0, 25.0, 12.0, 10.0, 7.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.3203125, -5.1490478515625, -4.977783203125, -4.8065185546875, -4.63525390625, -4.4639892578125, -4.292724609375, -4.1214599609375, -3.9501953125, -3.7789306640625, -3.607666015625, -3.4364013671875, -3.26513671875, -3.0938720703125, -2.922607421875, -2.7513427734375, -2.580078125, -2.4088134765625, -2.237548828125, -2.0662841796875, -1.89501953125, -1.7237548828125, -1.552490234375, -1.3812255859375, -1.2099609375, -1.0386962890625, -0.867431640625, -0.6961669921875, -0.52490234375, -0.3536376953125, -0.182373046875, -0.0111083984375, 0.16015625, 0.3314208984375, 0.502685546875, 0.6739501953125, 0.84521484375, 1.0164794921875, 1.187744140625, 1.3590087890625, 1.5302734375, 1.7015380859375, 1.872802734375, 2.0440673828125, 2.21533203125, 2.3865966796875, 2.557861328125, 2.7291259765625, 2.900390625, 3.0716552734375, 3.242919921875, 3.4141845703125, 3.58544921875, 3.7567138671875, 3.927978515625, 4.0992431640625, 4.2705078125, 4.4417724609375, 4.613037109375, 4.7843017578125, 4.95556640625, 5.1268310546875, 5.298095703125, 5.4693603515625, 5.640625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 5.0, 14.0, 10.0, 14.0, 15.0, 16.0, 23.0, 20.0, 22.0, 24.0, 21.0, 37.0, 40.0, 40.0, 40.0, 41.0, 38.0, 30.0, 47.0, 33.0, 39.0, 37.0, 28.0, 32.0, 31.0, 36.0, 36.0, 29.0, 22.0, 20.0, 10.0, 15.0, 21.0, 8.0, 15.0, 13.0, 14.0, 7.0, 7.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-2.22265625, -2.15447998046875, -2.0863037109375, -2.01812744140625, -1.949951171875, -1.88177490234375, -1.8135986328125, -1.74542236328125, -1.67724609375, -1.60906982421875, -1.5408935546875, -1.47271728515625, -1.404541015625, -1.33636474609375, -1.2681884765625, -1.20001220703125, -1.1318359375, -1.06365966796875, -0.9954833984375, -0.92730712890625, -0.859130859375, -0.79095458984375, -0.7227783203125, -0.65460205078125, -0.58642578125, -0.51824951171875, -0.4500732421875, -0.38189697265625, -0.313720703125, -0.24554443359375, -0.1773681640625, -0.10919189453125, -0.041015625, 0.02716064453125, 0.0953369140625, 0.16351318359375, 0.231689453125, 0.29986572265625, 0.3680419921875, 0.43621826171875, 0.50439453125, 0.57257080078125, 0.6407470703125, 0.70892333984375, 0.777099609375, 0.84527587890625, 0.9134521484375, 0.98162841796875, 1.0498046875, 1.11798095703125, 1.1861572265625, 1.25433349609375, 1.322509765625, 1.39068603515625, 1.4588623046875, 1.52703857421875, 1.59521484375, 1.66339111328125, 1.7315673828125, 1.79974365234375, 1.867919921875, 1.93609619140625, 2.0042724609375, 2.07244873046875, 2.140625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 9.0, 8.0, 18.0, 20.0, 32.0, 51.0, 79.0, 128.0, 211.0, 337.0, 564.0, 1051.0, 1738.0, 3279.0, 5726.0, 10712.0, 20277.0, 39524.0, 79682.0, 166347.0, 351410.0, 713747.0, 1077336.0, 858196.0, 446810.0, 211612.0, 100617.0, 50009.0, 25007.0, 13425.0, 7092.0, 3897.0, 2150.0, 1273.0, 757.0, 438.0, 259.0, 170.0, 112.0, 60.0, 45.0, 24.0, 14.0, 11.0, 5.0, 8.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.57476806640625, -4.4151611328125, -4.25555419921875, -4.095947265625, -3.93634033203125, -3.7767333984375, -3.61712646484375, -3.45751953125, -3.29791259765625, -3.1383056640625, -2.97869873046875, -2.819091796875, -2.65948486328125, -2.4998779296875, -2.34027099609375, -2.1806640625, -2.02105712890625, -1.8614501953125, -1.70184326171875, -1.542236328125, -1.38262939453125, -1.2230224609375, -1.06341552734375, -0.90380859375, -0.74420166015625, -0.5845947265625, -0.42498779296875, -0.265380859375, -0.10577392578125, 0.0538330078125, 0.21343994140625, 0.373046875, 0.53265380859375, 0.6922607421875, 0.85186767578125, 1.011474609375, 1.17108154296875, 1.3306884765625, 1.49029541015625, 1.64990234375, 1.80950927734375, 1.9691162109375, 2.12872314453125, 2.288330078125, 2.44793701171875, 2.6075439453125, 2.76715087890625, 2.9267578125, 3.08636474609375, 3.2459716796875, 3.40557861328125, 3.565185546875, 3.72479248046875, 3.8843994140625, 4.04400634765625, 4.20361328125, 4.36322021484375, 4.5228271484375, 4.68243408203125, 4.842041015625, 5.00164794921875, 5.1612548828125, 5.32086181640625, 5.48046875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 1.0, 4.0, 9.0, 12.0, 14.0, 18.0, 24.0, 38.0, 33.0, 37.0, 61.0, 63.0, 70.0, 79.0, 109.0, 173.0, 156.0, 162.0, 196.0, 217.0, 241.0, 272.0, 247.0, 247.0, 236.0, 214.0, 155.0, 180.0, 138.0, 109.0, 117.0, 91.0, 75.0, 70.0, 49.0, 34.0, 25.0, 28.0, 23.0, 11.0, 9.0, 5.0, 8.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2294921875, -1.189666748046875, -1.14984130859375, -1.110015869140625, -1.0701904296875, -1.030364990234375, -0.99053955078125, -0.950714111328125, -0.910888671875, -0.871063232421875, -0.83123779296875, -0.791412353515625, -0.7515869140625, -0.711761474609375, -0.67193603515625, -0.632110595703125, -0.59228515625, -0.552459716796875, -0.51263427734375, -0.472808837890625, -0.4329833984375, -0.393157958984375, -0.35333251953125, -0.313507080078125, -0.273681640625, -0.233856201171875, -0.19403076171875, -0.154205322265625, -0.1143798828125, -0.074554443359375, -0.03472900390625, 0.005096435546875, 0.044921875, 0.084747314453125, 0.12457275390625, 0.164398193359375, 0.2042236328125, 0.244049072265625, 0.28387451171875, 0.323699951171875, 0.363525390625, 0.403350830078125, 0.44317626953125, 0.483001708984375, 0.5228271484375, 0.562652587890625, 0.60247802734375, 0.642303466796875, 0.68212890625, 0.721954345703125, 0.76177978515625, 0.801605224609375, 0.8414306640625, 0.881256103515625, 0.92108154296875, 0.960906982421875, 1.000732421875, 1.040557861328125, 1.08038330078125, 1.120208740234375, 1.1600341796875, 1.199859619140625, 1.23968505859375, 1.279510498046875, 1.3193359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 11.0, 3.0, 7.0, 9.0, 13.0, 20.0, 10.0, 20.0, 25.0, 37.0, 51.0, 57.0, 63.0, 54.0, 68.0, 65.0, 71.0, 57.0, 64.0, 60.0, 51.0, 33.0, 37.0, 24.0, 23.0, 16.0, 13.0, 7.0, 14.0, 5.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.061370372772217, -4.901939868927002, -4.742508888244629, -4.583078384399414, -4.423647880554199, -4.264216899871826, -4.104786396026611, -3.9453556537628174, -3.7859249114990234, -3.6264941692352295, -3.4670634269714355, -3.3076329231262207, -3.1482021808624268, -2.988771438598633, -2.829340934753418, -2.669910192489624, -2.51047945022583, -2.351048707962036, -2.191617965698242, -2.0321874618530273, -1.8727567195892334, -1.7133259773254395, -1.553895354270935, -1.3944647312164307, -1.2350339889526367, -1.0756032466888428, -0.9161726236343384, -0.7567419409751892, -0.59731125831604, -0.43788057565689087, -0.2784498929977417, -0.1190192699432373, 0.040411949157714844, 0.199842631816864, 0.3592733144760132, 0.5187039971351624, 0.6781346797943115, 0.8375653624534607, 0.9969960451126099, 1.1564266681671143, 1.3158574104309082, 1.4752881526947021, 1.6347187757492065, 1.794149398803711, 1.9535801410675049, 2.113010883331299, 2.2724413871765137, 2.4318721294403076, 2.5913028717041016, 2.7507336139678955, 2.9101643562316895, 3.0695948600769043, 3.2290256023406982, 3.388456344604492, 3.547886848449707, 3.707317590713501, 3.866748332977295, 4.02617883682251, 4.185609817504883, 4.345040321350098, 4.5044708251953125, 4.6639018058776855, 4.8233323097229, 4.982763290405273, 5.142193794250488]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 3.0, 7.0, 10.0, 7.0, 9.0, 12.0, 10.0, 16.0, 16.0, 26.0, 21.0, 22.0, 37.0, 30.0, 38.0, 39.0, 40.0, 37.0, 42.0, 53.0, 47.0, 44.0, 35.0, 43.0, 34.0, 36.0, 27.0, 25.0, 29.0, 24.0, 29.0, 31.0, 18.0, 23.0, 10.0, 11.0, 12.0, 11.0, 5.0, 10.0, 6.0, 1.0, 8.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.797964096069336, -2.7095541954040527, -2.6211440563201904, -2.5327341556549072, -2.444324254989624, -2.3559141159057617, -2.2675042152404785, -2.1790943145751953, -2.090684413909912, -2.002274513244629, -1.9138644933700562, -1.8254544734954834, -1.7370445728302002, -1.6486345529556274, -1.5602245330810547, -1.4718146324157715, -1.3834044933319092, -1.2949944734573364, -1.2065845727920532, -1.1181745529174805, -1.0297646522521973, -0.9413546323776245, -0.8529446125030518, -0.7645346522331238, -0.6761246919631958, -0.5877147316932678, -0.49930474162101746, -0.4108947515487671, -0.3224847912788391, -0.23407483100891113, -0.14566481113433838, -0.0572548508644104, 0.031154870986938477, 0.11956484615802765, 0.20797482132911682, 0.2963848114013672, 0.38479477167129517, 0.47320473194122314, 0.5616147518157959, 0.6500247120857239, 0.7384346723556519, 0.8268446326255798, 0.9152545928955078, 1.0036646127700806, 1.0920746326446533, 1.1804845333099365, 1.2688945531845093, 1.357304573059082, 1.4457144737243652, 1.534124493598938, 1.6225343942642212, 1.710944414138794, 1.7993543148040771, 1.88776433467865, 1.9761743545532227, 2.064584255218506, 2.152994155883789, 2.2414040565490723, 2.3298141956329346, 2.4182240962982178, 2.506633996963501, 2.5950441360473633, 2.6834540367126465, 2.7718639373779297, 2.860274076461792]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 6.0, 15.0, 10.0, 24.0, 33.0, 40.0, 66.0, 110.0, 115.0, 186.0, 304.0, 402.0, 661.0, 1115.0, 1875.0, 3256.0, 5748.0, 10559.0, 19136.0, 36249.0, 67235.0, 120252.0, 187913.0, 214364.0, 164789.0, 97413.0, 53224.0, 28442.0, 15235.0, 8216.0, 4639.0, 2619.0, 1650.0, 906.0, 567.0, 341.0, 240.0, 169.0, 126.0, 68.0, 71.0, 50.0, 26.0, 19.0, 12.0, 15.0, 7.0, 5.0, 2.0, 10.0, 5.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.52783203125, -0.5114974975585938, -0.4951629638671875, -0.47882843017578125, -0.462493896484375, -0.44615936279296875, -0.4298248291015625, -0.41349029541015625, -0.39715576171875, -0.38082122802734375, -0.3644866943359375, -0.34815216064453125, -0.331817626953125, -0.31548309326171875, -0.2991485595703125, -0.28281402587890625, -0.2664794921875, -0.25014495849609375, -0.2338104248046875, -0.21747589111328125, -0.201141357421875, -0.18480682373046875, -0.1684722900390625, -0.15213775634765625, -0.13580322265625, -0.11946868896484375, -0.1031341552734375, -0.08679962158203125, -0.070465087890625, -0.05413055419921875, -0.0377960205078125, -0.02146148681640625, -0.005126953125, 0.01120758056640625, 0.0275421142578125, 0.04387664794921875, 0.060211181640625, 0.07654571533203125, 0.0928802490234375, 0.10921478271484375, 0.12554931640625, 0.14188385009765625, 0.1582183837890625, 0.17455291748046875, 0.190887451171875, 0.20722198486328125, 0.2235565185546875, 0.23989105224609375, 0.2562255859375, 0.27256011962890625, 0.2888946533203125, 0.30522918701171875, 0.321563720703125, 0.33789825439453125, 0.3542327880859375, 0.37056732177734375, 0.38690185546875, 0.40323638916015625, 0.4195709228515625, 0.43590545654296875, 0.452239990234375, 0.46857452392578125, 0.4849090576171875, 0.5012435913085938, 0.517578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 5.0, 9.0, 9.0, 11.0, 16.0, 13.0, 15.0, 23.0, 23.0, 30.0, 21.0, 35.0, 40.0, 39.0, 41.0, 36.0, 45.0, 54.0, 54.0, 36.0, 42.0, 40.0, 50.0, 29.0, 43.0, 29.0, 39.0, 27.0, 23.0, 16.0, 15.0, 17.0, 16.0, 9.0, 12.0, 11.0, 4.0, 6.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.087890625, -2.9840087890625, -2.880126953125, -2.7762451171875, -2.67236328125, -2.5684814453125, -2.464599609375, -2.3607177734375, -2.2568359375, -2.1529541015625, -2.049072265625, -1.9451904296875, -1.84130859375, -1.7374267578125, -1.633544921875, -1.5296630859375, -1.42578125, -1.3218994140625, -1.218017578125, -1.1141357421875, -1.01025390625, -0.9063720703125, -0.802490234375, -0.6986083984375, -0.5947265625, -0.4908447265625, -0.386962890625, -0.2830810546875, -0.17919921875, -0.0753173828125, 0.028564453125, 0.1324462890625, 0.236328125, 0.3402099609375, 0.444091796875, 0.5479736328125, 0.65185546875, 0.7557373046875, 0.859619140625, 0.9635009765625, 1.0673828125, 1.1712646484375, 1.275146484375, 1.3790283203125, 1.48291015625, 1.5867919921875, 1.690673828125, 1.7945556640625, 1.8984375, 2.0023193359375, 2.106201171875, 2.2100830078125, 2.31396484375, 2.4178466796875, 2.521728515625, 2.6256103515625, 2.7294921875, 2.8333740234375, 2.937255859375, 3.0411376953125, 3.14501953125, 3.2489013671875, 3.352783203125, 3.4566650390625, 3.560546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 16.0, 24.0, 16.0, 28.0, 40.0, 43.0, 54.0, 82.0, 113.0, 166.0, 216.0, 278.0, 469.0, 607.0, 1061.0, 1622.0, 2751.0, 5235.0, 10357.0, 24288.0, 158943.0, 773983.0, 37615.0, 14354.0, 6792.0, 3570.0, 1983.0, 1236.0, 792.0, 518.0, 362.0, 243.0, 185.0, 115.0, 79.0, 61.0, 58.0, 44.0, 31.0, 23.0, 19.0, 8.0, 9.0, 7.0, 7.0, 14.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0], "bins": [-1.6416015625, -1.5921478271484375, -1.542694091796875, -1.4932403564453125, -1.44378662109375, -1.3943328857421875, -1.344879150390625, -1.2954254150390625, -1.2459716796875, -1.1965179443359375, -1.147064208984375, -1.0976104736328125, -1.04815673828125, -0.9987030029296875, -0.949249267578125, -0.8997955322265625, -0.850341796875, -0.8008880615234375, -0.751434326171875, -0.7019805908203125, -0.65252685546875, -0.6030731201171875, -0.553619384765625, -0.5041656494140625, -0.4547119140625, -0.4052581787109375, -0.355804443359375, -0.3063507080078125, -0.25689697265625, -0.2074432373046875, -0.157989501953125, -0.1085357666015625, -0.05908203125, -0.0096282958984375, 0.039825439453125, 0.0892791748046875, 0.13873291015625, 0.1881866455078125, 0.237640380859375, 0.2870941162109375, 0.3365478515625, 0.3860015869140625, 0.435455322265625, 0.4849090576171875, 0.53436279296875, 0.5838165283203125, 0.633270263671875, 0.6827239990234375, 0.732177734375, 0.7816314697265625, 0.831085205078125, 0.8805389404296875, 0.92999267578125, 0.9794464111328125, 1.028900146484375, 1.0783538818359375, 1.1278076171875, 1.1772613525390625, 1.226715087890625, 1.2761688232421875, 1.32562255859375, 1.3750762939453125, 1.424530029296875, 1.4739837646484375, 1.5234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 4.0, 8.0, 7.0, 13.0, 9.0, 14.0, 16.0, 18.0, 15.0, 22.0, 23.0, 28.0, 25.0, 34.0, 27.0, 46.0, 30.0, 40.0, 38.0, 39.0, 38.0, 48.0, 40.0, 37.0, 38.0, 32.0, 36.0, 32.0, 30.0, 26.0, 13.0, 20.0, 18.0, 18.0, 19.0, 14.0, 16.0, 9.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.541015625, -2.46380615234375, -2.3865966796875, -2.30938720703125, -2.232177734375, -2.15496826171875, -2.0777587890625, -2.00054931640625, -1.92333984375, -1.84613037109375, -1.7689208984375, -1.69171142578125, -1.614501953125, -1.53729248046875, -1.4600830078125, -1.38287353515625, -1.3056640625, -1.22845458984375, -1.1512451171875, -1.07403564453125, -0.996826171875, -0.91961669921875, -0.8424072265625, -0.76519775390625, -0.68798828125, -0.61077880859375, -0.5335693359375, -0.45635986328125, -0.379150390625, -0.30194091796875, -0.2247314453125, -0.14752197265625, -0.0703125, 0.00689697265625, 0.0841064453125, 0.16131591796875, 0.238525390625, 0.31573486328125, 0.3929443359375, 0.47015380859375, 0.54736328125, 0.62457275390625, 0.7017822265625, 0.77899169921875, 0.856201171875, 0.93341064453125, 1.0106201171875, 1.08782958984375, 1.1650390625, 1.24224853515625, 1.3194580078125, 1.39666748046875, 1.473876953125, 1.55108642578125, 1.6282958984375, 1.70550537109375, 1.78271484375, 1.85992431640625, 1.9371337890625, 2.01434326171875, 2.091552734375, 2.16876220703125, 2.2459716796875, 2.32318115234375, 2.400390625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 1.0, 6.0, 10.0, 15.0, 29.0, 36.0, 71.0, 71.0, 116.0, 200.0, 273.0, 450.0, 724.0, 1085.0, 1743.0, 2834.0, 4658.0, 8174.0, 15437.0, 37109.0, 874691.0, 57488.0, 19200.0, 9753.0, 5526.0, 3318.0, 1974.0, 1226.0, 804.0, 519.0, 318.0, 235.0, 150.0, 83.0, 66.0, 54.0, 29.0, 22.0, 19.0, 15.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51123046875, -0.49204254150390625, -0.4728546142578125, -0.45366668701171875, -0.434478759765625, -0.41529083251953125, -0.3961029052734375, -0.37691497802734375, -0.35772705078125, -0.33853912353515625, -0.3193511962890625, -0.30016326904296875, -0.280975341796875, -0.26178741455078125, -0.2425994873046875, -0.22341156005859375, -0.2042236328125, -0.18503570556640625, -0.1658477783203125, -0.14665985107421875, -0.127471923828125, -0.10828399658203125, -0.0890960693359375, -0.06990814208984375, -0.05072021484375, -0.03153228759765625, -0.0123443603515625, 0.00684356689453125, 0.026031494140625, 0.04521942138671875, 0.0644073486328125, 0.08359527587890625, 0.102783203125, 0.12197113037109375, 0.1411590576171875, 0.16034698486328125, 0.179534912109375, 0.19872283935546875, 0.2179107666015625, 0.23709869384765625, 0.25628662109375, 0.27547454833984375, 0.2946624755859375, 0.31385040283203125, 0.333038330078125, 0.35222625732421875, 0.3714141845703125, 0.39060211181640625, 0.4097900390625, 0.42897796630859375, 0.4481658935546875, 0.46735382080078125, 0.486541748046875, 0.5057296752929688, 0.5249176025390625, 0.5441055297851562, 0.56329345703125, 0.5824813842773438, 0.6016693115234375, 0.6208572387695312, 0.640045166015625, 0.6592330932617188, 0.6784210205078125, 0.6976089477539062, 0.716796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 16.0, 13.0, 18.0, 20.0, 17.0, 15.0, 25.0, 30.0, 30.0, 49.0, 31.0, 38.0, 36.0, 39.0, 35.0, 59.0, 30.0, 45.0, 33.0, 38.0, 38.0, 34.0, 39.0, 29.0, 33.0, 20.0, 34.0, 22.0, 15.0, 16.0, 11.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.2782554626464844e-05, -3.183819353580475e-05, -3.089383244514465e-05, -2.9949471354484558e-05, -2.9005110263824463e-05, -2.8060749173164368e-05, -2.7116388082504272e-05, -2.6172026991844177e-05, -2.5227665901184082e-05, -2.4283304810523987e-05, -2.333894371986389e-05, -2.2394582629203796e-05, -2.14502215385437e-05, -2.0505860447883606e-05, -1.956149935722351e-05, -1.8617138266563416e-05, -1.767277717590332e-05, -1.6728416085243225e-05, -1.578405499458313e-05, -1.4839693903923035e-05, -1.389533281326294e-05, -1.2950971722602844e-05, -1.2006610631942749e-05, -1.1062249541282654e-05, -1.0117888450622559e-05, -9.173527359962463e-06, -8.229166269302368e-06, -7.284805178642273e-06, -6.340444087982178e-06, -5.3960829973220825e-06, -4.451721906661987e-06, -3.507360816001892e-06, -2.562999725341797e-06, -1.6186386346817017e-06, -6.742775440216064e-07, 2.7008354663848877e-07, 1.214444637298584e-06, 2.158805727958679e-06, 3.1031668186187744e-06, 4.04752790927887e-06, 4.991888999938965e-06, 5.93625009059906e-06, 6.880611181259155e-06, 7.82497227191925e-06, 8.769333362579346e-06, 9.713694453239441e-06, 1.0658055543899536e-05, 1.1602416634559631e-05, 1.2546777725219727e-05, 1.3491138815879822e-05, 1.4435499906539917e-05, 1.5379860997200012e-05, 1.6324222087860107e-05, 1.7268583178520203e-05, 1.8212944269180298e-05, 1.9157305359840393e-05, 2.0101666450500488e-05, 2.1046027541160583e-05, 2.199038863182068e-05, 2.2934749722480774e-05, 2.387911081314087e-05, 2.4823471903800964e-05, 2.576783299446106e-05, 2.6712194085121155e-05, 2.765655517578125e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 10.0, 19.0, 19.0, 24.0, 28.0, 48.0, 75.0, 106.0, 141.0, 210.0, 332.0, 486.0, 677.0, 1165.0, 1786.0, 2986.0, 5145.0, 9292.0, 17908.0, 36776.0, 80510.0, 183817.0, 312423.0, 211974.0, 94592.0, 42331.0, 20490.0, 10426.0, 5775.0, 3292.0, 2000.0, 1243.0, 827.0, 511.0, 347.0, 235.0, 158.0, 102.0, 77.0, 48.0, 39.0, 24.0, 21.0, 10.0, 12.0, 7.0, 4.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2139892578125, -0.20699501037597656, -0.20000076293945312, -0.1930065155029297, -0.18601226806640625, -0.1790180206298828, -0.17202377319335938, -0.16502952575683594, -0.1580352783203125, -0.15104103088378906, -0.14404678344726562, -0.1370525360107422, -0.13005828857421875, -0.12306404113769531, -0.11606979370117188, -0.10907554626464844, -0.102081298828125, -0.09508705139160156, -0.08809280395507812, -0.08109855651855469, -0.07410430908203125, -0.06711006164550781, -0.060115814208984375, -0.05312156677246094, -0.0461273193359375, -0.03913307189941406, -0.032138824462890625, -0.025144577026367188, -0.01815032958984375, -0.011156082153320312, -0.004161834716796875, 0.0028324127197265625, 0.00982666015625, 0.016820907592773438, 0.023815155029296875, 0.030809402465820312, 0.03780364990234375, 0.04479789733886719, 0.051792144775390625, 0.05878639221191406, 0.0657806396484375, 0.07277488708496094, 0.07976913452148438, 0.08676338195800781, 0.09375762939453125, 0.10075187683105469, 0.10774612426757812, 0.11474037170410156, 0.121734619140625, 0.12872886657714844, 0.13572311401367188, 0.1427173614501953, 0.14971160888671875, 0.1567058563232422, 0.16370010375976562, 0.17069435119628906, 0.1776885986328125, 0.18468284606933594, 0.19167709350585938, 0.1986713409423828, 0.20566558837890625, 0.2126598358154297, 0.21965408325195312, 0.22664833068847656, 0.233642578125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 10.0, 12.0, 12.0, 13.0, 22.0, 21.0, 30.0, 49.0, 43.0, 61.0, 85.0, 81.0, 93.0, 85.0, 70.0, 62.0, 47.0, 36.0, 15.0, 17.0, 20.0, 22.0, 12.0, 11.0, 9.0, 5.0, 4.0, 5.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1292724609375, -0.12485885620117188, -0.12044525146484375, -0.11603164672851562, -0.1116180419921875, -0.10720443725585938, -0.10279083251953125, -0.09837722778320312, -0.093963623046875, -0.08955001831054688, -0.08513641357421875, -0.08072280883789062, -0.0763092041015625, -0.07189559936523438, -0.06748199462890625, -0.06306838989257812, -0.05865478515625, -0.054241180419921875, -0.04982757568359375, -0.045413970947265625, -0.0410003662109375, -0.036586761474609375, -0.03217315673828125, -0.027759552001953125, -0.023345947265625, -0.018932342529296875, -0.01451873779296875, -0.010105133056640625, -0.0056915283203125, -0.001277923583984375, 0.00313568115234375, 0.007549285888671875, 0.011962890625, 0.016376495361328125, 0.02079010009765625, 0.025203704833984375, 0.0296173095703125, 0.034030914306640625, 0.03844451904296875, 0.042858123779296875, 0.047271728515625, 0.051685333251953125, 0.05609893798828125, 0.060512542724609375, 0.0649261474609375, 0.06933975219726562, 0.07375335693359375, 0.07816696166992188, 0.08258056640625, 0.08699417114257812, 0.09140777587890625, 0.09582138061523438, 0.1002349853515625, 0.10464859008789062, 0.10906219482421875, 0.11347579956054688, 0.117889404296875, 0.12230300903320312, 0.12671661376953125, 0.13113021850585938, 0.1355438232421875, 0.13995742797851562, 0.14437103271484375, 0.14878463745117188, 0.1531982421875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 11.0, 5.0, 7.0, 7.0, 11.0, 14.0, 19.0, 11.0, 22.0, 31.0, 49.0, 42.0, 59.0, 67.0, 62.0, 58.0, 65.0, 70.0, 48.0, 68.0, 67.0, 36.0, 42.0, 27.0, 25.0, 17.0, 16.0, 14.0, 5.0, 13.0, 6.0, 1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.942590713500977, -4.7854461669921875, -4.628301620483398, -4.471157073974609, -4.31401252746582, -4.156867980957031, -3.9997236728668213, -3.8425791263580322, -3.685434579849243, -3.528290033340454, -3.371145486831665, -3.214000940322876, -3.056856632232666, -2.899712085723877, -2.742567539215088, -2.585422992706299, -2.4282784461975098, -2.2711338996887207, -2.1139893531799316, -1.9568449258804321, -1.799700379371643, -1.642555832862854, -1.4854114055633545, -1.3282668590545654, -1.1711223125457764, -1.0139777660369873, -0.856833279132843, -0.6996887922286987, -0.5425442457199097, -0.3853996992111206, -0.22825521230697632, -0.07111072540283203, 0.08603382110595703, 0.2431783378124237, 0.4003228545188904, 0.5574673414230347, 0.7146118879318237, 0.8717564344406128, 1.0289008617401123, 1.1860454082489014, 1.3431899547576904, 1.5003345012664795, 1.6574790477752686, 1.814623475074768, 1.9717680215835571, 2.1289124488830566, 2.2860569953918457, 2.4432015419006348, 2.600346088409424, 2.757490634918213, 2.914635181427002, 3.071779727935791, 3.22892427444458, 3.386068820953369, 3.543213129043579, 3.700357675552368, 3.8575022220611572, 4.014646530151367, 4.171791076660156, 4.328935623168945, 4.486080169677734, 4.643224716186523, 4.8003692626953125, 4.957513809204102, 5.114658355712891]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 6.0, 9.0, 5.0, 10.0, 11.0, 12.0, 15.0, 16.0, 15.0, 26.0, 20.0, 36.0, 29.0, 35.0, 40.0, 39.0, 38.0, 36.0, 54.0, 47.0, 48.0, 40.0, 40.0, 39.0, 29.0, 35.0, 20.0, 35.0, 29.0, 19.0, 29.0, 27.0, 18.0, 15.0, 14.0, 10.0, 13.0, 7.0, 6.0, 9.0, 3.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.8237361907958984, -2.7358651161193848, -2.647994041442871, -2.5601229667663574, -2.4722518920898438, -2.38438081741333, -2.2965097427368164, -2.2086386680603027, -2.120767593383789, -2.0328965187072754, -1.9450254440307617, -1.857154369354248, -1.7692832946777344, -1.6814122200012207, -1.5935412645339966, -1.505670189857483, -1.4177992343902588, -1.3299281597137451, -1.2420570850372314, -1.1541860103607178, -1.066314935684204, -0.9784439206123352, -0.8905729055404663, -0.8027018308639526, -0.714830756187439, -0.6269596815109253, -0.5390886068344116, -0.4512175917625427, -0.36334651708602905, -0.2754754424095154, -0.18760442733764648, -0.09973335266113281, -0.01186227798461914, 0.07600878179073334, 0.16387984156608582, 0.2517508864402771, 0.33962196111679077, 0.42749303579330444, 0.5153640508651733, 0.603235125541687, 0.6911062002182007, 0.7789772748947144, 0.866848349571228, 0.9547193646430969, 1.0425903797149658, 1.1304614543914795, 1.2183325290679932, 1.3062036037445068, 1.3940746784210205, 1.4819457530975342, 1.5698168277740479, 1.6576879024505615, 1.7455589771270752, 1.8334300518035889, 1.921301007270813, 2.009171962738037, 2.097043037414551, 2.1849141120910645, 2.272785186767578, 2.360656261444092, 2.4485273361206055, 2.536398410797119, 2.624269485473633, 2.7121405601501465, 2.80001163482666]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 7.0, 12.0, 9.0, 18.0, 24.0, 38.0, 63.0, 97.0, 143.0, 210.0, 364.0, 531.0, 918.0, 1490.0, 2654.0, 4234.0, 6735.0, 11581.0, 18956.0, 31577.0, 50646.0, 79152.0, 113377.0, 144064.0, 155466.0, 137245.0, 103328.0, 70792.0, 44876.0, 27707.0, 16633.0, 10027.0, 5943.0, 3745.0, 2294.0, 1372.0, 815.0, 498.0, 334.0, 206.0, 124.0, 83.0, 66.0, 27.0, 34.0, 11.0, 8.0, 5.0, 2.0, 9.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-3.341796875, -3.238555908203125, -3.13531494140625, -3.032073974609375, -2.9288330078125, -2.825592041015625, -2.72235107421875, -2.619110107421875, -2.515869140625, -2.412628173828125, -2.30938720703125, -2.206146240234375, -2.1029052734375, -1.999664306640625, -1.89642333984375, -1.793182373046875, -1.68994140625, -1.586700439453125, -1.48345947265625, -1.380218505859375, -1.2769775390625, -1.173736572265625, -1.07049560546875, -0.967254638671875, -0.864013671875, -0.760772705078125, -0.65753173828125, -0.554290771484375, -0.4510498046875, -0.347808837890625, -0.24456787109375, -0.141326904296875, -0.0380859375, 0.065155029296875, 0.16839599609375, 0.271636962890625, 0.3748779296875, 0.478118896484375, 0.58135986328125, 0.684600830078125, 0.787841796875, 0.891082763671875, 0.99432373046875, 1.097564697265625, 1.2008056640625, 1.304046630859375, 1.40728759765625, 1.510528564453125, 1.61376953125, 1.717010498046875, 1.82025146484375, 1.923492431640625, 2.0267333984375, 2.129974365234375, 2.23321533203125, 2.336456298828125, 2.439697265625, 2.542938232421875, 2.64617919921875, 2.749420166015625, 2.8526611328125, 2.955902099609375, 3.05914306640625, 3.162384033203125, 3.265625]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 4.0, 5.0, 10.0, 7.0, 13.0, 13.0, 13.0, 15.0, 21.0, 25.0, 23.0, 23.0, 40.0, 28.0, 31.0, 35.0, 33.0, 32.0, 43.0, 47.0, 51.0, 41.0, 29.0, 37.0, 24.0, 31.0, 35.0, 44.0, 29.0, 29.0, 26.0, 23.0, 19.0, 23.0, 15.0, 12.0, 14.0, 7.0, 12.0, 7.0, 8.0, 4.0, 3.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.543731689453125, -2.45269775390625, -2.361663818359375, -2.2706298828125, -2.179595947265625, -2.08856201171875, -1.997528076171875, -1.906494140625, -1.815460205078125, -1.72442626953125, -1.633392333984375, -1.5423583984375, -1.451324462890625, -1.36029052734375, -1.269256591796875, -1.17822265625, -1.087188720703125, -0.99615478515625, -0.905120849609375, -0.8140869140625, -0.723052978515625, -0.63201904296875, -0.540985107421875, -0.449951171875, -0.358917236328125, -0.26788330078125, -0.176849365234375, -0.0858154296875, 0.005218505859375, 0.09625244140625, 0.187286376953125, 0.2783203125, 0.369354248046875, 0.46038818359375, 0.551422119140625, 0.6424560546875, 0.733489990234375, 0.82452392578125, 0.915557861328125, 1.006591796875, 1.097625732421875, 1.18865966796875, 1.279693603515625, 1.3707275390625, 1.461761474609375, 1.55279541015625, 1.643829345703125, 1.73486328125, 1.825897216796875, 1.91693115234375, 2.007965087890625, 2.0989990234375, 2.190032958984375, 2.28106689453125, 2.372100830078125, 2.463134765625, 2.554168701171875, 2.64520263671875, 2.736236572265625, 2.8272705078125, 2.918304443359375, 3.00933837890625, 3.100372314453125, 3.19140625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 16.0, 19.0, 24.0, 40.0, 67.0, 96.0, 128.0, 195.0, 328.0, 466.0, 806.0, 1352.0, 2200.0, 3675.0, 6014.0, 10167.0, 17248.0, 28438.0, 46243.0, 73195.0, 108372.0, 142850.0, 158204.0, 143943.0, 109824.0, 74986.0, 47144.0, 29193.0, 17271.0, 10243.0, 6267.0, 3635.0, 2197.0, 1341.0, 858.0, 545.0, 355.0, 197.0, 140.0, 95.0, 58.0, 39.0, 23.0, 18.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-3.42578125, -3.323577880859375, -3.22137451171875, -3.119171142578125, -3.0169677734375, -2.914764404296875, -2.81256103515625, -2.710357666015625, -2.608154296875, -2.505950927734375, -2.40374755859375, -2.301544189453125, -2.1993408203125, -2.097137451171875, -1.99493408203125, -1.892730712890625, -1.79052734375, -1.688323974609375, -1.58612060546875, -1.483917236328125, -1.3817138671875, -1.279510498046875, -1.17730712890625, -1.075103759765625, -0.972900390625, -0.870697021484375, -0.76849365234375, -0.666290283203125, -0.5640869140625, -0.461883544921875, -0.35968017578125, -0.257476806640625, -0.1552734375, -0.053070068359375, 0.04913330078125, 0.151336669921875, 0.2535400390625, 0.355743408203125, 0.45794677734375, 0.560150146484375, 0.662353515625, 0.764556884765625, 0.86676025390625, 0.968963623046875, 1.0711669921875, 1.173370361328125, 1.27557373046875, 1.377777099609375, 1.47998046875, 1.582183837890625, 1.68438720703125, 1.786590576171875, 1.8887939453125, 1.990997314453125, 2.09320068359375, 2.195404052734375, 2.297607421875, 2.399810791015625, 2.50201416015625, 2.604217529296875, 2.7064208984375, 2.808624267578125, 2.91082763671875, 3.013031005859375, 3.115234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 14.0, 8.0, 4.0, 9.0, 16.0, 7.0, 13.0, 10.0, 23.0, 17.0, 29.0, 31.0, 39.0, 36.0, 29.0, 37.0, 43.0, 35.0, 40.0, 40.0, 40.0, 45.0, 51.0, 39.0, 32.0, 40.0, 33.0, 36.0, 32.0, 22.0, 29.0, 15.0, 27.0, 15.0, 17.0, 13.0, 8.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.048828125, -1.98492431640625, -1.9210205078125, -1.85711669921875, -1.793212890625, -1.72930908203125, -1.6654052734375, -1.60150146484375, -1.53759765625, -1.47369384765625, -1.4097900390625, -1.34588623046875, -1.281982421875, -1.21807861328125, -1.1541748046875, -1.09027099609375, -1.0263671875, -0.96246337890625, -0.8985595703125, -0.83465576171875, -0.770751953125, -0.70684814453125, -0.6429443359375, -0.57904052734375, -0.51513671875, -0.45123291015625, -0.3873291015625, -0.32342529296875, -0.259521484375, -0.19561767578125, -0.1317138671875, -0.06781005859375, -0.00390625, 0.05999755859375, 0.1239013671875, 0.18780517578125, 0.251708984375, 0.31561279296875, 0.3795166015625, 0.44342041015625, 0.50732421875, 0.57122802734375, 0.6351318359375, 0.69903564453125, 0.762939453125, 0.82684326171875, 0.8907470703125, 0.95465087890625, 1.0185546875, 1.08245849609375, 1.1463623046875, 1.21026611328125, 1.274169921875, 1.33807373046875, 1.4019775390625, 1.46588134765625, 1.52978515625, 1.59368896484375, 1.6575927734375, 1.72149658203125, 1.785400390625, 1.84930419921875, 1.9132080078125, 1.97711181640625, 2.041015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 11.0, 10.0, 19.0, 22.0, 38.0, 55.0, 109.0, 140.0, 223.0, 351.0, 556.0, 938.0, 1460.0, 2576.0, 4235.0, 7382.0, 12941.0, 22366.0, 39416.0, 68510.0, 111793.0, 161641.0, 185020.0, 159659.0, 110126.0, 67156.0, 39376.0, 22187.0, 12566.0, 7168.0, 4202.0, 2453.0, 1448.0, 899.0, 537.0, 346.0, 236.0, 129.0, 100.0, 52.0, 30.0, 20.0, 18.0, 9.0, 12.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.099609375, -2.03497314453125, -1.9703369140625, -1.90570068359375, -1.841064453125, -1.77642822265625, -1.7117919921875, -1.64715576171875, -1.58251953125, -1.51788330078125, -1.4532470703125, -1.38861083984375, -1.323974609375, -1.25933837890625, -1.1947021484375, -1.13006591796875, -1.0654296875, -1.00079345703125, -0.9361572265625, -0.87152099609375, -0.806884765625, -0.74224853515625, -0.6776123046875, -0.61297607421875, -0.54833984375, -0.48370361328125, -0.4190673828125, -0.35443115234375, -0.289794921875, -0.22515869140625, -0.1605224609375, -0.09588623046875, -0.03125, 0.03338623046875, 0.0980224609375, 0.16265869140625, 0.227294921875, 0.29193115234375, 0.3565673828125, 0.42120361328125, 0.48583984375, 0.55047607421875, 0.6151123046875, 0.67974853515625, 0.744384765625, 0.80902099609375, 0.8736572265625, 0.93829345703125, 1.0029296875, 1.06756591796875, 1.1322021484375, 1.19683837890625, 1.261474609375, 1.32611083984375, 1.3907470703125, 1.45538330078125, 1.52001953125, 1.58465576171875, 1.6492919921875, 1.71392822265625, 1.778564453125, 1.84320068359375, 1.9078369140625, 1.97247314453125, 2.037109375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 14.0, 15.0, 17.0, 16.0, 15.0, 24.0, 38.0, 23.0, 32.0, 42.0, 50.0, 48.0, 54.0, 68.0, 74.0, 49.0, 61.0, 44.0, 43.0, 40.0, 42.0, 24.0, 19.0, 27.0, 20.0, 20.0, 13.0, 10.0, 6.0, 6.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00019216537475585938, -0.0001864079385995865, -0.0001806505024433136, -0.0001748930662870407, -0.00016913563013076782, -0.00016337819397449493, -0.00015762075781822205, -0.00015186332166194916, -0.00014610588550567627, -0.00014034844934940338, -0.0001345910131931305, -0.0001288335770368576, -0.00012307614088058472, -0.00011731870472431183, -0.00011156126856803894, -0.00010580383241176605, -0.00010004639625549316, -9.428896009922028e-05, -8.853152394294739e-05, -8.27740877866745e-05, -7.701665163040161e-05, -7.125921547412872e-05, -6.550177931785583e-05, -5.974434316158295e-05, -5.398690700531006e-05, -4.822947084903717e-05, -4.247203469276428e-05, -3.6714598536491394e-05, -3.0957162380218506e-05, -2.5199726223945618e-05, -1.944229006767273e-05, -1.3684853911399841e-05, -7.927417755126953e-06, -2.169981598854065e-06, 3.5874545574188232e-06, 9.344890713691711e-06, 1.51023268699646e-05, 2.0859763026237488e-05, 2.6617199182510376e-05, 3.2374635338783264e-05, 3.813207149505615e-05, 4.388950765132904e-05, 4.964694380760193e-05, 5.540437996387482e-05, 6.11618161201477e-05, 6.69192522764206e-05, 7.267668843269348e-05, 7.843412458896637e-05, 8.419156074523926e-05, 8.994899690151215e-05, 9.570643305778503e-05, 0.00010146386921405792, 0.00010722130537033081, 0.0001129787415266037, 0.00011873617768287659, 0.00012449361383914948, 0.00013025104999542236, 0.00013600848615169525, 0.00014176592230796814, 0.00014752335846424103, 0.00015328079462051392, 0.0001590382307767868, 0.0001647956669330597, 0.00017055310308933258, 0.00017631053924560547]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 12.0, 11.0, 23.0, 37.0, 64.0, 94.0, 145.0, 251.0, 403.0, 651.0, 999.0, 1673.0, 2590.0, 4236.0, 6953.0, 11467.0, 18383.0, 29972.0, 48292.0, 75297.0, 110361.0, 143914.0, 157109.0, 140144.0, 105672.0, 71318.0, 45015.0, 28284.0, 17416.0, 10746.0, 6507.0, 4049.0, 2429.0, 1523.0, 977.0, 553.0, 371.0, 222.0, 141.0, 90.0, 51.0, 47.0, 25.0, 10.0, 14.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7412109375, -1.6891326904296875, -1.637054443359375, -1.5849761962890625, -1.53289794921875, -1.4808197021484375, -1.428741455078125, -1.3766632080078125, -1.3245849609375, -1.2725067138671875, -1.220428466796875, -1.1683502197265625, -1.11627197265625, -1.0641937255859375, -1.012115478515625, -0.9600372314453125, -0.907958984375, -0.8558807373046875, -0.803802490234375, -0.7517242431640625, -0.69964599609375, -0.6475677490234375, -0.595489501953125, -0.5434112548828125, -0.4913330078125, -0.4392547607421875, -0.387176513671875, -0.3350982666015625, -0.28302001953125, -0.2309417724609375, -0.178863525390625, -0.1267852783203125, -0.07470703125, -0.0226287841796875, 0.029449462890625, 0.0815277099609375, 0.13360595703125, 0.1856842041015625, 0.237762451171875, 0.2898406982421875, 0.3419189453125, 0.3939971923828125, 0.446075439453125, 0.4981536865234375, 0.55023193359375, 0.6023101806640625, 0.654388427734375, 0.7064666748046875, 0.758544921875, 0.8106231689453125, 0.862701416015625, 0.9147796630859375, 0.96685791015625, 1.0189361572265625, 1.071014404296875, 1.1230926513671875, 1.1751708984375, 1.2272491455078125, 1.279327392578125, 1.3314056396484375, 1.38348388671875, 1.4355621337890625, 1.487640380859375, 1.5397186279296875, 1.591796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 4.0, 9.0, 13.0, 15.0, 12.0, 18.0, 16.0, 23.0, 32.0, 30.0, 39.0, 54.0, 59.0, 59.0, 61.0, 57.0, 72.0, 56.0, 64.0, 54.0, 37.0, 23.0, 34.0, 30.0, 29.0, 22.0, 14.0, 12.0, 12.0, 11.0, 6.0, 4.0, 1.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66064453125, -0.6390609741210938, -0.6174774169921875, -0.5958938598632812, -0.574310302734375, -0.5527267456054688, -0.5311431884765625, -0.5095596313476562, -0.48797607421875, -0.46639251708984375, -0.4448089599609375, -0.42322540283203125, -0.401641845703125, -0.38005828857421875, -0.3584747314453125, -0.33689117431640625, -0.3153076171875, -0.29372406005859375, -0.2721405029296875, -0.25055694580078125, -0.228973388671875, -0.20738983154296875, -0.1858062744140625, -0.16422271728515625, -0.14263916015625, -0.12105560302734375, -0.0994720458984375, -0.07788848876953125, -0.056304931640625, -0.03472137451171875, -0.0131378173828125, 0.00844573974609375, 0.030029296875, 0.05161285400390625, 0.0731964111328125, 0.09477996826171875, 0.116363525390625, 0.13794708251953125, 0.1595306396484375, 0.18111419677734375, 0.20269775390625, 0.22428131103515625, 0.2458648681640625, 0.26744842529296875, 0.289031982421875, 0.31061553955078125, 0.3321990966796875, 0.35378265380859375, 0.3753662109375, 0.39694976806640625, 0.4185333251953125, 0.44011688232421875, 0.461700439453125, 0.48328399658203125, 0.5048675537109375, 0.5264511108398438, 0.54803466796875, 0.5696182250976562, 0.5912017822265625, 0.6127853393554688, 0.634368896484375, 0.6559524536132812, 0.6775360107421875, 0.6991195678710938, 0.720703125]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 9.0, 11.0, 12.0, 11.0, 21.0, 29.0, 48.0, 45.0, 48.0, 62.0, 59.0, 66.0, 60.0, 62.0, 59.0, 56.0, 61.0, 46.0, 44.0, 27.0, 34.0, 26.0, 18.0, 9.0, 7.0, 11.0, 10.0, 8.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9030683040618896, -3.753147840499878, -3.6032276153564453, -3.4533071517944336, -3.303386926651001, -3.1534664630889893, -3.0035462379455566, -2.853625774383545, -2.703705310821533, -2.5537848472595215, -2.403864622116089, -2.253944158554077, -2.1040239334106445, -1.9541034698486328, -1.8041831254959106, -1.6542627811431885, -1.5043425559997559, -1.3544222116470337, -1.2045018672943115, -1.0545814037322998, -0.9046611189842224, -0.7547407746315002, -0.6048203706741333, -0.45490002632141113, -0.30497968196868896, -0.1550593227148056, -0.005138963460922241, 0.14478141069412231, 0.2947017550468445, 0.44462209939956665, 0.5945425033569336, 0.7444628477096558, 0.894383430480957, 1.0443037748336792, 1.1942241191864014, 1.344144582748413, 1.4940648078918457, 1.6439852714538574, 1.7939056158065796, 1.9438259601593018, 2.0937461853027344, 2.243666648864746, 2.3935868740081787, 2.5435073375701904, 2.693427562713623, 2.8433480262756348, 2.9932684898376465, 3.143188714981079, 3.293109178543091, 3.4430296421051025, 3.592949867248535, 3.742870330810547, 3.8927905559539795, 4.042710781097412, 4.192631244659424, 4.3425517082214355, 4.492472171783447, 4.642392635345459, 4.792313098907471, 4.942233085632324, 5.092153549194336, 5.242074012756348, 5.391994476318359, 5.541914939880371, 5.691834926605225]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 1.0, 8.0, 1.0, 3.0, 6.0, 12.0, 13.0, 17.0, 12.0, 8.0, 14.0, 24.0, 21.0, 26.0, 35.0, 24.0, 33.0, 38.0, 38.0, 49.0, 44.0, 36.0, 43.0, 38.0, 34.0, 32.0, 31.0, 23.0, 28.0, 34.0, 26.0, 26.0, 32.0, 20.0, 25.0, 27.0, 16.0, 8.0, 11.0, 21.0, 9.0, 6.0, 4.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0], "bins": [-2.761392116546631, -2.680264949798584, -2.599137544631958, -2.518010377883911, -2.4368832111358643, -2.3557558059692383, -2.2746286392211914, -2.1935014724731445, -2.1123740673065186, -2.0312469005584717, -1.9501196146011353, -1.8689923286437988, -1.7878650426864624, -1.706737756729126, -1.625610589981079, -1.5444833040237427, -1.4633561372756958, -1.3822288513183594, -1.3011016845703125, -1.219974398612976, -1.1388471126556396, -1.0577199459075928, -0.9765926599502563, -0.8954653739929199, -0.8143381476402283, -0.7332109212875366, -0.6520836353302002, -0.5709564089775085, -0.4898291528224945, -0.40870189666748047, -0.3275746703147888, -0.2464473843574524, -0.16532015800476074, -0.0841929093003273, -0.00306566059589386, 0.07806158065795898, 0.15918883681297302, 0.24031609296798706, 0.3214433193206787, 0.40257060527801514, 0.4836978316307068, 0.5648250579833984, 0.6459523439407349, 0.7270795702934265, 0.8082067966461182, 0.8893340826034546, 0.9704613089561462, 1.051588535308838, 1.1327158212661743, 1.2138431072235107, 1.2949702739715576, 1.376097559928894, 1.4572248458862305, 1.5383520126342773, 1.6194792985916138, 1.7006065845489502, 1.781733751296997, 1.8628610372543335, 1.9439882040023804, 2.025115489959717, 2.1062426567077637, 2.1873700618743896, 2.2684972286224365, 2.3496246337890625, 2.4307518005371094]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 9.0, 11.0, 23.0, 25.0, 38.0, 52.0, 68.0, 117.0, 212.0, 318.0, 446.0, 691.0, 1043.0, 1769.0, 2851.0, 4684.0, 7814.0, 13949.0, 25472.0, 49713.0, 101316.0, 222267.0, 517864.0, 1031953.0, 1113228.0, 602227.0, 257634.0, 115340.0, 56228.0, 28931.0, 15911.0, 8980.0, 5106.0, 3008.0, 1882.0, 1128.0, 747.0, 439.0, 254.0, 203.0, 132.0, 71.0, 45.0, 43.0, 18.0, 13.0, 7.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-5.203125, -5.0589599609375, -4.914794921875, -4.7706298828125, -4.62646484375, -4.4822998046875, -4.338134765625, -4.1939697265625, -4.0498046875, -3.9056396484375, -3.761474609375, -3.6173095703125, -3.47314453125, -3.3289794921875, -3.184814453125, -3.0406494140625, -2.896484375, -2.7523193359375, -2.608154296875, -2.4639892578125, -2.31982421875, -2.1756591796875, -2.031494140625, -1.8873291015625, -1.7431640625, -1.5989990234375, -1.454833984375, -1.3106689453125, -1.16650390625, -1.0223388671875, -0.878173828125, -0.7340087890625, -0.58984375, -0.4456787109375, -0.301513671875, -0.1573486328125, -0.01318359375, 0.1309814453125, 0.275146484375, 0.4193115234375, 0.5634765625, 0.7076416015625, 0.851806640625, 0.9959716796875, 1.14013671875, 1.2843017578125, 1.428466796875, 1.5726318359375, 1.716796875, 1.8609619140625, 2.005126953125, 2.1492919921875, 2.29345703125, 2.4376220703125, 2.581787109375, 2.7259521484375, 2.8701171875, 3.0142822265625, 3.158447265625, 3.3026123046875, 3.44677734375, 3.5909423828125, 3.735107421875, 3.8792724609375, 4.0234375]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 4.0, 4.0, 5.0, 10.0, 17.0, 14.0, 15.0, 14.0, 17.0, 21.0, 28.0, 19.0, 30.0, 43.0, 29.0, 37.0, 39.0, 40.0, 38.0, 48.0, 47.0, 34.0, 39.0, 32.0, 30.0, 36.0, 41.0, 33.0, 23.0, 21.0, 22.0, 23.0, 25.0, 20.0, 13.0, 10.0, 11.0, 7.0, 14.0, 3.0, 5.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8919677734375, -1.831787109375, -1.7716064453125, -1.71142578125, -1.6512451171875, -1.591064453125, -1.5308837890625, -1.470703125, -1.4105224609375, -1.350341796875, -1.2901611328125, -1.22998046875, -1.1697998046875, -1.109619140625, -1.0494384765625, -0.9892578125, -0.9290771484375, -0.868896484375, -0.8087158203125, -0.74853515625, -0.6883544921875, -0.628173828125, -0.5679931640625, -0.5078125, -0.4476318359375, -0.387451171875, -0.3272705078125, -0.26708984375, -0.2069091796875, -0.146728515625, -0.0865478515625, -0.0263671875, 0.0338134765625, 0.093994140625, 0.1541748046875, 0.21435546875, 0.2745361328125, 0.334716796875, 0.3948974609375, 0.455078125, 0.5152587890625, 0.575439453125, 0.6356201171875, 0.69580078125, 0.7559814453125, 0.816162109375, 0.8763427734375, 0.9365234375, 0.9967041015625, 1.056884765625, 1.1170654296875, 1.17724609375, 1.2374267578125, 1.297607421875, 1.3577880859375, 1.41796875, 1.4781494140625, 1.538330078125, 1.5985107421875, 1.65869140625, 1.7188720703125, 1.779052734375, 1.8392333984375, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 11.0, 7.0, 31.0, 29.0, 50.0, 63.0, 117.0, 179.0, 263.0, 385.0, 651.0, 930.0, 1634.0, 2557.0, 4142.0, 6969.0, 12067.0, 20994.0, 38495.0, 73202.0, 143392.0, 285092.0, 562891.0, 936695.0, 936982.0, 567641.0, 289982.0, 144460.0, 73875.0, 38822.0, 21567.0, 12151.0, 6983.0, 4029.0, 2544.0, 1585.0, 1007.0, 597.0, 406.0, 277.0, 191.0, 100.0, 81.0, 49.0, 34.0, 28.0, 16.0, 6.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.05859375, -3.92333984375, -3.7880859375, -3.65283203125, -3.517578125, -3.38232421875, -3.2470703125, -3.11181640625, -2.9765625, -2.84130859375, -2.7060546875, -2.57080078125, -2.435546875, -2.30029296875, -2.1650390625, -2.02978515625, -1.89453125, -1.75927734375, -1.6240234375, -1.48876953125, -1.353515625, -1.21826171875, -1.0830078125, -0.94775390625, -0.8125, -0.67724609375, -0.5419921875, -0.40673828125, -0.271484375, -0.13623046875, -0.0009765625, 0.13427734375, 0.26953125, 0.40478515625, 0.5400390625, 0.67529296875, 0.810546875, 0.94580078125, 1.0810546875, 1.21630859375, 1.3515625, 1.48681640625, 1.6220703125, 1.75732421875, 1.892578125, 2.02783203125, 2.1630859375, 2.29833984375, 2.43359375, 2.56884765625, 2.7041015625, 2.83935546875, 2.974609375, 3.10986328125, 3.2451171875, 3.38037109375, 3.515625, 3.65087890625, 3.7861328125, 3.92138671875, 4.056640625, 4.19189453125, 4.3271484375, 4.46240234375, 4.59765625]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0, 6.0, 3.0, 10.0, 4.0, 10.0, 17.0, 22.0, 20.0, 27.0, 34.0, 55.0, 61.0, 82.0, 86.0, 113.0, 114.0, 148.0, 191.0, 226.0, 230.0, 246.0, 247.0, 246.0, 264.0, 224.0, 224.0, 200.0, 181.0, 147.0, 119.0, 104.0, 85.0, 67.0, 71.0, 44.0, 32.0, 27.0, 30.0, 14.0, 11.0, 8.0, 10.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2470703125, -1.209442138671875, -1.17181396484375, -1.134185791015625, -1.0965576171875, -1.058929443359375, -1.02130126953125, -0.983673095703125, -0.946044921875, -0.908416748046875, -0.87078857421875, -0.833160400390625, -0.7955322265625, -0.757904052734375, -0.72027587890625, -0.682647705078125, -0.64501953125, -0.607391357421875, -0.56976318359375, -0.532135009765625, -0.4945068359375, -0.456878662109375, -0.41925048828125, -0.381622314453125, -0.343994140625, -0.306365966796875, -0.26873779296875, -0.231109619140625, -0.1934814453125, -0.155853271484375, -0.11822509765625, -0.080596923828125, -0.04296875, -0.005340576171875, 0.03228759765625, 0.069915771484375, 0.1075439453125, 0.145172119140625, 0.18280029296875, 0.220428466796875, 0.258056640625, 0.295684814453125, 0.33331298828125, 0.370941162109375, 0.4085693359375, 0.446197509765625, 0.48382568359375, 0.521453857421875, 0.55908203125, 0.596710205078125, 0.63433837890625, 0.671966552734375, 0.7095947265625, 0.747222900390625, 0.78485107421875, 0.822479248046875, 0.860107421875, 0.897735595703125, 0.93536376953125, 0.972991943359375, 1.0106201171875, 1.048248291015625, 1.08587646484375, 1.123504638671875, 1.1611328125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 6.0, 7.0, 10.0, 15.0, 16.0, 14.0, 20.0, 28.0, 32.0, 33.0, 51.0, 43.0, 52.0, 56.0, 46.0, 53.0, 56.0, 61.0, 51.0, 45.0, 34.0, 36.0, 35.0, 33.0, 25.0, 24.0, 23.0, 15.0, 6.0, 20.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2587530612945557, -3.1374149322509766, -3.0160770416259766, -2.8947389125823975, -2.7734007835388184, -2.6520628929138184, -2.5307247638702393, -2.40938663482666, -2.28804874420166, -2.166710615158081, -2.045372724533081, -1.924034595489502, -1.8026965856552124, -1.6813585758209229, -1.5600204467773438, -1.4386824369430542, -1.3173444271087646, -1.196006417274475, -1.0746684074401855, -0.9533302783966064, -0.8319922685623169, -0.7106542587280273, -0.589316189289093, -0.4679781198501587, -0.34664011001586914, -0.2253020703792572, -0.10396403074264526, 0.017374008893966675, 0.1387120485305786, 0.26005005836486816, 0.3813881278038025, 0.5027261972427368, 0.6240639686584473, 0.7454019784927368, 0.8667400479316711, 0.9880781173706055, 1.109416127204895, 1.2307541370391846, 1.3520922660827637, 1.4734302759170532, 1.5947682857513428, 1.7161062955856323, 1.8374443054199219, 1.958782434463501, 2.08012056350708, 2.20145845413208, 2.322796583175659, 2.4441347122192383, 2.5654726028442383, 2.6868107318878174, 2.8081486225128174, 2.9294867515563965, 3.0508246421813965, 3.1721627712249756, 3.2935009002685547, 3.4148387908935547, 3.536176919937134, 3.657515048980713, 3.778852939605713, 3.900191068649292, 4.021529197692871, 4.142867088317871, 4.264204978942871, 4.385543346405029, 4.506881237030029]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 7.0, 12.0, 9.0, 6.0, 11.0, 9.0, 14.0, 15.0, 20.0, 23.0, 15.0, 17.0, 29.0, 34.0, 35.0, 29.0, 26.0, 38.0, 30.0, 46.0, 46.0, 50.0, 43.0, 28.0, 27.0, 29.0, 38.0, 36.0, 31.0, 37.0, 20.0, 22.0, 11.0, 20.0, 24.0, 17.0, 22.0, 13.0, 8.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.0733299255371094, -2.0040252208709717, -1.934720516204834, -1.8654159307479858, -1.7961112260818481, -1.7268065214157104, -1.6575019359588623, -1.5881972312927246, -1.518892526626587, -1.4495878219604492, -1.3802831172943115, -1.3109785318374634, -1.2416738271713257, -1.172369122505188, -1.1030645370483398, -1.0337598323822021, -0.9644551277160645, -0.8951504230499268, -0.8258457779884338, -0.7565411329269409, -0.6872364282608032, -0.6179317235946655, -0.5486270785331726, -0.4793224036693573, -0.410017728805542, -0.3407130539417267, -0.2714083790779114, -0.20210370421409607, -0.13279902935028076, -0.06349435448646545, 0.0058103203773498535, 0.07511499524116516, 0.14441990852355957, 0.21372458338737488, 0.2830292582511902, 0.3523339331150055, 0.4216386079788208, 0.4909432828426361, 0.5602479577064514, 0.6295526027679443, 0.698857307434082, 0.7681620121002197, 0.8374666571617126, 0.9067713022232056, 0.9760760068893433, 1.045380711555481, 1.114685297012329, 1.1839900016784668, 1.2532947063446045, 1.3225994110107422, 1.3919041156768799, 1.461208701133728, 1.5305134057998657, 1.5998181104660034, 1.6691226959228516, 1.7384274005889893, 1.807732105255127, 1.8770368099212646, 1.9463415145874023, 2.01564621925354, 2.0849509239196777, 2.1542553901672363, 2.223560094833374, 2.2928647994995117, 2.3621695041656494]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 13.0, 23.0, 32.0, 56.0, 83.0, 115.0, 169.0, 296.0, 415.0, 628.0, 950.0, 1496.0, 2328.0, 3663.0, 5729.0, 9105.0, 14356.0, 22547.0, 35283.0, 54423.0, 82369.0, 117504.0, 148476.0, 153693.0, 128318.0, 93210.0, 62004.0, 40552.0, 25638.0, 16361.0, 10314.0, 6504.0, 4231.0, 2696.0, 1805.0, 1110.0, 681.0, 446.0, 324.0, 204.0, 121.0, 111.0, 48.0, 32.0, 23.0, 10.0, 15.0, 10.0, 7.0, 7.0, 3.0, 6.0, 2.0], "bins": [-0.315673828125, -0.3064308166503906, -0.29718780517578125, -0.2879447937011719, -0.2787017822265625, -0.2694587707519531, -0.26021575927734375, -0.2509727478027344, -0.241729736328125, -0.23248672485351562, -0.22324371337890625, -0.21400070190429688, -0.2047576904296875, -0.19551467895507812, -0.18627166748046875, -0.17702865600585938, -0.16778564453125, -0.15854263305664062, -0.14929962158203125, -0.14005661010742188, -0.1308135986328125, -0.12157058715820312, -0.11232757568359375, -0.10308456420898438, -0.093841552734375, -0.08459854125976562, -0.07535552978515625, -0.06611251831054688, -0.0568695068359375, -0.047626495361328125, -0.03838348388671875, -0.029140472412109375, -0.0198974609375, -0.010654449462890625, -0.00141143798828125, 0.007831573486328125, 0.0170745849609375, 0.026317596435546875, 0.03556060791015625, 0.044803619384765625, 0.054046630859375, 0.06328964233398438, 0.07253265380859375, 0.08177566528320312, 0.0910186767578125, 0.10026168823242188, 0.10950469970703125, 0.11874771118164062, 0.12799072265625, 0.13723373413085938, 0.14647674560546875, 0.15571975708007812, 0.1649627685546875, 0.17420578002929688, 0.18344879150390625, 0.19269180297851562, 0.201934814453125, 0.21117782592773438, 0.22042083740234375, 0.22966384887695312, 0.2389068603515625, 0.24814987182617188, 0.25739288330078125, 0.2666358947753906, 0.27587890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 7.0, 9.0, 12.0, 10.0, 16.0, 15.0, 23.0, 22.0, 18.0, 20.0, 36.0, 20.0, 26.0, 40.0, 25.0, 41.0, 45.0, 40.0, 44.0, 53.0, 40.0, 38.0, 47.0, 33.0, 30.0, 31.0, 34.0, 25.0, 19.0, 27.0, 19.0, 23.0, 11.0, 19.0, 19.0, 20.0, 14.0, 4.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28125, -2.198883056640625, -2.11651611328125, -2.034149169921875, -1.9517822265625, -1.869415283203125, -1.78704833984375, -1.704681396484375, -1.622314453125, -1.539947509765625, -1.45758056640625, -1.375213623046875, -1.2928466796875, -1.210479736328125, -1.12811279296875, -1.045745849609375, -0.96337890625, -0.881011962890625, -0.79864501953125, -0.716278076171875, -0.6339111328125, -0.551544189453125, -0.46917724609375, -0.386810302734375, -0.304443359375, -0.222076416015625, -0.13970947265625, -0.057342529296875, 0.0250244140625, 0.107391357421875, 0.18975830078125, 0.272125244140625, 0.3544921875, 0.436859130859375, 0.51922607421875, 0.601593017578125, 0.6839599609375, 0.766326904296875, 0.84869384765625, 0.931060791015625, 1.013427734375, 1.095794677734375, 1.17816162109375, 1.260528564453125, 1.3428955078125, 1.425262451171875, 1.50762939453125, 1.589996337890625, 1.67236328125, 1.754730224609375, 1.83709716796875, 1.919464111328125, 2.0018310546875, 2.084197998046875, 2.16656494140625, 2.248931884765625, 2.331298828125, 2.413665771484375, 2.49603271484375, 2.578399658203125, 2.6607666015625, 2.743133544921875, 2.82550048828125, 2.907867431640625, 2.990234375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 7.0, 6.0, 7.0, 11.0, 16.0, 19.0, 25.0, 26.0, 59.0, 57.0, 85.0, 108.0, 148.0, 195.0, 308.0, 451.0, 649.0, 1094.0, 1778.0, 3170.0, 5974.0, 11518.0, 24087.0, 118039.0, 796702.0, 46413.0, 17614.0, 8661.0, 4488.0, 2536.0, 1451.0, 931.0, 610.0, 382.0, 260.0, 184.0, 123.0, 104.0, 59.0, 42.0, 34.0, 25.0, 20.0, 24.0, 11.0, 16.0, 10.0, 10.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9912109375, -0.95849609375, -0.92578125, -0.89306640625, -0.8603515625, -0.82763671875, -0.794921875, -0.76220703125, -0.7294921875, -0.69677734375, -0.6640625, -0.63134765625, -0.5986328125, -0.56591796875, -0.533203125, -0.50048828125, -0.4677734375, -0.43505859375, -0.40234375, -0.36962890625, -0.3369140625, -0.30419921875, -0.271484375, -0.23876953125, -0.2060546875, -0.17333984375, -0.140625, -0.10791015625, -0.0751953125, -0.04248046875, -0.009765625, 0.02294921875, 0.0556640625, 0.08837890625, 0.12109375, 0.15380859375, 0.1865234375, 0.21923828125, 0.251953125, 0.28466796875, 0.3173828125, 0.35009765625, 0.3828125, 0.41552734375, 0.4482421875, 0.48095703125, 0.513671875, 0.54638671875, 0.5791015625, 0.61181640625, 0.64453125, 0.67724609375, 0.7099609375, 0.74267578125, 0.775390625, 0.80810546875, 0.8408203125, 0.87353515625, 0.90625, 0.93896484375, 0.9716796875, 1.00439453125, 1.037109375, 1.06982421875, 1.1025390625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 4.0, 8.0, 5.0, 14.0, 14.0, 13.0, 22.0, 21.0, 15.0, 24.0, 20.0, 30.0, 34.0, 30.0, 30.0, 42.0, 36.0, 34.0, 29.0, 36.0, 43.0, 30.0, 35.0, 34.0, 29.0, 36.0, 35.0, 31.0, 31.0, 34.0, 25.0, 19.0, 15.0, 20.0, 21.0, 13.0, 14.0, 9.0, 9.0, 10.0, 8.0, 10.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.6951446533203125, -1.640289306640625, -1.5854339599609375, -1.53057861328125, -1.4757232666015625, -1.420867919921875, -1.3660125732421875, -1.3111572265625, -1.2563018798828125, -1.201446533203125, -1.1465911865234375, -1.09173583984375, -1.0368804931640625, -0.982025146484375, -0.9271697998046875, -0.872314453125, -0.8174591064453125, -0.762603759765625, -0.7077484130859375, -0.65289306640625, -0.5980377197265625, -0.543182373046875, -0.4883270263671875, -0.4334716796875, -0.3786163330078125, -0.323760986328125, -0.2689056396484375, -0.21405029296875, -0.1591949462890625, -0.104339599609375, -0.0494842529296875, 0.00537109375, 0.0602264404296875, 0.115081787109375, 0.1699371337890625, 0.22479248046875, 0.2796478271484375, 0.334503173828125, 0.3893585205078125, 0.4442138671875, 0.4990692138671875, 0.553924560546875, 0.6087799072265625, 0.66363525390625, 0.7184906005859375, 0.773345947265625, 0.8282012939453125, 0.883056640625, 0.9379119873046875, 0.992767333984375, 1.0476226806640625, 1.10247802734375, 1.1573333740234375, 1.212188720703125, 1.2670440673828125, 1.3218994140625, 1.3767547607421875, 1.431610107421875, 1.4864654541015625, 1.54132080078125, 1.5961761474609375, 1.651031494140625, 1.7058868408203125, 1.7607421875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 5.0, 3.0, 2.0, 5.0, 13.0, 8.0, 17.0, 27.0, 41.0, 45.0, 52.0, 75.0, 95.0, 166.0, 267.0, 347.0, 566.0, 726.0, 1188.0, 1758.0, 2726.0, 4350.0, 7189.0, 12202.0, 22586.0, 81549.0, 834490.0, 35479.0, 16747.0, 9663.0, 5644.0, 3639.0, 2321.0, 1483.0, 988.0, 660.0, 424.0, 305.0, 211.0, 152.0, 95.0, 65.0, 49.0, 35.0, 32.0, 21.0, 13.0, 14.0, 9.0, 6.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.259033203125, -0.24953460693359375, -0.2400360107421875, -0.23053741455078125, -0.221038818359375, -0.21154022216796875, -0.2020416259765625, -0.19254302978515625, -0.18304443359375, -0.17354583740234375, -0.1640472412109375, -0.15454864501953125, -0.145050048828125, -0.13555145263671875, -0.1260528564453125, -0.11655426025390625, -0.1070556640625, -0.09755706787109375, -0.0880584716796875, -0.07855987548828125, -0.069061279296875, -0.05956268310546875, -0.0500640869140625, -0.04056549072265625, -0.03106689453125, -0.02156829833984375, -0.0120697021484375, -0.00257110595703125, 0.006927490234375, 0.01642608642578125, 0.0259246826171875, 0.03542327880859375, 0.044921875, 0.05442047119140625, 0.0639190673828125, 0.07341766357421875, 0.082916259765625, 0.09241485595703125, 0.1019134521484375, 0.11141204833984375, 0.12091064453125, 0.13040924072265625, 0.1399078369140625, 0.14940643310546875, 0.158905029296875, 0.16840362548828125, 0.1779022216796875, 0.18740081787109375, 0.1968994140625, 0.20639801025390625, 0.2158966064453125, 0.22539520263671875, 0.234893798828125, 0.24439239501953125, 0.2538909912109375, 0.26338958740234375, 0.27288818359375, 0.28238677978515625, 0.2918853759765625, 0.30138397216796875, 0.310882568359375, 0.32038116455078125, 0.3298797607421875, 0.33937835693359375, 0.348876953125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 4.0, 12.0, 6.0, 11.0, 17.0, 21.0, 19.0, 25.0, 18.0, 26.0, 19.0, 39.0, 32.0, 43.0, 40.0, 43.0, 35.0, 53.0, 37.0, 56.0, 42.0, 55.0, 40.0, 43.0, 45.0, 34.0, 26.0, 26.0, 24.0, 18.0, 17.0, 6.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.562999725341797e-05, -2.470053732395172e-05, -2.3771077394485474e-05, -2.2841617465019226e-05, -2.191215753555298e-05, -2.098269760608673e-05, -2.0053237676620483e-05, -1.9123777747154236e-05, -1.8194317817687988e-05, -1.726485788822174e-05, -1.6335397958755493e-05, -1.5405938029289246e-05, -1.4476478099822998e-05, -1.354701817035675e-05, -1.2617558240890503e-05, -1.1688098311424255e-05, -1.0758638381958008e-05, -9.82917845249176e-06, -8.899718523025513e-06, -7.970258593559265e-06, -7.040798664093018e-06, -6.11133873462677e-06, -5.1818788051605225e-06, -4.252418875694275e-06, -3.3229589462280273e-06, -2.3934990167617798e-06, -1.4640390872955322e-06, -5.345791578292847e-07, 3.948807716369629e-07, 1.3243407011032104e-06, 2.253800630569458e-06, 3.1832605600357056e-06, 4.112720489501953e-06, 5.042180418968201e-06, 5.971640348434448e-06, 6.901100277900696e-06, 7.830560207366943e-06, 8.760020136833191e-06, 9.689480066299438e-06, 1.0618939995765686e-05, 1.1548399925231934e-05, 1.2477859854698181e-05, 1.3407319784164429e-05, 1.4336779713630676e-05, 1.5266239643096924e-05, 1.619569957256317e-05, 1.712515950202942e-05, 1.8054619431495667e-05, 1.8984079360961914e-05, 1.991353929042816e-05, 2.084299921989441e-05, 2.1772459149360657e-05, 2.2701919078826904e-05, 2.3631379008293152e-05, 2.45608389377594e-05, 2.5490298867225647e-05, 2.6419758796691895e-05, 2.7349218726158142e-05, 2.827867865562439e-05, 2.9208138585090637e-05, 3.0137598514556885e-05, 3.106705844402313e-05, 3.199651837348938e-05, 3.292597830295563e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 12.0, 23.0, 29.0, 40.0, 61.0, 68.0, 111.0, 172.0, 255.0, 422.0, 757.0, 1277.0, 2200.0, 3683.0, 6939.0, 13388.0, 27587.0, 58850.0, 130249.0, 254678.0, 271229.0, 146350.0, 66656.0, 30960.0, 15126.0, 7651.0, 4123.0, 2271.0, 1280.0, 823.0, 473.0, 291.0, 167.0, 126.0, 78.0, 50.0, 25.0, 15.0, 16.0, 5.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 5.0, 0.0, 2.0], "bins": [-0.1693115234375, -0.16434288024902344, -0.15937423706054688, -0.1544055938720703, -0.14943695068359375, -0.1444683074951172, -0.13949966430664062, -0.13453102111816406, -0.1295623779296875, -0.12459373474121094, -0.11962509155273438, -0.11465644836425781, -0.10968780517578125, -0.10471916198730469, -0.09975051879882812, -0.09478187561035156, -0.089813232421875, -0.08484458923339844, -0.07987594604492188, -0.07490730285644531, -0.06993865966796875, -0.06497001647949219, -0.060001373291015625, -0.05503273010253906, -0.0500640869140625, -0.04509544372558594, -0.040126800537109375, -0.03515815734863281, -0.03018951416015625, -0.025220870971679688, -0.020252227783203125, -0.015283584594726562, -0.01031494140625, -0.0053462982177734375, -0.000377655029296875, 0.0045909881591796875, 0.00955963134765625, 0.014528274536132812, 0.019496917724609375, 0.024465560913085938, 0.0294342041015625, 0.03440284729003906, 0.039371490478515625, 0.04434013366699219, 0.04930877685546875, 0.05427742004394531, 0.059246063232421875, 0.06421470642089844, 0.069183349609375, 0.07415199279785156, 0.07912063598632812, 0.08408927917480469, 0.08905792236328125, 0.09402656555175781, 0.09899520874023438, 0.10396385192871094, 0.1089324951171875, 0.11390113830566406, 0.11886978149414062, 0.12383842468261719, 0.12880706787109375, 0.1337757110595703, 0.13874435424804688, 0.14371299743652344, 0.148681640625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 6.0, 3.0, 7.0, 16.0, 14.0, 10.0, 15.0, 16.0, 24.0, 29.0, 43.0, 62.0, 54.0, 76.0, 69.0, 85.0, 76.0, 56.0, 58.0, 54.0, 45.0, 22.0, 33.0, 18.0, 25.0, 20.0, 17.0, 10.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06414794921875, -0.06186485290527344, -0.059581756591796875, -0.05729866027832031, -0.05501556396484375, -0.05273246765136719, -0.050449371337890625, -0.04816627502441406, -0.0458831787109375, -0.04360008239746094, -0.041316986083984375, -0.03903388977050781, -0.03675079345703125, -0.03446769714355469, -0.032184600830078125, -0.029901504516601562, -0.027618408203125, -0.025335311889648438, -0.023052215576171875, -0.020769119262695312, -0.01848602294921875, -0.016202926635742188, -0.013919830322265625, -0.011636734008789062, -0.0093536376953125, -0.0070705413818359375, -0.004787445068359375, -0.0025043487548828125, -0.00022125244140625, 0.0020618438720703125, 0.004344940185546875, 0.0066280364990234375, 0.0089111328125, 0.011194229125976562, 0.013477325439453125, 0.015760421752929688, 0.01804351806640625, 0.020326614379882812, 0.022609710693359375, 0.024892807006835938, 0.0271759033203125, 0.029458999633789062, 0.031742095947265625, 0.03402519226074219, 0.03630828857421875, 0.03859138488769531, 0.040874481201171875, 0.04315757751464844, 0.045440673828125, 0.04772377014160156, 0.050006866455078125, 0.05228996276855469, 0.05457305908203125, 0.05685615539550781, 0.059139251708984375, 0.06142234802246094, 0.0637054443359375, 0.06598854064941406, 0.06827163696289062, 0.07055473327636719, 0.07283782958984375, 0.07512092590332031, 0.07740402221679688, 0.07968711853027344, 0.08197021484375]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 8.0, 9.0, 6.0, 10.0, 10.0, 11.0, 18.0, 15.0, 25.0, 20.0, 39.0, 35.0, 50.0, 44.0, 51.0, 56.0, 46.0, 60.0, 53.0, 61.0, 44.0, 48.0, 34.0, 34.0, 32.0, 39.0, 18.0, 26.0, 22.0, 14.0, 9.0, 18.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2084171772003174, -3.0880517959594727, -2.967686653137207, -2.8473212718963623, -2.7269558906555176, -2.606590747833252, -2.4862253665924072, -2.3658599853515625, -2.245494842529297, -2.125129461288452, -2.0047643184661865, -1.8843989372253418, -1.764033555984497, -1.643668293952942, -1.5233030319213867, -1.402937650680542, -1.2825722694396973, -1.162207007408142, -1.0418416261672974, -0.9214763641357422, -0.8011110424995422, -0.6807457208633423, -0.5603804588317871, -0.44001513719558716, -0.3196498155593872, -0.19928450882434845, -0.07891920208930969, 0.04144608974456787, 0.16181141138076782, 0.2821767330169678, 0.40254199504852295, 0.5229073166847229, 0.643272876739502, 0.7636381983757019, 0.8840035200119019, 1.004368782043457, 1.1247341632843018, 1.245099425315857, 1.365464687347412, 1.4858300685882568, 1.606195330619812, 1.7265605926513672, 1.846925973892212, 1.967291235923767, 2.0876564979553223, 2.208021879196167, 2.3283872604370117, 2.4487524032592773, 2.569117784500122, 2.689483165740967, 2.8098483085632324, 2.930213689804077, 3.050579071044922, 3.1709442138671875, 3.2913095951080322, 3.411674976348877, 3.5320401191711426, 3.6524055004119873, 3.772770643234253, 3.8931360244750977, 4.013501167297363, 4.133866786956787, 4.254231929779053, 4.374597072601318, 4.494962692260742]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 8.0, 9.0, 12.0, 6.0, 8.0, 10.0, 16.0, 17.0, 14.0, 26.0, 14.0, 19.0, 27.0, 40.0, 33.0, 30.0, 30.0, 29.0, 37.0, 40.0, 49.0, 50.0, 42.0, 26.0, 30.0, 31.0, 39.0, 33.0, 31.0, 36.0, 24.0, 17.0, 14.0, 18.0, 23.0, 22.0, 18.0, 10.0, 12.0, 11.0, 7.0, 6.0, 5.0, 10.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-2.064056634902954, -1.9949069023132324, -1.9257571697235107, -1.856607437133789, -1.7874577045440674, -1.7183079719543457, -1.649158239364624, -1.5800085067749023, -1.5108587741851807, -1.441709041595459, -1.3725593090057373, -1.3034095764160156, -1.234259843826294, -1.1651101112365723, -1.0959603786468506, -1.026810646057129, -0.9576607942581177, -0.888511061668396, -0.8193613290786743, -0.7502115964889526, -0.681061863899231, -0.6119121313095093, -0.5427623391151428, -0.47361260652542114, -0.40446287393569946, -0.3353131413459778, -0.2661634087562561, -0.19701364636421204, -0.12786391377449036, -0.05871418118476868, 0.01043558120727539, 0.07958531379699707, 0.14873504638671875, 0.21788477897644043, 0.2870345115661621, 0.3561842739582062, 0.42533400654792786, 0.49448373913764954, 0.5636335015296936, 0.6327832341194153, 0.701932966709137, 0.7710826992988586, 0.8402324318885803, 0.9093822240829468, 0.9785319566726685, 1.0476816892623901, 1.1168314218521118, 1.1859811544418335, 1.2551308870315552, 1.3242806196212769, 1.3934303522109985, 1.4625800848007202, 1.531729817390442, 1.6008795499801636, 1.6700294017791748, 1.7391791343688965, 1.8083288669586182, 1.8774785995483398, 1.9466283321380615, 2.015778064727783, 2.084927797317505, 2.1540775299072266, 2.2232272624969482, 2.29237699508667, 2.3615267276763916]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 14.0, 19.0, 21.0, 34.0, 57.0, 84.0, 104.0, 166.0, 259.0, 423.0, 609.0, 913.0, 1560.0, 2424.0, 4022.0, 6612.0, 11138.0, 18550.0, 31169.0, 49787.0, 76607.0, 108486.0, 137858.0, 150213.0, 137697.0, 108016.0, 76042.0, 48777.0, 30343.0, 18343.0, 11057.0, 6567.0, 3908.0, 2419.0, 1487.0, 921.0, 591.0, 397.0, 284.0, 189.0, 126.0, 65.0, 73.0, 33.0, 27.0, 16.0, 16.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.451171875, -2.373321533203125, -2.29547119140625, -2.217620849609375, -2.1397705078125, -2.061920166015625, -1.98406982421875, -1.906219482421875, -1.828369140625, -1.750518798828125, -1.67266845703125, -1.594818115234375, -1.5169677734375, -1.439117431640625, -1.36126708984375, -1.283416748046875, -1.20556640625, -1.127716064453125, -1.04986572265625, -0.972015380859375, -0.8941650390625, -0.816314697265625, -0.73846435546875, -0.660614013671875, -0.582763671875, -0.504913330078125, -0.42706298828125, -0.349212646484375, -0.2713623046875, -0.193511962890625, -0.11566162109375, -0.037811279296875, 0.0400390625, 0.117889404296875, 0.19573974609375, 0.273590087890625, 0.3514404296875, 0.429290771484375, 0.50714111328125, 0.584991455078125, 0.662841796875, 0.740692138671875, 0.81854248046875, 0.896392822265625, 0.9742431640625, 1.052093505859375, 1.12994384765625, 1.207794189453125, 1.28564453125, 1.363494873046875, 1.44134521484375, 1.519195556640625, 1.5970458984375, 1.674896240234375, 1.75274658203125, 1.830596923828125, 1.908447265625, 1.986297607421875, 2.06414794921875, 2.141998291015625, 2.2198486328125, 2.297698974609375, 2.37554931640625, 2.453399658203125, 2.53125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 4.0, 10.0, 11.0, 10.0, 8.0, 17.0, 24.0, 20.0, 24.0, 22.0, 18.0, 33.0, 19.0, 35.0, 39.0, 26.0, 49.0, 46.0, 50.0, 41.0, 39.0, 29.0, 39.0, 43.0, 32.0, 30.0, 29.0, 28.0, 23.0, 28.0, 27.0, 18.0, 14.0, 19.0, 14.0, 13.0, 11.0, 9.0, 11.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0], "bins": [-2.333984375, -2.254425048828125, -2.17486572265625, -2.095306396484375, -2.0157470703125, -1.936187744140625, -1.85662841796875, -1.777069091796875, -1.697509765625, -1.617950439453125, -1.53839111328125, -1.458831787109375, -1.3792724609375, -1.299713134765625, -1.22015380859375, -1.140594482421875, -1.06103515625, -0.981475830078125, -0.90191650390625, -0.822357177734375, -0.7427978515625, -0.663238525390625, -0.58367919921875, -0.504119873046875, -0.424560546875, -0.345001220703125, -0.26544189453125, -0.185882568359375, -0.1063232421875, -0.026763916015625, 0.05279541015625, 0.132354736328125, 0.2119140625, 0.291473388671875, 0.37103271484375, 0.450592041015625, 0.5301513671875, 0.609710693359375, 0.68927001953125, 0.768829345703125, 0.848388671875, 0.927947998046875, 1.00750732421875, 1.087066650390625, 1.1666259765625, 1.246185302734375, 1.32574462890625, 1.405303955078125, 1.48486328125, 1.564422607421875, 1.64398193359375, 1.723541259765625, 1.8031005859375, 1.882659912109375, 1.96221923828125, 2.041778564453125, 2.121337890625, 2.200897216796875, 2.28045654296875, 2.360015869140625, 2.4395751953125, 2.519134521484375, 2.59869384765625, 2.678253173828125, 2.7578125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 9.0, 9.0, 15.0, 28.0, 41.0, 60.0, 97.0, 127.0, 228.0, 310.0, 407.0, 718.0, 1129.0, 1664.0, 2514.0, 3922.0, 5911.0, 8993.0, 14307.0, 21533.0, 32764.0, 47827.0, 69122.0, 93037.0, 115252.0, 129046.0, 125140.0, 107743.0, 83663.0, 60639.0, 41578.0, 27840.0, 18275.0, 11956.0, 7723.0, 5136.0, 3386.0, 2207.0, 1447.0, 927.0, 562.0, 420.0, 266.0, 175.0, 125.0, 104.0, 63.0, 36.0, 31.0, 13.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0], "bins": [-2.25, -2.181427001953125, -2.11285400390625, -2.044281005859375, -1.9757080078125, -1.907135009765625, -1.83856201171875, -1.769989013671875, -1.701416015625, -1.632843017578125, -1.56427001953125, -1.495697021484375, -1.4271240234375, -1.358551025390625, -1.28997802734375, -1.221405029296875, -1.15283203125, -1.084259033203125, -1.01568603515625, -0.947113037109375, -0.8785400390625, -0.809967041015625, -0.74139404296875, -0.672821044921875, -0.604248046875, -0.535675048828125, -0.46710205078125, -0.398529052734375, -0.3299560546875, -0.261383056640625, -0.19281005859375, -0.124237060546875, -0.0556640625, 0.012908935546875, 0.08148193359375, 0.150054931640625, 0.2186279296875, 0.287200927734375, 0.35577392578125, 0.424346923828125, 0.492919921875, 0.561492919921875, 0.63006591796875, 0.698638916015625, 0.7672119140625, 0.835784912109375, 0.90435791015625, 0.972930908203125, 1.04150390625, 1.110076904296875, 1.17864990234375, 1.247222900390625, 1.3157958984375, 1.384368896484375, 1.45294189453125, 1.521514892578125, 1.590087890625, 1.658660888671875, 1.72723388671875, 1.795806884765625, 1.8643798828125, 1.932952880859375, 2.00152587890625, 2.070098876953125, 2.138671875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 7.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 13.0, 18.0, 16.0, 20.0, 26.0, 29.0, 18.0, 37.0, 40.0, 50.0, 48.0, 31.0, 43.0, 44.0, 37.0, 47.0, 48.0, 41.0, 42.0, 48.0, 35.0, 33.0, 36.0, 18.0, 25.0, 22.0, 22.0, 16.0, 11.0, 8.0, 9.0, 4.0, 8.0, 12.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.828125, -1.770233154296875, -1.71234130859375, -1.654449462890625, -1.5965576171875, -1.538665771484375, -1.48077392578125, -1.422882080078125, -1.364990234375, -1.307098388671875, -1.24920654296875, -1.191314697265625, -1.1334228515625, -1.075531005859375, -1.01763916015625, -0.959747314453125, -0.90185546875, -0.843963623046875, -0.78607177734375, -0.728179931640625, -0.6702880859375, -0.612396240234375, -0.55450439453125, -0.496612548828125, -0.438720703125, -0.380828857421875, -0.32293701171875, -0.265045166015625, -0.2071533203125, -0.149261474609375, -0.09136962890625, -0.033477783203125, 0.0244140625, 0.082305908203125, 0.14019775390625, 0.198089599609375, 0.2559814453125, 0.313873291015625, 0.37176513671875, 0.429656982421875, 0.487548828125, 0.545440673828125, 0.60333251953125, 0.661224365234375, 0.7191162109375, 0.777008056640625, 0.83489990234375, 0.892791748046875, 0.95068359375, 1.008575439453125, 1.06646728515625, 1.124359130859375, 1.1822509765625, 1.240142822265625, 1.29803466796875, 1.355926513671875, 1.413818359375, 1.471710205078125, 1.52960205078125, 1.587493896484375, 1.6453857421875, 1.703277587890625, 1.76116943359375, 1.819061279296875, 1.876953125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 13.0, 14.0, 23.0, 29.0, 43.0, 64.0, 93.0, 154.0, 256.0, 403.0, 656.0, 1166.0, 1897.0, 3336.0, 5876.0, 10222.0, 18268.0, 32339.0, 56490.0, 93837.0, 143808.0, 182255.0, 174814.0, 129306.0, 81618.0, 48177.0, 27264.0, 15309.0, 8828.0, 4834.0, 2949.0, 1652.0, 989.0, 588.0, 362.0, 218.0, 145.0, 81.0, 58.0, 42.0, 19.0, 19.0, 14.0, 3.0, 12.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5177154541015625, -1.465118408203125, -1.4125213623046875, -1.35992431640625, -1.3073272705078125, -1.254730224609375, -1.2021331787109375, -1.1495361328125, -1.0969390869140625, -1.044342041015625, -0.9917449951171875, -0.93914794921875, -0.8865509033203125, -0.833953857421875, -0.7813568115234375, -0.728759765625, -0.6761627197265625, -0.623565673828125, -0.5709686279296875, -0.51837158203125, -0.4657745361328125, -0.413177490234375, -0.3605804443359375, -0.3079833984375, -0.2553863525390625, -0.202789306640625, -0.1501922607421875, -0.09759521484375, -0.0449981689453125, 0.007598876953125, 0.0601959228515625, 0.11279296875, 0.1653900146484375, 0.217987060546875, 0.2705841064453125, 0.32318115234375, 0.3757781982421875, 0.428375244140625, 0.4809722900390625, 0.5335693359375, 0.5861663818359375, 0.638763427734375, 0.6913604736328125, 0.74395751953125, 0.7965545654296875, 0.849151611328125, 0.9017486572265625, 0.954345703125, 1.0069427490234375, 1.059539794921875, 1.1121368408203125, 1.16473388671875, 1.2173309326171875, 1.269927978515625, 1.3225250244140625, 1.3751220703125, 1.4277191162109375, 1.480316162109375, 1.5329132080078125, 1.58551025390625, 1.6381072998046875, 1.690704345703125, 1.7433013916015625, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 8.0, 3.0, 6.0, 11.0, 14.0, 15.0, 13.0, 22.0, 31.0, 26.0, 36.0, 40.0, 39.0, 48.0, 39.0, 55.0, 41.0, 59.0, 45.0, 49.0, 54.0, 48.0, 41.0, 35.0, 36.0, 26.0, 25.0, 24.0, 16.0, 17.0, 18.0, 12.0, 8.0, 9.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001214146614074707, -0.00011733081191778183, -0.00011324696242809296, -0.00010916311293840408, -0.00010507926344871521, -0.00010099541395902634, -9.691156446933746e-05, -9.282771497964859e-05, -8.874386548995972e-05, -8.466001600027084e-05, -8.057616651058197e-05, -7.64923170208931e-05, -7.240846753120422e-05, -6.832461804151535e-05, -6.424076855182648e-05, -6.0156919062137604e-05, -5.607306957244873e-05, -5.198922008275986e-05, -4.7905370593070984e-05, -4.382152110338211e-05, -3.973767161369324e-05, -3.5653822124004364e-05, -3.156997263431549e-05, -2.7486123144626617e-05, -2.3402273654937744e-05, -1.931842416524887e-05, -1.5234574675559998e-05, -1.1150725185871124e-05, -7.066875696182251e-06, -2.9830262064933777e-06, 1.1008232831954956e-06, 5.184672772884369e-06, 9.268522262573242e-06, 1.3352371752262115e-05, 1.743622124195099e-05, 2.1520070731639862e-05, 2.5603920221328735e-05, 2.968776971101761e-05, 3.377161920070648e-05, 3.7855468690395355e-05, 4.193931818008423e-05, 4.60231676697731e-05, 5.0107017159461975e-05, 5.419086664915085e-05, 5.827471613883972e-05, 6.23585656285286e-05, 6.644241511821747e-05, 7.052626460790634e-05, 7.461011409759521e-05, 7.869396358728409e-05, 8.277781307697296e-05, 8.686166256666183e-05, 9.094551205635071e-05, 9.502936154603958e-05, 9.911321103572845e-05, 0.00010319706052541733, 0.0001072809100151062, 0.00011136475950479507, 0.00011544860899448395, 0.00011953245848417282, 0.0001236163079738617, 0.00012770015746355057, 0.00013178400695323944, 0.00013586785644292831, 0.0001399517059326172]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 22.0, 42.0, 46.0, 97.0, 139.0, 205.0, 343.0, 547.0, 880.0, 1436.0, 2382.0, 4010.0, 6724.0, 10976.0, 18127.0, 30230.0, 49581.0, 76893.0, 113280.0, 148222.0, 160438.0, 140719.0, 103589.0, 69046.0, 43475.0, 26562.0, 16209.0, 9600.0, 5827.0, 3471.0, 2056.0, 1290.0, 749.0, 459.0, 303.0, 203.0, 134.0, 83.0, 40.0, 44.0, 15.0, 12.0, 13.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4052734375, -1.3618621826171875, -1.318450927734375, -1.2750396728515625, -1.23162841796875, -1.1882171630859375, -1.144805908203125, -1.1013946533203125, -1.0579833984375, -1.0145721435546875, -0.971160888671875, -0.9277496337890625, -0.88433837890625, -0.8409271240234375, -0.797515869140625, -0.7541046142578125, -0.710693359375, -0.6672821044921875, -0.623870849609375, -0.5804595947265625, -0.53704833984375, -0.4936370849609375, -0.450225830078125, -0.4068145751953125, -0.3634033203125, -0.3199920654296875, -0.276580810546875, -0.2331695556640625, -0.18975830078125, -0.1463470458984375, -0.102935791015625, -0.0595245361328125, -0.01611328125, 0.0272979736328125, 0.070709228515625, 0.1141204833984375, 0.15753173828125, 0.2009429931640625, 0.244354248046875, 0.2877655029296875, 0.3311767578125, 0.3745880126953125, 0.417999267578125, 0.4614105224609375, 0.50482177734375, 0.5482330322265625, 0.591644287109375, 0.6350555419921875, 0.678466796875, 0.7218780517578125, 0.765289306640625, 0.8087005615234375, 0.85211181640625, 0.8955230712890625, 0.938934326171875, 0.9823455810546875, 1.0257568359375, 1.0691680908203125, 1.112579345703125, 1.1559906005859375, 1.19940185546875, 1.2428131103515625, 1.286224365234375, 1.3296356201171875, 1.373046875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 3.0, 9.0, 9.0, 5.0, 16.0, 13.0, 17.0, 22.0, 28.0, 23.0, 41.0, 40.0, 33.0, 41.0, 52.0, 41.0, 43.0, 56.0, 47.0, 54.0, 53.0, 47.0, 47.0, 37.0, 34.0, 35.0, 34.0, 22.0, 17.0, 18.0, 9.0, 16.0, 10.0, 9.0, 6.0, 6.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37255859375, -0.359283447265625, -0.34600830078125, -0.332733154296875, -0.3194580078125, -0.306182861328125, -0.29290771484375, -0.279632568359375, -0.266357421875, -0.253082275390625, -0.23980712890625, -0.226531982421875, -0.2132568359375, -0.199981689453125, -0.18670654296875, -0.173431396484375, -0.16015625, -0.146881103515625, -0.13360595703125, -0.120330810546875, -0.1070556640625, -0.093780517578125, -0.08050537109375, -0.067230224609375, -0.053955078125, -0.040679931640625, -0.02740478515625, -0.014129638671875, -0.0008544921875, 0.012420654296875, 0.02569580078125, 0.038970947265625, 0.05224609375, 0.065521240234375, 0.07879638671875, 0.092071533203125, 0.1053466796875, 0.118621826171875, 0.13189697265625, 0.145172119140625, 0.158447265625, 0.171722412109375, 0.18499755859375, 0.198272705078125, 0.2115478515625, 0.224822998046875, 0.23809814453125, 0.251373291015625, 0.2646484375, 0.277923583984375, 0.29119873046875, 0.304473876953125, 0.3177490234375, 0.331024169921875, 0.34429931640625, 0.357574462890625, 0.370849609375, 0.384124755859375, 0.39739990234375, 0.410675048828125, 0.4239501953125, 0.437225341796875, 0.45050048828125, 0.463775634765625, 0.47705078125]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 4.0, 14.0, 11.0, 9.0, 15.0, 18.0, 13.0, 17.0, 31.0, 27.0, 41.0, 43.0, 42.0, 55.0, 63.0, 61.0, 68.0, 61.0, 58.0, 45.0, 61.0, 31.0, 35.0, 25.0, 29.0, 32.0, 27.0, 16.0, 10.0, 7.0, 4.0, 5.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.737412691116333, -3.605987548828125, -3.474562406539917, -3.343137264251709, -3.211712121963501, -3.080286979675293, -2.948861837387085, -2.817436695098877, -2.686011552810669, -2.554586410522461, -2.423161268234253, -2.291736125946045, -2.160310983657837, -2.028885841369629, -1.897460699081421, -1.766035556793213, -1.6346104145050049, -1.5031852722167969, -1.3717601299285889, -1.2403349876403809, -1.1089098453521729, -0.9774847030639648, -0.8460595607757568, -0.7146344184875488, -0.5832092761993408, -0.4517841339111328, -0.3203589916229248, -0.1889338493347168, -0.05750870704650879, 0.07391643524169922, 0.20534157752990723, 0.33676671981811523, 0.46819162368774414, 0.5996167659759521, 0.7310419082641602, 0.8624670505523682, 0.9938921928405762, 1.1253173351287842, 1.2567424774169922, 1.3881676197052002, 1.5195927619934082, 1.6510179042816162, 1.7824430465698242, 1.9138681888580322, 2.0452933311462402, 2.1767184734344482, 2.3081436157226562, 2.4395687580108643, 2.5709939002990723, 2.7024190425872803, 2.8338441848754883, 2.9652693271636963, 3.0966944694519043, 3.2281196117401123, 3.3595447540283203, 3.4909698963165283, 3.6223950386047363, 3.7538201808929443, 3.8852453231811523, 4.016670227050781, 4.148095607757568, 4.2795209884643555, 4.410945892333984, 4.542370796203613, 4.6737961769104]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 9.0, 9.0, 7.0, 9.0, 9.0, 14.0, 12.0, 24.0, 22.0, 30.0, 31.0, 25.0, 35.0, 35.0, 35.0, 40.0, 36.0, 33.0, 30.0, 39.0, 32.0, 44.0, 47.0, 49.0, 44.0, 37.0, 25.0, 27.0, 27.0, 19.0, 27.0, 15.0, 13.0, 17.0, 20.0, 11.0, 14.0, 6.0, 7.0, 4.0, 9.0, 3.0, 2.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.0968737602233887, -2.024630546569824, -1.9523870944976807, -1.8801438808441162, -1.8079005479812622, -1.7356572151184082, -1.6634140014648438, -1.5911706686019897, -1.5189273357391357, -1.4466840028762817, -1.3744406700134277, -1.3021974563598633, -1.2299541234970093, -1.1577107906341553, -1.0854675769805908, -1.0132242441177368, -0.9409809112548828, -0.8687375783920288, -0.7964943051338196, -0.7242510318756104, -0.6520076990127563, -0.5797643661499023, -0.5075210928916931, -0.4352778196334839, -0.3630344867706299, -0.29079118371009827, -0.21854788064956665, -0.14630457758903503, -0.07406127452850342, -0.0018179714679718018, 0.07042533159255981, 0.14266860485076904, 0.21491169929504395, 0.28715500235557556, 0.3593983054161072, 0.4316416084766388, 0.5038849115371704, 0.5761282444000244, 0.6483715176582336, 0.7206147909164429, 0.7928581237792969, 0.8651014566421509, 0.9373447299003601, 1.0095880031585693, 1.0818313360214233, 1.1540746688842773, 1.2263178825378418, 1.2985612154006958, 1.3708045482635498, 1.4430478811264038, 1.5152912139892578, 1.5875344276428223, 1.6597777605056763, 1.7320210933685303, 1.8042643070220947, 1.8765076398849487, 1.9487509727478027, 2.020994186401367, 2.0932376384735107, 2.165480852127075, 2.2377243041992188, 2.309967517852783, 2.3822107315063477, 2.454453945159912, 2.5266973972320557]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 4.0, 5.0, 5.0, 11.0, 15.0, 15.0, 31.0, 53.0, 50.0, 84.0, 107.0, 164.0, 243.0, 360.0, 595.0, 951.0, 1362.0, 2329.0, 3856.0, 6858.0, 12539.0, 23711.0, 47416.0, 100038.0, 229439.0, 552685.0, 1117856.0, 1118593.0, 544901.0, 225033.0, 100026.0, 47521.0, 24514.0, 13433.0, 7620.0, 4376.0, 2776.0, 1663.0, 1092.0, 682.0, 473.0, 284.0, 187.0, 130.0, 73.0, 49.0, 28.0, 19.0, 13.0, 10.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.40234375, -4.26031494140625, -4.1182861328125, -3.97625732421875, -3.834228515625, -3.69219970703125, -3.5501708984375, -3.40814208984375, -3.26611328125, -3.12408447265625, -2.9820556640625, -2.84002685546875, -2.697998046875, -2.55596923828125, -2.4139404296875, -2.27191162109375, -2.1298828125, -1.98785400390625, -1.8458251953125, -1.70379638671875, -1.561767578125, -1.41973876953125, -1.2777099609375, -1.13568115234375, -0.99365234375, -0.85162353515625, -0.7095947265625, -0.56756591796875, -0.425537109375, -0.28350830078125, -0.1414794921875, 0.00054931640625, 0.142578125, 0.28460693359375, 0.4266357421875, 0.56866455078125, 0.710693359375, 0.85272216796875, 0.9947509765625, 1.13677978515625, 1.27880859375, 1.42083740234375, 1.5628662109375, 1.70489501953125, 1.846923828125, 1.98895263671875, 2.1309814453125, 2.27301025390625, 2.4150390625, 2.55706787109375, 2.6990966796875, 2.84112548828125, 2.983154296875, 3.12518310546875, 3.2672119140625, 3.40924072265625, 3.55126953125, 3.69329833984375, 3.8353271484375, 3.97735595703125, 4.119384765625, 4.26141357421875, 4.4034423828125, 4.54547119140625, 4.6875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 5.0, 11.0, 5.0, 7.0, 17.0, 16.0, 10.0, 26.0, 18.0, 17.0, 37.0, 34.0, 29.0, 45.0, 42.0, 34.0, 38.0, 45.0, 40.0, 46.0, 40.0, 46.0, 54.0, 44.0, 22.0, 29.0, 28.0, 27.0, 24.0, 24.0, 25.0, 27.0, 13.0, 16.0, 14.0, 11.0, 10.0, 4.0, 7.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7919921875, -1.734954833984375, -1.67791748046875, -1.620880126953125, -1.5638427734375, -1.506805419921875, -1.44976806640625, -1.392730712890625, -1.335693359375, -1.278656005859375, -1.22161865234375, -1.164581298828125, -1.1075439453125, -1.050506591796875, -0.99346923828125, -0.936431884765625, -0.87939453125, -0.822357177734375, -0.76531982421875, -0.708282470703125, -0.6512451171875, -0.594207763671875, -0.53717041015625, -0.480133056640625, -0.423095703125, -0.366058349609375, -0.30902099609375, -0.251983642578125, -0.1949462890625, -0.137908935546875, -0.08087158203125, -0.023834228515625, 0.033203125, 0.090240478515625, 0.14727783203125, 0.204315185546875, 0.2613525390625, 0.318389892578125, 0.37542724609375, 0.432464599609375, 0.489501953125, 0.546539306640625, 0.60357666015625, 0.660614013671875, 0.7176513671875, 0.774688720703125, 0.83172607421875, 0.888763427734375, 0.94580078125, 1.002838134765625, 1.05987548828125, 1.116912841796875, 1.1739501953125, 1.230987548828125, 1.28802490234375, 1.345062255859375, 1.402099609375, 1.459136962890625, 1.51617431640625, 1.573211669921875, 1.6302490234375, 1.687286376953125, 1.74432373046875, 1.801361083984375, 1.8583984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 6.0, 15.0, 20.0, 32.0, 57.0, 74.0, 131.0, 211.0, 321.0, 518.0, 853.0, 1404.0, 2213.0, 3707.0, 6283.0, 10778.0, 19348.0, 36010.0, 67104.0, 131689.0, 264487.0, 532742.0, 931319.0, 981830.0, 592995.0, 297473.0, 147644.0, 74988.0, 39427.0, 21663.0, 11878.0, 6744.0, 3924.0, 2364.0, 1483.0, 884.0, 566.0, 363.0, 256.0, 134.0, 88.0, 70.0, 49.0, 51.0, 21.0, 15.0, 16.0, 5.0, 7.0, 11.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.9658203125, -3.833984375, -3.7021484375, -3.5703125, -3.4384765625, -3.306640625, -3.1748046875, -3.04296875, -2.9111328125, -2.779296875, -2.6474609375, -2.515625, -2.3837890625, -2.251953125, -2.1201171875, -1.98828125, -1.8564453125, -1.724609375, -1.5927734375, -1.4609375, -1.3291015625, -1.197265625, -1.0654296875, -0.93359375, -0.8017578125, -0.669921875, -0.5380859375, -0.40625, -0.2744140625, -0.142578125, -0.0107421875, 0.12109375, 0.2529296875, 0.384765625, 0.5166015625, 0.6484375, 0.7802734375, 0.912109375, 1.0439453125, 1.17578125, 1.3076171875, 1.439453125, 1.5712890625, 1.703125, 1.8349609375, 1.966796875, 2.0986328125, 2.23046875, 2.3623046875, 2.494140625, 2.6259765625, 2.7578125, 2.8896484375, 3.021484375, 3.1533203125, 3.28515625, 3.4169921875, 3.548828125, 3.6806640625, 3.8125, 3.9443359375, 4.076171875, 4.2080078125, 4.33984375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 13.0, 6.0, 8.0, 21.0, 19.0, 11.0, 22.0, 35.0, 40.0, 39.0, 56.0, 63.0, 78.0, 86.0, 103.0, 143.0, 139.0, 176.0, 192.0, 193.0, 199.0, 215.0, 227.0, 224.0, 231.0, 199.0, 169.0, 151.0, 146.0, 146.0, 113.0, 108.0, 98.0, 80.0, 48.0, 45.0, 44.0, 40.0, 27.0, 26.0, 16.0, 17.0, 8.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-1.0107421875, -0.9813995361328125, -0.952056884765625, -0.9227142333984375, -0.89337158203125, -0.8640289306640625, -0.834686279296875, -0.8053436279296875, -0.7760009765625, -0.7466583251953125, -0.717315673828125, -0.6879730224609375, -0.65863037109375, -0.6292877197265625, -0.599945068359375, -0.5706024169921875, -0.541259765625, -0.5119171142578125, -0.482574462890625, -0.4532318115234375, -0.42388916015625, -0.3945465087890625, -0.365203857421875, -0.3358612060546875, -0.3065185546875, -0.2771759033203125, -0.247833251953125, -0.2184906005859375, -0.18914794921875, -0.1598052978515625, -0.130462646484375, -0.1011199951171875, -0.07177734375, -0.0424346923828125, -0.013092041015625, 0.0162506103515625, 0.04559326171875, 0.0749359130859375, 0.104278564453125, 0.1336212158203125, 0.1629638671875, 0.1923065185546875, 0.221649169921875, 0.2509918212890625, 0.28033447265625, 0.3096771240234375, 0.339019775390625, 0.3683624267578125, 0.397705078125, 0.4270477294921875, 0.456390380859375, 0.4857330322265625, 0.51507568359375, 0.5444183349609375, 0.573760986328125, 0.6031036376953125, 0.6324462890625, 0.6617889404296875, 0.691131591796875, 0.7204742431640625, 0.74981689453125, 0.7791595458984375, 0.808502197265625, 0.8378448486328125, 0.8671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 8.0, 2.0, 10.0, 8.0, 12.0, 11.0, 16.0, 22.0, 34.0, 42.0, 42.0, 38.0, 56.0, 70.0, 49.0, 75.0, 72.0, 64.0, 66.0, 53.0, 52.0, 38.0, 35.0, 21.0, 25.0, 21.0, 18.0, 9.0, 8.0, 3.0, 11.0, 2.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.347010850906372, -3.201976776123047, -3.0569427013397217, -2.9119086265563965, -2.766874313354492, -2.621840476989746, -2.476806163787842, -2.3317720890045166, -2.1867380142211914, -2.041703939437866, -1.896669864654541, -1.7516356706619263, -1.606601595878601, -1.4615675210952759, -1.3165333271026611, -1.171499252319336, -1.0264651775360107, -0.8814311027526855, -0.7363969683647156, -0.5913628339767456, -0.4463287591934204, -0.3012946844100952, -0.15626055002212524, -0.011226415634155273, 0.13380765914916992, 0.2788417637348175, 0.4238758683204651, 0.5689100027084351, 0.7139440774917603, 0.8589781522750854, 1.0040123462677002, 1.1490464210510254, 1.2940807342529297, 1.4391148090362549, 1.58414888381958, 1.7291830778121948, 1.87421715259552, 2.0192513465881348, 2.16428542137146, 2.309319496154785, 2.4543535709381104, 2.5993876457214355, 2.7444217205047607, 2.889455795288086, 3.0344901084899902, 3.1795239448547363, 3.3245582580566406, 3.469592332839966, 3.614626407623291, 3.759660482406616, 3.9046945571899414, 4.049728870391846, 4.194762706756592, 4.339797019958496, 4.484830856323242, 4.6298651695251465, 4.774899482727051, 4.919933795928955, 5.064967632293701, 5.2100019454956055, 5.355035781860352, 5.500070095062256, 5.645103931427002, 5.790138244628906, 5.935172080993652]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 4.0, 3.0, 5.0, 7.0, 14.0, 19.0, 16.0, 16.0, 29.0, 30.0, 28.0, 37.0, 23.0, 40.0, 38.0, 41.0, 53.0, 33.0, 38.0, 45.0, 51.0, 46.0, 43.0, 46.0, 35.0, 33.0, 28.0, 29.0, 25.0, 29.0, 25.0, 17.0, 11.0, 16.0, 9.0, 6.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9165393114089966, -1.8452924489974976, -1.7740455865859985, -1.7027987241744995, -1.6315518617630005, -1.5603049993515015, -1.4890581369400024, -1.4178112745285034, -1.3465644121170044, -1.2753175497055054, -1.2040706872940063, -1.1328238248825073, -1.0615769624710083, -0.9903301000595093, -0.9190832376480103, -0.8478363752365112, -0.7765895128250122, -0.7053426504135132, -0.6340957880020142, -0.5628489255905151, -0.4916020631790161, -0.4203552007675171, -0.34910833835601807, -0.27786147594451904, -0.20661461353302002, -0.135367751121521, -0.06412088871002197, 0.007125973701477051, 0.07837283611297607, 0.1496196985244751, 0.22086656093597412, 0.29211342334747314, 0.3633601665496826, 0.43460702896118164, 0.5058538913726807, 0.5771007537841797, 0.6483476161956787, 0.7195944786071777, 0.7908413410186768, 0.8620882034301758, 0.9333350658416748, 1.0045819282531738, 1.0758287906646729, 1.1470756530761719, 1.218322515487671, 1.28956937789917, 1.360816240310669, 1.432063102722168, 1.503309965133667, 1.574556827545166, 1.645803689956665, 1.717050552368164, 1.788297414779663, 1.859544277191162, 1.9307911396026611, 2.00203800201416, 2.073284864425659, 2.144531726837158, 2.2157785892486572, 2.2870254516601562, 2.3582723140716553, 2.4295191764831543, 2.5007660388946533, 2.5720129013061523, 2.6432597637176514]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 7.0, 14.0, 16.0, 20.0, 28.0, 39.0, 59.0, 66.0, 79.0, 129.0, 180.0, 214.0, 296.0, 422.0, 618.0, 885.0, 1406.0, 2312.0, 3879.0, 6637.0, 11992.0, 23685.0, 47682.0, 98091.0, 186254.0, 254527.0, 195861.0, 104975.0, 51522.0, 25398.0, 13129.0, 6948.0, 4026.0, 2386.0, 1501.0, 923.0, 644.0, 457.0, 336.0, 221.0, 185.0, 120.0, 114.0, 56.0, 60.0, 40.0, 29.0, 31.0, 21.0, 9.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5258369445800781, -0.5096817016601562, -0.4935264587402344, -0.4773712158203125, -0.4612159729003906, -0.44506072998046875, -0.4289054870605469, -0.412750244140625, -0.3965950012207031, -0.38043975830078125, -0.3642845153808594, -0.3481292724609375, -0.3319740295410156, -0.31581878662109375, -0.2996635437011719, -0.28350830078125, -0.2673530578613281, -0.25119781494140625, -0.23504257202148438, -0.2188873291015625, -0.20273208618164062, -0.18657684326171875, -0.17042160034179688, -0.154266357421875, -0.13811111450195312, -0.12195587158203125, -0.10580062866210938, -0.0896453857421875, -0.07349014282226562, -0.05733489990234375, -0.041179656982421875, -0.0250244140625, -0.008869171142578125, 0.00728607177734375, 0.023441314697265625, 0.0395965576171875, 0.055751800537109375, 0.07190704345703125, 0.08806228637695312, 0.104217529296875, 0.12037277221679688, 0.13652801513671875, 0.15268325805664062, 0.1688385009765625, 0.18499374389648438, 0.20114898681640625, 0.21730422973632812, 0.23345947265625, 0.24961471557617188, 0.26576995849609375, 0.2819252014160156, 0.2980804443359375, 0.3142356872558594, 0.33039093017578125, 0.3465461730957031, 0.362701416015625, 0.3788566589355469, 0.39501190185546875, 0.4111671447753906, 0.4273223876953125, 0.4434776306152344, 0.45963287353515625, 0.4757881164550781, 0.491943359375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 9.0, 13.0, 15.0, 18.0, 10.0, 21.0, 23.0, 27.0, 40.0, 34.0, 35.0, 35.0, 44.0, 42.0, 46.0, 45.0, 52.0, 43.0, 46.0, 42.0, 37.0, 37.0, 29.0, 38.0, 38.0, 25.0, 21.0, 23.0, 21.0, 17.0, 15.0, 10.0, 7.0, 5.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.348663330078125, -2.26568603515625, -2.182708740234375, -2.0997314453125, -2.016754150390625, -1.93377685546875, -1.850799560546875, -1.767822265625, -1.684844970703125, -1.60186767578125, -1.518890380859375, -1.4359130859375, -1.352935791015625, -1.26995849609375, -1.186981201171875, -1.10400390625, -1.021026611328125, -0.93804931640625, -0.855072021484375, -0.7720947265625, -0.689117431640625, -0.60614013671875, -0.523162841796875, -0.440185546875, -0.357208251953125, -0.27423095703125, -0.191253662109375, -0.1082763671875, -0.025299072265625, 0.05767822265625, 0.140655517578125, 0.2236328125, 0.306610107421875, 0.38958740234375, 0.472564697265625, 0.5555419921875, 0.638519287109375, 0.72149658203125, 0.804473876953125, 0.887451171875, 0.970428466796875, 1.05340576171875, 1.136383056640625, 1.2193603515625, 1.302337646484375, 1.38531494140625, 1.468292236328125, 1.55126953125, 1.634246826171875, 1.71722412109375, 1.800201416015625, 1.8831787109375, 1.966156005859375, 2.04913330078125, 2.132110595703125, 2.215087890625, 2.298065185546875, 2.38104248046875, 2.464019775390625, 2.5469970703125, 2.629974365234375, 2.71295166015625, 2.795928955078125, 2.87890625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 5.0, 6.0, 9.0, 12.0, 16.0, 24.0, 22.0, 29.0, 62.0, 65.0, 116.0, 172.0, 218.0, 388.0, 608.0, 1143.0, 2225.0, 4933.0, 13626.0, 52366.0, 905642.0, 44735.0, 12511.0, 4720.0, 2129.0, 1059.0, 606.0, 347.0, 247.0, 141.0, 113.0, 64.0, 50.0, 43.0, 23.0, 22.0, 7.0, 15.0, 8.0, 6.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0], "bins": [-1.7724609375, -1.719482421875, -1.66650390625, -1.613525390625, -1.560546875, -1.507568359375, -1.45458984375, -1.401611328125, -1.3486328125, -1.295654296875, -1.24267578125, -1.189697265625, -1.13671875, -1.083740234375, -1.03076171875, -0.977783203125, -0.9248046875, -0.871826171875, -0.81884765625, -0.765869140625, -0.712890625, -0.659912109375, -0.60693359375, -0.553955078125, -0.5009765625, -0.447998046875, -0.39501953125, -0.342041015625, -0.2890625, -0.236083984375, -0.18310546875, -0.130126953125, -0.0771484375, -0.024169921875, 0.02880859375, 0.081787109375, 0.134765625, 0.187744140625, 0.24072265625, 0.293701171875, 0.3466796875, 0.399658203125, 0.45263671875, 0.505615234375, 0.55859375, 0.611572265625, 0.66455078125, 0.717529296875, 0.7705078125, 0.823486328125, 0.87646484375, 0.929443359375, 0.982421875, 1.035400390625, 1.08837890625, 1.141357421875, 1.1943359375, 1.247314453125, 1.30029296875, 1.353271484375, 1.40625, 1.459228515625, 1.51220703125, 1.565185546875, 1.6181640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 2.0, 6.0, 15.0, 10.0, 12.0, 14.0, 18.0, 27.0, 18.0, 31.0, 18.0, 35.0, 26.0, 42.0, 30.0, 36.0, 43.0, 49.0, 49.0, 36.0, 38.0, 41.0, 33.0, 47.0, 27.0, 43.0, 32.0, 22.0, 19.0, 29.0, 24.0, 20.0, 19.0, 14.0, 15.0, 8.0, 9.0, 15.0, 4.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.599609375, -1.5498504638671875, -1.500091552734375, -1.4503326416015625, -1.40057373046875, -1.3508148193359375, -1.301055908203125, -1.2512969970703125, -1.2015380859375, -1.1517791748046875, -1.102020263671875, -1.0522613525390625, -1.00250244140625, -0.9527435302734375, -0.902984619140625, -0.8532257080078125, -0.803466796875, -0.7537078857421875, -0.703948974609375, -0.6541900634765625, -0.60443115234375, -0.5546722412109375, -0.504913330078125, -0.4551544189453125, -0.4053955078125, -0.3556365966796875, -0.305877685546875, -0.2561187744140625, -0.20635986328125, -0.1566009521484375, -0.106842041015625, -0.0570831298828125, -0.00732421875, 0.0424346923828125, 0.092193603515625, 0.1419525146484375, 0.19171142578125, 0.2414703369140625, 0.291229248046875, 0.3409881591796875, 0.3907470703125, 0.4405059814453125, 0.490264892578125, 0.5400238037109375, 0.58978271484375, 0.6395416259765625, 0.689300537109375, 0.7390594482421875, 0.788818359375, 0.8385772705078125, 0.888336181640625, 0.9380950927734375, 0.98785400390625, 1.0376129150390625, 1.087371826171875, 1.1371307373046875, 1.1868896484375, 1.2366485595703125, 1.286407470703125, 1.3361663818359375, 1.38592529296875, 1.4356842041015625, 1.485443115234375, 1.5352020263671875, 1.5849609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 6.0, 13.0, 10.0, 17.0, 18.0, 25.0, 31.0, 41.0, 46.0, 58.0, 80.0, 108.0, 152.0, 179.0, 247.0, 354.0, 475.0, 742.0, 1176.0, 2197.0, 4414.0, 9417.0, 24542.0, 689032.0, 274530.0, 22142.0, 8808.0, 4041.0, 2069.0, 1163.0, 716.0, 464.0, 307.0, 211.0, 150.0, 99.0, 107.0, 95.0, 52.0, 35.0, 43.0, 22.0, 27.0, 16.0, 21.0, 14.0, 8.0, 12.0, 4.0, 4.0, 2.0, 7.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.4404296875, -0.4266471862792969, -0.41286468505859375, -0.3990821838378906, -0.3852996826171875, -0.3715171813964844, -0.35773468017578125, -0.3439521789550781, -0.330169677734375, -0.3163871765136719, -0.30260467529296875, -0.2888221740722656, -0.2750396728515625, -0.2612571716308594, -0.24747467041015625, -0.23369216918945312, -0.21990966796875, -0.20612716674804688, -0.19234466552734375, -0.17856216430664062, -0.1647796630859375, -0.15099716186523438, -0.13721466064453125, -0.12343215942382812, -0.109649658203125, -0.09586715698242188, -0.08208465576171875, -0.06830215454101562, -0.0545196533203125, -0.040737152099609375, -0.02695465087890625, -0.013172149658203125, 0.0006103515625, 0.014392852783203125, 0.02817535400390625, 0.041957855224609375, 0.0557403564453125, 0.06952285766601562, 0.08330535888671875, 0.09708786010742188, 0.110870361328125, 0.12465286254882812, 0.13843536376953125, 0.15221786499023438, 0.1660003662109375, 0.17978286743164062, 0.19356536865234375, 0.20734786987304688, 0.22113037109375, 0.23491287231445312, 0.24869537353515625, 0.2624778747558594, 0.2762603759765625, 0.2900428771972656, 0.30382537841796875, 0.3176078796386719, 0.331390380859375, 0.3451728820800781, 0.35895538330078125, 0.3727378845214844, 0.3865203857421875, 0.4003028869628906, 0.41408538818359375, 0.4278678894042969, 0.441650390625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 6.0, 15.0, 14.0, 18.0, 28.0, 22.0, 46.0, 38.0, 45.0, 54.0, 52.0, 73.0, 72.0, 53.0, 76.0, 70.0, 61.0, 39.0, 43.0, 43.0, 27.0, 21.0, 12.0, 14.0, 12.0, 8.0, 9.0, 6.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0590763092041016e-05, -3.9091333746910095e-05, -3.7591904401779175e-05, -3.6092475056648254e-05, -3.4593045711517334e-05, -3.3093616366386414e-05, -3.159418702125549e-05, -3.0094757676124573e-05, -2.8595328330993652e-05, -2.7095898985862732e-05, -2.559646964073181e-05, -2.409704029560089e-05, -2.259761095046997e-05, -2.109818160533905e-05, -1.959875226020813e-05, -1.809932291507721e-05, -1.659989356994629e-05, -1.5100464224815369e-05, -1.3601034879684448e-05, -1.2101605534553528e-05, -1.0602176189422607e-05, -9.102746844291687e-06, -7.603317499160767e-06, -6.103888154029846e-06, -4.604458808898926e-06, -3.1050294637680054e-06, -1.605600118637085e-06, -1.0617077350616455e-07, 1.3932585716247559e-06, 2.8926879167556763e-06, 4.392117261886597e-06, 5.891546607017517e-06, 7.3909759521484375e-06, 8.890405297279358e-06, 1.0389834642410278e-05, 1.1889263987541199e-05, 1.3388693332672119e-05, 1.488812267780304e-05, 1.638755202293396e-05, 1.788698136806488e-05, 1.93864107131958e-05, 2.088584005832672e-05, 2.238526940345764e-05, 2.3884698748588562e-05, 2.5384128093719482e-05, 2.6883557438850403e-05, 2.8382986783981323e-05, 2.9882416129112244e-05, 3.1381845474243164e-05, 3.2881274819374084e-05, 3.4380704164505005e-05, 3.5880133509635925e-05, 3.7379562854766846e-05, 3.8878992199897766e-05, 4.0378421545028687e-05, 4.187785089015961e-05, 4.337728023529053e-05, 4.487670958042145e-05, 4.637613892555237e-05, 4.787556827068329e-05, 4.937499761581421e-05, 5.087442696094513e-05, 5.237385630607605e-05, 5.387328565120697e-05, 5.537271499633789e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 12.0, 7.0, 10.0, 24.0, 29.0, 42.0, 61.0, 116.0, 178.0, 306.0, 530.0, 976.0, 1740.0, 3001.0, 5905.0, 11581.0, 24480.0, 56927.0, 144132.0, 315218.0, 277357.0, 117032.0, 47187.0, 20606.0, 9945.0, 4983.0, 2687.0, 1460.0, 807.0, 494.0, 263.0, 145.0, 98.0, 64.0, 43.0, 23.0, 19.0, 15.0, 12.0, 12.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.1649169921875, -0.15990257263183594, -0.15488815307617188, -0.1498737335205078, -0.14485931396484375, -0.1398448944091797, -0.13483047485351562, -0.12981605529785156, -0.1248016357421875, -0.11978721618652344, -0.11477279663085938, -0.10975837707519531, -0.10474395751953125, -0.09972953796386719, -0.09471511840820312, -0.08970069885253906, -0.084686279296875, -0.07967185974121094, -0.07465744018554688, -0.06964302062988281, -0.06462860107421875, -0.05961418151855469, -0.054599761962890625, -0.04958534240722656, -0.0445709228515625, -0.03955650329589844, -0.034542083740234375, -0.029527664184570312, -0.02451324462890625, -0.019498825073242188, -0.014484405517578125, -0.009469985961914062, -0.00445556640625, 0.0005588531494140625, 0.005573272705078125, 0.010587692260742188, 0.01560211181640625, 0.020616531372070312, 0.025630950927734375, 0.030645370483398438, 0.0356597900390625, 0.04067420959472656, 0.045688629150390625, 0.05070304870605469, 0.05571746826171875, 0.06073188781738281, 0.06574630737304688, 0.07076072692871094, 0.075775146484375, 0.08078956604003906, 0.08580398559570312, 0.09081840515136719, 0.09583282470703125, 0.10084724426269531, 0.10586166381835938, 0.11087608337402344, 0.1158905029296875, 0.12090492248535156, 0.12591934204101562, 0.1309337615966797, 0.13594818115234375, 0.1409626007080078, 0.14597702026367188, 0.15099143981933594, 0.156005859375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 7.0, 16.0, 7.0, 11.0, 19.0, 26.0, 22.0, 37.0, 38.0, 52.0, 50.0, 75.0, 74.0, 80.0, 82.0, 57.0, 72.0, 52.0, 44.0, 34.0, 29.0, 25.0, 13.0, 11.0, 10.0, 13.0, 3.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037933349609375, -0.036604881286621094, -0.03527641296386719, -0.03394794464111328, -0.032619476318359375, -0.03129100799560547, -0.029962539672851562, -0.028634071350097656, -0.02730560302734375, -0.025977134704589844, -0.024648666381835938, -0.02332019805908203, -0.021991729736328125, -0.02066326141357422, -0.019334793090820312, -0.018006324768066406, -0.0166778564453125, -0.015349388122558594, -0.014020919799804688, -0.012692451477050781, -0.011363983154296875, -0.010035514831542969, -0.008707046508789062, -0.007378578186035156, -0.00605010986328125, -0.004721641540527344, -0.0033931732177734375, -0.0020647048950195312, -0.000736236572265625, 0.0005922317504882812, 0.0019207000732421875, 0.0032491683959960938, 0.00457763671875, 0.005906105041503906, 0.0072345733642578125, 0.008563041687011719, 0.009891510009765625, 0.011219978332519531, 0.012548446655273438, 0.013876914978027344, 0.01520538330078125, 0.016533851623535156, 0.017862319946289062, 0.01919078826904297, 0.020519256591796875, 0.02184772491455078, 0.023176193237304688, 0.024504661560058594, 0.0258331298828125, 0.027161598205566406, 0.028490066528320312, 0.02981853485107422, 0.031147003173828125, 0.03247547149658203, 0.03380393981933594, 0.035132408142089844, 0.03646087646484375, 0.037789344787597656, 0.03911781311035156, 0.04044628143310547, 0.041774749755859375, 0.04310321807861328, 0.04443168640136719, 0.045760154724121094, 0.047088623046875]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 7.0, 9.0, 8.0, 12.0, 14.0, 20.0, 26.0, 34.0, 44.0, 42.0, 44.0, 54.0, 72.0, 49.0, 91.0, 57.0, 68.0, 59.0, 55.0, 44.0, 36.0, 28.0, 24.0, 26.0, 15.0, 15.0, 10.0, 5.0, 11.0, 3.0, 2.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2583179473876953, -3.1144847869873047, -2.970651626586914, -2.8268184661865234, -2.682985544204712, -2.5391523838043213, -2.3953192234039307, -2.251486301422119, -2.1076531410217285, -1.963819980621338, -1.8199869394302368, -1.6761537790298462, -1.5323207378387451, -1.3884875774383545, -1.2446544170379639, -1.1008213758468628, -0.9569880962371826, -0.8131549954414368, -0.6693218946456909, -0.5254887342453003, -0.38165563344955444, -0.2378225326538086, -0.09398937225341797, 0.049843668937683105, 0.19367682933807373, 0.3375099301338196, 0.4813430607318878, 0.625176191329956, 0.7690092921257019, 0.9128423929214478, 1.0566755533218384, 1.2005085945129395, 1.34434175491333, 1.4881749153137207, 1.6320079565048218, 1.7758411169052124, 1.9196741580963135, 2.063507318496704, 2.2073404788970947, 2.3511734008789062, 2.495006561279297, 2.6388397216796875, 2.782672882080078, 2.9265060424804688, 3.0703389644622803, 3.214172124862671, 3.3580052852630615, 3.501838207244873, 3.6456716060638428, 3.7895047664642334, 3.933337926864624, 4.0771708488464355, 4.221004009246826, 4.364837169647217, 4.508670330047607, 4.652503490447998, 4.796336650848389, 4.940169811248779, 5.08400297164917, 5.2278361320495605, 5.371669292449951, 5.515501976013184, 5.659335136413574, 5.803168296813965, 5.9470014572143555]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 0.0, 5.0, 3.0, 3.0, 6.0, 9.0, 12.0, 17.0, 19.0, 14.0, 30.0, 33.0, 26.0, 37.0, 20.0, 45.0, 44.0, 36.0, 48.0, 37.0, 34.0, 53.0, 43.0, 44.0, 50.0, 45.0, 31.0, 33.0, 31.0, 29.0, 25.0, 26.0, 25.0, 17.0, 12.0, 15.0, 9.0, 6.0, 7.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8723468780517578, -1.8014521598815918, -1.7305575609207153, -1.6596628427505493, -1.5887682437896729, -1.5178735256195068, -1.4469788074493408, -1.3760842084884644, -1.305189609527588, -1.2342948913574219, -1.1634002923965454, -1.0925055742263794, -1.021610975265503, -0.9507162570953369, -0.8798215985298157, -0.8089269399642944, -0.7380322217941284, -0.6671375632286072, -0.5962429046630859, -0.5253481864929199, -0.45445355772972107, -0.38355889916419983, -0.3126642107963562, -0.24176955223083496, -0.17087489366531372, -0.09998022764921188, -0.029085561633110046, 0.04180911183357239, 0.11270377039909363, 0.18359842896461487, 0.2544931173324585, 0.32538777589797974, 0.396282434463501, 0.4671770930290222, 0.5380717515945435, 0.6089664697647095, 0.6798610687255859, 0.750755786895752, 0.8216504454612732, 0.8925451040267944, 0.9634397625923157, 1.034334421157837, 1.105229139328003, 1.1761237382888794, 1.2470184564590454, 1.3179130554199219, 1.388807773590088, 1.459702491760254, 1.5305970907211304, 1.6014918088912964, 1.6723864078521729, 1.7432811260223389, 1.8141757249832153, 1.8850704431533813, 1.9559650421142578, 2.026859760284424, 2.09775447845459, 2.168649196624756, 2.239543914794922, 2.310438394546509, 2.381333112716675, 2.452227830886841, 2.523122549057007, 2.5940170288085938, 2.6649117469787598]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 11.0, 18.0, 29.0, 46.0, 80.0, 135.0, 152.0, 243.0, 368.0, 544.0, 781.0, 1198.0, 1843.0, 2801.0, 4347.0, 6658.0, 10642.0, 16859.0, 26331.0, 40831.0, 62197.0, 89107.0, 119286.0, 139780.0, 139628.0, 119168.0, 89375.0, 62131.0, 40817.0, 26163.0, 16846.0, 10651.0, 6846.0, 4386.0, 2808.0, 1831.0, 1201.0, 762.0, 545.0, 384.0, 236.0, 146.0, 107.0, 73.0, 53.0, 28.0, 25.0, 20.0, 10.0, 9.0, 0.0, 8.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.267578125, -2.19671630859375, -2.1258544921875, -2.05499267578125, -1.984130859375, -1.91326904296875, -1.8424072265625, -1.77154541015625, -1.70068359375, -1.62982177734375, -1.5589599609375, -1.48809814453125, -1.417236328125, -1.34637451171875, -1.2755126953125, -1.20465087890625, -1.1337890625, -1.06292724609375, -0.9920654296875, -0.92120361328125, -0.850341796875, -0.77947998046875, -0.7086181640625, -0.63775634765625, -0.56689453125, -0.49603271484375, -0.4251708984375, -0.35430908203125, -0.283447265625, -0.21258544921875, -0.1417236328125, -0.07086181640625, 0.0, 0.07086181640625, 0.1417236328125, 0.21258544921875, 0.283447265625, 0.35430908203125, 0.4251708984375, 0.49603271484375, 0.56689453125, 0.63775634765625, 0.7086181640625, 0.77947998046875, 0.850341796875, 0.92120361328125, 0.9920654296875, 1.06292724609375, 1.1337890625, 1.20465087890625, 1.2755126953125, 1.34637451171875, 1.417236328125, 1.48809814453125, 1.5589599609375, 1.62982177734375, 1.70068359375, 1.77154541015625, 1.8424072265625, 1.91326904296875, 1.984130859375, 2.05499267578125, 2.1258544921875, 2.19671630859375, 2.267578125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 8.0, 14.0, 18.0, 14.0, 25.0, 32.0, 28.0, 37.0, 39.0, 41.0, 28.0, 43.0, 38.0, 44.0, 41.0, 36.0, 43.0, 50.0, 42.0, 41.0, 43.0, 35.0, 28.0, 38.0, 22.0, 13.0, 32.0, 20.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.638671875, -2.5579833984375, -2.477294921875, -2.3966064453125, -2.31591796875, -2.2352294921875, -2.154541015625, -2.0738525390625, -1.9931640625, -1.9124755859375, -1.831787109375, -1.7510986328125, -1.67041015625, -1.5897216796875, -1.509033203125, -1.4283447265625, -1.34765625, -1.2669677734375, -1.186279296875, -1.1055908203125, -1.02490234375, -0.9442138671875, -0.863525390625, -0.7828369140625, -0.7021484375, -0.6214599609375, -0.540771484375, -0.4600830078125, -0.37939453125, -0.2987060546875, -0.218017578125, -0.1373291015625, -0.056640625, 0.0240478515625, 0.104736328125, 0.1854248046875, 0.26611328125, 0.3468017578125, 0.427490234375, 0.5081787109375, 0.5888671875, 0.6695556640625, 0.750244140625, 0.8309326171875, 0.91162109375, 0.9923095703125, 1.072998046875, 1.1536865234375, 1.234375, 1.3150634765625, 1.395751953125, 1.4764404296875, 1.55712890625, 1.6378173828125, 1.718505859375, 1.7991943359375, 1.8798828125, 1.9605712890625, 2.041259765625, 2.1219482421875, 2.20263671875, 2.2833251953125, 2.364013671875, 2.4447021484375, 2.525390625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 9.0, 7.0, 7.0, 10.0, 21.0, 31.0, 44.0, 49.0, 70.0, 112.0, 204.0, 315.0, 462.0, 722.0, 1159.0, 1797.0, 2922.0, 4496.0, 7597.0, 12275.0, 20201.0, 33183.0, 52551.0, 78899.0, 110832.0, 138860.0, 149269.0, 133426.0, 103732.0, 71641.0, 46834.0, 29523.0, 18213.0, 11049.0, 6710.0, 4189.0, 2593.0, 1588.0, 1065.0, 662.0, 422.0, 270.0, 181.0, 124.0, 72.0, 51.0, 46.0, 29.0, 13.0, 12.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.138671875, -2.065887451171875, -1.99310302734375, -1.920318603515625, -1.8475341796875, -1.774749755859375, -1.70196533203125, -1.629180908203125, -1.556396484375, -1.483612060546875, -1.41082763671875, -1.338043212890625, -1.2652587890625, -1.192474365234375, -1.11968994140625, -1.046905517578125, -0.97412109375, -0.901336669921875, -0.82855224609375, -0.755767822265625, -0.6829833984375, -0.610198974609375, -0.53741455078125, -0.464630126953125, -0.391845703125, -0.319061279296875, -0.24627685546875, -0.173492431640625, -0.1007080078125, -0.027923583984375, 0.04486083984375, 0.117645263671875, 0.1904296875, 0.263214111328125, 0.33599853515625, 0.408782958984375, 0.4815673828125, 0.554351806640625, 0.62713623046875, 0.699920654296875, 0.772705078125, 0.845489501953125, 0.91827392578125, 0.991058349609375, 1.0638427734375, 1.136627197265625, 1.20941162109375, 1.282196044921875, 1.35498046875, 1.427764892578125, 1.50054931640625, 1.573333740234375, 1.6461181640625, 1.718902587890625, 1.79168701171875, 1.864471435546875, 1.937255859375, 2.010040283203125, 2.08282470703125, 2.155609130859375, 2.2283935546875, 2.301177978515625, 2.37396240234375, 2.446746826171875, 2.51953125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 7.0, 6.0, 2.0, 7.0, 9.0, 21.0, 11.0, 17.0, 23.0, 15.0, 20.0, 25.0, 28.0, 27.0, 22.0, 42.0, 33.0, 42.0, 35.0, 39.0, 49.0, 33.0, 47.0, 39.0, 37.0, 39.0, 35.0, 28.0, 33.0, 35.0, 26.0, 27.0, 22.0, 13.0, 21.0, 14.0, 12.0, 9.0, 13.0, 7.0, 5.0, 5.0, 4.0, 1.0, 7.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.5205078125, -1.47528076171875, -1.4300537109375, -1.38482666015625, -1.339599609375, -1.29437255859375, -1.2491455078125, -1.20391845703125, -1.15869140625, -1.11346435546875, -1.0682373046875, -1.02301025390625, -0.977783203125, -0.93255615234375, -0.8873291015625, -0.84210205078125, -0.796875, -0.75164794921875, -0.7064208984375, -0.66119384765625, -0.615966796875, -0.57073974609375, -0.5255126953125, -0.48028564453125, -0.43505859375, -0.38983154296875, -0.3446044921875, -0.29937744140625, -0.254150390625, -0.20892333984375, -0.1636962890625, -0.11846923828125, -0.0732421875, -0.02801513671875, 0.0172119140625, 0.06243896484375, 0.107666015625, 0.15289306640625, 0.1981201171875, 0.24334716796875, 0.28857421875, 0.33380126953125, 0.3790283203125, 0.42425537109375, 0.469482421875, 0.51470947265625, 0.5599365234375, 0.60516357421875, 0.650390625, 0.69561767578125, 0.7408447265625, 0.78607177734375, 0.831298828125, 0.87652587890625, 0.9217529296875, 0.96697998046875, 1.01220703125, 1.05743408203125, 1.1026611328125, 1.14788818359375, 1.193115234375, 1.23834228515625, 1.2835693359375, 1.32879638671875, 1.3740234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 16.0, 15.0, 33.0, 48.0, 85.0, 135.0, 190.0, 282.0, 479.0, 818.0, 1425.0, 2497.0, 4452.0, 8546.0, 17122.0, 34491.0, 70453.0, 136416.0, 218914.0, 232280.0, 154749.0, 82283.0, 40966.0, 19931.0, 9976.0, 5108.0, 2848.0, 1583.0, 935.0, 556.0, 336.0, 226.0, 119.0, 79.0, 45.0, 31.0, 35.0, 18.0, 5.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.962890625, -1.897705078125, -1.83251953125, -1.767333984375, -1.7021484375, -1.636962890625, -1.57177734375, -1.506591796875, -1.44140625, -1.376220703125, -1.31103515625, -1.245849609375, -1.1806640625, -1.115478515625, -1.05029296875, -0.985107421875, -0.919921875, -0.854736328125, -0.78955078125, -0.724365234375, -0.6591796875, -0.593994140625, -0.52880859375, -0.463623046875, -0.3984375, -0.333251953125, -0.26806640625, -0.202880859375, -0.1376953125, -0.072509765625, -0.00732421875, 0.057861328125, 0.123046875, 0.188232421875, 0.25341796875, 0.318603515625, 0.3837890625, 0.448974609375, 0.51416015625, 0.579345703125, 0.64453125, 0.709716796875, 0.77490234375, 0.840087890625, 0.9052734375, 0.970458984375, 1.03564453125, 1.100830078125, 1.166015625, 1.231201171875, 1.29638671875, 1.361572265625, 1.4267578125, 1.491943359375, 1.55712890625, 1.622314453125, 1.6875, 1.752685546875, 1.81787109375, 1.883056640625, 1.9482421875, 2.013427734375, 2.07861328125, 2.143798828125, 2.208984375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 5.0, 12.0, 14.0, 20.0, 24.0, 33.0, 42.0, 46.0, 50.0, 69.0, 49.0, 76.0, 63.0, 61.0, 55.0, 62.0, 64.0, 44.0, 35.0, 34.0, 31.0, 16.0, 20.0, 10.0, 12.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00016999244689941406, -0.00016469135880470276, -0.00015939027070999146, -0.00015408918261528015, -0.00014878809452056885, -0.00014348700642585754, -0.00013818591833114624, -0.00013288483023643494, -0.00012758374214172363, -0.00012228265404701233, -0.00011698156595230103, -0.00011168047785758972, -0.00010637938976287842, -0.00010107830166816711, -9.577721357345581e-05, -9.047612547874451e-05, -8.51750373840332e-05, -7.98739492893219e-05, -7.45728611946106e-05, -6.927177309989929e-05, -6.397068500518799e-05, -5.8669596910476685e-05, -5.336850881576538e-05, -4.806742072105408e-05, -4.2766332626342773e-05, -3.746524453163147e-05, -3.2164156436920166e-05, -2.6863068342208862e-05, -2.156198024749756e-05, -1.6260892152786255e-05, -1.0959804058074951e-05, -5.6587159633636475e-06, -3.5762786865234375e-07, 4.94346022605896e-06, 1.0244548320770264e-05, 1.5545636415481567e-05, 2.084672451019287e-05, 2.6147812604904175e-05, 3.144890069961548e-05, 3.674998879432678e-05, 4.2051076889038086e-05, 4.735216498374939e-05, 5.265325307846069e-05, 5.7954341173172e-05, 6.32554292678833e-05, 6.85565173625946e-05, 7.385760545730591e-05, 7.915869355201721e-05, 8.445978164672852e-05, 8.976086974143982e-05, 9.506195783615112e-05, 0.00010036304593086243, 0.00010566413402557373, 0.00011096522212028503, 0.00011626631021499634, 0.00012156739830970764, 0.00012686848640441895, 0.00013216957449913025, 0.00013747066259384155, 0.00014277175068855286, 0.00014807283878326416, 0.00015337392687797546, 0.00015867501497268677, 0.00016397610306739807, 0.00016927719116210938]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 5.0, 8.0, 12.0, 24.0, 34.0, 40.0, 57.0, 81.0, 109.0, 217.0, 322.0, 523.0, 872.0, 1444.0, 2874.0, 5700.0, 12329.0, 27098.0, 61463.0, 130434.0, 228291.0, 254400.0, 167923.0, 83573.0, 37722.0, 16872.0, 7695.0, 3728.0, 1947.0, 1085.0, 576.0, 363.0, 204.0, 172.0, 115.0, 70.0, 44.0, 39.0, 30.0, 16.0, 11.0, 10.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.310546875, -2.24298095703125, -2.1754150390625, -2.10784912109375, -2.040283203125, -1.97271728515625, -1.9051513671875, -1.83758544921875, -1.77001953125, -1.70245361328125, -1.6348876953125, -1.56732177734375, -1.499755859375, -1.43218994140625, -1.3646240234375, -1.29705810546875, -1.2294921875, -1.16192626953125, -1.0943603515625, -1.02679443359375, -0.959228515625, -0.89166259765625, -0.8240966796875, -0.75653076171875, -0.68896484375, -0.62139892578125, -0.5538330078125, -0.48626708984375, -0.418701171875, -0.35113525390625, -0.2835693359375, -0.21600341796875, -0.1484375, -0.08087158203125, -0.0133056640625, 0.05426025390625, 0.121826171875, 0.18939208984375, 0.2569580078125, 0.32452392578125, 0.39208984375, 0.45965576171875, 0.5272216796875, 0.59478759765625, 0.662353515625, 0.72991943359375, 0.7974853515625, 0.86505126953125, 0.9326171875, 1.00018310546875, 1.0677490234375, 1.13531494140625, 1.202880859375, 1.27044677734375, 1.3380126953125, 1.40557861328125, 1.47314453125, 1.54071044921875, 1.6082763671875, 1.67584228515625, 1.743408203125, 1.81097412109375, 1.8785400390625, 1.94610595703125, 2.013671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 12.0, 6.0, 14.0, 5.0, 15.0, 19.0, 18.0, 34.0, 47.0, 50.0, 67.0, 80.0, 78.0, 85.0, 68.0, 63.0, 78.0, 54.0, 37.0, 39.0, 27.0, 20.0, 24.0, 15.0, 8.0, 10.0, 4.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.48282623291015625, -0.4651641845703125, -0.44750213623046875, -0.429840087890625, -0.41217803955078125, -0.3945159912109375, -0.37685394287109375, -0.35919189453125, -0.34152984619140625, -0.3238677978515625, -0.30620574951171875, -0.288543701171875, -0.27088165283203125, -0.2532196044921875, -0.23555755615234375, -0.2178955078125, -0.20023345947265625, -0.1825714111328125, -0.16490936279296875, -0.147247314453125, -0.12958526611328125, -0.1119232177734375, -0.09426116943359375, -0.07659912109375, -0.05893707275390625, -0.0412750244140625, -0.02361297607421875, -0.005950927734375, 0.01171112060546875, 0.0293731689453125, 0.04703521728515625, 0.064697265625, 0.08235931396484375, 0.1000213623046875, 0.11768341064453125, 0.135345458984375, 0.15300750732421875, 0.1706695556640625, 0.18833160400390625, 0.20599365234375, 0.22365570068359375, 0.2413177490234375, 0.25897979736328125, 0.276641845703125, 0.29430389404296875, 0.3119659423828125, 0.32962799072265625, 0.3472900390625, 0.36495208740234375, 0.3826141357421875, 0.40027618408203125, 0.417938232421875, 0.43560028076171875, 0.4532623291015625, 0.47092437744140625, 0.48858642578125, 0.5062484741210938, 0.5239105224609375, 0.5415725708007812, 0.559234619140625, 0.5768966674804688, 0.5945587158203125, 0.6122207641601562, 0.6298828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 2.0, 6.0, 6.0, 8.0, 10.0, 25.0, 26.0, 27.0, 30.0, 42.0, 51.0, 36.0, 60.0, 62.0, 66.0, 83.0, 76.0, 68.0, 50.0, 48.0, 51.0, 31.0, 24.0, 29.0, 14.0, 20.0, 11.0, 6.0, 7.0, 6.0, 8.0, 5.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1759355068206787, -3.0269339084625244, -2.877932071685791, -2.7289304733276367, -2.5799286365509033, -2.430927038192749, -2.2819252014160156, -2.1329236030578613, -1.9839218854904175, -1.8349201679229736, -1.6859184503555298, -1.536916732788086, -1.3879151344299316, -1.2389132976531982, -1.089911699295044, -0.9409099817276001, -0.7919082641601562, -0.6429065465927124, -0.49390485882759094, -0.3449031710624695, -0.19590145349502563, -0.04689973592758179, 0.10210192203521729, 0.25110363960266113, 0.400105357170105, 0.5491070747375488, 0.6981087923049927, 0.8471104502677917, 0.9961121678352356, 1.1451139450073242, 1.2941155433654785, 1.4431172609329224, 1.592118740081787, 1.741120457649231, 1.8901221752166748, 2.039123773574829, 2.1881256103515625, 2.337127208709717, 2.486128807067871, 2.6351306438446045, 2.784132480621338, 2.933134078979492, 3.0821359157562256, 3.23113751411438, 3.3801393508911133, 3.5291409492492676, 3.678142547607422, 3.8271443843841553, 3.9761459827423096, 4.125147819519043, 4.274149417877197, 4.423151016235352, 4.572152614593506, 4.721154689788818, 4.870156288146973, 5.019157886505127, 5.168159484863281, 5.3171610832214355, 5.46616268157959, 5.615164756774902, 5.764166355133057, 5.913167953491211, 6.062169551849365, 6.2111711502075195, 6.360173225402832]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 7.0, 11.0, 9.0, 7.0, 13.0, 24.0, 21.0, 32.0, 35.0, 19.0, 31.0, 42.0, 33.0, 36.0, 40.0, 40.0, 34.0, 37.0, 48.0, 43.0, 33.0, 37.0, 28.0, 42.0, 34.0, 36.0, 22.0, 24.0, 25.0, 20.0, 19.0, 13.0, 23.0, 19.0, 14.0, 6.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1072566509246826, -2.0383243560791016, -1.96939218044281, -1.900459885597229, -1.8315277099609375, -1.7625954151153564, -1.6936631202697754, -1.6247308254241943, -1.5557986497879028, -1.4868663549423218, -1.4179341793060303, -1.3490018844604492, -1.2800695896148682, -1.2111374139785767, -1.1422051191329956, -1.073272943496704, -1.004340648651123, -0.9354084134101868, -0.8664761781692505, -0.7975438833236694, -0.7286116480827332, -0.6596794128417969, -0.5907471179962158, -0.5218148827552795, -0.45288264751434326, -0.383950412273407, -0.3150181472301483, -0.24608589708805084, -0.17715364694595337, -0.10822141170501709, -0.03928914666175842, 0.029643118381500244, 0.09857535362243652, 0.167507603764534, 0.23643985390663147, 0.30537211894989014, 0.3743043541908264, 0.4432365894317627, 0.5121688842773438, 0.58110111951828, 0.6500333547592163, 0.7189655900001526, 0.7878978252410889, 0.8568301200866699, 0.9257623553276062, 0.9946945905685425, 1.0636268854141235, 1.132559061050415, 1.201491355895996, 1.2704236507415771, 1.3393558263778687, 1.4082881212234497, 1.4772202968597412, 1.5461525917053223, 1.6150848865509033, 1.6840171813964844, 1.7529493570327759, 1.821881651878357, 1.8908138275146484, 1.9597461223602295, 2.0286784172058105, 2.0976104736328125, 2.1665427684783936, 2.2354750633239746, 2.3044073581695557]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 8.0, 3.0, 6.0, 5.0, 16.0, 18.0, 31.0, 25.0, 43.0, 68.0, 77.0, 119.0, 168.0, 223.0, 339.0, 495.0, 772.0, 1151.0, 1826.0, 2863.0, 4612.0, 7647.0, 12852.0, 22804.0, 41960.0, 81546.0, 167286.0, 372217.0, 809354.0, 1163699.0, 799715.0, 362097.0, 162759.0, 78841.0, 41532.0, 22924.0, 13196.0, 7871.0, 4791.0, 3019.0, 1889.0, 1172.0, 722.0, 508.0, 330.0, 221.0, 166.0, 108.0, 74.0, 45.0, 31.0, 12.0, 10.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 2.0], "bins": [-4.2265625, -4.100341796875, -3.97412109375, -3.847900390625, -3.7216796875, -3.595458984375, -3.46923828125, -3.343017578125, -3.216796875, -3.090576171875, -2.96435546875, -2.838134765625, -2.7119140625, -2.585693359375, -2.45947265625, -2.333251953125, -2.20703125, -2.080810546875, -1.95458984375, -1.828369140625, -1.7021484375, -1.575927734375, -1.44970703125, -1.323486328125, -1.197265625, -1.071044921875, -0.94482421875, -0.818603515625, -0.6923828125, -0.566162109375, -0.43994140625, -0.313720703125, -0.1875, -0.061279296875, 0.06494140625, 0.191162109375, 0.3173828125, 0.443603515625, 0.56982421875, 0.696044921875, 0.822265625, 0.948486328125, 1.07470703125, 1.200927734375, 1.3271484375, 1.453369140625, 1.57958984375, 1.705810546875, 1.83203125, 1.958251953125, 2.08447265625, 2.210693359375, 2.3369140625, 2.463134765625, 2.58935546875, 2.715576171875, 2.841796875, 2.968017578125, 3.09423828125, 3.220458984375, 3.3466796875, 3.472900390625, 3.59912109375, 3.725341796875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 11.0, 11.0, 10.0, 16.0, 20.0, 30.0, 20.0, 42.0, 29.0, 31.0, 31.0, 26.0, 45.0, 30.0, 47.0, 39.0, 33.0, 31.0, 29.0, 39.0, 32.0, 35.0, 45.0, 33.0, 26.0, 28.0, 27.0, 25.0, 22.0, 15.0, 12.0, 13.0, 11.0, 14.0, 10.0, 12.0, 4.0, 11.0, 7.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.6083984375, -1.5599517822265625, -1.511505126953125, -1.4630584716796875, -1.41461181640625, -1.3661651611328125, -1.317718505859375, -1.2692718505859375, -1.2208251953125, -1.1723785400390625, -1.123931884765625, -1.0754852294921875, -1.02703857421875, -0.9785919189453125, -0.930145263671875, -0.8816986083984375, -0.833251953125, -0.7848052978515625, -0.736358642578125, -0.6879119873046875, -0.63946533203125, -0.5910186767578125, -0.542572021484375, -0.4941253662109375, -0.4456787109375, -0.3972320556640625, -0.348785400390625, -0.3003387451171875, -0.25189208984375, -0.2034454345703125, -0.154998779296875, -0.1065521240234375, -0.05810546875, -0.0096588134765625, 0.038787841796875, 0.0872344970703125, 0.13568115234375, 0.1841278076171875, 0.232574462890625, 0.2810211181640625, 0.3294677734375, 0.3779144287109375, 0.426361083984375, 0.4748077392578125, 0.52325439453125, 0.5717010498046875, 0.620147705078125, 0.6685943603515625, 0.717041015625, 0.7654876708984375, 0.813934326171875, 0.8623809814453125, 0.91082763671875, 0.9592742919921875, 1.007720947265625, 1.0561676025390625, 1.1046142578125, 1.1530609130859375, 1.201507568359375, 1.2499542236328125, 1.29840087890625, 1.3468475341796875, 1.395294189453125, 1.4437408447265625, 1.4921875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 10.0, 15.0, 15.0, 29.0, 50.0, 64.0, 99.0, 185.0, 266.0, 455.0, 781.0, 1220.0, 2101.0, 3397.0, 5882.0, 10704.0, 19212.0, 36738.0, 70946.0, 148270.0, 320188.0, 685952.0, 1124935.0, 904769.0, 449266.0, 205279.0, 97639.0, 48815.0, 25193.0, 13506.0, 7581.0, 4274.0, 2447.0, 1529.0, 911.0, 554.0, 340.0, 249.0, 138.0, 113.0, 55.0, 29.0, 27.0, 23.0, 11.0, 6.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.20233154296875, -4.0609130859375, -3.91949462890625, -3.778076171875, -3.63665771484375, -3.4952392578125, -3.35382080078125, -3.21240234375, -3.07098388671875, -2.9295654296875, -2.78814697265625, -2.646728515625, -2.50531005859375, -2.3638916015625, -2.22247314453125, -2.0810546875, -1.93963623046875, -1.7982177734375, -1.65679931640625, -1.515380859375, -1.37396240234375, -1.2325439453125, -1.09112548828125, -0.94970703125, -0.80828857421875, -0.6668701171875, -0.52545166015625, -0.384033203125, -0.24261474609375, -0.1011962890625, 0.04022216796875, 0.181640625, 0.32305908203125, 0.4644775390625, 0.60589599609375, 0.747314453125, 0.88873291015625, 1.0301513671875, 1.17156982421875, 1.31298828125, 1.45440673828125, 1.5958251953125, 1.73724365234375, 1.878662109375, 2.02008056640625, 2.1614990234375, 2.30291748046875, 2.4443359375, 2.58575439453125, 2.7271728515625, 2.86859130859375, 3.010009765625, 3.15142822265625, 3.2928466796875, 3.43426513671875, 3.57568359375, 3.71710205078125, 3.8585205078125, 3.99993896484375, 4.141357421875, 4.28277587890625, 4.4241943359375, 4.56561279296875, 4.70703125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 11.0, 15.0, 13.0, 22.0, 17.0, 29.0, 34.0, 51.0, 63.0, 68.0, 77.0, 114.0, 146.0, 152.0, 201.0, 230.0, 259.0, 244.0, 282.0, 281.0, 279.0, 244.0, 233.0, 212.0, 158.0, 150.0, 103.0, 69.0, 67.0, 56.0, 47.0, 34.0, 26.0, 21.0, 19.0, 13.0, 15.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.239715576171875, -1.20306396484375, -1.166412353515625, -1.1297607421875, -1.093109130859375, -1.05645751953125, -1.019805908203125, -0.983154296875, -0.946502685546875, -0.90985107421875, -0.873199462890625, -0.8365478515625, -0.799896240234375, -0.76324462890625, -0.726593017578125, -0.68994140625, -0.653289794921875, -0.61663818359375, -0.579986572265625, -0.5433349609375, -0.506683349609375, -0.47003173828125, -0.433380126953125, -0.396728515625, -0.360076904296875, -0.32342529296875, -0.286773681640625, -0.2501220703125, -0.213470458984375, -0.17681884765625, -0.140167236328125, -0.103515625, -0.066864013671875, -0.03021240234375, 0.006439208984375, 0.0430908203125, 0.079742431640625, 0.11639404296875, 0.153045654296875, 0.189697265625, 0.226348876953125, 0.26300048828125, 0.299652099609375, 0.3363037109375, 0.372955322265625, 0.40960693359375, 0.446258544921875, 0.48291015625, 0.519561767578125, 0.55621337890625, 0.592864990234375, 0.6295166015625, 0.666168212890625, 0.70281982421875, 0.739471435546875, 0.776123046875, 0.812774658203125, 0.84942626953125, 0.886077880859375, 0.9227294921875, 0.959381103515625, 0.99603271484375, 1.032684326171875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 14.0, 16.0, 15.0, 27.0, 29.0, 30.0, 50.0, 47.0, 56.0, 55.0, 86.0, 78.0, 63.0, 66.0, 60.0, 64.0, 44.0, 40.0, 27.0, 21.0, 17.0, 16.0, 11.0, 12.0, 8.0, 11.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52296781539917, -4.3727850914001465, -4.222602844238281, -4.072420120239258, -3.9222373962402344, -3.772054672241211, -3.6218721866607666, -3.4716897010803223, -3.321506977081299, -3.1713242530822754, -3.021141767501831, -2.8709592819213867, -2.7207765579223633, -2.57059383392334, -2.4204113483428955, -2.270228862762451, -2.1200461387634277, -1.9698635339736938, -1.81968092918396, -1.669498324394226, -1.5193157196044922, -1.3691331148147583, -1.2189505100250244, -1.0687679052352905, -0.9185853004455566, -0.7684026956558228, -0.6182200908660889, -0.468037486076355, -0.3178548812866211, -0.1676722764968872, -0.01748967170715332, 0.13269293308258057, 0.28287506103515625, 0.43305766582489014, 0.583240270614624, 0.7334228754043579, 0.8836054801940918, 1.0337880849838257, 1.1839706897735596, 1.3341532945632935, 1.4843358993530273, 1.6345185041427612, 1.7847011089324951, 1.934883713722229, 2.085066318511963, 2.2352490425109863, 2.3854315280914307, 2.535614013671875, 2.6857967376708984, 2.835979461669922, 2.986161947250366, 3.1363444328308105, 3.286527156829834, 3.4367098808288574, 3.5868923664093018, 3.737074851989746, 3.8872575759887695, 4.037440299987793, 4.187623023986816, 4.337805271148682, 4.487987995147705, 4.6381707191467285, 4.788352966308594, 4.938535690307617, 5.088718414306641]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 5.0, 11.0, 7.0, 16.0, 17.0, 17.0, 15.0, 23.0, 20.0, 26.0, 23.0, 32.0, 27.0, 36.0, 36.0, 25.0, 49.0, 36.0, 44.0, 40.0, 34.0, 27.0, 35.0, 41.0, 34.0, 36.0, 38.0, 24.0, 32.0, 20.0, 16.0, 22.0, 23.0, 20.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 10.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7342405319213867, -1.6759778261184692, -1.6177152395248413, -1.5594525337219238, -1.5011898279190063, -1.4429271221160889, -1.384664535522461, -1.3264018297195435, -1.268139123916626, -1.2098764181137085, -1.1516138315200806, -1.093351125717163, -1.0350884199142456, -0.9768257737159729, -0.9185631275177002, -0.8603004217147827, -0.8020378351211548, -0.7437751889228821, -0.6855124831199646, -0.6272498369216919, -0.5689871311187744, -0.5107244849205017, -0.452461838722229, -0.3941991627216339, -0.3359364867210388, -0.2776738107204437, -0.21941114962100983, -0.16114848852157593, -0.10288581252098083, -0.04462313652038574, 0.013639509677886963, 0.07190218567848206, 0.13016486167907715, 0.18842753767967224, 0.24669019877910614, 0.30495285987854004, 0.36321553587913513, 0.4214782118797302, 0.47974085807800293, 0.5380035638809204, 0.5962662100791931, 0.6545288562774658, 0.7127915620803833, 0.771054208278656, 0.8293168544769287, 0.8875795602798462, 0.9458422064781189, 1.0041048526763916, 1.062367558479309, 1.1206302642822266, 1.1788928508758545, 1.237155556678772, 1.2954182624816895, 1.3536808490753174, 1.4119435548782349, 1.4702062606811523, 1.5284688472747803, 1.5867315530776978, 1.6449941396713257, 1.7032568454742432, 1.7615195512771606, 1.8197822570800781, 1.878044843673706, 1.9363075494766235, 1.994570255279541]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 11.0, 14.0, 29.0, 39.0, 86.0, 164.0, 220.0, 390.0, 604.0, 1095.0, 1785.0, 3161.0, 6031.0, 10358.0, 19464.0, 36833.0, 68971.0, 124869.0, 194771.0, 218822.0, 159262.0, 93230.0, 49961.0, 26749.0, 13998.0, 7681.0, 4259.0, 2444.0, 1315.0, 747.0, 467.0, 295.0, 169.0, 93.0, 52.0, 38.0, 29.0, 9.0, 5.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.4033203125, -0.3921928405761719, -0.38106536865234375, -0.3699378967285156, -0.3588104248046875, -0.3476829528808594, -0.33655548095703125, -0.3254280090332031, -0.314300537109375, -0.3031730651855469, -0.29204559326171875, -0.2809181213378906, -0.2697906494140625, -0.2586631774902344, -0.24753570556640625, -0.23640823364257812, -0.22528076171875, -0.21415328979492188, -0.20302581787109375, -0.19189834594726562, -0.1807708740234375, -0.16964340209960938, -0.15851593017578125, -0.14738845825195312, -0.136260986328125, -0.12513351440429688, -0.11400604248046875, -0.10287857055664062, -0.0917510986328125, -0.08062362670898438, -0.06949615478515625, -0.058368682861328125, -0.0472412109375, -0.036113739013671875, -0.02498626708984375, -0.013858795166015625, -0.0027313232421875, 0.008396148681640625, 0.01952362060546875, 0.030651092529296875, 0.041778564453125, 0.052906036376953125, 0.06403350830078125, 0.07516098022460938, 0.0862884521484375, 0.09741592407226562, 0.10854339599609375, 0.11967086791992188, 0.13079833984375, 0.14192581176757812, 0.15305328369140625, 0.16418075561523438, 0.1753082275390625, 0.18643569946289062, 0.19756317138671875, 0.20869064331054688, 0.219818115234375, 0.23094558715820312, 0.24207305908203125, 0.2532005310058594, 0.2643280029296875, 0.2754554748535156, 0.28658294677734375, 0.2977104187011719, 0.308837890625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 6.0, 15.0, 9.0, 16.0, 12.0, 15.0, 34.0, 25.0, 26.0, 24.0, 29.0, 28.0, 27.0, 34.0, 34.0, 31.0, 30.0, 35.0, 35.0, 34.0, 41.0, 35.0, 27.0, 30.0, 27.0, 33.0, 23.0, 32.0, 21.0, 28.0, 21.0, 24.0, 21.0, 12.0, 23.0, 10.0, 9.0, 8.0, 12.0, 5.0, 6.0, 11.0, 4.0, 2.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8076171875, -1.7475433349609375, -1.687469482421875, -1.6273956298828125, -1.56732177734375, -1.5072479248046875, -1.447174072265625, -1.3871002197265625, -1.3270263671875, -1.2669525146484375, -1.206878662109375, -1.1468048095703125, -1.08673095703125, -1.0266571044921875, -0.966583251953125, -0.9065093994140625, -0.846435546875, -0.7863616943359375, -0.726287841796875, -0.6662139892578125, -0.60614013671875, -0.5460662841796875, -0.485992431640625, -0.4259185791015625, -0.3658447265625, -0.3057708740234375, -0.245697021484375, -0.1856231689453125, -0.12554931640625, -0.0654754638671875, -0.005401611328125, 0.0546722412109375, 0.11474609375, 0.1748199462890625, 0.234893798828125, 0.2949676513671875, 0.35504150390625, 0.4151153564453125, 0.475189208984375, 0.5352630615234375, 0.5953369140625, 0.6554107666015625, 0.715484619140625, 0.7755584716796875, 0.83563232421875, 0.8957061767578125, 0.955780029296875, 1.0158538818359375, 1.075927734375, 1.1360015869140625, 1.196075439453125, 1.2561492919921875, 1.31622314453125, 1.3762969970703125, 1.436370849609375, 1.4964447021484375, 1.5565185546875, 1.6165924072265625, 1.676666259765625, 1.7367401123046875, 1.79681396484375, 1.8568878173828125, 1.916961669921875, 1.9770355224609375, 2.037109375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 13.0, 7.0, 10.0, 9.0, 23.0, 27.0, 35.0, 45.0, 62.0, 86.0, 107.0, 171.0, 212.0, 367.0, 511.0, 798.0, 1344.0, 2176.0, 4090.0, 7837.0, 17034.0, 45426.0, 817685.0, 104685.0, 23152.0, 10193.0, 5227.0, 2753.0, 1623.0, 908.0, 581.0, 401.0, 277.0, 177.0, 142.0, 94.0, 61.0, 55.0, 40.0, 30.0, 19.0, 14.0, 16.0, 11.0, 7.0, 1.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8077774047851562, -0.7796173095703125, -0.7514572143554688, -0.723297119140625, -0.6951370239257812, -0.6669769287109375, -0.6388168334960938, -0.61065673828125, -0.5824966430664062, -0.5543365478515625, -0.5261764526367188, -0.498016357421875, -0.46985626220703125, -0.4416961669921875, -0.41353607177734375, -0.3853759765625, -0.35721588134765625, -0.3290557861328125, -0.30089569091796875, -0.272735595703125, -0.24457550048828125, -0.2164154052734375, -0.18825531005859375, -0.16009521484375, -0.13193511962890625, -0.1037750244140625, -0.07561492919921875, -0.047454833984375, -0.01929473876953125, 0.0088653564453125, 0.03702545166015625, 0.065185546875, 0.09334564208984375, 0.1215057373046875, 0.14966583251953125, 0.177825927734375, 0.20598602294921875, 0.2341461181640625, 0.26230621337890625, 0.29046630859375, 0.31862640380859375, 0.3467864990234375, 0.37494659423828125, 0.403106689453125, 0.43126678466796875, 0.4594268798828125, 0.48758697509765625, 0.5157470703125, 0.5439071655273438, 0.5720672607421875, 0.6002273559570312, 0.628387451171875, 0.6565475463867188, 0.6847076416015625, 0.7128677368164062, 0.74102783203125, 0.7691879272460938, 0.7973480224609375, 0.8255081176757812, 0.853668212890625, 0.8818283081054688, 0.9099884033203125, 0.9381484985351562, 0.96630859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 6.0, 7.0, 7.0, 12.0, 9.0, 14.0, 13.0, 14.0, 9.0, 12.0, 18.0, 28.0, 31.0, 23.0, 37.0, 38.0, 32.0, 36.0, 41.0, 36.0, 31.0, 38.0, 46.0, 41.0, 30.0, 33.0, 34.0, 37.0, 30.0, 31.0, 29.0, 18.0, 20.0, 22.0, 24.0, 12.0, 20.0, 12.0, 12.0, 10.0, 8.0, 8.0, 13.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2724609375, -1.230499267578125, -1.18853759765625, -1.146575927734375, -1.1046142578125, -1.062652587890625, -1.02069091796875, -0.978729248046875, -0.936767578125, -0.894805908203125, -0.85284423828125, -0.810882568359375, -0.7689208984375, -0.726959228515625, -0.68499755859375, -0.643035888671875, -0.60107421875, -0.559112548828125, -0.51715087890625, -0.475189208984375, -0.4332275390625, -0.391265869140625, -0.34930419921875, -0.307342529296875, -0.265380859375, -0.223419189453125, -0.18145751953125, -0.139495849609375, -0.0975341796875, -0.055572509765625, -0.01361083984375, 0.028350830078125, 0.0703125, 0.112274169921875, 0.15423583984375, 0.196197509765625, 0.2381591796875, 0.280120849609375, 0.32208251953125, 0.364044189453125, 0.406005859375, 0.447967529296875, 0.48992919921875, 0.531890869140625, 0.5738525390625, 0.615814208984375, 0.65777587890625, 0.699737548828125, 0.74169921875, 0.783660888671875, 0.82562255859375, 0.867584228515625, 0.9095458984375, 0.951507568359375, 0.99346923828125, 1.035430908203125, 1.077392578125, 1.119354248046875, 1.16131591796875, 1.203277587890625, 1.2452392578125, 1.287200927734375, 1.32916259765625, 1.371124267578125, 1.4130859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 17.0, 19.0, 35.0, 38.0, 65.0, 96.0, 174.0, 268.0, 418.0, 637.0, 1136.0, 1815.0, 3097.0, 5285.0, 9482.0, 18389.0, 41509.0, 872844.0, 49095.0, 19737.0, 10362.0, 5755.0, 3300.0, 1882.0, 1185.0, 667.0, 465.0, 268.0, 182.0, 93.0, 69.0, 46.0, 41.0, 21.0, 20.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2230224609375, -0.21637725830078125, -0.2097320556640625, -0.20308685302734375, -0.196441650390625, -0.18979644775390625, -0.1831512451171875, -0.17650604248046875, -0.16986083984375, -0.16321563720703125, -0.1565704345703125, -0.14992523193359375, -0.143280029296875, -0.13663482666015625, -0.1299896240234375, -0.12334442138671875, -0.11669921875, -0.11005401611328125, -0.1034088134765625, -0.09676361083984375, -0.090118408203125, -0.08347320556640625, -0.0768280029296875, -0.07018280029296875, -0.06353759765625, -0.05689239501953125, -0.0502471923828125, -0.04360198974609375, -0.036956787109375, -0.03031158447265625, -0.0236663818359375, -0.01702117919921875, -0.0103759765625, -0.00373077392578125, 0.0029144287109375, 0.00955963134765625, 0.016204833984375, 0.02285003662109375, 0.0294952392578125, 0.03614044189453125, 0.04278564453125, 0.04943084716796875, 0.0560760498046875, 0.06272125244140625, 0.069366455078125, 0.07601165771484375, 0.0826568603515625, 0.08930206298828125, 0.095947265625, 0.10259246826171875, 0.1092376708984375, 0.11588287353515625, 0.122528076171875, 0.12917327880859375, 0.1358184814453125, 0.14246368408203125, 0.14910888671875, 0.15575408935546875, 0.1623992919921875, 0.16904449462890625, 0.175689697265625, 0.18233489990234375, 0.1889801025390625, 0.19562530517578125, 0.2022705078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 4.0, 9.0, 14.0, 23.0, 29.0, 28.0, 39.0, 49.0, 47.0, 64.0, 71.0, 82.0, 71.0, 65.0, 59.0, 63.0, 62.0, 42.0, 39.0, 31.0, 29.0, 15.0, 13.0, 5.0, 9.0, 2.0, 6.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.7637691497802734e-05, -5.59687614440918e-05, -5.429983139038086e-05, -5.263090133666992e-05, -5.0961971282958984e-05, -4.929304122924805e-05, -4.762411117553711e-05, -4.595518112182617e-05, -4.4286251068115234e-05, -4.26173210144043e-05, -4.094839096069336e-05, -3.927946090698242e-05, -3.7610530853271484e-05, -3.594160079956055e-05, -3.427267074584961e-05, -3.260374069213867e-05, -3.0934810638427734e-05, -2.9265880584716797e-05, -2.759695053100586e-05, -2.5928020477294922e-05, -2.4259090423583984e-05, -2.2590160369873047e-05, -2.092123031616211e-05, -1.9252300262451172e-05, -1.7583370208740234e-05, -1.5914440155029297e-05, -1.424551010131836e-05, -1.2576580047607422e-05, -1.0907649993896484e-05, -9.238719940185547e-06, -7.569789886474609e-06, -5.900859832763672e-06, -4.231929779052734e-06, -2.562999725341797e-06, -8.940696716308594e-07, 7.748603820800781e-07, 2.4437904357910156e-06, 4.112720489501953e-06, 5.781650543212891e-06, 7.450580596923828e-06, 9.119510650634766e-06, 1.0788440704345703e-05, 1.245737075805664e-05, 1.4126300811767578e-05, 1.5795230865478516e-05, 1.7464160919189453e-05, 1.913309097290039e-05, 2.0802021026611328e-05, 2.2470951080322266e-05, 2.4139881134033203e-05, 2.580881118774414e-05, 2.7477741241455078e-05, 2.9146671295166016e-05, 3.081560134887695e-05, 3.248453140258789e-05, 3.415346145629883e-05, 3.5822391510009766e-05, 3.74913215637207e-05, 3.916025161743164e-05, 4.082918167114258e-05, 4.2498111724853516e-05, 4.416704177856445e-05, 4.583597183227539e-05, 4.750490188598633e-05, 4.9173831939697266e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 16.0, 30.0, 50.0, 59.0, 97.0, 153.0, 254.0, 354.0, 548.0, 887.0, 1365.0, 2205.0, 3612.0, 5744.0, 9350.0, 15719.0, 26414.0, 44122.0, 76052.0, 125850.0, 182444.0, 193555.0, 142334.0, 88334.0, 52021.0, 30322.0, 18254.0, 10655.0, 6620.0, 4070.0, 2552.0, 1611.0, 1051.0, 635.0, 443.0, 251.0, 169.0, 117.0, 67.0, 49.0, 38.0, 15.0, 19.0, 9.0, 4.0, 10.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.07196044921875, -0.06985282897949219, -0.06774520874023438, -0.06563758850097656, -0.06352996826171875, -0.06142234802246094, -0.059314727783203125, -0.05720710754394531, -0.0550994873046875, -0.05299186706542969, -0.050884246826171875, -0.04877662658691406, -0.04666900634765625, -0.04456138610839844, -0.042453765869140625, -0.04034614562988281, -0.038238525390625, -0.03613090515136719, -0.034023284912109375, -0.03191566467285156, -0.02980804443359375, -0.027700424194335938, -0.025592803955078125, -0.023485183715820312, -0.0213775634765625, -0.019269943237304688, -0.017162322998046875, -0.015054702758789062, -0.01294708251953125, -0.010839462280273438, -0.008731842041015625, -0.0066242218017578125, -0.0045166015625, -0.0024089813232421875, -0.000301361083984375, 0.0018062591552734375, 0.00391387939453125, 0.0060214996337890625, 0.008129119873046875, 0.010236740112304688, 0.0123443603515625, 0.014451980590820312, 0.016559600830078125, 0.018667221069335938, 0.02077484130859375, 0.022882461547851562, 0.024990081787109375, 0.027097702026367188, 0.029205322265625, 0.03131294250488281, 0.033420562744140625, 0.03552818298339844, 0.03763580322265625, 0.03974342346191406, 0.041851043701171875, 0.04395866394042969, 0.0460662841796875, 0.04817390441894531, 0.050281524658203125, 0.05238914489746094, 0.05449676513671875, 0.05660438537597656, 0.058712005615234375, 0.06081962585449219, 0.06292724609375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 10.0, 5.0, 9.0, 9.0, 9.0, 8.0, 14.0, 16.0, 19.0, 16.0, 22.0, 32.0, 26.0, 34.0, 44.0, 40.0, 57.0, 29.0, 47.0, 56.0, 52.0, 48.0, 51.0, 58.0, 41.0, 47.0, 27.0, 26.0, 27.0, 23.0, 13.0, 16.0, 14.0, 6.0, 9.0, 8.0, 6.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.017547607421875, -0.017049312591552734, -0.01655101776123047, -0.016052722930908203, -0.015554428100585938, -0.015056133270263672, -0.014557838439941406, -0.01405954360961914, -0.013561248779296875, -0.01306295394897461, -0.012564659118652344, -0.012066364288330078, -0.011568069458007812, -0.011069774627685547, -0.010571479797363281, -0.010073184967041016, -0.00957489013671875, -0.009076595306396484, -0.008578300476074219, -0.008080005645751953, -0.0075817108154296875, -0.007083415985107422, -0.006585121154785156, -0.006086826324462891, -0.005588531494140625, -0.005090236663818359, -0.004591941833496094, -0.004093647003173828, -0.0035953521728515625, -0.003097057342529297, -0.0025987625122070312, -0.0021004676818847656, -0.0016021728515625, -0.0011038780212402344, -0.0006055831909179688, -0.00010728836059570312, 0.0003910064697265625, 0.0008893013000488281, 0.0013875961303710938, 0.0018858909606933594, 0.002384185791015625, 0.0028824806213378906, 0.0033807754516601562, 0.003879070281982422, 0.0043773651123046875, 0.004875659942626953, 0.005373954772949219, 0.005872249603271484, 0.00637054443359375, 0.006868839263916016, 0.007367134094238281, 0.007865428924560547, 0.008363723754882812, 0.008862018585205078, 0.009360313415527344, 0.00985860824584961, 0.010356903076171875, 0.01085519790649414, 0.011353492736816406, 0.011851787567138672, 0.012350082397460938, 0.012848377227783203, 0.013346672058105469, 0.013844966888427734, 0.01434326171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 8.0, 13.0, 19.0, 13.0, 26.0, 28.0, 30.0, 39.0, 63.0, 47.0, 54.0, 86.0, 82.0, 57.0, 67.0, 57.0, 68.0, 50.0, 38.0, 29.0, 21.0, 17.0, 16.0, 14.0, 10.0, 9.0, 11.0, 7.0, 3.0, 4.0, 5.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.529380798339844, -4.3796868324279785, -4.229992866516113, -4.080298900604248, -3.930605173110962, -3.7809112071990967, -3.6312174797058105, -3.4815235137939453, -3.33182954788208, -3.182135581970215, -3.0324416160583496, -2.8827478885650635, -2.7330539226531982, -2.583359956741333, -2.433666229248047, -2.2839722633361816, -2.1342782974243164, -1.9845843315124512, -1.8348904848098755, -1.6851966381072998, -1.5355026721954346, -1.3858087062835693, -1.2361148595809937, -1.086421012878418, -0.9367270469665527, -0.7870331406593323, -0.6373392343521118, -0.48764532804489136, -0.3379514217376709, -0.18825751543045044, -0.03856360912322998, 0.1111302375793457, 0.26082468032836914, 0.4105185866355896, 0.5602124929428101, 0.7099063992500305, 0.859600305557251, 1.0092942714691162, 1.158988118171692, 1.3086819648742676, 1.4583759307861328, 1.608069896697998, 1.7577637434005737, 1.9074575901031494, 2.0571515560150146, 2.20684552192688, 2.356539249420166, 2.5062332153320312, 2.6559271812438965, 2.8056211471557617, 2.955315113067627, 3.105008840560913, 3.2547028064727783, 3.4043967723846436, 3.5540904998779297, 3.703784465789795, 3.85347843170166, 4.003172397613525, 4.152866363525391, 4.302560329437256, 4.452254295349121, 4.601947784423828, 4.751641750335693, 4.901335716247559, 5.051029682159424]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 12.0, 5.0, 16.0, 19.0, 14.0, 17.0, 23.0, 21.0, 25.0, 25.0, 30.0, 26.0, 38.0, 33.0, 28.0, 46.0, 38.0, 43.0, 42.0, 33.0, 26.0, 41.0, 33.0, 33.0, 41.0, 35.0, 27.0, 31.0, 20.0, 16.0, 21.0, 25.0, 19.0, 16.0, 8.0, 15.0, 9.0, 6.0, 6.0, 4.0, 9.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7494254112243652, -1.6914043426513672, -1.6333832740783691, -1.575362205505371, -1.517341136932373, -1.459320068359375, -1.401298999786377, -1.343277931213379, -1.2852568626403809, -1.2272357940673828, -1.1692147254943848, -1.1111936569213867, -1.0531725883483887, -0.9951515197753906, -0.9371304512023926, -0.8791093826293945, -0.8210883140563965, -0.7630672454833984, -0.7050461769104004, -0.6470251083374023, -0.5890040397644043, -0.5309829711914062, -0.4729619026184082, -0.41494083404541016, -0.3569197654724121, -0.29889869689941406, -0.24087762832641602, -0.18285655975341797, -0.12483549118041992, -0.06681442260742188, -0.008793354034423828, 0.04922771453857422, 0.10724878311157227, 0.1652698516845703, 0.22329092025756836, 0.2813119888305664, 0.33933305740356445, 0.3973541259765625, 0.45537519454956055, 0.5133962631225586, 0.5714173316955566, 0.6294384002685547, 0.6874594688415527, 0.7454805374145508, 0.8035016059875488, 0.8615226745605469, 0.9195437431335449, 0.977564811706543, 1.035585880279541, 1.093606948852539, 1.151628017425537, 1.2096490859985352, 1.2676701545715332, 1.3256912231445312, 1.3837122917175293, 1.4417333602905273, 1.4997544288635254, 1.5577754974365234, 1.6157965660095215, 1.6738176345825195, 1.7318387031555176, 1.7898597717285156, 1.8478808403015137, 1.9059019088745117, 1.9639229774475098]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 9.0, 13.0, 12.0, 27.0, 38.0, 57.0, 97.0, 163.0, 211.0, 317.0, 554.0, 809.0, 1272.0, 2022.0, 3350.0, 5101.0, 8424.0, 13640.0, 22573.0, 36626.0, 58771.0, 90041.0, 124956.0, 151061.0, 151670.0, 127535.0, 91557.0, 59864.0, 37578.0, 23229.0, 14002.0, 8603.0, 5253.0, 3255.0, 2146.0, 1289.0, 845.0, 549.0, 372.0, 221.0, 155.0, 93.0, 65.0, 51.0, 32.0, 15.0, 10.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-2.455078125, -2.37841796875, -2.3017578125, -2.22509765625, -2.1484375, -2.07177734375, -1.9951171875, -1.91845703125, -1.841796875, -1.76513671875, -1.6884765625, -1.61181640625, -1.53515625, -1.45849609375, -1.3818359375, -1.30517578125, -1.228515625, -1.15185546875, -1.0751953125, -0.99853515625, -0.921875, -0.84521484375, -0.7685546875, -0.69189453125, -0.615234375, -0.53857421875, -0.4619140625, -0.38525390625, -0.30859375, -0.23193359375, -0.1552734375, -0.07861328125, -0.001953125, 0.07470703125, 0.1513671875, 0.22802734375, 0.3046875, 0.38134765625, 0.4580078125, 0.53466796875, 0.611328125, 0.68798828125, 0.7646484375, 0.84130859375, 0.91796875, 0.99462890625, 1.0712890625, 1.14794921875, 1.224609375, 1.30126953125, 1.3779296875, 1.45458984375, 1.53125, 1.60791015625, 1.6845703125, 1.76123046875, 1.837890625, 1.91455078125, 1.9912109375, 2.06787109375, 2.14453125, 2.22119140625, 2.2978515625, 2.37451171875, 2.451171875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 11.0, 14.0, 18.0, 25.0, 18.0, 22.0, 32.0, 29.0, 27.0, 37.0, 34.0, 23.0, 38.0, 38.0, 51.0, 44.0, 44.0, 40.0, 36.0, 35.0, 36.0, 35.0, 28.0, 29.0, 28.0, 28.0, 25.0, 24.0, 19.0, 14.0, 8.0, 11.0, 15.0, 11.0, 2.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.955596923828125, -1.88775634765625, -1.819915771484375, -1.7520751953125, -1.684234619140625, -1.61639404296875, -1.548553466796875, -1.480712890625, -1.412872314453125, -1.34503173828125, -1.277191162109375, -1.2093505859375, -1.141510009765625, -1.07366943359375, -1.005828857421875, -0.93798828125, -0.870147705078125, -0.80230712890625, -0.734466552734375, -0.6666259765625, -0.598785400390625, -0.53094482421875, -0.463104248046875, -0.395263671875, -0.327423095703125, -0.25958251953125, -0.191741943359375, -0.1239013671875, -0.056060791015625, 0.01177978515625, 0.079620361328125, 0.1474609375, 0.215301513671875, 0.28314208984375, 0.350982666015625, 0.4188232421875, 0.486663818359375, 0.55450439453125, 0.622344970703125, 0.690185546875, 0.758026123046875, 0.82586669921875, 0.893707275390625, 0.9615478515625, 1.029388427734375, 1.09722900390625, 1.165069580078125, 1.23291015625, 1.300750732421875, 1.36859130859375, 1.436431884765625, 1.5042724609375, 1.572113037109375, 1.63995361328125, 1.707794189453125, 1.775634765625, 1.843475341796875, 1.91131591796875, 1.979156494140625, 2.0469970703125, 2.114837646484375, 2.18267822265625, 2.250518798828125, 2.318359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 7.0, 17.0, 19.0, 41.0, 50.0, 76.0, 105.0, 177.0, 287.0, 352.0, 568.0, 844.0, 1387.0, 2294.0, 3789.0, 6142.0, 10569.0, 17988.0, 30935.0, 52496.0, 83792.0, 123336.0, 157414.0, 165512.0, 137665.0, 98118.0, 62314.0, 37769.0, 22045.0, 12906.0, 7640.0, 4486.0, 2709.0, 1716.0, 1047.0, 666.0, 424.0, 265.0, 201.0, 135.0, 85.0, 44.0, 45.0, 17.0, 18.0, 14.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.611328125, -2.527587890625, -2.44384765625, -2.360107421875, -2.2763671875, -2.192626953125, -2.10888671875, -2.025146484375, -1.94140625, -1.857666015625, -1.77392578125, -1.690185546875, -1.6064453125, -1.522705078125, -1.43896484375, -1.355224609375, -1.271484375, -1.187744140625, -1.10400390625, -1.020263671875, -0.9365234375, -0.852783203125, -0.76904296875, -0.685302734375, -0.6015625, -0.517822265625, -0.43408203125, -0.350341796875, -0.2666015625, -0.182861328125, -0.09912109375, -0.015380859375, 0.068359375, 0.152099609375, 0.23583984375, 0.319580078125, 0.4033203125, 0.487060546875, 0.57080078125, 0.654541015625, 0.73828125, 0.822021484375, 0.90576171875, 0.989501953125, 1.0732421875, 1.156982421875, 1.24072265625, 1.324462890625, 1.408203125, 1.491943359375, 1.57568359375, 1.659423828125, 1.7431640625, 1.826904296875, 1.91064453125, 1.994384765625, 2.078125, 2.161865234375, 2.24560546875, 2.329345703125, 2.4130859375, 2.496826171875, 2.58056640625, 2.664306640625, 2.748046875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 7.0, 5.0, 9.0, 15.0, 15.0, 5.0, 12.0, 16.0, 19.0, 27.0, 23.0, 24.0, 37.0, 25.0, 30.0, 40.0, 32.0, 36.0, 38.0, 36.0, 52.0, 44.0, 36.0, 47.0, 43.0, 35.0, 38.0, 27.0, 20.0, 24.0, 28.0, 29.0, 14.0, 12.0, 19.0, 7.0, 12.0, 7.0, 8.0, 13.0, 5.0, 2.0, 7.0, 1.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.13092041015625, -1.0899658203125, -1.04901123046875, -1.008056640625, -0.96710205078125, -0.9261474609375, -0.88519287109375, -0.84423828125, -0.80328369140625, -0.7623291015625, -0.72137451171875, -0.680419921875, -0.63946533203125, -0.5985107421875, -0.55755615234375, -0.5166015625, -0.47564697265625, -0.4346923828125, -0.39373779296875, -0.352783203125, -0.31182861328125, -0.2708740234375, -0.22991943359375, -0.18896484375, -0.14801025390625, -0.1070556640625, -0.06610107421875, -0.025146484375, 0.01580810546875, 0.0567626953125, 0.09771728515625, 0.138671875, 0.17962646484375, 0.2205810546875, 0.26153564453125, 0.302490234375, 0.34344482421875, 0.3843994140625, 0.42535400390625, 0.46630859375, 0.50726318359375, 0.5482177734375, 0.58917236328125, 0.630126953125, 0.67108154296875, 0.7120361328125, 0.75299072265625, 0.7939453125, 0.83489990234375, 0.8758544921875, 0.91680908203125, 0.957763671875, 0.99871826171875, 1.0396728515625, 1.08062744140625, 1.12158203125, 1.16253662109375, 1.2034912109375, 1.24444580078125, 1.285400390625, 1.32635498046875, 1.3673095703125, 1.40826416015625, 1.44921875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 12.0, 17.0, 17.0, 36.0, 48.0, 66.0, 123.0, 205.0, 307.0, 504.0, 829.0, 1428.0, 2382.0, 4214.0, 7388.0, 13151.0, 23990.0, 42627.0, 75139.0, 124603.0, 177281.0, 191828.0, 152613.0, 98457.0, 57875.0, 32195.0, 17738.0, 10187.0, 5525.0, 3166.0, 1889.0, 1059.0, 661.0, 383.0, 232.0, 132.0, 91.0, 63.0, 36.0, 32.0, 14.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.525390625, -1.4732513427734375, -1.421112060546875, -1.3689727783203125, -1.31683349609375, -1.2646942138671875, -1.212554931640625, -1.1604156494140625, -1.1082763671875, -1.0561370849609375, -1.003997802734375, -0.9518585205078125, -0.89971923828125, -0.8475799560546875, -0.795440673828125, -0.7433013916015625, -0.691162109375, -0.6390228271484375, -0.586883544921875, -0.5347442626953125, -0.48260498046875, -0.4304656982421875, -0.378326416015625, -0.3261871337890625, -0.2740478515625, -0.2219085693359375, -0.169769287109375, -0.1176300048828125, -0.06549072265625, -0.0133514404296875, 0.038787841796875, 0.0909271240234375, 0.14306640625, 0.1952056884765625, 0.247344970703125, 0.2994842529296875, 0.35162353515625, 0.4037628173828125, 0.455902099609375, 0.5080413818359375, 0.5601806640625, 0.6123199462890625, 0.664459228515625, 0.7165985107421875, 0.76873779296875, 0.8208770751953125, 0.873016357421875, 0.9251556396484375, 0.977294921875, 1.0294342041015625, 1.081573486328125, 1.1337127685546875, 1.18585205078125, 1.2379913330078125, 1.290130615234375, 1.3422698974609375, 1.3944091796875, 1.4465484619140625, 1.498687744140625, 1.5508270263671875, 1.60296630859375, 1.6551055908203125, 1.707244873046875, 1.7593841552734375, 1.8115234375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 6.0, 9.0, 17.0, 17.0, 28.0, 40.0, 45.0, 52.0, 75.0, 106.0, 101.0, 101.0, 90.0, 76.0, 66.0, 37.0, 43.0, 18.0, 27.0, 13.0, 15.0, 9.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019490718841552734, -0.00018788687884807587, -0.0001808665692806244, -0.0001738462597131729, -0.00016682595014572144, -0.00015980564057826996, -0.00015278533101081848, -0.000145765021443367, -0.00013874471187591553, -0.00013172440230846405, -0.00012470409274101257, -0.0001176837831735611, -0.00011066347360610962, -0.00010364316403865814, -9.662285447120667e-05, -8.960254490375519e-05, -8.258223533630371e-05, -7.556192576885223e-05, -6.854161620140076e-05, -6.152130663394928e-05, -5.45009970664978e-05, -4.7480687499046326e-05, -4.046037793159485e-05, -3.344006836414337e-05, -2.6419758796691895e-05, -1.9399449229240417e-05, -1.237913966178894e-05, -5.358830094337463e-06, 1.6614794731140137e-06, 8.68178904056549e-06, 1.5702098608016968e-05, 2.2722408175468445e-05, 2.9742717742919922e-05, 3.67630273103714e-05, 4.3783336877822876e-05, 5.080364644527435e-05, 5.782395601272583e-05, 6.484426558017731e-05, 7.186457514762878e-05, 7.888488471508026e-05, 8.590519428253174e-05, 9.292550384998322e-05, 9.994581341743469e-05, 0.00010696612298488617, 0.00011398643255233765, 0.00012100674211978912, 0.0001280270516872406, 0.00013504736125469208, 0.00014206767082214355, 0.00014908798038959503, 0.0001561082899570465, 0.00016312859952449799, 0.00017014890909194946, 0.00017716921865940094, 0.00018418952822685242, 0.0001912098377943039, 0.00019823014736175537, 0.00020525045692920685, 0.00021227076649665833, 0.0002192910760641098, 0.00022631138563156128, 0.00023333169519901276, 0.00024035200476646423, 0.0002473723143339157, 0.0002543926239013672]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 1.0, 7.0, 4.0, 5.0, 13.0, 16.0, 19.0, 38.0, 43.0, 58.0, 124.0, 151.0, 239.0, 352.0, 537.0, 829.0, 1228.0, 1876.0, 2971.0, 4544.0, 7138.0, 11260.0, 17251.0, 27439.0, 42794.0, 65154.0, 94782.0, 127091.0, 147868.0, 142009.0, 115157.0, 82496.0, 55309.0, 36010.0, 22997.0, 14392.0, 9351.0, 6029.0, 3758.0, 2494.0, 1615.0, 1050.0, 699.0, 462.0, 313.0, 183.0, 146.0, 83.0, 52.0, 49.0, 20.0, 15.0, 12.0, 11.0, 6.0, 9.0, 6.0, 0.0, 3.0, 0.0, 1.0], "bins": [-1.177734375, -1.1407012939453125, -1.103668212890625, -1.0666351318359375, -1.02960205078125, -0.9925689697265625, -0.955535888671875, -0.9185028076171875, -0.8814697265625, -0.8444366455078125, -0.807403564453125, -0.7703704833984375, -0.73333740234375, -0.6963043212890625, -0.659271240234375, -0.6222381591796875, -0.585205078125, -0.5481719970703125, -0.511138916015625, -0.4741058349609375, -0.43707275390625, -0.4000396728515625, -0.363006591796875, -0.3259735107421875, -0.2889404296875, -0.2519073486328125, -0.214874267578125, -0.1778411865234375, -0.14080810546875, -0.1037750244140625, -0.066741943359375, -0.0297088623046875, 0.00732421875, 0.0443572998046875, 0.081390380859375, 0.1184234619140625, 0.15545654296875, 0.1924896240234375, 0.229522705078125, 0.2665557861328125, 0.3035888671875, 0.3406219482421875, 0.377655029296875, 0.4146881103515625, 0.45172119140625, 0.4887542724609375, 0.525787353515625, 0.5628204345703125, 0.599853515625, 0.6368865966796875, 0.673919677734375, 0.7109527587890625, 0.74798583984375, 0.7850189208984375, 0.822052001953125, 0.8590850830078125, 0.8961181640625, 0.9331512451171875, 0.970184326171875, 1.0072174072265625, 1.04425048828125, 1.0812835693359375, 1.118316650390625, 1.1553497314453125, 1.1923828125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 6.0, 4.0, 5.0, 10.0, 12.0, 20.0, 16.0, 18.0, 22.0, 23.0, 35.0, 38.0, 41.0, 41.0, 39.0, 48.0, 63.0, 48.0, 49.0, 36.0, 52.0, 42.0, 28.0, 41.0, 34.0, 31.0, 26.0, 24.0, 26.0, 22.0, 13.0, 15.0, 9.0, 8.0, 12.0, 11.0, 1.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.30908203125, -0.2984199523925781, -0.28775787353515625, -0.2770957946777344, -0.2664337158203125, -0.2557716369628906, -0.24510955810546875, -0.23444747924804688, -0.223785400390625, -0.21312332153320312, -0.20246124267578125, -0.19179916381835938, -0.1811370849609375, -0.17047500610351562, -0.15981292724609375, -0.14915084838867188, -0.13848876953125, -0.12782669067382812, -0.11716461181640625, -0.10650253295898438, -0.0958404541015625, -0.08517837524414062, -0.07451629638671875, -0.06385421752929688, -0.053192138671875, -0.042530059814453125, -0.03186798095703125, -0.021205902099609375, -0.0105438232421875, 0.000118255615234375, 0.01078033447265625, 0.021442413330078125, 0.0321044921875, 0.042766571044921875, 0.05342864990234375, 0.06409072875976562, 0.0747528076171875, 0.08541488647460938, 0.09607696533203125, 0.10673904418945312, 0.117401123046875, 0.12806320190429688, 0.13872528076171875, 0.14938735961914062, 0.1600494384765625, 0.17071151733398438, 0.18137359619140625, 0.19203567504882812, 0.20269775390625, 0.21335983276367188, 0.22402191162109375, 0.23468399047851562, 0.2453460693359375, 0.2560081481933594, 0.26667022705078125, 0.2773323059082031, 0.287994384765625, 0.2986564636230469, 0.30931854248046875, 0.3199806213378906, 0.3306427001953125, 0.3413047790527344, 0.35196685791015625, 0.3626289367675781, 0.373291015625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 15.0, 12.0, 17.0, 15.0, 14.0, 30.0, 39.0, 53.0, 56.0, 61.0, 63.0, 66.0, 76.0, 63.0, 77.0, 54.0, 56.0, 47.0, 37.0, 22.0, 17.0, 23.0, 16.0, 14.0, 9.0, 10.0, 3.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.714277267456055, -4.566986083984375, -4.419694900512695, -4.272403717041016, -4.125112533569336, -3.9778213500976562, -3.8305299282073975, -3.6832387447357178, -3.535947561264038, -3.3886563777923584, -3.2413651943206787, -3.094074010848999, -2.9467825889587402, -2.7994914054870605, -2.652200222015381, -2.504909038543701, -2.3576178550720215, -2.210326671600342, -2.063035488128662, -1.9157441854476929, -1.7684530019760132, -1.6211618185043335, -1.4738705158233643, -1.3265793323516846, -1.1792881488800049, -1.0319969654083252, -0.8847057223320007, -0.7374144792556763, -0.5901232957839966, -0.4428321123123169, -0.29554086923599243, -0.14824962615966797, -0.0009589195251464844, 0.1463322937488556, 0.29362350702285767, 0.44091472029685974, 0.5882059335708618, 0.7354971170425415, 0.882788360118866, 1.0300796031951904, 1.1773707866668701, 1.3246619701385498, 1.4719531536102295, 1.6192444562911987, 1.7665356397628784, 1.913826823234558, 2.0611181259155273, 2.208409309387207, 2.3557004928588867, 2.5029916763305664, 2.650282859802246, 2.797574043273926, 2.9448652267456055, 3.092156410217285, 3.239447832107544, 3.3867390155792236, 3.5340301990509033, 3.681321382522583, 3.8286125659942627, 3.9759037494659424, 4.123195171356201, 4.270486354827881, 4.4177775382995605, 4.56506872177124, 4.71235990524292]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 4.0, 1.0, 8.0, 8.0, 9.0, 9.0, 11.0, 20.0, 15.0, 10.0, 19.0, 19.0, 24.0, 31.0, 26.0, 25.0, 36.0, 30.0, 28.0, 37.0, 44.0, 50.0, 38.0, 35.0, 38.0, 32.0, 29.0, 24.0, 28.0, 36.0, 25.0, 34.0, 30.0, 26.0, 19.0, 22.0, 24.0, 11.0, 8.0, 10.0, 14.0, 10.0, 7.0, 7.0, 9.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 6.0, 0.0, 1.0, 2.0], "bins": [-1.959781289100647, -1.899973750114441, -1.8401663303375244, -1.7803587913513184, -1.7205513715744019, -1.6607438325881958, -1.6009364128112793, -1.5411288738250732, -1.4813213348388672, -1.4215137958526611, -1.3617063760757446, -1.3018988370895386, -1.242091417312622, -1.182283878326416, -1.12247633934021, -1.0626689195632935, -1.002861499786377, -0.9430540204048157, -0.8832465410232544, -0.8234390020370483, -0.7636315822601318, -0.7038240432739258, -0.6440165638923645, -0.5842090845108032, -0.5244016051292419, -0.46459412574768066, -0.4047866463661194, -0.3449791371822357, -0.28517165780067444, -0.22536417841911316, -0.1655566692352295, -0.10574918985366821, -0.045941710472106934, 0.013865776360034943, 0.07367326319217682, 0.1334807574748993, 0.19328823685646057, 0.25309571623802185, 0.3129032254219055, 0.3727107048034668, 0.4325181841850281, 0.49232566356658936, 0.5521331429481506, 0.6119406223297119, 0.671748161315918, 0.7315555810928345, 0.7913631200790405, 0.8511705994606018, 0.9109780788421631, 0.9707855582237244, 1.0305930376052856, 1.0904005765914917, 1.1502079963684082, 1.2100155353546143, 1.2698230743408203, 1.3296304941177368, 1.3894379138946533, 1.4492454528808594, 1.5090528726577759, 1.568860411643982, 1.6286678314208984, 1.6884753704071045, 1.7482829093933105, 1.808090329170227, 1.867897868156433]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 9.0, 8.0, 13.0, 24.0, 31.0, 45.0, 81.0, 96.0, 135.0, 206.0, 328.0, 492.0, 762.0, 1116.0, 1753.0, 2804.0, 4488.0, 7367.0, 11936.0, 20540.0, 36259.0, 67500.0, 133005.0, 278507.0, 600425.0, 1037957.0, 969389.0, 520258.0, 242263.0, 117210.0, 60344.0, 32393.0, 18549.0, 10894.0, 6470.0, 3895.0, 2428.0, 1514.0, 1015.0, 598.0, 393.0, 281.0, 179.0, 118.0, 79.0, 44.0, 30.0, 25.0, 13.0, 9.0, 7.0, 5.0, 2.0, 1.0], "bins": [-4.3046875, -4.184783935546875, -4.06488037109375, -3.944976806640625, -3.8250732421875, -3.705169677734375, -3.58526611328125, -3.465362548828125, -3.345458984375, -3.225555419921875, -3.10565185546875, -2.985748291015625, -2.8658447265625, -2.745941162109375, -2.62603759765625, -2.506134033203125, -2.38623046875, -2.266326904296875, -2.14642333984375, -2.026519775390625, -1.9066162109375, -1.786712646484375, -1.66680908203125, -1.546905517578125, -1.427001953125, -1.307098388671875, -1.18719482421875, -1.067291259765625, -0.9473876953125, -0.827484130859375, -0.70758056640625, -0.587677001953125, -0.4677734375, -0.347869873046875, -0.22796630859375, -0.108062744140625, 0.0118408203125, 0.131744384765625, 0.25164794921875, 0.371551513671875, 0.491455078125, 0.611358642578125, 0.73126220703125, 0.851165771484375, 0.9710693359375, 1.090972900390625, 1.21087646484375, 1.330780029296875, 1.45068359375, 1.570587158203125, 1.69049072265625, 1.810394287109375, 1.9302978515625, 2.050201416015625, 2.17010498046875, 2.290008544921875, 2.409912109375, 2.529815673828125, 2.64971923828125, 2.769622802734375, 2.8895263671875, 3.009429931640625, 3.12933349609375, 3.249237060546875, 3.369140625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 10.0, 14.0, 10.0, 10.0, 10.0, 18.0, 20.0, 20.0, 21.0, 24.0, 31.0, 20.0, 47.0, 35.0, 36.0, 38.0, 31.0, 41.0, 38.0, 47.0, 39.0, 42.0, 48.0, 36.0, 48.0, 28.0, 38.0, 34.0, 29.0, 12.0, 24.0, 7.0, 17.0, 10.0, 19.0, 10.0, 13.0, 6.0, 5.0, 6.0, 1.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-1.87890625, -1.8269805908203125, -1.775054931640625, -1.7231292724609375, -1.67120361328125, -1.6192779541015625, -1.567352294921875, -1.5154266357421875, -1.4635009765625, -1.4115753173828125, -1.359649658203125, -1.3077239990234375, -1.25579833984375, -1.2038726806640625, -1.151947021484375, -1.1000213623046875, -1.048095703125, -0.9961700439453125, -0.944244384765625, -0.8923187255859375, -0.84039306640625, -0.7884674072265625, -0.736541748046875, -0.6846160888671875, -0.6326904296875, -0.5807647705078125, -0.528839111328125, -0.4769134521484375, -0.42498779296875, -0.3730621337890625, -0.321136474609375, -0.2692108154296875, -0.21728515625, -0.1653594970703125, -0.113433837890625, -0.0615081787109375, -0.00958251953125, 0.0423431396484375, 0.094268798828125, 0.1461944580078125, 0.1981201171875, 0.2500457763671875, 0.301971435546875, 0.3538970947265625, 0.40582275390625, 0.4577484130859375, 0.509674072265625, 0.5615997314453125, 0.613525390625, 0.6654510498046875, 0.717376708984375, 0.7693023681640625, 0.82122802734375, 0.8731536865234375, 0.925079345703125, 0.9770050048828125, 1.0289306640625, 1.0808563232421875, 1.132781982421875, 1.1847076416015625, 1.23663330078125, 1.2885589599609375, 1.340484619140625, 1.3924102783203125, 1.4443359375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 7.0, 8.0, 8.0, 18.0, 27.0, 45.0, 59.0, 87.0, 145.0, 225.0, 361.0, 564.0, 861.0, 1291.0, 2038.0, 3275.0, 5463.0, 8708.0, 14303.0, 23790.0, 40590.0, 69876.0, 124796.0, 226503.0, 414431.0, 707492.0, 906769.0, 708604.0, 413161.0, 225275.0, 124499.0, 70042.0, 40275.0, 23608.0, 14370.0, 8596.0, 5232.0, 3268.0, 2005.0, 1304.0, 830.0, 520.0, 321.0, 233.0, 120.0, 98.0, 66.0, 50.0, 24.0, 19.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.484375, -3.373748779296875, -3.26312255859375, -3.152496337890625, -3.0418701171875, -2.931243896484375, -2.82061767578125, -2.709991455078125, -2.599365234375, -2.488739013671875, -2.37811279296875, -2.267486572265625, -2.1568603515625, -2.046234130859375, -1.93560791015625, -1.824981689453125, -1.71435546875, -1.603729248046875, -1.49310302734375, -1.382476806640625, -1.2718505859375, -1.161224365234375, -1.05059814453125, -0.939971923828125, -0.829345703125, -0.718719482421875, -0.60809326171875, -0.497467041015625, -0.3868408203125, -0.276214599609375, -0.16558837890625, -0.054962158203125, 0.0556640625, 0.166290283203125, 0.27691650390625, 0.387542724609375, 0.4981689453125, 0.608795166015625, 0.71942138671875, 0.830047607421875, 0.940673828125, 1.051300048828125, 1.16192626953125, 1.272552490234375, 1.3831787109375, 1.493804931640625, 1.60443115234375, 1.715057373046875, 1.82568359375, 1.936309814453125, 2.04693603515625, 2.157562255859375, 2.2681884765625, 2.378814697265625, 2.48944091796875, 2.600067138671875, 2.710693359375, 2.821319580078125, 2.93194580078125, 3.042572021484375, 3.1531982421875, 3.263824462890625, 3.37445068359375, 3.485076904296875, 3.595703125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 9.0, 12.0, 8.0, 14.0, 21.0, 25.0, 39.0, 30.0, 48.0, 45.0, 60.0, 71.0, 86.0, 99.0, 98.0, 136.0, 139.0, 166.0, 185.0, 198.0, 223.0, 236.0, 217.0, 206.0, 216.0, 205.0, 155.0, 182.0, 130.0, 126.0, 124.0, 98.0, 77.0, 69.0, 68.0, 45.0, 38.0, 37.0, 27.0, 21.0, 14.0, 13.0, 14.0, 8.0, 7.0, 10.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8623046875, -0.8345413208007812, -0.8067779541015625, -0.7790145874023438, -0.751251220703125, -0.7234878540039062, -0.6957244873046875, -0.6679611206054688, -0.64019775390625, -0.6124343872070312, -0.5846710205078125, -0.5569076538085938, -0.529144287109375, -0.5013809204101562, -0.4736175537109375, -0.44585418701171875, -0.4180908203125, -0.39032745361328125, -0.3625640869140625, -0.33480072021484375, -0.307037353515625, -0.27927398681640625, -0.2515106201171875, -0.22374725341796875, -0.19598388671875, -0.16822052001953125, -0.1404571533203125, -0.11269378662109375, -0.084930419921875, -0.05716705322265625, -0.0294036865234375, -0.00164031982421875, 0.026123046875, 0.05388641357421875, 0.0816497802734375, 0.10941314697265625, 0.137176513671875, 0.16493988037109375, 0.1927032470703125, 0.22046661376953125, 0.24822998046875, 0.27599334716796875, 0.3037567138671875, 0.33152008056640625, 0.359283447265625, 0.38704681396484375, 0.4148101806640625, 0.44257354736328125, 0.4703369140625, 0.49810028076171875, 0.5258636474609375, 0.5536270141601562, 0.581390380859375, 0.6091537475585938, 0.6369171142578125, 0.6646804809570312, 0.69244384765625, 0.7202072143554688, 0.7479705810546875, 0.7757339477539062, 0.803497314453125, 0.8312606811523438, 0.8590240478515625, 0.8867874145507812, 0.91455078125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 9.0, 4.0, 6.0, 4.0, 6.0, 13.0, 13.0, 20.0, 27.0, 26.0, 34.0, 52.0, 60.0, 64.0, 67.0, 66.0, 64.0, 71.0, 64.0, 58.0, 60.0, 34.0, 27.0, 28.0, 30.0, 16.0, 20.0, 10.0, 6.0, 7.0, 7.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.285930633544922, -4.141051292419434, -3.996171712875366, -3.851292133331299, -3.7064127922058105, -3.561533212661743, -3.416653633117676, -3.2717742919921875, -3.12689471244812, -2.9820151329040527, -2.8371357917785645, -2.692256212234497, -2.5473766326904297, -2.4024972915649414, -2.257617712020874, -2.1127381324768066, -1.9678587913513184, -1.8229793310165405, -1.6780998706817627, -1.5332202911376953, -1.3883408308029175, -1.2434613704681396, -1.0985817909240723, -0.9537023305892944, -0.8088228702545166, -0.6639434099197388, -0.5190638899803162, -0.37418439984321594, -0.22930490970611572, -0.08442544937133789, 0.06045407056808472, 0.20533359050750732, 0.35021352767944336, 0.4950930178165436, 0.6399725079536438, 0.7848520278930664, 0.9297314882278442, 1.074610948562622, 1.2194905281066895, 1.3643699884414673, 1.5092494487762451, 1.654128909111023, 1.7990083694458008, 1.9438879489898682, 2.0887675285339355, 2.233646869659424, 2.378526449203491, 2.5234060287475586, 2.668285369873047, 2.8131649494171143, 2.9580442905426025, 3.10292387008667, 3.247803211212158, 3.3926827907562256, 3.537562370300293, 3.6824417114257812, 3.8273212909698486, 3.972200870513916, 4.117080211639404, 4.261959552764893, 4.406839370727539, 4.551718711853027, 4.696598052978516, 4.841477870941162, 4.98635721206665]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 10.0, 13.0, 12.0, 11.0, 12.0, 11.0, 15.0, 21.0, 25.0, 17.0, 23.0, 26.0, 24.0, 31.0, 36.0, 32.0, 37.0, 29.0, 25.0, 37.0, 52.0, 44.0, 32.0, 37.0, 38.0, 40.0, 34.0, 36.0, 33.0, 26.0, 22.0, 23.0, 18.0, 26.0, 13.0, 18.0, 12.0, 8.0, 7.0, 7.0, 7.0, 5.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7316498756408691, -1.6734554767608643, -1.6152609586715698, -1.557066559791565, -1.4988720417022705, -1.4406776428222656, -1.3824831247329712, -1.3242887258529663, -1.2660942077636719, -1.207899808883667, -1.1497052907943726, -1.0915108919143677, -1.0333163738250732, -0.9751219749450684, -0.9169274568557739, -0.858733057975769, -0.8005385994911194, -0.7423441410064697, -0.6841496825218201, -0.6259552240371704, -0.5677607655525208, -0.5095663070678711, -0.4513718783855438, -0.39317741990089417, -0.3349829614162445, -0.27678850293159485, -0.2185940444469452, -0.16039960086345673, -0.10220514237880707, -0.044010698795318604, 0.014183759689331055, 0.07237821817398071, 0.13057267665863037, 0.18876713514328003, 0.2469615936279297, 0.30515605211257935, 0.363350510597229, 0.4215449392795563, 0.47973939776420593, 0.5379338264465332, 0.5961283445358276, 0.6543228030204773, 0.712517261505127, 0.7707117199897766, 0.8289061784744263, 0.8871005773544312, 0.9452950954437256, 1.0034894943237305, 1.0616838932037354, 1.1198782920837402, 1.1780728101730347, 1.2362672090530396, 1.294461727142334, 1.3526561260223389, 1.4108506441116333, 1.4690450429916382, 1.5272395610809326, 1.5854339599609375, 1.643628478050232, 1.7018228769302368, 1.7600173950195312, 1.8182117938995361, 1.8764063119888306, 1.9346007108688354, 1.9927952289581299]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 9.0, 18.0, 15.0, 23.0, 38.0, 75.0, 123.0, 150.0, 253.0, 431.0, 660.0, 1107.0, 1918.0, 3246.0, 6093.0, 11105.0, 20615.0, 39160.0, 73818.0, 134500.0, 211318.0, 220414.0, 147458.0, 81425.0, 43648.0, 23108.0, 12175.0, 6649.0, 3775.0, 1994.0, 1231.0, 764.0, 483.0, 260.0, 176.0, 113.0, 56.0, 46.0, 33.0, 20.0, 15.0, 12.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.32568359375, -0.3155326843261719, -0.30538177490234375, -0.2952308654785156, -0.2850799560546875, -0.2749290466308594, -0.26477813720703125, -0.2546272277832031, -0.244476318359375, -0.23432540893554688, -0.22417449951171875, -0.21402359008789062, -0.2038726806640625, -0.19372177124023438, -0.18357086181640625, -0.17341995239257812, -0.16326904296875, -0.15311813354492188, -0.14296722412109375, -0.13281631469726562, -0.1226654052734375, -0.11251449584960938, -0.10236358642578125, -0.09221267700195312, -0.082061767578125, -0.07191085815429688, -0.06175994873046875, -0.051609039306640625, -0.0414581298828125, -0.031307220458984375, -0.02115631103515625, -0.011005401611328125, -0.0008544921875, 0.009296417236328125, 0.01944732666015625, 0.029598236083984375, 0.0397491455078125, 0.049900054931640625, 0.06005096435546875, 0.07020187377929688, 0.080352783203125, 0.09050369262695312, 0.10065460205078125, 0.11080551147460938, 0.1209564208984375, 0.13110733032226562, 0.14125823974609375, 0.15140914916992188, 0.16156005859375, 0.17171096801757812, 0.18186187744140625, 0.19201278686523438, 0.2021636962890625, 0.21231460571289062, 0.22246551513671875, 0.23261642456054688, 0.242767333984375, 0.2529182434082031, 0.26306915283203125, 0.2732200622558594, 0.2833709716796875, 0.2935218811035156, 0.30367279052734375, 0.3138236999511719, 0.323974609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 4.0, 17.0, 5.0, 13.0, 9.0, 11.0, 20.0, 22.0, 19.0, 23.0, 30.0, 34.0, 33.0, 30.0, 18.0, 32.0, 33.0, 48.0, 48.0, 42.0, 51.0, 53.0, 37.0, 42.0, 41.0, 41.0, 39.0, 29.0, 32.0, 18.0, 12.0, 20.0, 17.0, 12.0, 15.0, 6.0, 12.0, 7.0, 7.0, 8.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.25, -2.1741943359375, -2.098388671875, -2.0225830078125, -1.94677734375, -1.8709716796875, -1.795166015625, -1.7193603515625, -1.6435546875, -1.5677490234375, -1.491943359375, -1.4161376953125, -1.34033203125, -1.2645263671875, -1.188720703125, -1.1129150390625, -1.037109375, -0.9613037109375, -0.885498046875, -0.8096923828125, -0.73388671875, -0.6580810546875, -0.582275390625, -0.5064697265625, -0.4306640625, -0.3548583984375, -0.279052734375, -0.2032470703125, -0.12744140625, -0.0516357421875, 0.024169921875, 0.0999755859375, 0.17578125, 0.2515869140625, 0.327392578125, 0.4031982421875, 0.47900390625, 0.5548095703125, 0.630615234375, 0.7064208984375, 0.7822265625, 0.8580322265625, 0.933837890625, 1.0096435546875, 1.08544921875, 1.1612548828125, 1.237060546875, 1.3128662109375, 1.388671875, 1.4644775390625, 1.540283203125, 1.6160888671875, 1.69189453125, 1.7677001953125, 1.843505859375, 1.9193115234375, 1.9951171875, 2.0709228515625, 2.146728515625, 2.2225341796875, 2.29833984375, 2.3741455078125, 2.449951171875, 2.5257568359375, 2.6015625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 3.0, 10.0, 9.0, 9.0, 13.0, 24.0, 39.0, 49.0, 61.0, 70.0, 110.0, 151.0, 201.0, 363.0, 497.0, 749.0, 1258.0, 2142.0, 3781.0, 7894.0, 17018.0, 47203.0, 830002.0, 93310.0, 22229.0, 9632.0, 4901.0, 2628.0, 1528.0, 882.0, 560.0, 390.0, 235.0, 169.0, 111.0, 82.0, 63.0, 36.0, 34.0, 24.0, 20.0, 22.0, 11.0, 10.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.8016128540039062, -0.7736358642578125, -0.7456588745117188, -0.717681884765625, -0.6897048950195312, -0.6617279052734375, -0.6337509155273438, -0.60577392578125, -0.5777969360351562, -0.5498199462890625, -0.5218429565429688, -0.493865966796875, -0.46588897705078125, -0.4379119873046875, -0.40993499755859375, -0.3819580078125, -0.35398101806640625, -0.3260040283203125, -0.29802703857421875, -0.270050048828125, -0.24207305908203125, -0.2140960693359375, -0.18611907958984375, -0.15814208984375, -0.13016510009765625, -0.1021881103515625, -0.07421112060546875, -0.046234130859375, -0.01825714111328125, 0.0097198486328125, 0.03769683837890625, 0.065673828125, 0.09365081787109375, 0.1216278076171875, 0.14960479736328125, 0.177581787109375, 0.20555877685546875, 0.2335357666015625, 0.26151275634765625, 0.28948974609375, 0.31746673583984375, 0.3454437255859375, 0.37342071533203125, 0.401397705078125, 0.42937469482421875, 0.4573516845703125, 0.48532867431640625, 0.5133056640625, 0.5412826538085938, 0.5692596435546875, 0.5972366333007812, 0.625213623046875, 0.6531906127929688, 0.6811676025390625, 0.7091445922851562, 0.73712158203125, 0.7650985717773438, 0.7930755615234375, 0.8210525512695312, 0.849029541015625, 0.8770065307617188, 0.9049835205078125, 0.9329605102539062, 0.9609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 9.0, 7.0, 8.0, 5.0, 10.0, 11.0, 12.0, 13.0, 13.0, 17.0, 30.0, 29.0, 16.0, 27.0, 30.0, 32.0, 30.0, 30.0, 37.0, 38.0, 34.0, 34.0, 41.0, 42.0, 48.0, 38.0, 36.0, 34.0, 28.0, 23.0, 23.0, 19.0, 23.0, 23.0, 22.0, 24.0, 15.0, 17.0, 10.0, 16.0, 11.0, 7.0, 8.0, 3.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2685546875, -1.2261810302734375, -1.183807373046875, -1.1414337158203125, -1.09906005859375, -1.0566864013671875, -1.014312744140625, -0.9719390869140625, -0.9295654296875, -0.8871917724609375, -0.844818115234375, -0.8024444580078125, -0.76007080078125, -0.7176971435546875, -0.675323486328125, -0.6329498291015625, -0.590576171875, -0.5482025146484375, -0.505828857421875, -0.4634552001953125, -0.42108154296875, -0.3787078857421875, -0.336334228515625, -0.2939605712890625, -0.2515869140625, -0.2092132568359375, -0.166839599609375, -0.1244659423828125, -0.08209228515625, -0.0397186279296875, 0.002655029296875, 0.0450286865234375, 0.08740234375, 0.1297760009765625, 0.172149658203125, 0.2145233154296875, 0.25689697265625, 0.2992706298828125, 0.341644287109375, 0.3840179443359375, 0.4263916015625, 0.4687652587890625, 0.511138916015625, 0.5535125732421875, 0.59588623046875, 0.6382598876953125, 0.680633544921875, 0.7230072021484375, 0.765380859375, 0.8077545166015625, 0.850128173828125, 0.8925018310546875, 0.93487548828125, 0.9772491455078125, 1.019622802734375, 1.0619964599609375, 1.1043701171875, 1.1467437744140625, 1.189117431640625, 1.2314910888671875, 1.27386474609375, 1.3162384033203125, 1.358612060546875, 1.4009857177734375, 1.443359375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 9.0, 12.0, 24.0, 15.0, 27.0, 46.0, 59.0, 90.0, 109.0, 210.0, 308.0, 516.0, 731.0, 1193.0, 1766.0, 2802.0, 4689.0, 7983.0, 14481.0, 28652.0, 596362.0, 328898.0, 26547.0, 13487.0, 7548.0, 4452.0, 2775.0, 1746.0, 1026.0, 689.0, 425.0, 308.0, 195.0, 127.0, 73.0, 47.0, 36.0, 31.0, 21.0, 14.0, 7.0, 12.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1768798828125, -0.17181968688964844, -0.16675949096679688, -0.1616992950439453, -0.15663909912109375, -0.1515789031982422, -0.14651870727539062, -0.14145851135253906, -0.1363983154296875, -0.13133811950683594, -0.12627792358398438, -0.12121772766113281, -0.11615753173828125, -0.11109733581542969, -0.10603713989257812, -0.10097694396972656, -0.095916748046875, -0.09085655212402344, -0.08579635620117188, -0.08073616027832031, -0.07567596435546875, -0.07061576843261719, -0.06555557250976562, -0.06049537658691406, -0.0554351806640625, -0.05037498474121094, -0.045314788818359375, -0.04025459289550781, -0.03519439697265625, -0.030134201049804688, -0.025074005126953125, -0.020013809204101562, -0.01495361328125, -0.009893417358398438, -0.004833221435546875, 0.0002269744873046875, 0.00528717041015625, 0.010347366333007812, 0.015407562255859375, 0.020467758178710938, 0.0255279541015625, 0.030588150024414062, 0.035648345947265625, 0.04070854187011719, 0.04576873779296875, 0.05082893371582031, 0.055889129638671875, 0.06094932556152344, 0.066009521484375, 0.07106971740722656, 0.07612991333007812, 0.08119010925292969, 0.08625030517578125, 0.09131050109863281, 0.09637069702148438, 0.10143089294433594, 0.1064910888671875, 0.11155128479003906, 0.11661148071289062, 0.12167167663574219, 0.12673187255859375, 0.1317920684814453, 0.13685226440429688, 0.14191246032714844, 0.14697265625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 9.0, 11.0, 17.0, 24.0, 19.0, 38.0, 33.0, 48.0, 46.0, 56.0, 52.0, 67.0, 74.0, 56.0, 63.0, 56.0, 51.0, 43.0, 32.0, 29.0, 38.0, 30.0, 13.0, 17.0, 11.0, 13.0, 0.0, 3.0, 4.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.248453140258789e-05, -3.1313858926296234e-05, -3.0143186450004578e-05, -2.897251397371292e-05, -2.7801841497421265e-05, -2.6631169021129608e-05, -2.546049654483795e-05, -2.4289824068546295e-05, -2.311915159225464e-05, -2.1948479115962982e-05, -2.0777806639671326e-05, -1.960713416337967e-05, -1.8436461687088013e-05, -1.7265789210796356e-05, -1.60951167345047e-05, -1.4924444258213043e-05, -1.3753771781921387e-05, -1.258309930562973e-05, -1.1412426829338074e-05, -1.0241754353046417e-05, -9.07108187675476e-06, -7.900409400463104e-06, -6.729736924171448e-06, -5.559064447879791e-06, -4.388391971588135e-06, -3.2177194952964783e-06, -2.0470470190048218e-06, -8.763745427131653e-07, 2.942979335784912e-07, 1.4649704098701477e-06, 2.635642886161804e-06, 3.8063153624534607e-06, 4.976987838745117e-06, 6.147660315036774e-06, 7.31833279132843e-06, 8.489005267620087e-06, 9.659677743911743e-06, 1.08303502202034e-05, 1.2001022696495056e-05, 1.3171695172786713e-05, 1.4342367649078369e-05, 1.5513040125370026e-05, 1.6683712601661682e-05, 1.785438507795334e-05, 1.9025057554244995e-05, 2.019573003053665e-05, 2.1366402506828308e-05, 2.2537074983119965e-05, 2.370774745941162e-05, 2.4878419935703278e-05, 2.6049092411994934e-05, 2.721976488828659e-05, 2.8390437364578247e-05, 2.9561109840869904e-05, 3.073178231716156e-05, 3.1902454793453217e-05, 3.307312726974487e-05, 3.424379974603653e-05, 3.5414472222328186e-05, 3.658514469861984e-05, 3.77558171749115e-05, 3.8926489651203156e-05, 4.009716212749481e-05, 4.126783460378647e-05, 4.2438507080078125e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 12.0, 29.0, 50.0, 55.0, 88.0, 168.0, 244.0, 338.0, 524.0, 938.0, 1530.0, 2553.0, 4356.0, 7806.0, 14568.0, 27175.0, 51326.0, 97521.0, 170502.0, 231786.0, 192073.0, 113840.0, 60271.0, 31694.0, 17046.0, 9338.0, 5179.0, 3035.0, 1673.0, 1027.0, 678.0, 361.0, 242.0, 156.0, 120.0, 82.0, 50.0, 40.0, 16.0, 18.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058837890625, -0.056708335876464844, -0.05457878112792969, -0.05244922637939453, -0.050319671630859375, -0.04819011688232422, -0.04606056213378906, -0.043931007385253906, -0.04180145263671875, -0.039671897888183594, -0.03754234313964844, -0.03541278839111328, -0.033283233642578125, -0.03115367889404297, -0.029024124145507812, -0.026894569396972656, -0.0247650146484375, -0.022635459899902344, -0.020505905151367188, -0.01837635040283203, -0.016246795654296875, -0.014117240905761719, -0.011987686157226562, -0.009858131408691406, -0.00772857666015625, -0.005599021911621094, -0.0034694671630859375, -0.0013399124145507812, 0.000789642333984375, 0.0029191970825195312, 0.0050487518310546875, 0.007178306579589844, 0.009307861328125, 0.011437416076660156, 0.013566970825195312, 0.01569652557373047, 0.017826080322265625, 0.01995563507080078, 0.022085189819335938, 0.024214744567871094, 0.02634429931640625, 0.028473854064941406, 0.030603408813476562, 0.03273296356201172, 0.034862518310546875, 0.03699207305908203, 0.03912162780761719, 0.041251182556152344, 0.0433807373046875, 0.045510292053222656, 0.04763984680175781, 0.04976940155029297, 0.051898956298828125, 0.05402851104736328, 0.05615806579589844, 0.058287620544433594, 0.06041717529296875, 0.0625467300415039, 0.06467628479003906, 0.06680583953857422, 0.06893539428710938, 0.07106494903564453, 0.07319450378417969, 0.07532405853271484, 0.07745361328125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 3.0, 6.0, 10.0, 9.0, 12.0, 7.0, 18.0, 27.0, 21.0, 32.0, 39.0, 27.0, 48.0, 53.0, 61.0, 61.0, 70.0, 60.0, 54.0, 56.0, 49.0, 39.0, 40.0, 31.0, 37.0, 26.0, 15.0, 13.0, 9.0, 10.0, 12.0, 7.0, 8.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0193328857421875, -0.018761157989501953, -0.018189430236816406, -0.01761770248413086, -0.017045974731445312, -0.016474246978759766, -0.01590251922607422, -0.015330791473388672, -0.014759063720703125, -0.014187335968017578, -0.013615608215332031, -0.013043880462646484, -0.012472152709960938, -0.01190042495727539, -0.011328697204589844, -0.010756969451904297, -0.01018524169921875, -0.009613513946533203, -0.009041786193847656, -0.00847005844116211, -0.007898330688476562, -0.007326602935791016, -0.006754875183105469, -0.006183147430419922, -0.005611419677734375, -0.005039691925048828, -0.004467964172363281, -0.0038962364196777344, -0.0033245086669921875, -0.0027527809143066406, -0.0021810531616210938, -0.0016093254089355469, -0.00103759765625, -0.0004658699035644531, 0.00010585784912109375, 0.0006775856018066406, 0.0012493133544921875, 0.0018210411071777344, 0.0023927688598632812, 0.002964496612548828, 0.003536224365234375, 0.004107952117919922, 0.004679679870605469, 0.005251407623291016, 0.0058231353759765625, 0.006394863128662109, 0.006966590881347656, 0.007538318634033203, 0.00811004638671875, 0.008681774139404297, 0.009253501892089844, 0.00982522964477539, 0.010396957397460938, 0.010968685150146484, 0.011540412902832031, 0.012112140655517578, 0.012683868408203125, 0.013255596160888672, 0.013827323913574219, 0.014399051666259766, 0.014970779418945312, 0.01554250717163086, 0.016114234924316406, 0.016685962677001953, 0.0172576904296875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 7.0, 1.0, 9.0, 3.0, 7.0, 4.0, 4.0, 17.0, 13.0, 21.0, 28.0, 27.0, 34.0, 51.0, 57.0, 70.0, 62.0, 64.0, 70.0, 73.0, 66.0, 61.0, 52.0, 34.0, 27.0, 28.0, 26.0, 20.0, 16.0, 9.0, 8.0, 6.0, 7.0, 8.0, 3.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.278392314910889, -4.133045196533203, -3.9876976013183594, -3.842350482940674, -3.697003126144409, -3.5516557693481445, -3.406308650970459, -3.2609612941741943, -3.1156139373779297, -2.970266580581665, -2.8249192237854004, -2.679572105407715, -2.53422474861145, -2.3888773918151855, -2.2435302734375, -2.0981829166412354, -1.9528355598449707, -1.807488203048706, -1.662140965461731, -1.5167937278747559, -1.3714463710784912, -1.2260990142822266, -1.0807517766952515, -0.9354045391082764, -0.7900571823120117, -0.6447098851203918, -0.499362587928772, -0.3540152907371521, -0.20866799354553223, -0.06332069635391235, 0.08202660083770752, 0.22737383842468262, 0.37272071838378906, 0.5180680155754089, 0.6634153127670288, 0.8087626099586487, 0.9541099071502686, 1.0994572639465332, 1.2448045015335083, 1.3901517391204834, 1.535499095916748, 1.6808464527130127, 1.8261936902999878, 1.971540927886963, 2.1168882846832275, 2.262235641479492, 2.4075827598571777, 2.5529301166534424, 2.698277473449707, 2.8436248302459717, 2.9889721870422363, 3.134319305419922, 3.2796666622161865, 3.425014019012451, 3.5703611373901367, 3.7157084941864014, 3.861055850982666, 4.006402969360352, 4.151750564575195, 4.297097682952881, 4.442444801330566, 4.58779239654541, 4.733139514923096, 4.878486633300781, 5.023834228515625]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 7.0, 10.0, 11.0, 11.0, 16.0, 8.0, 13.0, 17.0, 18.0, 25.0, 22.0, 19.0, 28.0, 26.0, 33.0, 28.0, 33.0, 37.0, 31.0, 27.0, 35.0, 54.0, 41.0, 35.0, 40.0, 30.0, 41.0, 38.0, 34.0, 30.0, 27.0, 23.0, 23.0, 18.0, 24.0, 12.0, 19.0, 11.0, 8.0, 10.0, 4.0, 9.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7050451040267944, -1.6472798585891724, -1.5895144939422607, -1.5317492485046387, -1.473983883857727, -1.416218638420105, -1.3584532737731934, -1.3006880283355713, -1.2429227828979492, -1.1851575374603271, -1.1273921728134155, -1.0696269273757935, -1.0118615627288818, -0.9540963172912598, -0.8963310122489929, -0.8385657072067261, -0.7808003425598145, -0.7230350375175476, -0.6652697324752808, -0.6075044870376587, -0.5497391223907471, -0.4919738471508026, -0.43420857191085815, -0.3764432668685913, -0.31867796182632446, -0.2609126567840576, -0.20314736664295197, -0.1453820765018463, -0.08761677145957947, -0.029851466417312622, 0.027913808822631836, 0.08567911386489868, 0.14344441890716553, 0.20120972394943237, 0.2589750289916992, 0.3167403042316437, 0.3745056092739105, 0.43227091431617737, 0.4900361895561218, 0.5478014945983887, 0.6055667996406555, 0.6633321046829224, 0.7210974097251892, 0.778862714767456, 0.8366279602050781, 0.8943933248519897, 0.9521585702896118, 1.0099239349365234, 1.0676891803741455, 1.1254544258117676, 1.1832197904586792, 1.2409850358963013, 1.298750400543213, 1.356515645980835, 1.414280891418457, 1.4720462560653687, 1.5298116207122803, 1.5875768661499023, 1.645342230796814, 1.703107476234436, 1.7608728408813477, 1.8186380863189697, 1.8764033317565918, 1.9341686964035034, 1.9919339418411255]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 10.0, 11.0, 20.0, 20.0, 42.0, 77.0, 98.0, 128.0, 218.0, 349.0, 585.0, 975.0, 1551.0, 2663.0, 4779.0, 8291.0, 14726.0, 26864.0, 48478.0, 82217.0, 130019.0, 174190.0, 180841.0, 144901.0, 96157.0, 57218.0, 31781.0, 18156.0, 9759.0, 5586.0, 3123.0, 1839.0, 1040.0, 675.0, 428.0, 264.0, 179.0, 106.0, 79.0, 32.0, 18.0, 24.0, 12.0, 10.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.412353515625, -2.32666015625, -2.240966796875, -2.1552734375, -2.069580078125, -1.98388671875, -1.898193359375, -1.8125, -1.726806640625, -1.64111328125, -1.555419921875, -1.4697265625, -1.384033203125, -1.29833984375, -1.212646484375, -1.126953125, -1.041259765625, -0.95556640625, -0.869873046875, -0.7841796875, -0.698486328125, -0.61279296875, -0.527099609375, -0.44140625, -0.355712890625, -0.27001953125, -0.184326171875, -0.0986328125, -0.012939453125, 0.07275390625, 0.158447265625, 0.244140625, 0.329833984375, 0.41552734375, 0.501220703125, 0.5869140625, 0.672607421875, 0.75830078125, 0.843994140625, 0.9296875, 1.015380859375, 1.10107421875, 1.186767578125, 1.2724609375, 1.358154296875, 1.44384765625, 1.529541015625, 1.615234375, 1.700927734375, 1.78662109375, 1.872314453125, 1.9580078125, 2.043701171875, 2.12939453125, 2.215087890625, 2.30078125, 2.386474609375, 2.47216796875, 2.557861328125, 2.6435546875, 2.729248046875, 2.81494140625, 2.900634765625, 2.986328125]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 4.0, 5.0, 13.0, 6.0, 16.0, 13.0, 17.0, 26.0, 24.0, 15.0, 14.0, 27.0, 22.0, 29.0, 26.0, 36.0, 29.0, 39.0, 33.0, 33.0, 33.0, 30.0, 40.0, 45.0, 43.0, 40.0, 37.0, 35.0, 35.0, 31.0, 30.0, 18.0, 27.0, 23.0, 19.0, 17.0, 7.0, 13.0, 15.0, 10.0, 3.0, 4.0, 8.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.0311279296875, -1.964599609375, -1.8980712890625, -1.83154296875, -1.7650146484375, -1.698486328125, -1.6319580078125, -1.5654296875, -1.4989013671875, -1.432373046875, -1.3658447265625, -1.29931640625, -1.2327880859375, -1.166259765625, -1.0997314453125, -1.033203125, -0.9666748046875, -0.900146484375, -0.8336181640625, -0.76708984375, -0.7005615234375, -0.634033203125, -0.5675048828125, -0.5009765625, -0.4344482421875, -0.367919921875, -0.3013916015625, -0.23486328125, -0.1683349609375, -0.101806640625, -0.0352783203125, 0.03125, 0.0977783203125, 0.164306640625, 0.2308349609375, 0.29736328125, 0.3638916015625, 0.430419921875, 0.4969482421875, 0.5634765625, 0.6300048828125, 0.696533203125, 0.7630615234375, 0.82958984375, 0.8961181640625, 0.962646484375, 1.0291748046875, 1.095703125, 1.1622314453125, 1.228759765625, 1.2952880859375, 1.36181640625, 1.4283447265625, 1.494873046875, 1.5614013671875, 1.6279296875, 1.6944580078125, 1.760986328125, 1.8275146484375, 1.89404296875, 1.9605712890625, 2.027099609375, 2.0936279296875, 2.16015625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 7.0, 8.0, 15.0, 18.0, 46.0, 42.0, 68.0, 98.0, 179.0, 226.0, 350.0, 587.0, 903.0, 1424.0, 2294.0, 3856.0, 6355.0, 10891.0, 18187.0, 30565.0, 49960.0, 79273.0, 115614.0, 149237.0, 159552.0, 139697.0, 103913.0, 68673.0, 42416.0, 25448.0, 15387.0, 8994.0, 5552.0, 3264.0, 1986.0, 1254.0, 737.0, 485.0, 335.0, 210.0, 140.0, 96.0, 62.0, 50.0, 34.0, 18.0, 10.0, 16.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.443359375, -2.365386962890625, -2.28741455078125, -2.209442138671875, -2.1314697265625, -2.053497314453125, -1.97552490234375, -1.897552490234375, -1.819580078125, -1.741607666015625, -1.66363525390625, -1.585662841796875, -1.5076904296875, -1.429718017578125, -1.35174560546875, -1.273773193359375, -1.19580078125, -1.117828369140625, -1.03985595703125, -0.961883544921875, -0.8839111328125, -0.805938720703125, -0.72796630859375, -0.649993896484375, -0.572021484375, -0.494049072265625, -0.41607666015625, -0.338104248046875, -0.2601318359375, -0.182159423828125, -0.10418701171875, -0.026214599609375, 0.0517578125, 0.129730224609375, 0.20770263671875, 0.285675048828125, 0.3636474609375, 0.441619873046875, 0.51959228515625, 0.597564697265625, 0.675537109375, 0.753509521484375, 0.83148193359375, 0.909454345703125, 0.9874267578125, 1.065399169921875, 1.14337158203125, 1.221343994140625, 1.29931640625, 1.377288818359375, 1.45526123046875, 1.533233642578125, 1.6112060546875, 1.689178466796875, 1.76715087890625, 1.845123291015625, 1.923095703125, 2.001068115234375, 2.07904052734375, 2.157012939453125, 2.2349853515625, 2.312957763671875, 2.39093017578125, 2.468902587890625, 2.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 6.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 6.0, 13.0, 14.0, 14.0, 19.0, 22.0, 18.0, 22.0, 28.0, 17.0, 16.0, 23.0, 30.0, 30.0, 42.0, 32.0, 45.0, 34.0, 24.0, 37.0, 41.0, 39.0, 45.0, 37.0, 29.0, 51.0, 32.0, 34.0, 21.0, 21.0, 19.0, 17.0, 13.0, 16.0, 13.0, 15.0, 10.0, 7.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2705078125, -1.2288055419921875, -1.187103271484375, -1.1454010009765625, -1.10369873046875, -1.0619964599609375, -1.020294189453125, -0.9785919189453125, -0.9368896484375, -0.8951873779296875, -0.853485107421875, -0.8117828369140625, -0.77008056640625, -0.7283782958984375, -0.686676025390625, -0.6449737548828125, -0.603271484375, -0.5615692138671875, -0.519866943359375, -0.4781646728515625, -0.43646240234375, -0.3947601318359375, -0.353057861328125, -0.3113555908203125, -0.2696533203125, -0.2279510498046875, -0.186248779296875, -0.1445465087890625, -0.10284423828125, -0.0611419677734375, -0.019439697265625, 0.0222625732421875, 0.06396484375, 0.1056671142578125, 0.147369384765625, 0.1890716552734375, 0.23077392578125, 0.2724761962890625, 0.314178466796875, 0.3558807373046875, 0.3975830078125, 0.4392852783203125, 0.480987548828125, 0.5226898193359375, 0.56439208984375, 0.6060943603515625, 0.647796630859375, 0.6894989013671875, 0.731201171875, 0.7729034423828125, 0.814605712890625, 0.8563079833984375, 0.89801025390625, 0.9397125244140625, 0.981414794921875, 1.0231170654296875, 1.0648193359375, 1.1065216064453125, 1.148223876953125, 1.1899261474609375, 1.23162841796875, 1.2733306884765625, 1.315032958984375, 1.3567352294921875, 1.3984375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 6.0, 4.0, 15.0, 12.0, 16.0, 18.0, 34.0, 52.0, 95.0, 112.0, 180.0, 260.0, 425.0, 645.0, 1055.0, 1622.0, 2684.0, 4336.0, 7315.0, 12311.0, 21421.0, 38694.0, 68384.0, 118096.0, 177524.0, 201459.0, 158868.0, 99524.0, 56996.0, 31973.0, 18074.0, 10507.0, 6053.0, 3822.0, 2150.0, 1345.0, 907.0, 549.0, 307.0, 249.0, 162.0, 103.0, 63.0, 35.0, 33.0, 24.0, 14.0, 10.0, 11.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3408203125, -1.2935028076171875, -1.246185302734375, -1.1988677978515625, -1.15155029296875, -1.1042327880859375, -1.056915283203125, -1.0095977783203125, -0.9622802734375, -0.9149627685546875, -0.867645263671875, -0.8203277587890625, -0.77301025390625, -0.7256927490234375, -0.678375244140625, -0.6310577392578125, -0.583740234375, -0.5364227294921875, -0.489105224609375, -0.4417877197265625, -0.39447021484375, -0.3471527099609375, -0.299835205078125, -0.2525177001953125, -0.2052001953125, -0.1578826904296875, -0.110565185546875, -0.0632476806640625, -0.01593017578125, 0.0313873291015625, 0.078704833984375, 0.1260223388671875, 0.17333984375, 0.2206573486328125, 0.267974853515625, 0.3152923583984375, 0.36260986328125, 0.4099273681640625, 0.457244873046875, 0.5045623779296875, 0.5518798828125, 0.5991973876953125, 0.646514892578125, 0.6938323974609375, 0.74114990234375, 0.7884674072265625, 0.835784912109375, 0.8831024169921875, 0.930419921875, 0.9777374267578125, 1.025054931640625, 1.0723724365234375, 1.11968994140625, 1.1670074462890625, 1.214324951171875, 1.2616424560546875, 1.3089599609375, 1.3562774658203125, 1.403594970703125, 1.4509124755859375, 1.49822998046875, 1.5455474853515625, 1.592864990234375, 1.6401824951171875, 1.6875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 10.0, 17.0, 16.0, 20.0, 28.0, 40.0, 36.0, 47.0, 67.0, 83.0, 69.0, 79.0, 76.0, 71.0, 69.0, 49.0, 51.0, 35.0, 27.0, 27.0, 11.0, 18.0, 10.0, 10.0, 5.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017762184143066406, -0.00017231516540050507, -0.00016700848937034607, -0.00016170181334018707, -0.00015639513731002808, -0.00015108846127986908, -0.00014578178524971008, -0.00014047510921955109, -0.0001351684331893921, -0.0001298617571592331, -0.0001245550811290741, -0.0001192484050989151, -0.0001139417290687561, -0.00010863505303859711, -0.00010332837700843811, -9.802170097827911e-05, -9.271502494812012e-05, -8.740834891796112e-05, -8.210167288780212e-05, -7.679499685764313e-05, -7.148832082748413e-05, -6.618164479732513e-05, -6.087496876716614e-05, -5.556829273700714e-05, -5.0261616706848145e-05, -4.495494067668915e-05, -3.964826464653015e-05, -3.4341588616371155e-05, -2.9034912586212158e-05, -2.372823655605316e-05, -1.8421560525894165e-05, -1.3114884495735168e-05, -7.808208465576172e-06, -2.5015324354171753e-06, 2.8051435947418213e-06, 8.111819624900818e-06, 1.3418495655059814e-05, 1.872517168521881e-05, 2.4031847715377808e-05, 2.9338523745536804e-05, 3.46451997756958e-05, 3.99518758058548e-05, 4.5258551836013794e-05, 5.056522786617279e-05, 5.587190389633179e-05, 6.117857992649078e-05, 6.648525595664978e-05, 7.179193198680878e-05, 7.709860801696777e-05, 8.240528404712677e-05, 8.771196007728577e-05, 9.301863610744476e-05, 9.832531213760376e-05, 0.00010363198816776276, 0.00010893866419792175, 0.00011424534022808075, 0.00011955201625823975, 0.00012485869228839874, 0.00013016536831855774, 0.00013547204434871674, 0.00014077872037887573, 0.00014608539640903473, 0.00015139207243919373, 0.00015669874846935272, 0.00016200542449951172]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 5.0, 9.0, 17.0, 30.0, 50.0, 66.0, 84.0, 142.0, 216.0, 305.0, 439.0, 595.0, 956.0, 1435.0, 2398.0, 3601.0, 5798.0, 9505.0, 15782.0, 26081.0, 44170.0, 73606.0, 115551.0, 160099.0, 175035.0, 148360.0, 103196.0, 64003.0, 37971.0, 22636.0, 13627.0, 8365.0, 5224.0, 3295.0, 2029.0, 1322.0, 851.0, 585.0, 334.0, 289.0, 146.0, 115.0, 77.0, 39.0, 28.0, 29.0, 15.0, 13.0, 11.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.3056640625, -1.2665252685546875, -1.227386474609375, -1.1882476806640625, -1.14910888671875, -1.1099700927734375, -1.070831298828125, -1.0316925048828125, -0.9925537109375, -0.9534149169921875, -0.914276123046875, -0.8751373291015625, -0.83599853515625, -0.7968597412109375, -0.757720947265625, -0.7185821533203125, -0.679443359375, -0.6403045654296875, -0.601165771484375, -0.5620269775390625, -0.52288818359375, -0.4837493896484375, -0.444610595703125, -0.4054718017578125, -0.3663330078125, -0.3271942138671875, -0.288055419921875, -0.2489166259765625, -0.20977783203125, -0.1706390380859375, -0.131500244140625, -0.0923614501953125, -0.05322265625, -0.0140838623046875, 0.025054931640625, 0.0641937255859375, 0.10333251953125, 0.1424713134765625, 0.181610107421875, 0.2207489013671875, 0.2598876953125, 0.2990264892578125, 0.338165283203125, 0.3773040771484375, 0.41644287109375, 0.4555816650390625, 0.494720458984375, 0.5338592529296875, 0.572998046875, 0.6121368408203125, 0.651275634765625, 0.6904144287109375, 0.72955322265625, 0.7686920166015625, 0.807830810546875, 0.8469696044921875, 0.8861083984375, 0.9252471923828125, 0.964385986328125, 1.0035247802734375, 1.04266357421875, 1.0818023681640625, 1.120941162109375, 1.1600799560546875, 1.19921875]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 8.0, 3.0, 5.0, 9.0, 16.0, 24.0, 17.0, 20.0, 42.0, 36.0, 49.0, 52.0, 55.0, 57.0, 72.0, 55.0, 66.0, 74.0, 51.0, 50.0, 39.0, 44.0, 26.0, 22.0, 23.0, 25.0, 17.0, 8.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2727622985839844, -0.26061248779296875, -0.24846267700195312, -0.2363128662109375, -0.22416305541992188, -0.21201324462890625, -0.19986343383789062, -0.187713623046875, -0.17556381225585938, -0.16341400146484375, -0.15126419067382812, -0.1391143798828125, -0.12696456909179688, -0.11481475830078125, -0.10266494750976562, -0.09051513671875, -0.07836532592773438, -0.06621551513671875, -0.054065704345703125, -0.0419158935546875, -0.029766082763671875, -0.01761627197265625, -0.005466461181640625, 0.006683349609375, 0.018833160400390625, 0.03098297119140625, 0.043132781982421875, 0.0552825927734375, 0.06743240356445312, 0.07958221435546875, 0.09173202514648438, 0.1038818359375, 0.11603164672851562, 0.12818145751953125, 0.14033126831054688, 0.1524810791015625, 0.16463088989257812, 0.17678070068359375, 0.18893051147460938, 0.201080322265625, 0.21323013305664062, 0.22537994384765625, 0.23752975463867188, 0.2496795654296875, 0.2618293762207031, 0.27397918701171875, 0.2861289978027344, 0.29827880859375, 0.3104286193847656, 0.32257843017578125, 0.3347282409667969, 0.3468780517578125, 0.3590278625488281, 0.37117767333984375, 0.3833274841308594, 0.395477294921875, 0.4076271057128906, 0.41977691650390625, 0.4319267272949219, 0.4440765380859375, 0.4562263488769531, 0.46837615966796875, 0.4805259704589844, 0.49267578125]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 9.0, 9.0, 16.0, 18.0, 29.0, 26.0, 33.0, 43.0, 46.0, 64.0, 60.0, 61.0, 64.0, 71.0, 64.0, 72.0, 57.0, 47.0, 37.0, 28.0, 17.0, 29.0, 24.0, 11.0, 9.0, 4.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-4.868194103240967, -4.724942207336426, -4.581690311431885, -4.438438415527344, -4.2951860427856445, -4.1519341468811035, -4.0086822509765625, -3.8654303550720215, -3.7221784591674805, -3.5789265632629395, -3.4356744289398193, -3.2924225330352783, -3.1491706371307373, -3.005918502807617, -2.862666606903076, -2.719414710998535, -2.576162576675415, -2.432910680770874, -2.289658546447754, -2.146406650543213, -2.003154754638672, -1.8599027395248413, -1.7166507244110107, -1.5733988285064697, -1.4301468133926392, -1.2868947982788086, -1.1436429023742676, -1.000390887260437, -0.8571389317512512, -0.7138869762420654, -0.5706349611282349, -0.42738306522369385, -0.2841310501098633, -0.1408790796995163, 0.0023728907108306885, 0.14562487602233887, 0.28887683153152466, 0.43212878704071045, 0.575380802154541, 0.718632698059082, 0.8618847131729126, 1.0051367282867432, 1.1483886241912842, 1.2916406393051147, 1.4348926544189453, 1.5781445503234863, 1.721396565437317, 1.864648461341858, 2.0079004764556885, 2.1511523723602295, 2.2944045066833496, 2.4376564025878906, 2.5809082984924316, 2.7241601943969727, 2.8674123287200928, 3.010664224624634, 3.153916358947754, 3.297168254852295, 3.440420389175415, 3.583672285079956, 3.726924180984497, 3.870176315307617, 4.013428211212158, 4.156680107116699, 4.29993200302124]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 5.0, 7.0, 6.0, 12.0, 11.0, 12.0, 16.0, 12.0, 18.0, 27.0, 19.0, 14.0, 22.0, 22.0, 36.0, 39.0, 24.0, 26.0, 36.0, 34.0, 46.0, 41.0, 39.0, 47.0, 36.0, 36.0, 38.0, 37.0, 27.0, 31.0, 37.0, 25.0, 26.0, 24.0, 21.0, 16.0, 10.0, 14.0, 7.0, 8.0, 13.0, 5.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.992197871208191, -1.9318187236785889, -1.8714396953582764, -1.8110605478286743, -1.7506814002990723, -1.6903023719787598, -1.6299232244491577, -1.5695440769195557, -1.5091650485992432, -1.4487859010696411, -1.3884068727493286, -1.3280277252197266, -1.2676485776901245, -1.2072694301605225, -1.14689040184021, -1.086511254310608, -1.0261321067810059, -0.9657530188560486, -0.9053738713264465, -0.8449947834014893, -0.7846156358718872, -0.7242365479469299, -0.6638574600219727, -0.6034783124923706, -0.5430992245674133, -0.48272010684013367, -0.422340989112854, -0.36196190118789673, -0.30158278346061707, -0.2412036657333374, -0.18082457780838013, -0.12044546008110046, -0.06006622314453125, 0.00031288713216781616, 0.06069199740886688, 0.12107110023498535, 0.18145021796226501, 0.24182933568954468, 0.30220842361450195, 0.3625875413417816, 0.4229666590690613, 0.48334577679634094, 0.5437248945236206, 0.6041039824485779, 0.6644830703735352, 0.7248622179031372, 0.7852413058280945, 0.8456203937530518, 0.9059995412826538, 0.9663786292076111, 1.0267577171325684, 1.0871368646621704, 1.1475160121917725, 1.207895040512085, 1.268274188041687, 1.328653335571289, 1.3890323638916016, 1.4494115114212036, 1.5097905397415161, 1.5701696872711182, 1.6305488348007202, 1.6909279823303223, 1.7513070106506348, 1.8116861581802368, 1.8720653057098389]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 12.0, 17.0, 18.0, 22.0, 43.0, 74.0, 133.0, 199.0, 298.0, 498.0, 832.0, 1419.0, 2618.0, 4620.0, 8675.0, 16585.0, 34867.0, 79247.0, 198938.0, 562609.0, 1347464.0, 1192420.0, 452143.0, 162392.0, 66632.0, 30030.0, 14683.0, 7471.0, 3989.0, 2204.0, 1272.0, 765.0, 438.0, 247.0, 158.0, 101.0, 58.0, 33.0, 26.0, 10.0, 11.0, 9.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.64776611328125, -4.4869384765625, -4.32611083984375, -4.165283203125, -4.00445556640625, -3.8436279296875, -3.68280029296875, -3.52197265625, -3.36114501953125, -3.2003173828125, -3.03948974609375, -2.878662109375, -2.71783447265625, -2.5570068359375, -2.39617919921875, -2.2353515625, -2.07452392578125, -1.9136962890625, -1.75286865234375, -1.592041015625, -1.43121337890625, -1.2703857421875, -1.10955810546875, -0.94873046875, -0.78790283203125, -0.6270751953125, -0.46624755859375, -0.305419921875, -0.14459228515625, 0.0162353515625, 0.17706298828125, 0.337890625, 0.49871826171875, 0.6595458984375, 0.82037353515625, 0.981201171875, 1.14202880859375, 1.3028564453125, 1.46368408203125, 1.62451171875, 1.78533935546875, 1.9461669921875, 2.10699462890625, 2.267822265625, 2.42864990234375, 2.5894775390625, 2.75030517578125, 2.9111328125, 3.07196044921875, 3.2327880859375, 3.39361572265625, 3.554443359375, 3.71527099609375, 3.8760986328125, 4.03692626953125, 4.19775390625, 4.35858154296875, 4.5194091796875, 4.68023681640625, 4.841064453125, 5.00189208984375, 5.1627197265625, 5.32354736328125, 5.484375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 8.0, 7.0, 13.0, 9.0, 19.0, 17.0, 20.0, 17.0, 11.0, 31.0, 20.0, 38.0, 29.0, 34.0, 44.0, 41.0, 42.0, 38.0, 41.0, 48.0, 35.0, 40.0, 36.0, 49.0, 30.0, 41.0, 32.0, 34.0, 22.0, 30.0, 18.0, 24.0, 15.0, 13.0, 8.0, 11.0, 10.0, 8.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.8583984375, -1.8057098388671875, -1.753021240234375, -1.7003326416015625, -1.64764404296875, -1.5949554443359375, -1.542266845703125, -1.4895782470703125, -1.4368896484375, -1.3842010498046875, -1.331512451171875, -1.2788238525390625, -1.22613525390625, -1.1734466552734375, -1.120758056640625, -1.0680694580078125, -1.015380859375, -0.9626922607421875, -0.910003662109375, -0.8573150634765625, -0.80462646484375, -0.7519378662109375, -0.699249267578125, -0.6465606689453125, -0.5938720703125, -0.5411834716796875, -0.488494873046875, -0.4358062744140625, -0.38311767578125, -0.3304290771484375, -0.277740478515625, -0.2250518798828125, -0.17236328125, -0.1196746826171875, -0.066986083984375, -0.0142974853515625, 0.03839111328125, 0.0910797119140625, 0.143768310546875, 0.1964569091796875, 0.2491455078125, 0.3018341064453125, 0.354522705078125, 0.4072113037109375, 0.45989990234375, 0.5125885009765625, 0.565277099609375, 0.6179656982421875, 0.670654296875, 0.7233428955078125, 0.776031494140625, 0.8287200927734375, 0.88140869140625, 0.9340972900390625, 0.986785888671875, 1.0394744873046875, 1.0921630859375, 1.1448516845703125, 1.197540283203125, 1.2502288818359375, 1.30291748046875, 1.3556060791015625, 1.408294677734375, 1.4609832763671875, 1.513671875]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 8.0, 15.0, 20.0, 31.0, 33.0, 54.0, 86.0, 126.0, 180.0, 296.0, 420.0, 613.0, 970.0, 1446.0, 2363.0, 4023.0, 6676.0, 11517.0, 20180.0, 37937.0, 72101.0, 141521.0, 287879.0, 578844.0, 980187.0, 950174.0, 543755.0, 269077.0, 133547.0, 67561.0, 35751.0, 19595.0, 10842.0, 6314.0, 3635.0, 2349.0, 1418.0, 925.0, 592.0, 385.0, 253.0, 174.0, 123.0, 86.0, 62.0, 34.0, 24.0, 20.0, 16.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-4.07421875, -3.94671630859375, -3.8192138671875, -3.69171142578125, -3.564208984375, -3.43670654296875, -3.3092041015625, -3.18170166015625, -3.05419921875, -2.92669677734375, -2.7991943359375, -2.67169189453125, -2.544189453125, -2.41668701171875, -2.2891845703125, -2.16168212890625, -2.0341796875, -1.90667724609375, -1.7791748046875, -1.65167236328125, -1.524169921875, -1.39666748046875, -1.2691650390625, -1.14166259765625, -1.01416015625, -0.88665771484375, -0.7591552734375, -0.63165283203125, -0.504150390625, -0.37664794921875, -0.2491455078125, -0.12164306640625, 0.005859375, 0.13336181640625, 0.2608642578125, 0.38836669921875, 0.515869140625, 0.64337158203125, 0.7708740234375, 0.89837646484375, 1.02587890625, 1.15338134765625, 1.2808837890625, 1.40838623046875, 1.535888671875, 1.66339111328125, 1.7908935546875, 1.91839599609375, 2.0458984375, 2.17340087890625, 2.3009033203125, 2.42840576171875, 2.555908203125, 2.68341064453125, 2.8109130859375, 2.93841552734375, 3.06591796875, 3.19342041015625, 3.3209228515625, 3.44842529296875, 3.575927734375, 3.70343017578125, 3.8309326171875, 3.95843505859375, 4.0859375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 7.0, 11.0, 7.0, 10.0, 12.0, 16.0, 25.0, 24.0, 51.0, 51.0, 73.0, 68.0, 77.0, 107.0, 114.0, 135.0, 164.0, 200.0, 215.0, 219.0, 247.0, 272.0, 272.0, 241.0, 227.0, 205.0, 181.0, 159.0, 144.0, 105.0, 98.0, 61.0, 51.0, 47.0, 42.0, 36.0, 27.0, 12.0, 15.0, 13.0, 12.0, 9.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91748046875, -0.8853073120117188, -0.8531341552734375, -0.8209609985351562, -0.788787841796875, -0.7566146850585938, -0.7244415283203125, -0.6922683715820312, -0.66009521484375, -0.6279220581054688, -0.5957489013671875, -0.5635757446289062, -0.531402587890625, -0.49922943115234375, -0.4670562744140625, -0.43488311767578125, -0.4027099609375, -0.37053680419921875, -0.3383636474609375, -0.30619049072265625, -0.274017333984375, -0.24184417724609375, -0.2096710205078125, -0.17749786376953125, -0.14532470703125, -0.11315155029296875, -0.0809783935546875, -0.04880523681640625, -0.016632080078125, 0.01554107666015625, 0.0477142333984375, 0.07988739013671875, 0.112060546875, 0.14423370361328125, 0.1764068603515625, 0.20858001708984375, 0.240753173828125, 0.27292633056640625, 0.3050994873046875, 0.33727264404296875, 0.36944580078125, 0.40161895751953125, 0.4337921142578125, 0.46596527099609375, 0.498138427734375, 0.5303115844726562, 0.5624847412109375, 0.5946578979492188, 0.6268310546875, 0.6590042114257812, 0.6911773681640625, 0.7233505249023438, 0.755523681640625, 0.7876968383789062, 0.8198699951171875, 0.8520431518554688, 0.88421630859375, 0.9163894653320312, 0.9485626220703125, 0.9807357788085938, 1.012908935546875, 1.0450820922851562, 1.0772552490234375, 1.1094284057617188, 1.1416015625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 6.0, 7.0, 11.0, 14.0, 18.0, 26.0, 41.0, 37.0, 50.0, 53.0, 86.0, 95.0, 67.0, 86.0, 84.0, 51.0, 59.0, 59.0, 33.0, 25.0, 19.0, 16.0, 13.0, 12.0, 6.0, 3.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.172397613525391, -6.000027179718018, -5.8276567459106445, -5.655285835266113, -5.48291540145874, -5.310544967651367, -5.138174533843994, -4.965804100036621, -4.79343318939209, -4.621062755584717, -4.448692321777344, -4.2763214111328125, -4.1039509773254395, -3.9315805435180664, -3.7592101097106934, -3.5868396759033203, -3.4144692420959473, -3.242098808288574, -3.069728136062622, -2.897357702255249, -2.724987030029297, -2.552616596221924, -2.380246162414551, -2.2078757286071777, -2.0355050563812256, -1.863134503364563, -1.6907639503479004, -1.5183935165405273, -1.3460229635238647, -1.1736524105072021, -1.001281976699829, -0.8289114236831665, -0.6565403938293457, -0.4841698706150055, -0.3117993474006653, -0.13942885398864746, 0.03294169902801514, 0.20531225204467773, 0.3776826858520508, 0.5500532388687134, 0.722423791885376, 0.8947943449020386, 1.0671648979187012, 1.2395353317260742, 1.4119058847427368, 1.5842764377593994, 1.7566468715667725, 1.929017424583435, 2.1013879776000977, 2.2737584114074707, 2.446129083633423, 2.618499517440796, 2.790870189666748, 2.963240623474121, 3.135611057281494, 3.307981491088867, 3.4803521633148193, 3.6527225971221924, 3.8250932693481445, 3.9974637031555176, 4.169834136962891, 4.342205047607422, 4.514575004577637, 4.686945915222168, 4.859316349029541]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 12.0, 10.0, 5.0, 16.0, 14.0, 19.0, 24.0, 11.0, 20.0, 18.0, 19.0, 20.0, 33.0, 30.0, 33.0, 32.0, 34.0, 28.0, 40.0, 35.0, 31.0, 40.0, 42.0, 44.0, 33.0, 25.0, 30.0, 35.0, 24.0, 21.0, 30.0, 26.0, 25.0, 26.0, 11.0, 11.0, 11.0, 8.0, 10.0, 9.0, 2.0, 8.0, 11.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.6643472909927368, -1.6124193668365479, -1.5604914426803589, -1.50856351852417, -1.4566354751586914, -1.4047075510025024, -1.3527796268463135, -1.3008517026901245, -1.2489237785339355, -1.1969958543777466, -1.1450679302215576, -1.093139886856079, -1.0412119626998901, -0.9892840385437012, -0.9373561143875122, -0.8854281902313232, -0.8335001468658447, -0.7815722227096558, -0.729644238948822, -0.6777163147926331, -0.6257883310317993, -0.5738604068756104, -0.5219324827194214, -0.47000452876091003, -0.4180765748023987, -0.36614862084388733, -0.314220666885376, -0.262292742729187, -0.21036478877067566, -0.1584368348121643, -0.10650891065597534, -0.05458095669746399, -0.0026531219482421875, 0.04927482455968857, 0.10120277106761932, 0.15313071012496948, 0.20505866408348083, 0.2569866180419922, 0.30891454219818115, 0.3608424961566925, 0.41277045011520386, 0.4646984040737152, 0.5166263580322266, 0.5685542821884155, 0.6204822063446045, 0.6724101901054382, 0.7243381142616272, 0.7762660980224609, 0.8281940221786499, 0.8801219463348389, 0.9320499300956726, 0.9839778542518616, 1.0359058380126953, 1.0878337621688843, 1.1397616863250732, 1.1916896104812622, 1.2436175346374512, 1.2955454587936401, 1.347473382949829, 1.3994014263153076, 1.4513293504714966, 1.5032572746276855, 1.5551851987838745, 1.6071131229400635, 1.659041166305542]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 6.0, 22.0, 31.0, 37.0, 36.0, 70.0, 101.0, 195.0, 276.0, 458.0, 765.0, 1103.0, 1784.0, 2949.0, 4554.0, 7714.0, 12976.0, 22532.0, 39025.0, 68688.0, 119159.0, 180762.0, 204086.0, 156394.0, 94745.0, 54244.0, 31093.0, 17896.0, 10541.0, 6200.0, 3717.0, 2431.0, 1392.0, 928.0, 577.0, 410.0, 250.0, 128.0, 94.0, 58.0, 46.0, 23.0, 20.0, 15.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2666015625, -0.25749969482421875, -0.2483978271484375, -0.23929595947265625, -0.230194091796875, -0.22109222412109375, -0.2119903564453125, -0.20288848876953125, -0.19378662109375, -0.18468475341796875, -0.1755828857421875, -0.16648101806640625, -0.157379150390625, -0.14827728271484375, -0.1391754150390625, -0.13007354736328125, -0.1209716796875, -0.11186981201171875, -0.1027679443359375, -0.09366607666015625, -0.084564208984375, -0.07546234130859375, -0.0663604736328125, -0.05725860595703125, -0.04815673828125, -0.03905487060546875, -0.0299530029296875, -0.02085113525390625, -0.011749267578125, -0.00264739990234375, 0.0064544677734375, 0.01555633544921875, 0.024658203125, 0.03376007080078125, 0.0428619384765625, 0.05196380615234375, 0.061065673828125, 0.07016754150390625, 0.0792694091796875, 0.08837127685546875, 0.09747314453125, 0.10657501220703125, 0.1156768798828125, 0.12477874755859375, 0.133880615234375, 0.14298248291015625, 0.1520843505859375, 0.16118621826171875, 0.1702880859375, 0.17938995361328125, 0.1884918212890625, 0.19759368896484375, 0.206695556640625, 0.21579742431640625, 0.2248992919921875, 0.23400115966796875, 0.24310302734375, 0.25220489501953125, 0.2613067626953125, 0.27040863037109375, 0.279510498046875, 0.28861236572265625, 0.2977142333984375, 0.30681610107421875, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 10.0, 12.0, 14.0, 10.0, 15.0, 19.0, 16.0, 22.0, 31.0, 23.0, 37.0, 47.0, 32.0, 45.0, 39.0, 44.0, 33.0, 32.0, 47.0, 55.0, 47.0, 36.0, 38.0, 40.0, 30.0, 33.0, 25.0, 32.0, 20.0, 23.0, 13.0, 9.0, 17.0, 7.0, 11.0, 5.0, 7.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.087554931640625, -2.01495361328125, -1.942352294921875, -1.8697509765625, -1.797149658203125, -1.72454833984375, -1.651947021484375, -1.579345703125, -1.506744384765625, -1.43414306640625, -1.361541748046875, -1.2889404296875, -1.216339111328125, -1.14373779296875, -1.071136474609375, -0.99853515625, -0.925933837890625, -0.85333251953125, -0.780731201171875, -0.7081298828125, -0.635528564453125, -0.56292724609375, -0.490325927734375, -0.417724609375, -0.345123291015625, -0.27252197265625, -0.199920654296875, -0.1273193359375, -0.054718017578125, 0.01788330078125, 0.090484619140625, 0.1630859375, 0.235687255859375, 0.30828857421875, 0.380889892578125, 0.4534912109375, 0.526092529296875, 0.59869384765625, 0.671295166015625, 0.743896484375, 0.816497802734375, 0.88909912109375, 0.961700439453125, 1.0343017578125, 1.106903076171875, 1.17950439453125, 1.252105712890625, 1.32470703125, 1.397308349609375, 1.46990966796875, 1.542510986328125, 1.6151123046875, 1.687713623046875, 1.76031494140625, 1.832916259765625, 1.905517578125, 1.978118896484375, 2.05072021484375, 2.123321533203125, 2.1959228515625, 2.268524169921875, 2.34112548828125, 2.413726806640625, 2.486328125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 13.0, 13.0, 16.0, 26.0, 33.0, 38.0, 63.0, 88.0, 136.0, 176.0, 337.0, 570.0, 958.0, 1697.0, 3674.0, 8331.0, 23168.0, 211303.0, 747447.0, 30491.0, 10686.0, 4421.0, 2013.0, 1126.0, 582.0, 397.0, 259.0, 139.0, 92.0, 74.0, 59.0, 31.0, 25.0, 18.0, 8.0, 13.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0], "bins": [-1.21484375, -1.1770172119140625, -1.139190673828125, -1.1013641357421875, -1.06353759765625, -1.0257110595703125, -0.987884521484375, -0.9500579833984375, -0.9122314453125, -0.8744049072265625, -0.836578369140625, -0.7987518310546875, -0.76092529296875, -0.7230987548828125, -0.685272216796875, -0.6474456787109375, -0.609619140625, -0.5717926025390625, -0.533966064453125, -0.4961395263671875, -0.45831298828125, -0.4204864501953125, -0.382659912109375, -0.3448333740234375, -0.3070068359375, -0.2691802978515625, -0.231353759765625, -0.1935272216796875, -0.15570068359375, -0.1178741455078125, -0.080047607421875, -0.0422210693359375, -0.00439453125, 0.0334320068359375, 0.071258544921875, 0.1090850830078125, 0.14691162109375, 0.1847381591796875, 0.222564697265625, 0.2603912353515625, 0.2982177734375, 0.3360443115234375, 0.373870849609375, 0.4116973876953125, 0.44952392578125, 0.4873504638671875, 0.525177001953125, 0.5630035400390625, 0.600830078125, 0.6386566162109375, 0.676483154296875, 0.7143096923828125, 0.75213623046875, 0.7899627685546875, 0.827789306640625, 0.8656158447265625, 0.9034423828125, 0.9412689208984375, 0.979095458984375, 1.0169219970703125, 1.05474853515625, 1.0925750732421875, 1.130401611328125, 1.1682281494140625, 1.2060546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 8.0, 5.0, 6.0, 11.0, 11.0, 17.0, 11.0, 22.0, 18.0, 24.0, 30.0, 36.0, 30.0, 30.0, 42.0, 37.0, 32.0, 31.0, 40.0, 45.0, 51.0, 41.0, 34.0, 45.0, 47.0, 40.0, 38.0, 38.0, 28.0, 21.0, 19.0, 24.0, 16.0, 12.0, 13.0, 9.0, 5.0, 10.0, 4.0, 4.0, 6.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.2974853515625, -1.250244140625, -1.2030029296875, -1.15576171875, -1.1085205078125, -1.061279296875, -1.0140380859375, -0.966796875, -0.9195556640625, -0.872314453125, -0.8250732421875, -0.77783203125, -0.7305908203125, -0.683349609375, -0.6361083984375, -0.5888671875, -0.5416259765625, -0.494384765625, -0.4471435546875, -0.39990234375, -0.3526611328125, -0.305419921875, -0.2581787109375, -0.2109375, -0.1636962890625, -0.116455078125, -0.0692138671875, -0.02197265625, 0.0252685546875, 0.072509765625, 0.1197509765625, 0.1669921875, 0.2142333984375, 0.261474609375, 0.3087158203125, 0.35595703125, 0.4031982421875, 0.450439453125, 0.4976806640625, 0.544921875, 0.5921630859375, 0.639404296875, 0.6866455078125, 0.73388671875, 0.7811279296875, 0.828369140625, 0.8756103515625, 0.9228515625, 0.9700927734375, 1.017333984375, 1.0645751953125, 1.11181640625, 1.1590576171875, 1.206298828125, 1.2535400390625, 1.30078125, 1.3480224609375, 1.395263671875, 1.4425048828125, 1.48974609375, 1.5369873046875, 1.584228515625, 1.6314697265625, 1.6787109375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 12.0, 7.0, 5.0, 8.0, 28.0, 32.0, 37.0, 60.0, 96.0, 124.0, 204.0, 299.0, 461.0, 809.0, 1405.0, 2594.0, 4836.0, 10603.0, 26809.0, 790727.0, 168339.0, 22337.0, 9116.0, 4222.0, 2181.0, 1224.0, 728.0, 478.0, 272.0, 161.0, 90.0, 66.0, 49.0, 43.0, 21.0, 23.0, 17.0, 8.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.275146484375, -0.26624298095703125, -0.2573394775390625, -0.24843597412109375, -0.239532470703125, -0.23062896728515625, -0.2217254638671875, -0.21282196044921875, -0.20391845703125, -0.19501495361328125, -0.1861114501953125, -0.17720794677734375, -0.168304443359375, -0.15940093994140625, -0.1504974365234375, -0.14159393310546875, -0.1326904296875, -0.12378692626953125, -0.1148834228515625, -0.10597991943359375, -0.097076416015625, -0.08817291259765625, -0.0792694091796875, -0.07036590576171875, -0.06146240234375, -0.05255889892578125, -0.0436553955078125, -0.03475189208984375, -0.025848388671875, -0.01694488525390625, -0.0080413818359375, 0.00086212158203125, 0.009765625, 0.01866912841796875, 0.0275726318359375, 0.03647613525390625, 0.045379638671875, 0.05428314208984375, 0.0631866455078125, 0.07209014892578125, 0.08099365234375, 0.08989715576171875, 0.0988006591796875, 0.10770416259765625, 0.116607666015625, 0.12551116943359375, 0.1344146728515625, 0.14331817626953125, 0.1522216796875, 0.16112518310546875, 0.1700286865234375, 0.17893218994140625, 0.187835693359375, 0.19673919677734375, 0.2056427001953125, 0.21454620361328125, 0.22344970703125, 0.23235321044921875, 0.2412567138671875, 0.25016021728515625, 0.259063720703125, 0.26796722412109375, 0.2768707275390625, 0.28577423095703125, 0.294677734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 6.0, 2.0, 4.0, 7.0, 14.0, 11.0, 13.0, 13.0, 22.0, 21.0, 18.0, 18.0, 29.0, 36.0, 44.0, 35.0, 49.0, 43.0, 41.0, 61.0, 51.0, 54.0, 41.0, 56.0, 41.0, 45.0, 28.0, 41.0, 21.0, 21.0, 26.0, 13.0, 18.0, 9.0, 9.0, 9.0, 3.0, 8.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.184246063232422e-05, -4.0601007640361786e-05, -3.935955464839935e-05, -3.811810165643692e-05, -3.687664866447449e-05, -3.5635195672512054e-05, -3.439374268054962e-05, -3.315228968858719e-05, -3.1910836696624756e-05, -3.066938370466232e-05, -2.942793071269989e-05, -2.8186477720737457e-05, -2.6945024728775024e-05, -2.570357173681259e-05, -2.446211874485016e-05, -2.3220665752887726e-05, -2.1979212760925293e-05, -2.073775976896286e-05, -1.9496306777000427e-05, -1.8254853785037994e-05, -1.701340079307556e-05, -1.577194780111313e-05, -1.4530494809150696e-05, -1.3289041817188263e-05, -1.204758882522583e-05, -1.0806135833263397e-05, -9.564682841300964e-06, -8.323229849338531e-06, -7.081776857376099e-06, -5.840323865413666e-06, -4.598870873451233e-06, -3.3574178814888e-06, -2.115964889526367e-06, -8.745118975639343e-07, 3.6694109439849854e-07, 1.6083940863609314e-06, 2.8498470783233643e-06, 4.091300070285797e-06, 5.33275306224823e-06, 6.574206054210663e-06, 7.815659046173096e-06, 9.057112038135529e-06, 1.0298565030097961e-05, 1.1540018022060394e-05, 1.2781471014022827e-05, 1.402292400598526e-05, 1.5264376997947693e-05, 1.6505829989910126e-05, 1.774728298187256e-05, 1.898873597383499e-05, 2.0230188965797424e-05, 2.1471641957759857e-05, 2.271309494972229e-05, 2.3954547941684723e-05, 2.5196000933647156e-05, 2.643745392560959e-05, 2.767890691757202e-05, 2.8920359909534454e-05, 3.0161812901496887e-05, 3.140326589345932e-05, 3.264471888542175e-05, 3.3886171877384186e-05, 3.512762486934662e-05, 3.636907786130905e-05, 3.7610530853271484e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [6.0, 5.0, 5.0, 4.0, 8.0, 14.0, 20.0, 23.0, 24.0, 39.0, 44.0, 77.0, 122.0, 153.0, 210.0, 279.0, 416.0, 558.0, 771.0, 1094.0, 1661.0, 2290.0, 3371.0, 5129.0, 7983.0, 13040.0, 21359.0, 37246.0, 66164.0, 116637.0, 185253.0, 213896.0, 153189.0, 90693.0, 50861.0, 28460.0, 16905.0, 10218.0, 6586.0, 4299.0, 2760.0, 1956.0, 1309.0, 965.0, 726.0, 506.0, 366.0, 227.0, 168.0, 129.0, 113.0, 67.0, 50.0, 34.0, 16.0, 21.0, 15.0, 12.0, 6.0, 9.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.0679931640625, -0.06581878662109375, -0.0636444091796875, -0.06147003173828125, -0.059295654296875, -0.05712127685546875, -0.0549468994140625, -0.05277252197265625, -0.05059814453125, -0.04842376708984375, -0.0462493896484375, -0.04407501220703125, -0.041900634765625, -0.03972625732421875, -0.0375518798828125, -0.03537750244140625, -0.033203125, -0.03102874755859375, -0.0288543701171875, -0.02667999267578125, -0.024505615234375, -0.02233123779296875, -0.0201568603515625, -0.01798248291015625, -0.01580810546875, -0.01363372802734375, -0.0114593505859375, -0.00928497314453125, -0.007110595703125, -0.00493621826171875, -0.0027618408203125, -0.00058746337890625, 0.0015869140625, 0.00376129150390625, 0.0059356689453125, 0.00811004638671875, 0.010284423828125, 0.01245880126953125, 0.0146331787109375, 0.01680755615234375, 0.01898193359375, 0.02115631103515625, 0.0233306884765625, 0.02550506591796875, 0.027679443359375, 0.02985382080078125, 0.0320281982421875, 0.03420257568359375, 0.036376953125, 0.03855133056640625, 0.0407257080078125, 0.04290008544921875, 0.045074462890625, 0.04724884033203125, 0.0494232177734375, 0.05159759521484375, 0.05377197265625, 0.05594635009765625, 0.0581207275390625, 0.06029510498046875, 0.062469482421875, 0.06464385986328125, 0.0668182373046875, 0.06899261474609375, 0.0711669921875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 8.0, 6.0, 11.0, 13.0, 17.0, 28.0, 28.0, 39.0, 42.0, 72.0, 44.0, 61.0, 62.0, 90.0, 73.0, 66.0, 68.0, 50.0, 46.0, 46.0, 31.0, 21.0, 23.0, 14.0, 9.0, 10.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.023406982421875, -0.022638797760009766, -0.02187061309814453, -0.021102428436279297, -0.020334243774414062, -0.019566059112548828, -0.018797874450683594, -0.01802968978881836, -0.017261505126953125, -0.01649332046508789, -0.015725135803222656, -0.014956951141357422, -0.014188766479492188, -0.013420581817626953, -0.012652397155761719, -0.011884212493896484, -0.01111602783203125, -0.010347843170166016, -0.009579658508300781, -0.008811473846435547, -0.008043289184570312, -0.007275104522705078, -0.006506919860839844, -0.005738735198974609, -0.004970550537109375, -0.004202365875244141, -0.0034341812133789062, -0.002665996551513672, -0.0018978118896484375, -0.0011296272277832031, -0.00036144256591796875, 0.0004067420959472656, 0.0011749267578125, 0.0019431114196777344, 0.0027112960815429688, 0.003479480743408203, 0.0042476654052734375, 0.005015850067138672, 0.005784034729003906, 0.006552219390869141, 0.007320404052734375, 0.00808858871459961, 0.008856773376464844, 0.009624958038330078, 0.010393142700195312, 0.011161327362060547, 0.011929512023925781, 0.012697696685791016, 0.01346588134765625, 0.014234066009521484, 0.015002250671386719, 0.015770435333251953, 0.016538619995117188, 0.017306804656982422, 0.018074989318847656, 0.01884317398071289, 0.019611358642578125, 0.02037954330444336, 0.021147727966308594, 0.021915912628173828, 0.022684097290039062, 0.023452281951904297, 0.02422046661376953, 0.024988651275634766, 0.0257568359375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 11.0, 17.0, 21.0, 31.0, 32.0, 47.0, 47.0, 58.0, 89.0, 99.0, 63.0, 95.0, 73.0, 57.0, 50.0, 59.0, 27.0, 23.0, 20.0, 17.0, 11.0, 9.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.15084171295166, -5.977791786193848, -5.804741859436035, -5.631691932678223, -5.45864200592041, -5.285592079162598, -5.112542152404785, -4.939492702484131, -4.766442775726318, -4.593392848968506, -4.420342922210693, -4.247292995452881, -4.074243068695068, -3.901193380355835, -3.7281434535980225, -3.555093765258789, -3.3820436000823975, -3.208993673324585, -3.0359437465667725, -2.862894058227539, -2.6898441314697266, -2.516794204711914, -2.3437442779541016, -2.170694351196289, -1.9976445436477661, -1.8245946168899536, -1.6515448093414307, -1.4784948825836182, -1.3054449558258057, -1.1323951482772827, -0.9593452215194702, -0.7862954139709473, -0.6132454872131348, -0.44019562005996704, -0.26714572310447693, -0.09409582614898682, 0.07895404100418091, 0.25200390815734863, 0.42505383491516113, 0.5981036424636841, 0.7711535692214966, 0.9442034363746643, 1.117253303527832, 1.2903032302856445, 1.463353157043457, 1.63640296459198, 1.8094528913497925, 1.9825026988983154, 2.155552625656128, 2.3286025524139404, 2.501652479171753, 2.6747021675109863, 2.847752094268799, 3.0208020210266113, 3.193851947784424, 3.3669018745422363, 3.539951801300049, 3.7130017280578613, 3.886051654815674, 4.059101581573486, 4.232151508331299, 4.405200958251953, 4.578250885009766, 4.751300811767578, 4.924350738525391]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 8.0, 11.0, 11.0, 6.0, 13.0, 15.0, 21.0, 23.0, 11.0, 20.0, 19.0, 16.0, 20.0, 36.0, 28.0, 32.0, 31.0, 40.0, 26.0, 39.0, 33.0, 32.0, 40.0, 42.0, 40.0, 35.0, 27.0, 28.0, 35.0, 28.0, 20.0, 25.0, 31.0, 24.0, 27.0, 10.0, 11.0, 10.0, 10.0, 8.0, 11.0, 1.0, 9.0, 9.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0], "bins": [-1.6304569244384766, -1.5789599418640137, -1.5274629592895508, -1.4759658575057983, -1.4244688749313354, -1.3729718923568726, -1.3214747905731201, -1.2699778079986572, -1.2184808254241943, -1.1669838428497314, -1.1154868602752686, -1.0639897584915161, -1.0124927759170532, -0.9609957933425903, -0.9094987511634827, -0.858001708984375, -0.8065047264099121, -0.7550077438354492, -0.7035107016563416, -0.6520136594772339, -0.600516676902771, -0.5490196943283081, -0.49752265214920044, -0.44602563977241516, -0.3945286273956299, -0.3430316150188446, -0.2915346026420593, -0.24003759026527405, -0.18854057788848877, -0.1370435655117035, -0.08554655313491821, -0.034049540758132935, 0.017447471618652344, 0.06894448399543762, 0.1204414963722229, 0.17193850874900818, 0.22343552112579346, 0.27493253350257874, 0.326429545879364, 0.3779265582561493, 0.42942357063293457, 0.48092058300971985, 0.5324175953865051, 0.5839146375656128, 0.6354116201400757, 0.6869086027145386, 0.7384056448936462, 0.7899026870727539, 0.8413996696472168, 0.8928966522216797, 0.9443936944007874, 0.995890736579895, 1.047387719154358, 1.0988847017288208, 1.1503818035125732, 1.2018787860870361, 1.253375768661499, 1.304872751235962, 1.3563697338104248, 1.4078668355941772, 1.4593638181686401, 1.510860800743103, 1.5623579025268555, 1.6138548851013184, 1.6653518676757812]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 2.0, 8.0, 2.0, 5.0, 13.0, 18.0, 23.0, 37.0, 41.0, 56.0, 83.0, 150.0, 159.0, 291.0, 432.0, 645.0, 1065.0, 1710.0, 3032.0, 5445.0, 10351.0, 19737.0, 38136.0, 72313.0, 125851.0, 184243.0, 202256.0, 161700.0, 101738.0, 56245.0, 29273.0, 14963.0, 7892.0, 4297.0, 2458.0, 1449.0, 853.0, 527.0, 359.0, 228.0, 140.0, 98.0, 63.0, 49.0, 35.0, 26.0, 19.0, 17.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.876953125, -2.77874755859375, -2.6805419921875, -2.58233642578125, -2.484130859375, -2.38592529296875, -2.2877197265625, -2.18951416015625, -2.09130859375, -1.99310302734375, -1.8948974609375, -1.79669189453125, -1.698486328125, -1.60028076171875, -1.5020751953125, -1.40386962890625, -1.3056640625, -1.20745849609375, -1.1092529296875, -1.01104736328125, -0.912841796875, -0.81463623046875, -0.7164306640625, -0.61822509765625, -0.52001953125, -0.42181396484375, -0.3236083984375, -0.22540283203125, -0.127197265625, -0.02899169921875, 0.0692138671875, 0.16741943359375, 0.265625, 0.36383056640625, 0.4620361328125, 0.56024169921875, 0.658447265625, 0.75665283203125, 0.8548583984375, 0.95306396484375, 1.05126953125, 1.14947509765625, 1.2476806640625, 1.34588623046875, 1.444091796875, 1.54229736328125, 1.6405029296875, 1.73870849609375, 1.8369140625, 1.93511962890625, 2.0333251953125, 2.13153076171875, 2.229736328125, 2.32794189453125, 2.4261474609375, 2.52435302734375, 2.62255859375, 2.72076416015625, 2.8189697265625, 2.91717529296875, 3.015380859375, 3.11358642578125, 3.2117919921875, 3.30999755859375, 3.408203125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 10.0, 8.0, 13.0, 8.0, 10.0, 20.0, 16.0, 20.0, 26.0, 24.0, 26.0, 22.0, 26.0, 34.0, 36.0, 37.0, 35.0, 43.0, 48.0, 39.0, 39.0, 34.0, 41.0, 30.0, 29.0, 26.0, 33.0, 29.0, 24.0, 20.0, 27.0, 27.0, 22.0, 13.0, 11.0, 14.0, 6.0, 11.0, 3.0, 8.0, 5.0, 10.0, 4.0, 3.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0], "bins": [-2.11328125, -2.0505828857421875, -1.987884521484375, -1.9251861572265625, -1.86248779296875, -1.7997894287109375, -1.737091064453125, -1.6743927001953125, -1.6116943359375, -1.5489959716796875, -1.486297607421875, -1.4235992431640625, -1.36090087890625, -1.2982025146484375, -1.235504150390625, -1.1728057861328125, -1.110107421875, -1.0474090576171875, -0.984710693359375, -0.9220123291015625, -0.85931396484375, -0.7966156005859375, -0.733917236328125, -0.6712188720703125, -0.6085205078125, -0.5458221435546875, -0.483123779296875, -0.4204254150390625, -0.35772705078125, -0.2950286865234375, -0.232330322265625, -0.1696319580078125, -0.10693359375, -0.0442352294921875, 0.018463134765625, 0.0811614990234375, 0.14385986328125, 0.2065582275390625, 0.269256591796875, 0.3319549560546875, 0.3946533203125, 0.4573516845703125, 0.520050048828125, 0.5827484130859375, 0.64544677734375, 0.7081451416015625, 0.770843505859375, 0.8335418701171875, 0.896240234375, 0.9589385986328125, 1.021636962890625, 1.0843353271484375, 1.14703369140625, 1.2097320556640625, 1.272430419921875, 1.3351287841796875, 1.3978271484375, 1.4605255126953125, 1.523223876953125, 1.5859222412109375, 1.64862060546875, 1.7113189697265625, 1.774017333984375, 1.8367156982421875, 1.8994140625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 20.0, 24.0, 42.0, 47.0, 63.0, 121.0, 145.0, 238.0, 337.0, 516.0, 768.0, 1332.0, 2067.0, 3346.0, 5718.0, 10038.0, 17773.0, 31894.0, 56072.0, 93595.0, 140919.0, 176733.0, 171636.0, 132193.0, 85378.0, 50266.0, 28599.0, 16047.0, 9050.0, 5158.0, 3048.0, 1917.0, 1223.0, 755.0, 493.0, 315.0, 208.0, 148.0, 87.0, 69.0, 38.0, 32.0, 28.0, 17.0, 10.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.720703125, -2.629730224609375, -2.53875732421875, -2.447784423828125, -2.3568115234375, -2.265838623046875, -2.17486572265625, -2.083892822265625, -1.992919921875, -1.901947021484375, -1.81097412109375, -1.720001220703125, -1.6290283203125, -1.538055419921875, -1.44708251953125, -1.356109619140625, -1.26513671875, -1.174163818359375, -1.08319091796875, -0.992218017578125, -0.9012451171875, -0.810272216796875, -0.71929931640625, -0.628326416015625, -0.537353515625, -0.446380615234375, -0.35540771484375, -0.264434814453125, -0.1734619140625, -0.082489013671875, 0.00848388671875, 0.099456787109375, 0.1904296875, 0.281402587890625, 0.37237548828125, 0.463348388671875, 0.5543212890625, 0.645294189453125, 0.73626708984375, 0.827239990234375, 0.918212890625, 1.009185791015625, 1.10015869140625, 1.191131591796875, 1.2821044921875, 1.373077392578125, 1.46405029296875, 1.555023193359375, 1.64599609375, 1.736968994140625, 1.82794189453125, 1.918914794921875, 2.0098876953125, 2.100860595703125, 2.19183349609375, 2.282806396484375, 2.373779296875, 2.464752197265625, 2.55572509765625, 2.646697998046875, 2.7376708984375, 2.828643798828125, 2.91961669921875, 3.010589599609375, 3.1015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 4.0, 10.0, 10.0, 12.0, 12.0, 16.0, 23.0, 17.0, 18.0, 36.0, 24.0, 29.0, 41.0, 38.0, 37.0, 44.0, 36.0, 47.0, 44.0, 44.0, 43.0, 49.0, 37.0, 34.0, 42.0, 39.0, 24.0, 29.0, 22.0, 20.0, 19.0, 27.0, 16.0, 10.0, 8.0, 13.0, 6.0, 4.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2480316162109375, -1.202117919921875, -1.1562042236328125, -1.11029052734375, -1.0643768310546875, -1.018463134765625, -0.9725494384765625, -0.9266357421875, -0.8807220458984375, -0.834808349609375, -0.7888946533203125, -0.74298095703125, -0.6970672607421875, -0.651153564453125, -0.6052398681640625, -0.559326171875, -0.5134124755859375, -0.467498779296875, -0.4215850830078125, -0.37567138671875, -0.3297576904296875, -0.283843994140625, -0.2379302978515625, -0.1920166015625, -0.1461029052734375, -0.100189208984375, -0.0542755126953125, -0.00836181640625, 0.0375518798828125, 0.083465576171875, 0.1293792724609375, 0.17529296875, 0.2212066650390625, 0.267120361328125, 0.3130340576171875, 0.35894775390625, 0.4048614501953125, 0.450775146484375, 0.4966888427734375, 0.5426025390625, 0.5885162353515625, 0.634429931640625, 0.6803436279296875, 0.72625732421875, 0.7721710205078125, 0.818084716796875, 0.8639984130859375, 0.909912109375, 0.9558258056640625, 1.001739501953125, 1.0476531982421875, 1.09356689453125, 1.1394805908203125, 1.185394287109375, 1.2313079833984375, 1.2772216796875, 1.3231353759765625, 1.369049072265625, 1.4149627685546875, 1.46087646484375, 1.5067901611328125, 1.552703857421875, 1.5986175537109375, 1.64453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 4.0, 6.0, 9.0, 22.0, 27.0, 41.0, 44.0, 86.0, 83.0, 160.0, 244.0, 282.0, 526.0, 796.0, 1060.0, 1803.0, 2731.0, 4513.0, 7348.0, 13007.0, 23521.0, 43775.0, 83187.0, 147416.0, 209129.0, 201800.0, 137558.0, 76417.0, 40513.0, 21775.0, 11933.0, 7084.0, 4149.0, 2584.0, 1680.0, 1117.0, 675.0, 476.0, 313.0, 198.0, 143.0, 107.0, 65.0, 45.0, 31.0, 27.0, 13.0, 17.0, 10.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7138671875, -1.6584625244140625, -1.603057861328125, -1.5476531982421875, -1.49224853515625, -1.4368438720703125, -1.381439208984375, -1.3260345458984375, -1.2706298828125, -1.2152252197265625, -1.159820556640625, -1.1044158935546875, -1.04901123046875, -0.9936065673828125, -0.938201904296875, -0.8827972412109375, -0.827392578125, -0.7719879150390625, -0.716583251953125, -0.6611785888671875, -0.60577392578125, -0.5503692626953125, -0.494964599609375, -0.4395599365234375, -0.3841552734375, -0.3287506103515625, -0.273345947265625, -0.2179412841796875, -0.16253662109375, -0.1071319580078125, -0.051727294921875, 0.0036773681640625, 0.05908203125, 0.1144866943359375, 0.169891357421875, 0.2252960205078125, 0.28070068359375, 0.3361053466796875, 0.391510009765625, 0.4469146728515625, 0.5023193359375, 0.5577239990234375, 0.613128662109375, 0.6685333251953125, 0.72393798828125, 0.7793426513671875, 0.834747314453125, 0.8901519775390625, 0.945556640625, 1.0009613037109375, 1.056365966796875, 1.1117706298828125, 1.16717529296875, 1.2225799560546875, 1.277984619140625, 1.3333892822265625, 1.3887939453125, 1.4441986083984375, 1.499603271484375, 1.5550079345703125, 1.61041259765625, 1.6658172607421875, 1.721221923828125, 1.7766265869140625, 1.83203125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 5.0, 14.0, 17.0, 14.0, 19.0, 29.0, 31.0, 39.0, 40.0, 45.0, 50.0, 65.0, 61.0, 65.0, 68.0, 75.0, 65.0, 52.0, 37.0, 36.0, 33.0, 26.0, 26.0, 13.0, 15.0, 12.0, 9.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00015115737915039062, -0.00014640763401985168, -0.00014165788888931274, -0.0001369081437587738, -0.00013215839862823486, -0.00012740865349769592, -0.00012265890836715698, -0.00011790916323661804, -0.0001131594181060791, -0.00010840967297554016, -0.00010365992784500122, -9.891018271446228e-05, -9.416043758392334e-05, -8.94106924533844e-05, -8.466094732284546e-05, -7.991120219230652e-05, -7.516145706176758e-05, -7.041171193122864e-05, -6.56619668006897e-05, -6.091222167015076e-05, -5.6162476539611816e-05, -5.1412731409072876e-05, -4.6662986278533936e-05, -4.1913241147994995e-05, -3.7163496017456055e-05, -3.2413750886917114e-05, -2.7664005756378174e-05, -2.2914260625839233e-05, -1.8164515495300293e-05, -1.3414770364761353e-05, -8.665025234222412e-06, -3.915280103683472e-06, 8.344650268554688e-07, 5.584210157394409e-06, 1.033395528793335e-05, 1.508370041847229e-05, 1.983344554901123e-05, 2.458319067955017e-05, 2.933293581008911e-05, 3.408268094062805e-05, 3.883242607116699e-05, 4.358217120170593e-05, 4.833191633224487e-05, 5.3081661462783813e-05, 5.7831406593322754e-05, 6.25811517238617e-05, 6.733089685440063e-05, 7.208064198493958e-05, 7.683038711547852e-05, 8.158013224601746e-05, 8.63298773765564e-05, 9.107962250709534e-05, 9.582936763763428e-05, 0.00010057911276817322, 0.00010532885789871216, 0.0001100786030292511, 0.00011482834815979004, 0.00011957809329032898, 0.00012432783842086792, 0.00012907758355140686, 0.0001338273286819458, 0.00013857707381248474, 0.00014332681894302368, 0.00014807656407356262, 0.00015282630920410156]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 10.0, 12.0, 21.0, 28.0, 64.0, 82.0, 120.0, 198.0, 337.0, 601.0, 1008.0, 1778.0, 3100.0, 5987.0, 11620.0, 22885.0, 46501.0, 92868.0, 166782.0, 229264.0, 205666.0, 127413.0, 65616.0, 32195.0, 16370.0, 8059.0, 4397.0, 2406.0, 1306.0, 771.0, 405.0, 256.0, 127.0, 92.0, 74.0, 51.0, 21.0, 25.0, 11.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7138671875, -1.6581268310546875, -1.602386474609375, -1.5466461181640625, -1.49090576171875, -1.4351654052734375, -1.379425048828125, -1.3236846923828125, -1.2679443359375, -1.2122039794921875, -1.156463623046875, -1.1007232666015625, -1.04498291015625, -0.9892425537109375, -0.933502197265625, -0.8777618408203125, -0.822021484375, -0.7662811279296875, -0.710540771484375, -0.6548004150390625, -0.59906005859375, -0.5433197021484375, -0.487579345703125, -0.4318389892578125, -0.3760986328125, -0.3203582763671875, -0.264617919921875, -0.2088775634765625, -0.15313720703125, -0.0973968505859375, -0.041656494140625, 0.0140838623046875, 0.06982421875, 0.1255645751953125, 0.181304931640625, 0.2370452880859375, 0.29278564453125, 0.3485260009765625, 0.404266357421875, 0.4600067138671875, 0.5157470703125, 0.5714874267578125, 0.627227783203125, 0.6829681396484375, 0.73870849609375, 0.7944488525390625, 0.850189208984375, 0.9059295654296875, 0.961669921875, 1.0174102783203125, 1.073150634765625, 1.1288909912109375, 1.18463134765625, 1.2403717041015625, 1.296112060546875, 1.3518524169921875, 1.4075927734375, 1.4633331298828125, 1.519073486328125, 1.5748138427734375, 1.63055419921875, 1.6862945556640625, 1.742034912109375, 1.7977752685546875, 1.853515625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 9.0, 10.0, 11.0, 11.0, 13.0, 12.0, 22.0, 21.0, 30.0, 39.0, 47.0, 49.0, 56.0, 80.0, 69.0, 56.0, 70.0, 54.0, 64.0, 43.0, 39.0, 36.0, 37.0, 36.0, 17.0, 13.0, 8.0, 16.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343017578125, -0.33078765869140625, -0.3185577392578125, -0.30632781982421875, -0.294097900390625, -0.28186798095703125, -0.2696380615234375, -0.25740814208984375, -0.24517822265625, -0.23294830322265625, -0.2207183837890625, -0.20848846435546875, -0.196258544921875, -0.18402862548828125, -0.1717987060546875, -0.15956878662109375, -0.1473388671875, -0.13510894775390625, -0.1228790283203125, -0.11064910888671875, -0.098419189453125, -0.08618927001953125, -0.0739593505859375, -0.06172943115234375, -0.04949951171875, -0.03726959228515625, -0.0250396728515625, -0.01280975341796875, -0.000579833984375, 0.01165008544921875, 0.0238800048828125, 0.03610992431640625, 0.04833984375, 0.06056976318359375, 0.0727996826171875, 0.08502960205078125, 0.097259521484375, 0.10948944091796875, 0.1217193603515625, 0.13394927978515625, 0.14617919921875, 0.15840911865234375, 0.1706390380859375, 0.18286895751953125, 0.195098876953125, 0.20732879638671875, 0.2195587158203125, 0.23178863525390625, 0.2440185546875, 0.25624847412109375, 0.2684783935546875, 0.28070831298828125, 0.292938232421875, 0.30516815185546875, 0.3173980712890625, 0.32962799072265625, 0.34185791015625, 0.35408782958984375, 0.3663177490234375, 0.37854766845703125, 0.390777587890625, 0.40300750732421875, 0.4152374267578125, 0.42746734619140625, 0.439697265625]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 6.0, 3.0, 10.0, 13.0, 22.0, 20.0, 39.0, 43.0, 57.0, 61.0, 78.0, 93.0, 95.0, 73.0, 93.0, 58.0, 51.0, 45.0, 34.0, 28.0, 17.0, 13.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.668394565582275, -6.490774154663086, -6.313153266906738, -6.135532855987549, -5.957912445068359, -5.78029203414917, -5.6026716232299805, -5.425050735473633, -5.247430324554443, -5.069809913635254, -4.892189025878906, -4.714568614959717, -4.536948204040527, -4.359327793121338, -4.181707382202148, -4.004086494445801, -3.8264660835266113, -3.648845672607422, -3.4712250232696533, -3.2936043739318848, -3.1159839630126953, -2.938363552093506, -2.7607429027557373, -2.5831222534179688, -2.4055018424987793, -2.22788143157959, -2.0502607822418213, -1.8726402521133423, -1.6950197219848633, -1.5173991918563843, -1.3397786617279053, -1.1621581315994263, -0.9845380783081055, -0.8069175481796265, -0.6292970180511475, -0.45167648792266846, -0.27405595779418945, -0.09643542766571045, 0.08118510246276855, 0.25880563259124756, 0.43642616271972656, 0.6140466928482056, 0.7916672229766846, 0.9692877531051636, 1.1469082832336426, 1.3245288133621216, 1.5021493434906006, 1.6797698736190796, 1.8573904037475586, 2.035010814666748, 2.2126314640045166, 2.390252113342285, 2.5678725242614746, 2.745492935180664, 2.9231135845184326, 3.100734233856201, 3.2783546447753906, 3.45597505569458, 3.6335957050323486, 3.811216354370117, 3.9888367652893066, 4.166457176208496, 4.344078063964844, 4.521698474884033, 4.699318885803223]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 1.0, 3.0, 6.0, 7.0, 12.0, 8.0, 13.0, 14.0, 27.0, 21.0, 14.0, 21.0, 27.0, 34.0, 19.0, 35.0, 35.0, 34.0, 35.0, 45.0, 52.0, 42.0, 44.0, 44.0, 47.0, 31.0, 32.0, 34.0, 41.0, 29.0, 21.0, 21.0, 26.0, 20.0, 13.0, 23.0, 17.0, 4.0, 13.0, 12.0, 4.0, 5.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9693043231964111, -1.907718539237976, -1.8461326360702515, -1.7845468521118164, -1.7229610681533813, -1.6613751649856567, -1.5997893810272217, -1.538203477859497, -1.476617693901062, -1.415031909942627, -1.3534460067749023, -1.2918602228164673, -1.2302744388580322, -1.1686885356903076, -1.1071027517318726, -1.0455169677734375, -0.9839311242103577, -0.9223452806472778, -0.8607594966888428, -0.7991736531257629, -0.7375878095626831, -0.676002025604248, -0.6144161820411682, -0.5528303384780884, -0.49124452471733093, -0.4296587109565735, -0.36807286739349365, -0.3064870536327362, -0.24490122497081757, -0.18331539630889893, -0.12172958254814148, -0.060143738985061646, 0.0014420747756958008, 0.06302790343761444, 0.12461372464895248, 0.18619954586029053, 0.24778537452220917, 0.3093712031841278, 0.37095701694488525, 0.4325428605079651, 0.49412867426872253, 0.55571448802948, 0.6173003315925598, 0.6788861751556396, 0.7404719591140747, 0.8020578026771545, 0.8636436462402344, 0.9252294301986694, 0.9868152737617493, 1.048401117324829, 1.1099869012832642, 1.1715726852416992, 1.2331585884094238, 1.2947443723678589, 1.356330156326294, 1.4179160594940186, 1.4795018434524536, 1.5410876274108887, 1.6026735305786133, 1.6642593145370483, 1.7258450984954834, 1.787431001663208, 1.849016785621643, 1.9106025695800781, 1.9721884727478027]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 17.0, 15.0, 30.0, 53.0, 72.0, 115.0, 159.0, 260.0, 440.0, 654.0, 1032.0, 1716.0, 3034.0, 5258.0, 9629.0, 18512.0, 37235.0, 80871.0, 193478.0, 512983.0, 1207863.0, 1228824.0, 534557.0, 197648.0, 81611.0, 37276.0, 18129.0, 9622.0, 5355.0, 3054.0, 1833.0, 1113.0, 654.0, 428.0, 257.0, 184.0, 96.0, 75.0, 53.0, 28.0, 22.0, 14.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.61328125, -4.46453857421875, -4.3157958984375, -4.16705322265625, -4.018310546875, -3.86956787109375, -3.7208251953125, -3.57208251953125, -3.42333984375, -3.27459716796875, -3.1258544921875, -2.97711181640625, -2.828369140625, -2.67962646484375, -2.5308837890625, -2.38214111328125, -2.2333984375, -2.08465576171875, -1.9359130859375, -1.78717041015625, -1.638427734375, -1.48968505859375, -1.3409423828125, -1.19219970703125, -1.04345703125, -0.89471435546875, -0.7459716796875, -0.59722900390625, -0.448486328125, -0.29974365234375, -0.1510009765625, -0.00225830078125, 0.146484375, 0.29522705078125, 0.4439697265625, 0.59271240234375, 0.741455078125, 0.89019775390625, 1.0389404296875, 1.18768310546875, 1.33642578125, 1.48516845703125, 1.6339111328125, 1.78265380859375, 1.931396484375, 2.08013916015625, 2.2288818359375, 2.37762451171875, 2.5263671875, 2.67510986328125, 2.8238525390625, 2.97259521484375, 3.121337890625, 3.27008056640625, 3.4188232421875, 3.56756591796875, 3.71630859375, 3.86505126953125, 4.0137939453125, 4.16253662109375, 4.311279296875, 4.46002197265625, 4.6087646484375, 4.75750732421875, 4.90625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 4.0, 1.0, 5.0, 5.0, 11.0, 15.0, 11.0, 17.0, 10.0, 19.0, 19.0, 25.0, 20.0, 28.0, 29.0, 36.0, 32.0, 30.0, 27.0, 36.0, 40.0, 49.0, 30.0, 46.0, 39.0, 27.0, 41.0, 34.0, 37.0, 30.0, 29.0, 28.0, 21.0, 22.0, 18.0, 12.0, 21.0, 18.0, 10.0, 10.0, 12.0, 11.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.521484375, -1.4746856689453125, -1.427886962890625, -1.3810882568359375, -1.33428955078125, -1.2874908447265625, -1.240692138671875, -1.1938934326171875, -1.1470947265625, -1.1002960205078125, -1.053497314453125, -1.0066986083984375, -0.95989990234375, -0.9131011962890625, -0.866302490234375, -0.8195037841796875, -0.772705078125, -0.7259063720703125, -0.679107666015625, -0.6323089599609375, -0.58551025390625, -0.5387115478515625, -0.491912841796875, -0.4451141357421875, -0.3983154296875, -0.3515167236328125, -0.304718017578125, -0.2579193115234375, -0.21112060546875, -0.1643218994140625, -0.117523193359375, -0.0707244873046875, -0.02392578125, 0.0228729248046875, 0.069671630859375, 0.1164703369140625, 0.16326904296875, 0.2100677490234375, 0.256866455078125, 0.3036651611328125, 0.3504638671875, 0.3972625732421875, 0.444061279296875, 0.4908599853515625, 0.53765869140625, 0.5844573974609375, 0.631256103515625, 0.6780548095703125, 0.724853515625, 0.7716522216796875, 0.818450927734375, 0.8652496337890625, 0.91204833984375, 0.9588470458984375, 1.005645751953125, 1.0524444580078125, 1.0992431640625, 1.1460418701171875, 1.192840576171875, 1.2396392822265625, 1.28643798828125, 1.3332366943359375, 1.380035400390625, 1.4268341064453125, 1.4736328125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 12.0, 18.0, 21.0, 34.0, 49.0, 85.0, 107.0, 132.0, 230.0, 328.0, 517.0, 746.0, 1216.0, 1900.0, 2960.0, 4741.0, 7636.0, 12945.0, 22377.0, 40009.0, 73152.0, 138658.0, 272854.0, 535096.0, 921368.0, 958471.0, 576936.0, 293593.0, 148977.0, 78048.0, 41927.0, 23661.0, 13667.0, 8188.0, 5038.0, 3014.0, 1946.0, 1255.0, 774.0, 538.0, 350.0, 230.0, 165.0, 98.0, 65.0, 49.0, 41.0, 14.0, 13.0, 14.0, 10.0, 4.0, 1.0, 5.0, 4.0, 1.0], "bins": [-4.10546875, -3.98126220703125, -3.8570556640625, -3.73284912109375, -3.608642578125, -3.48443603515625, -3.3602294921875, -3.23602294921875, -3.11181640625, -2.98760986328125, -2.8634033203125, -2.73919677734375, -2.614990234375, -2.49078369140625, -2.3665771484375, -2.24237060546875, -2.1181640625, -1.99395751953125, -1.8697509765625, -1.74554443359375, -1.621337890625, -1.49713134765625, -1.3729248046875, -1.24871826171875, -1.12451171875, -1.00030517578125, -0.8760986328125, -0.75189208984375, -0.627685546875, -0.50347900390625, -0.3792724609375, -0.25506591796875, -0.130859375, -0.00665283203125, 0.1175537109375, 0.24176025390625, 0.365966796875, 0.49017333984375, 0.6143798828125, 0.73858642578125, 0.86279296875, 0.98699951171875, 1.1112060546875, 1.23541259765625, 1.359619140625, 1.48382568359375, 1.6080322265625, 1.73223876953125, 1.8564453125, 1.98065185546875, 2.1048583984375, 2.22906494140625, 2.353271484375, 2.47747802734375, 2.6016845703125, 2.72589111328125, 2.85009765625, 2.97430419921875, 3.0985107421875, 3.22271728515625, 3.346923828125, 3.47113037109375, 3.5953369140625, 3.71954345703125, 3.84375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 9.0, 8.0, 6.0, 17.0, 32.0, 40.0, 34.0, 48.0, 57.0, 95.0, 94.0, 105.0, 141.0, 176.0, 209.0, 265.0, 260.0, 293.0, 294.0, 265.0, 263.0, 272.0, 205.0, 180.0, 148.0, 118.0, 98.0, 79.0, 61.0, 50.0, 43.0, 28.0, 16.0, 13.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.07647705078125, -1.0396728515625, -1.00286865234375, -0.966064453125, -0.92926025390625, -0.8924560546875, -0.85565185546875, -0.81884765625, -0.78204345703125, -0.7452392578125, -0.70843505859375, -0.671630859375, -0.63482666015625, -0.5980224609375, -0.56121826171875, -0.5244140625, -0.48760986328125, -0.4508056640625, -0.41400146484375, -0.377197265625, -0.34039306640625, -0.3035888671875, -0.26678466796875, -0.22998046875, -0.19317626953125, -0.1563720703125, -0.11956787109375, -0.082763671875, -0.04595947265625, -0.0091552734375, 0.02764892578125, 0.064453125, 0.10125732421875, 0.1380615234375, 0.17486572265625, 0.211669921875, 0.24847412109375, 0.2852783203125, 0.32208251953125, 0.35888671875, 0.39569091796875, 0.4324951171875, 0.46929931640625, 0.506103515625, 0.54290771484375, 0.5797119140625, 0.61651611328125, 0.6533203125, 0.69012451171875, 0.7269287109375, 0.76373291015625, 0.800537109375, 0.83734130859375, 0.8741455078125, 0.91094970703125, 0.94775390625, 0.98455810546875, 1.0213623046875, 1.05816650390625, 1.094970703125, 1.13177490234375, 1.1685791015625, 1.20538330078125, 1.2421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 9.0, 9.0, 14.0, 16.0, 14.0, 26.0, 41.0, 51.0, 63.0, 74.0, 95.0, 79.0, 92.0, 91.0, 64.0, 57.0, 60.0, 32.0, 27.0, 24.0, 20.0, 7.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.784271717071533, -7.594692707061768, -7.405113697052002, -7.2155351638793945, -7.025956153869629, -6.836377143859863, -6.646798133850098, -6.457219123840332, -6.267640113830566, -6.078061103820801, -5.888482093811035, -5.6989030838012695, -5.509324550628662, -5.3197455406188965, -5.130166530609131, -4.940587520599365, -4.751008987426758, -4.561429977416992, -4.371850967407227, -4.182271957397461, -3.9926934242248535, -3.803114414215088, -3.6135354042053223, -3.4239563941955566, -3.23437762260437, -3.0447986125946045, -2.855219841003418, -2.6656408309936523, -2.4760618209838867, -2.2864830493927, -2.0969040393829346, -1.9073251485824585, -1.7177457809448242, -1.5281668901443481, -1.338587999343872, -1.1490089893341064, -0.9594300985336304, -0.7698512077331543, -0.5802721977233887, -0.3906933069229126, -0.20111441612243652, -0.011535495519638062, 0.1780434250831604, 0.36762237548828125, 0.5572012662887573, 0.7467801570892334, 0.936359167098999, 1.125938057899475, 1.3155169486999512, 1.5050958395004272, 1.6946747303009033, 1.884253740310669, 2.0738325119018555, 2.263411521911621, 2.4529905319213867, 2.6425695419311523, 2.832148313522339, 3.0217273235321045, 3.211306095123291, 3.4008851051330566, 3.5904641151428223, 3.780042886734009, 3.9696218967437744, 4.159200668334961, 4.348779678344727]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 8.0, 7.0, 16.0, 10.0, 16.0, 22.0, 25.0, 14.0, 29.0, 20.0, 30.0, 30.0, 30.0, 42.0, 45.0, 33.0, 43.0, 42.0, 48.0, 38.0, 34.0, 36.0, 39.0, 46.0, 38.0, 34.0, 32.0, 27.0, 20.0, 22.0, 18.0, 19.0, 14.0, 11.0, 9.0, 14.0, 10.0, 4.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.2169461250305176, -2.1566765308380127, -2.096407175064087, -2.036137580871582, -1.9758681058883667, -1.9155986309051514, -1.855329155921936, -1.7950596809387207, -1.7347902059555054, -1.67452073097229, -1.6142512559890747, -1.5539817810058594, -1.4937121868133545, -1.4334427118301392, -1.3731732368469238, -1.3129037618637085, -1.2526342868804932, -1.1923648118972778, -1.1320953369140625, -1.0718257427215576, -1.0115562677383423, -0.951286792755127, -0.8910173177719116, -0.8307478427886963, -0.7704782485961914, -0.7102087736129761, -0.649939239025116, -0.5896697640419006, -0.5294002890586853, -0.4691307842731476, -0.40886127948760986, -0.34859180450439453, -0.2883223295211792, -0.22805283963680267, -0.16778334975242615, -0.10751384496688843, -0.0472443550825119, 0.013025134801864624, 0.07329463958740234, 0.13356411457061768, 0.1938336193561554, 0.2541031241416931, 0.31437259912490845, 0.37464210391044617, 0.4349116086959839, 0.4951810836791992, 0.5554505586624146, 0.6157200336456299, 0.67598956823349, 0.7362590432167053, 0.7965285778045654, 0.8567980527877808, 0.9170675277709961, 0.9773370027542114, 1.0376064777374268, 1.0978760719299316, 1.158145546913147, 1.2184150218963623, 1.2786844968795776, 1.338953971862793, 1.3992235660552979, 1.4594930410385132, 1.5197625160217285, 1.5800319910049438, 1.6403014659881592]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 2.0, 8.0, 16.0, 17.0, 23.0, 39.0, 50.0, 84.0, 135.0, 251.0, 375.0, 565.0, 1053.0, 1793.0, 3324.0, 6319.0, 11909.0, 23719.0, 48421.0, 98618.0, 185751.0, 251671.0, 197455.0, 109129.0, 53839.0, 25988.0, 12835.0, 6635.0, 3733.0, 2003.0, 1131.0, 661.0, 360.0, 212.0, 154.0, 97.0, 54.0, 37.0, 27.0, 14.0, 17.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.33935546875, -0.32747650146484375, -0.3155975341796875, -0.30371856689453125, -0.291839599609375, -0.27996063232421875, -0.2680816650390625, -0.25620269775390625, -0.24432373046875, -0.23244476318359375, -0.2205657958984375, -0.20868682861328125, -0.196807861328125, -0.18492889404296875, -0.1730499267578125, -0.16117095947265625, -0.1492919921875, -0.13741302490234375, -0.1255340576171875, -0.11365509033203125, -0.101776123046875, -0.08989715576171875, -0.0780181884765625, -0.06613922119140625, -0.05426025390625, -0.04238128662109375, -0.0305023193359375, -0.01862335205078125, -0.006744384765625, 0.00513458251953125, 0.0170135498046875, 0.02889251708984375, 0.040771484375, 0.05265045166015625, 0.0645294189453125, 0.07640838623046875, 0.088287353515625, 0.10016632080078125, 0.1120452880859375, 0.12392425537109375, 0.13580322265625, 0.14768218994140625, 0.1595611572265625, 0.17144012451171875, 0.183319091796875, 0.19519805908203125, 0.2070770263671875, 0.21895599365234375, 0.2308349609375, 0.24271392822265625, 0.2545928955078125, 0.26647186279296875, 0.278350830078125, 0.29022979736328125, 0.3021087646484375, 0.31398773193359375, 0.32586669921875, 0.33774566650390625, 0.3496246337890625, 0.36150360107421875, 0.373382568359375, 0.38526153564453125, 0.3971405029296875, 0.40901947021484375, 0.4208984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 7.0, 12.0, 14.0, 20.0, 20.0, 23.0, 23.0, 27.0, 33.0, 24.0, 48.0, 37.0, 36.0, 35.0, 35.0, 33.0, 45.0, 33.0, 51.0, 41.0, 41.0, 42.0, 39.0, 23.0, 35.0, 29.0, 19.0, 25.0, 22.0, 15.0, 18.0, 16.0, 13.0, 10.0, 4.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.147979736328125, -2.07916259765625, -2.010345458984375, -1.9415283203125, -1.872711181640625, -1.80389404296875, -1.735076904296875, -1.666259765625, -1.597442626953125, -1.52862548828125, -1.459808349609375, -1.3909912109375, -1.322174072265625, -1.25335693359375, -1.184539794921875, -1.11572265625, -1.046905517578125, -0.97808837890625, -0.909271240234375, -0.8404541015625, -0.771636962890625, -0.70281982421875, -0.634002685546875, -0.565185546875, -0.496368408203125, -0.42755126953125, -0.358734130859375, -0.2899169921875, -0.221099853515625, -0.15228271484375, -0.083465576171875, -0.0146484375, 0.054168701171875, 0.12298583984375, 0.191802978515625, 0.2606201171875, 0.329437255859375, 0.39825439453125, 0.467071533203125, 0.535888671875, 0.604705810546875, 0.67352294921875, 0.742340087890625, 0.8111572265625, 0.879974365234375, 0.94879150390625, 1.017608642578125, 1.08642578125, 1.155242919921875, 1.22406005859375, 1.292877197265625, 1.3616943359375, 1.430511474609375, 1.49932861328125, 1.568145751953125, 1.636962890625, 1.705780029296875, 1.77459716796875, 1.843414306640625, 1.9122314453125, 1.981048583984375, 2.04986572265625, 2.118682861328125, 2.1875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 8.0, 3.0, 7.0, 8.0, 14.0, 15.0, 22.0, 30.0, 44.0, 66.0, 98.0, 129.0, 183.0, 286.0, 450.0, 693.0, 1152.0, 2002.0, 3984.0, 8534.0, 20126.0, 79197.0, 858546.0, 43362.0, 15206.0, 6627.0, 3194.0, 1758.0, 1019.0, 582.0, 398.0, 280.0, 143.0, 99.0, 73.0, 54.0, 42.0, 29.0, 18.0, 16.0, 15.0, 12.0, 9.0, 5.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.080078125, -1.04669189453125, -1.0133056640625, -0.97991943359375, -0.946533203125, -0.91314697265625, -0.8797607421875, -0.84637451171875, -0.81298828125, -0.77960205078125, -0.7462158203125, -0.71282958984375, -0.679443359375, -0.64605712890625, -0.6126708984375, -0.57928466796875, -0.5458984375, -0.51251220703125, -0.4791259765625, -0.44573974609375, -0.412353515625, -0.37896728515625, -0.3455810546875, -0.31219482421875, -0.27880859375, -0.24542236328125, -0.2120361328125, -0.17864990234375, -0.145263671875, -0.11187744140625, -0.0784912109375, -0.04510498046875, -0.01171875, 0.02166748046875, 0.0550537109375, 0.08843994140625, 0.121826171875, 0.15521240234375, 0.1885986328125, 0.22198486328125, 0.25537109375, 0.28875732421875, 0.3221435546875, 0.35552978515625, 0.388916015625, 0.42230224609375, 0.4556884765625, 0.48907470703125, 0.5224609375, 0.55584716796875, 0.5892333984375, 0.62261962890625, 0.656005859375, 0.68939208984375, 0.7227783203125, 0.75616455078125, 0.78955078125, 0.82293701171875, 0.8563232421875, 0.88970947265625, 0.923095703125, 0.95648193359375, 0.9898681640625, 1.02325439453125, 1.056640625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 5.0, 4.0, 5.0, 9.0, 11.0, 23.0, 27.0, 16.0, 21.0, 21.0, 34.0, 36.0, 32.0, 35.0, 38.0, 34.0, 43.0, 44.0, 43.0, 37.0, 40.0, 30.0, 37.0, 35.0, 39.0, 39.0, 31.0, 25.0, 28.0, 20.0, 12.0, 14.0, 23.0, 24.0, 13.0, 9.0, 10.0, 6.0, 10.0, 6.0, 9.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.36328125, -1.320404052734375, -1.27752685546875, -1.234649658203125, -1.1917724609375, -1.148895263671875, -1.10601806640625, -1.063140869140625, -1.020263671875, -0.977386474609375, -0.93450927734375, -0.891632080078125, -0.8487548828125, -0.805877685546875, -0.76300048828125, -0.720123291015625, -0.67724609375, -0.634368896484375, -0.59149169921875, -0.548614501953125, -0.5057373046875, -0.462860107421875, -0.41998291015625, -0.377105712890625, -0.334228515625, -0.291351318359375, -0.24847412109375, -0.205596923828125, -0.1627197265625, -0.119842529296875, -0.07696533203125, -0.034088134765625, 0.0087890625, 0.051666259765625, 0.09454345703125, 0.137420654296875, 0.1802978515625, 0.223175048828125, 0.26605224609375, 0.308929443359375, 0.351806640625, 0.394683837890625, 0.43756103515625, 0.480438232421875, 0.5233154296875, 0.566192626953125, 0.60906982421875, 0.651947021484375, 0.69482421875, 0.737701416015625, 0.78057861328125, 0.823455810546875, 0.8663330078125, 0.909210205078125, 0.95208740234375, 0.994964599609375, 1.037841796875, 1.080718994140625, 1.12359619140625, 1.166473388671875, 1.2093505859375, 1.252227783203125, 1.29510498046875, 1.337982177734375, 1.380859375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 13.0, 19.0, 18.0, 37.0, 49.0, 61.0, 116.0, 173.0, 274.0, 426.0, 801.0, 1574.0, 3218.0, 7855.0, 24748.0, 888202.0, 93343.0, 16556.0, 5688.0, 2476.0, 1178.0, 661.0, 373.0, 228.0, 138.0, 100.0, 61.0, 43.0, 33.0, 24.0, 10.0, 9.0, 16.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.36058807373046875, -0.3471527099609375, -0.33371734619140625, -0.320281982421875, -0.30684661865234375, -0.2934112548828125, -0.27997589111328125, -0.26654052734375, -0.25310516357421875, -0.2396697998046875, -0.22623443603515625, -0.212799072265625, -0.19936370849609375, -0.1859283447265625, -0.17249298095703125, -0.1590576171875, -0.14562225341796875, -0.1321868896484375, -0.11875152587890625, -0.105316162109375, -0.09188079833984375, -0.0784454345703125, -0.06501007080078125, -0.05157470703125, -0.03813934326171875, -0.0247039794921875, -0.01126861572265625, 0.002166748046875, 0.01560211181640625, 0.0290374755859375, 0.04247283935546875, 0.055908203125, 0.06934356689453125, 0.0827789306640625, 0.09621429443359375, 0.109649658203125, 0.12308502197265625, 0.1365203857421875, 0.14995574951171875, 0.16339111328125, 0.17682647705078125, 0.1902618408203125, 0.20369720458984375, 0.217132568359375, 0.23056793212890625, 0.2440032958984375, 0.25743865966796875, 0.2708740234375, 0.28430938720703125, 0.2977447509765625, 0.31118011474609375, 0.324615478515625, 0.33805084228515625, 0.3514862060546875, 0.36492156982421875, 0.37835693359375, 0.39179229736328125, 0.4052276611328125, 0.41866302490234375, 0.432098388671875, 0.44553375244140625, 0.4589691162109375, 0.47240447998046875, 0.48583984375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 7.0, 6.0, 5.0, 5.0, 4.0, 14.0, 12.0, 20.0, 17.0, 10.0, 20.0, 33.0, 23.0, 33.0, 40.0, 47.0, 52.0, 45.0, 52.0, 42.0, 56.0, 41.0, 49.0, 32.0, 43.0, 34.0, 36.0, 22.0, 28.0, 30.0, 26.0, 18.0, 21.0, 13.0, 5.0, 11.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0], "bins": [-3.552436828613281e-05, -3.449525684118271e-05, -3.3466145396232605e-05, -3.24370339512825e-05, -3.14079225063324e-05, -3.0378811061382294e-05, -2.934969961643219e-05, -2.8320588171482086e-05, -2.7291476726531982e-05, -2.626236528158188e-05, -2.5233253836631775e-05, -2.420414239168167e-05, -2.3175030946731567e-05, -2.2145919501781464e-05, -2.111680805683136e-05, -2.0087696611881256e-05, -1.9058585166931152e-05, -1.802947372198105e-05, -1.7000362277030945e-05, -1.597125083208084e-05, -1.4942139387130737e-05, -1.3913027942180634e-05, -1.288391649723053e-05, -1.1854805052280426e-05, -1.0825693607330322e-05, -9.796582162380219e-06, -8.767470717430115e-06, -7.738359272480011e-06, -6.709247827529907e-06, -5.6801363825798035e-06, -4.6510249376297e-06, -3.621913492679596e-06, -2.592802047729492e-06, -1.5636906027793884e-06, -5.345791578292847e-07, 4.945322871208191e-07, 1.5236437320709229e-06, 2.5527551770210266e-06, 3.5818666219711304e-06, 4.610978066921234e-06, 5.640089511871338e-06, 6.669200956821442e-06, 7.698312401771545e-06, 8.72742384672165e-06, 9.756535291671753e-06, 1.0785646736621857e-05, 1.181475818157196e-05, 1.2843869626522064e-05, 1.3872981071472168e-05, 1.4902092516422272e-05, 1.5931203961372375e-05, 1.696031540632248e-05, 1.7989426851272583e-05, 1.9018538296222687e-05, 2.004764974117279e-05, 2.1076761186122894e-05, 2.2105872631072998e-05, 2.3134984076023102e-05, 2.4164095520973206e-05, 2.519320696592331e-05, 2.6222318410873413e-05, 2.7251429855823517e-05, 2.828054130077362e-05, 2.9309652745723724e-05, 3.0338764190673828e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 9.0, 10.0, 19.0, 17.0, 34.0, 40.0, 53.0, 88.0, 149.0, 160.0, 290.0, 409.0, 618.0, 961.0, 1615.0, 2530.0, 4381.0, 7540.0, 13486.0, 24816.0, 47368.0, 90314.0, 165173.0, 237697.0, 200850.0, 116604.0, 61069.0, 31787.0, 17113.0, 9409.0, 5472.0, 3112.0, 1890.0, 1208.0, 767.0, 506.0, 322.0, 198.0, 132.0, 116.0, 67.0, 37.0, 34.0, 19.0, 18.0, 12.0, 4.0, 6.0, 5.0, 9.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.082763671875, -0.08006763458251953, -0.07737159729003906, -0.0746755599975586, -0.07197952270507812, -0.06928348541259766, -0.06658744812011719, -0.06389141082763672, -0.06119537353515625, -0.05849933624267578, -0.05580329895019531, -0.053107261657714844, -0.050411224365234375, -0.047715187072753906, -0.04501914978027344, -0.04232311248779297, -0.0396270751953125, -0.03693103790283203, -0.03423500061035156, -0.031538963317871094, -0.028842926025390625, -0.026146888732910156, -0.023450851440429688, -0.02075481414794922, -0.01805877685546875, -0.015362739562988281, -0.012666702270507812, -0.009970664978027344, -0.007274627685546875, -0.004578590393066406, -0.0018825531005859375, 0.0008134841918945312, 0.003509521484375, 0.006205558776855469, 0.008901596069335938, 0.011597633361816406, 0.014293670654296875, 0.016989707946777344, 0.019685745239257812, 0.02238178253173828, 0.02507781982421875, 0.02777385711669922, 0.030469894409179688, 0.033165931701660156, 0.035861968994140625, 0.038558006286621094, 0.04125404357910156, 0.04395008087158203, 0.0466461181640625, 0.04934215545654297, 0.05203819274902344, 0.054734230041503906, 0.057430267333984375, 0.060126304626464844, 0.06282234191894531, 0.06551837921142578, 0.06821441650390625, 0.07091045379638672, 0.07360649108886719, 0.07630252838134766, 0.07899856567382812, 0.0816946029663086, 0.08439064025878906, 0.08708667755126953, 0.08978271484375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 5.0, 3.0, 11.0, 8.0, 9.0, 10.0, 17.0, 30.0, 26.0, 33.0, 39.0, 56.0, 67.0, 69.0, 88.0, 79.0, 95.0, 79.0, 70.0, 49.0, 30.0, 35.0, 16.0, 33.0, 5.0, 12.0, 5.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0224761962890625, -0.021753787994384766, -0.02103137969970703, -0.020308971405029297, -0.019586563110351562, -0.018864154815673828, -0.018141746520996094, -0.01741933822631836, -0.016696929931640625, -0.01597452163696289, -0.015252113342285156, -0.014529705047607422, -0.013807296752929688, -0.013084888458251953, -0.012362480163574219, -0.011640071868896484, -0.01091766357421875, -0.010195255279541016, -0.009472846984863281, -0.008750438690185547, -0.008028030395507812, -0.007305622100830078, -0.006583213806152344, -0.005860805511474609, -0.005138397216796875, -0.004415988922119141, -0.0036935806274414062, -0.002971172332763672, -0.0022487640380859375, -0.0015263557434082031, -0.0008039474487304688, -8.153915405273438e-05, 0.000640869140625, 0.0013632774353027344, 0.0020856857299804688, 0.002808094024658203, 0.0035305023193359375, 0.004252910614013672, 0.004975318908691406, 0.005697727203369141, 0.006420135498046875, 0.007142543792724609, 0.007864952087402344, 0.008587360382080078, 0.009309768676757812, 0.010032176971435547, 0.010754585266113281, 0.011476993560791016, 0.01219940185546875, 0.012921810150146484, 0.013644218444824219, 0.014366626739501953, 0.015089035034179688, 0.015811443328857422, 0.016533851623535156, 0.01725625991821289, 0.017978668212890625, 0.01870107650756836, 0.019423484802246094, 0.020145893096923828, 0.020868301391601562, 0.021590709686279297, 0.02231311798095703, 0.023035526275634766, 0.0237579345703125]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 16.0, 19.0, 20.0, 35.0, 50.0, 63.0, 71.0, 95.0, 79.0, 86.0, 92.0, 76.0, 53.0, 60.0, 44.0, 25.0, 23.0, 20.0, 12.0, 9.0, 6.0, 7.0, 1.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.76797342300415, -7.5797271728515625, -7.391481399536133, -7.203235149383545, -7.014988899230957, -6.826742649078369, -6.638496398925781, -6.450250625610352, -6.262004375457764, -6.073758125305176, -5.885512351989746, -5.697266101837158, -5.50901985168457, -5.320773601531982, -5.1325273513793945, -4.944281578063965, -4.756035327911377, -4.567789077758789, -4.379543304443359, -4.1912970542907715, -4.003050804138184, -3.8148045539855957, -3.626558542251587, -3.438312530517578, -3.2500662803649902, -3.0618200302124023, -2.8735740184783936, -2.6853280067443848, -2.497081756591797, -2.308835506439209, -2.1205894947052, -1.9323433637619019, -1.7440977096557617, -1.5558515787124634, -1.367605447769165, -1.1793593168258667, -0.9911131858825684, -0.80286705493927, -0.6146209239959717, -0.42637479305267334, -0.238128662109375, -0.04988253116607666, 0.13836359977722168, 0.32660973072052, 0.5148558616638184, 0.7031019926071167, 0.891348123550415, 1.0795942544937134, 1.2678403854370117, 1.45608651638031, 1.6443326473236084, 1.8325787782669067, 2.020824909210205, 2.209071159362793, 2.3973171710968018, 2.5855631828308105, 2.7738094329833984, 2.9620556831359863, 3.150301694869995, 3.338547706604004, 3.526793956756592, 3.7150402069091797, 3.9032862186431885, 4.091532230377197, 4.279778480529785]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 8.0, 6.0, 14.0, 12.0, 14.0, 23.0, 23.0, 18.0, 24.0, 22.0, 29.0, 32.0, 28.0, 44.0, 41.0, 36.0, 37.0, 47.0, 43.0, 40.0, 34.0, 32.0, 46.0, 43.0, 36.0, 41.0, 30.0, 28.0, 21.0, 21.0, 21.0, 13.0, 18.0, 14.0, 8.0, 13.0, 10.0, 5.0, 4.0, 8.0, 2.0, 6.0, 3.0, 0.0, 3.0, 2.0], "bins": [-2.200934886932373, -2.141292095184326, -2.0816493034362793, -2.0220065116882324, -1.962363839149475, -1.9027210474014282, -1.8430782556533813, -1.7834354639053345, -1.7237927913665771, -1.6641499996185303, -1.6045072078704834, -1.5448644161224365, -1.4852217435836792, -1.4255789518356323, -1.3659361600875854, -1.3062933683395386, -1.2466505765914917, -1.1870077848434448, -1.127364993095398, -1.0677223205566406, -1.0080795288085938, -0.9484367370605469, -0.8887939453125, -0.8291511535644531, -0.769508421421051, -0.7098656296730042, -0.650222897529602, -0.5905801057815552, -0.5309373140335083, -0.4712945818901062, -0.4116517901420593, -0.35200902819633484, -0.2923663854598999, -0.23272362351417542, -0.17308084666728973, -0.11343806982040405, -0.053795307874679565, 0.005847454071044922, 0.0654902458190918, 0.12513300776481628, 0.18477576971054077, 0.24441853165626526, 0.30406129360198975, 0.3637040853500366, 0.4233468472957611, 0.4829896092414856, 0.5426324009895325, 0.6022751331329346, 0.6619179248809814, 0.7215607166290283, 0.7812034487724304, 0.8408462405204773, 0.9004889726638794, 0.9601317644119263, 1.0197745561599731, 1.07941734790802, 1.1390600204467773, 1.1987028121948242, 1.258345603942871, 1.317988395690918, 1.3776310682296753, 1.4372738599777222, 1.496916651725769, 1.556559443473816, 1.6162022352218628]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 6.0, 18.0, 22.0, 26.0, 30.0, 56.0, 108.0, 183.0, 315.0, 472.0, 717.0, 1156.0, 1993.0, 3203.0, 5447.0, 8809.0, 14767.0, 24315.0, 39148.0, 61162.0, 90567.0, 122147.0, 143693.0, 145157.0, 123860.0, 92996.0, 63414.0, 40142.0, 25287.0, 15660.0, 9342.0, 5619.0, 3415.0, 2149.0, 1272.0, 708.0, 406.0, 270.0, 182.0, 121.0, 75.0, 39.0, 21.0, 22.0, 15.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.24609375, -2.175994873046875, -2.10589599609375, -2.035797119140625, -1.9656982421875, -1.895599365234375, -1.82550048828125, -1.755401611328125, -1.685302734375, -1.615203857421875, -1.54510498046875, -1.475006103515625, -1.4049072265625, -1.334808349609375, -1.26470947265625, -1.194610595703125, -1.12451171875, -1.054412841796875, -0.98431396484375, -0.914215087890625, -0.8441162109375, -0.774017333984375, -0.70391845703125, -0.633819580078125, -0.563720703125, -0.493621826171875, -0.42352294921875, -0.353424072265625, -0.2833251953125, -0.213226318359375, -0.14312744140625, -0.073028564453125, -0.0029296875, 0.067169189453125, 0.13726806640625, 0.207366943359375, 0.2774658203125, 0.347564697265625, 0.41766357421875, 0.487762451171875, 0.557861328125, 0.627960205078125, 0.69805908203125, 0.768157958984375, 0.8382568359375, 0.908355712890625, 0.97845458984375, 1.048553466796875, 1.11865234375, 1.188751220703125, 1.25885009765625, 1.328948974609375, 1.3990478515625, 1.469146728515625, 1.53924560546875, 1.609344482421875, 1.679443359375, 1.749542236328125, 1.81964111328125, 1.889739990234375, 1.9598388671875, 2.029937744140625, 2.10003662109375, 2.170135498046875, 2.240234375]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 11.0, 8.0, 13.0, 12.0, 11.0, 9.0, 11.0, 24.0, 17.0, 25.0, 33.0, 30.0, 42.0, 24.0, 36.0, 29.0, 40.0, 32.0, 49.0, 45.0, 39.0, 46.0, 39.0, 49.0, 42.0, 32.0, 32.0, 26.0, 24.0, 32.0, 19.0, 18.0, 17.0, 14.0, 15.0, 9.0, 9.0, 7.0, 7.0, 2.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.341796875, -2.27349853515625, -2.2052001953125, -2.13690185546875, -2.068603515625, -2.00030517578125, -1.9320068359375, -1.86370849609375, -1.79541015625, -1.72711181640625, -1.6588134765625, -1.59051513671875, -1.522216796875, -1.45391845703125, -1.3856201171875, -1.31732177734375, -1.2490234375, -1.18072509765625, -1.1124267578125, -1.04412841796875, -0.975830078125, -0.90753173828125, -0.8392333984375, -0.77093505859375, -0.70263671875, -0.63433837890625, -0.5660400390625, -0.49774169921875, -0.429443359375, -0.36114501953125, -0.2928466796875, -0.22454833984375, -0.15625, -0.08795166015625, -0.0196533203125, 0.04864501953125, 0.116943359375, 0.18524169921875, 0.2535400390625, 0.32183837890625, 0.39013671875, 0.45843505859375, 0.5267333984375, 0.59503173828125, 0.663330078125, 0.73162841796875, 0.7999267578125, 0.86822509765625, 0.9365234375, 1.00482177734375, 1.0731201171875, 1.14141845703125, 1.209716796875, 1.27801513671875, 1.3463134765625, 1.41461181640625, 1.48291015625, 1.55120849609375, 1.6195068359375, 1.68780517578125, 1.756103515625, 1.82440185546875, 1.8927001953125, 1.96099853515625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 11.0, 24.0, 25.0, 37.0, 66.0, 108.0, 194.0, 271.0, 498.0, 773.0, 1300.0, 2156.0, 3589.0, 5979.0, 9990.0, 17235.0, 28268.0, 45354.0, 71001.0, 104484.0, 136716.0, 152765.0, 142265.0, 113275.0, 79743.0, 52043.0, 32112.0, 19446.0, 11701.0, 6750.0, 4192.0, 2370.0, 1476.0, 914.0, 555.0, 326.0, 198.0, 105.0, 78.0, 55.0, 37.0, 24.0, 15.0, 12.0, 4.0, 1.0, 4.0, 3.0], "bins": [-2.876953125, -2.800506591796875, -2.72406005859375, -2.647613525390625, -2.5711669921875, -2.494720458984375, -2.41827392578125, -2.341827392578125, -2.265380859375, -2.188934326171875, -2.11248779296875, -2.036041259765625, -1.9595947265625, -1.883148193359375, -1.80670166015625, -1.730255126953125, -1.65380859375, -1.577362060546875, -1.50091552734375, -1.424468994140625, -1.3480224609375, -1.271575927734375, -1.19512939453125, -1.118682861328125, -1.042236328125, -0.965789794921875, -0.88934326171875, -0.812896728515625, -0.7364501953125, -0.660003662109375, -0.58355712890625, -0.507110595703125, -0.4306640625, -0.354217529296875, -0.27777099609375, -0.201324462890625, -0.1248779296875, -0.048431396484375, 0.02801513671875, 0.104461669921875, 0.180908203125, 0.257354736328125, 0.33380126953125, 0.410247802734375, 0.4866943359375, 0.563140869140625, 0.63958740234375, 0.716033935546875, 0.79248046875, 0.868927001953125, 0.94537353515625, 1.021820068359375, 1.0982666015625, 1.174713134765625, 1.25115966796875, 1.327606201171875, 1.404052734375, 1.480499267578125, 1.55694580078125, 1.633392333984375, 1.7098388671875, 1.786285400390625, 1.86273193359375, 1.939178466796875, 2.015625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 8.0, 13.0, 11.0, 17.0, 21.0, 15.0, 32.0, 27.0, 24.0, 29.0, 42.0, 36.0, 43.0, 36.0, 27.0, 43.0, 54.0, 48.0, 38.0, 52.0, 42.0, 39.0, 35.0, 26.0, 34.0, 25.0, 25.0, 31.0, 27.0, 20.0, 12.0, 10.0, 10.0, 3.0, 10.0, 6.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5126953125, -1.4666748046875, -1.420654296875, -1.3746337890625, -1.32861328125, -1.2825927734375, -1.236572265625, -1.1905517578125, -1.14453125, -1.0985107421875, -1.052490234375, -1.0064697265625, -0.96044921875, -0.9144287109375, -0.868408203125, -0.8223876953125, -0.7763671875, -0.7303466796875, -0.684326171875, -0.6383056640625, -0.59228515625, -0.5462646484375, -0.500244140625, -0.4542236328125, -0.408203125, -0.3621826171875, -0.316162109375, -0.2701416015625, -0.22412109375, -0.1781005859375, -0.132080078125, -0.0860595703125, -0.0400390625, 0.0059814453125, 0.052001953125, 0.0980224609375, 0.14404296875, 0.1900634765625, 0.236083984375, 0.2821044921875, 0.328125, 0.3741455078125, 0.420166015625, 0.4661865234375, 0.51220703125, 0.5582275390625, 0.604248046875, 0.6502685546875, 0.6962890625, 0.7423095703125, 0.788330078125, 0.8343505859375, 0.88037109375, 0.9263916015625, 0.972412109375, 1.0184326171875, 1.064453125, 1.1104736328125, 1.156494140625, 1.2025146484375, 1.24853515625, 1.2945556640625, 1.340576171875, 1.3865966796875, 1.4326171875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 18.0, 22.0, 19.0, 44.0, 56.0, 77.0, 137.0, 182.0, 253.0, 404.0, 559.0, 915.0, 1305.0, 2045.0, 3171.0, 5291.0, 8580.0, 14272.0, 24335.0, 42283.0, 71904.0, 116646.0, 163621.0, 181668.0, 153042.0, 103390.0, 62840.0, 37000.0, 21404.0, 12633.0, 7488.0, 4469.0, 2871.0, 1857.0, 1222.0, 862.0, 528.0, 381.0, 219.0, 188.0, 119.0, 65.0, 50.0, 37.0, 28.0, 12.0, 11.0, 7.0, 6.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.44921875, -1.4015045166015625, -1.353790283203125, -1.3060760498046875, -1.25836181640625, -1.2106475830078125, -1.162933349609375, -1.1152191162109375, -1.0675048828125, -1.0197906494140625, -0.972076416015625, -0.9243621826171875, -0.87664794921875, -0.8289337158203125, -0.781219482421875, -0.7335052490234375, -0.685791015625, -0.6380767822265625, -0.590362548828125, -0.5426483154296875, -0.49493408203125, -0.4472198486328125, -0.399505615234375, -0.3517913818359375, -0.3040771484375, -0.2563629150390625, -0.208648681640625, -0.1609344482421875, -0.11322021484375, -0.0655059814453125, -0.017791748046875, 0.0299224853515625, 0.07763671875, 0.1253509521484375, 0.173065185546875, 0.2207794189453125, 0.26849365234375, 0.3162078857421875, 0.363922119140625, 0.4116363525390625, 0.4593505859375, 0.5070648193359375, 0.554779052734375, 0.6024932861328125, 0.65020751953125, 0.6979217529296875, 0.745635986328125, 0.7933502197265625, 0.841064453125, 0.8887786865234375, 0.936492919921875, 0.9842071533203125, 1.03192138671875, 1.0796356201171875, 1.127349853515625, 1.1750640869140625, 1.2227783203125, 1.2704925537109375, 1.318206787109375, 1.3659210205078125, 1.41363525390625, 1.4613494873046875, 1.509063720703125, 1.5567779541015625, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 11.0, 6.0, 21.0, 13.0, 25.0, 32.0, 37.0, 50.0, 50.0, 62.0, 63.0, 56.0, 79.0, 73.0, 71.0, 62.0, 42.0, 48.0, 41.0, 38.0, 24.0, 25.0, 11.0, 10.0, 7.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015425682067871094, -0.0001490432769060135, -0.00014382973313331604, -0.0001386161893606186, -0.00013340264558792114, -0.0001281891018152237, -0.00012297555804252625, -0.0001177620142698288, -0.00011254847049713135, -0.0001073349267244339, -0.00010212138295173645, -9.6907839179039e-05, -9.169429540634155e-05, -8.64807516336441e-05, -8.126720786094666e-05, -7.60536640882492e-05, -7.084012031555176e-05, -6.562657654285431e-05, -6.041303277015686e-05, -5.519948899745941e-05, -4.998594522476196e-05, -4.4772401452064514e-05, -3.9558857679367065e-05, -3.434531390666962e-05, -2.9131770133972168e-05, -2.391822636127472e-05, -1.870468258857727e-05, -1.3491138815879822e-05, -8.277595043182373e-06, -3.0640512704849243e-06, 2.1494925022125244e-06, 7.363036274909973e-06, 1.2576580047607422e-05, 1.779012382030487e-05, 2.300366759300232e-05, 2.8217211365699768e-05, 3.343075513839722e-05, 3.8644298911094666e-05, 4.3857842683792114e-05, 4.907138645648956e-05, 5.428493022918701e-05, 5.949847400188446e-05, 6.471201777458191e-05, 6.992556154727936e-05, 7.51391053199768e-05, 8.035264909267426e-05, 8.55661928653717e-05, 9.077973663806915e-05, 9.59932804107666e-05, 0.00010120682418346405, 0.0001064203679561615, 0.00011163391172885895, 0.0001168474555015564, 0.00012206099927425385, 0.0001272745430469513, 0.00013248808681964874, 0.0001377016305923462, 0.00014291517436504364, 0.0001481287181377411, 0.00015334226191043854, 0.00015855580568313599, 0.00016376934945583344, 0.00016898289322853088, 0.00017419643700122833, 0.00017940998077392578]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 12.0, 28.0, 21.0, 50.0, 65.0, 89.0, 170.0, 259.0, 365.0, 624.0, 937.0, 1558.0, 2574.0, 4229.0, 7426.0, 13417.0, 24421.0, 43942.0, 78330.0, 128056.0, 178636.0, 190180.0, 150247.0, 96743.0, 55915.0, 30554.0, 16522.0, 9376.0, 5512.0, 3145.0, 1929.0, 1162.0, 710.0, 469.0, 298.0, 205.0, 104.0, 91.0, 56.0, 34.0, 18.0, 12.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.39898681640625, -1.3526611328125, -1.30633544921875, -1.260009765625, -1.21368408203125, -1.1673583984375, -1.12103271484375, -1.07470703125, -1.02838134765625, -0.9820556640625, -0.93572998046875, -0.889404296875, -0.84307861328125, -0.7967529296875, -0.75042724609375, -0.7041015625, -0.65777587890625, -0.6114501953125, -0.56512451171875, -0.518798828125, -0.47247314453125, -0.4261474609375, -0.37982177734375, -0.33349609375, -0.28717041015625, -0.2408447265625, -0.19451904296875, -0.148193359375, -0.10186767578125, -0.0555419921875, -0.00921630859375, 0.037109375, 0.08343505859375, 0.1297607421875, 0.17608642578125, 0.222412109375, 0.26873779296875, 0.3150634765625, 0.36138916015625, 0.40771484375, 0.45404052734375, 0.5003662109375, 0.54669189453125, 0.593017578125, 0.63934326171875, 0.6856689453125, 0.73199462890625, 0.7783203125, 0.82464599609375, 0.8709716796875, 0.91729736328125, 0.963623046875, 1.00994873046875, 1.0562744140625, 1.10260009765625, 1.14892578125, 1.19525146484375, 1.2415771484375, 1.28790283203125, 1.334228515625, 1.38055419921875, 1.4268798828125, 1.47320556640625, 1.51953125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 2.0, 3.0, 9.0, 10.0, 15.0, 14.0, 16.0, 15.0, 25.0, 33.0, 20.0, 45.0, 40.0, 72.0, 68.0, 52.0, 62.0, 77.0, 68.0, 55.0, 46.0, 51.0, 44.0, 31.0, 24.0, 23.0, 18.0, 7.0, 12.0, 7.0, 3.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41357421875, -0.4009056091308594, -0.38823699951171875, -0.3755683898925781, -0.3628997802734375, -0.3502311706542969, -0.33756256103515625, -0.3248939514160156, -0.312225341796875, -0.2995567321777344, -0.28688812255859375, -0.2742195129394531, -0.2615509033203125, -0.24888229370117188, -0.23621368408203125, -0.22354507446289062, -0.21087646484375, -0.19820785522460938, -0.18553924560546875, -0.17287063598632812, -0.1602020263671875, -0.14753341674804688, -0.13486480712890625, -0.12219619750976562, -0.109527587890625, -0.09685897827148438, -0.08419036865234375, -0.07152175903320312, -0.0588531494140625, -0.046184539794921875, -0.03351593017578125, -0.020847320556640625, -0.0081787109375, 0.004489898681640625, 0.01715850830078125, 0.029827117919921875, 0.0424957275390625, 0.055164337158203125, 0.06783294677734375, 0.08050155639648438, 0.093170166015625, 0.10583877563476562, 0.11850738525390625, 0.13117599487304688, 0.1438446044921875, 0.15651321411132812, 0.16918182373046875, 0.18185043334960938, 0.19451904296875, 0.20718765258789062, 0.21985626220703125, 0.23252487182617188, 0.2451934814453125, 0.2578620910644531, 0.27053070068359375, 0.2831993103027344, 0.295867919921875, 0.3085365295410156, 0.32120513916015625, 0.3338737487792969, 0.3465423583984375, 0.3592109680175781, 0.37187957763671875, 0.3845481872558594, 0.397216796875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 7.0, 8.0, 8.0, 27.0, 19.0, 37.0, 32.0, 51.0, 69.0, 80.0, 92.0, 104.0, 77.0, 83.0, 72.0, 65.0, 35.0, 32.0, 28.0, 17.0, 21.0, 13.0, 4.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.787813186645508, -7.59655237197876, -7.40529203414917, -7.214031219482422, -7.022770881652832, -6.831510066986084, -6.640249252319336, -6.448988914489746, -6.257728576660156, -6.066467761993408, -5.875207424163818, -5.68394660949707, -5.4926862716674805, -5.301425457000732, -5.110164642333984, -4.9189043045043945, -4.7276434898376465, -4.536382675170898, -4.345122337341309, -4.1538615226745605, -3.9626011848449707, -3.7713403701782227, -3.5800797939300537, -3.3888192176818848, -3.197558641433716, -3.006298065185547, -2.815037488937378, -2.623776912689209, -2.432516098022461, -2.241255760192871, -2.049994945526123, -1.858734369277954, -1.667473316192627, -1.476212739944458, -1.284952163696289, -1.0936914682388306, -0.9024308919906616, -0.7111703157424927, -0.5199096202850342, -0.32864904403686523, -0.1373884677886963, 0.053872138261795044, 0.24513274431228638, 0.4363933801651001, 0.627653956413269, 0.818914532661438, 1.0101752281188965, 1.2014358043670654, 1.3926963806152344, 1.5839569568634033, 1.7752175331115723, 1.9664782285690308, 2.15773868560791, 2.348999500274658, 2.540260076522827, 2.731520652770996, 2.922781229019165, 3.114041805267334, 3.305302381515503, 3.496562957763672, 3.68782377243042, 3.8790841102600098, 4.070344924926758, 4.261605262756348, 4.452866077423096]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 11.0, 10.0, 10.0, 13.0, 17.0, 17.0, 19.0, 18.0, 21.0, 33.0, 34.0, 29.0, 30.0, 37.0, 25.0, 37.0, 36.0, 42.0, 46.0, 46.0, 35.0, 39.0, 33.0, 33.0, 34.0, 22.0, 33.0, 16.0, 28.0, 27.0, 18.0, 23.0, 14.0, 16.0, 9.0, 19.0, 10.0, 17.0, 12.0, 6.0, 3.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-2.103912353515625, -2.04496431350708, -1.9860161542892456, -1.9270681142807007, -1.8681199550628662, -1.8091719150543213, -1.7502238750457764, -1.6912758350372314, -1.632327675819397, -1.573379635810852, -1.5144314765930176, -1.4554834365844727, -1.3965353965759277, -1.3375872373580933, -1.2786391973495483, -1.2196910381317139, -1.160742998123169, -1.101794958114624, -1.0428467988967896, -0.9838987588882446, -0.9249506592750549, -0.8660025596618652, -0.8070545196533203, -0.7481064200401306, -0.6891583204269409, -0.6302102208137512, -0.5712621212005615, -0.5123140811920166, -0.4533659815788269, -0.3944178819656372, -0.3354698121547699, -0.2765217423439026, -0.21757376194000244, -0.15862567722797394, -0.09967759251594543, -0.04072950780391693, 0.018218576908111572, 0.07716667652130127, 0.13611474633216858, 0.1950628161430359, 0.2540109157562256, 0.3129590153694153, 0.3719070851802826, 0.4308551549911499, 0.4898032546043396, 0.5487513542175293, 0.6076993942260742, 0.6666474938392639, 0.7255955934524536, 0.7845436930656433, 0.843491792678833, 0.9024398326873779, 0.9613879323005676, 1.0203360319137573, 1.0792840719223022, 1.1382322311401367, 1.1971802711486816, 1.2561283111572266, 1.315076470375061, 1.374024510383606, 1.4329726696014404, 1.4919207096099854, 1.5508687496185303, 1.6098167896270752, 1.6687649488449097]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 2.0, 10.0, 22.0, 25.0, 44.0, 76.0, 117.0, 191.0, 276.0, 462.0, 806.0, 1383.0, 2191.0, 3634.0, 6327.0, 11467.0, 20756.0, 39748.0, 81050.0, 178953.0, 436498.0, 997004.0, 1223554.0, 672831.0, 278304.0, 120663.0, 57059.0, 28288.0, 14712.0, 7811.0, 4306.0, 2382.0, 1377.0, 806.0, 441.0, 278.0, 170.0, 98.0, 50.0, 36.0, 25.0, 23.0, 5.0, 5.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.26519775390625, -4.1241455078125, -3.98309326171875, -3.842041015625, -3.70098876953125, -3.5599365234375, -3.41888427734375, -3.27783203125, -3.13677978515625, -2.9957275390625, -2.85467529296875, -2.713623046875, -2.57257080078125, -2.4315185546875, -2.29046630859375, -2.1494140625, -2.00836181640625, -1.8673095703125, -1.72625732421875, -1.585205078125, -1.44415283203125, -1.3031005859375, -1.16204833984375, -1.02099609375, -0.87994384765625, -0.7388916015625, -0.59783935546875, -0.456787109375, -0.31573486328125, -0.1746826171875, -0.03363037109375, 0.107421875, 0.24847412109375, 0.3895263671875, 0.53057861328125, 0.671630859375, 0.81268310546875, 0.9537353515625, 1.09478759765625, 1.23583984375, 1.37689208984375, 1.5179443359375, 1.65899658203125, 1.800048828125, 1.94110107421875, 2.0821533203125, 2.22320556640625, 2.3642578125, 2.50531005859375, 2.6463623046875, 2.78741455078125, 2.928466796875, 3.06951904296875, 3.2105712890625, 3.35162353515625, 3.49267578125, 3.63372802734375, 3.7747802734375, 3.91583251953125, 4.056884765625, 4.19793701171875, 4.3389892578125, 4.48004150390625, 4.62109375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 4.0, 5.0, 6.0, 22.0, 12.0, 19.0, 27.0, 25.0, 29.0, 26.0, 39.0, 38.0, 36.0, 43.0, 31.0, 44.0, 35.0, 36.0, 54.0, 35.0, 52.0, 49.0, 40.0, 23.0, 38.0, 37.0, 30.0, 21.0, 21.0, 35.0, 15.0, 9.0, 10.0, 6.0, 12.0, 6.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.078125, -2.019866943359375, -1.96160888671875, -1.903350830078125, -1.8450927734375, -1.786834716796875, -1.72857666015625, -1.670318603515625, -1.612060546875, -1.553802490234375, -1.49554443359375, -1.437286376953125, -1.3790283203125, -1.320770263671875, -1.26251220703125, -1.204254150390625, -1.14599609375, -1.087738037109375, -1.02947998046875, -0.971221923828125, -0.9129638671875, -0.854705810546875, -0.79644775390625, -0.738189697265625, -0.679931640625, -0.621673583984375, -0.56341552734375, -0.505157470703125, -0.4468994140625, -0.388641357421875, -0.33038330078125, -0.272125244140625, -0.2138671875, -0.155609130859375, -0.09735107421875, -0.039093017578125, 0.0191650390625, 0.077423095703125, 0.13568115234375, 0.193939208984375, 0.252197265625, 0.310455322265625, 0.36871337890625, 0.426971435546875, 0.4852294921875, 0.543487548828125, 0.60174560546875, 0.660003662109375, 0.71826171875, 0.776519775390625, 0.83477783203125, 0.893035888671875, 0.9512939453125, 1.009552001953125, 1.06781005859375, 1.126068115234375, 1.184326171875, 1.242584228515625, 1.30084228515625, 1.359100341796875, 1.4173583984375, 1.475616455078125, 1.53387451171875, 1.592132568359375, 1.650390625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 11.0, 14.0, 27.0, 40.0, 45.0, 85.0, 134.0, 227.0, 335.0, 582.0, 967.0, 1473.0, 2510.0, 4315.0, 7428.0, 13143.0, 24089.0, 44776.0, 86996.0, 171692.0, 352864.0, 693910.0, 1039472.0, 840922.0, 451720.0, 221802.0, 110664.0, 56175.0, 29964.0, 16329.0, 9061.0, 4959.0, 3030.0, 1818.0, 1090.0, 646.0, 337.0, 231.0, 144.0, 103.0, 64.0, 32.0, 28.0, 10.0, 6.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.16015625, -4.0245361328125, -3.888916015625, -3.7532958984375, -3.61767578125, -3.4820556640625, -3.346435546875, -3.2108154296875, -3.0751953125, -2.9395751953125, -2.803955078125, -2.6683349609375, -2.53271484375, -2.3970947265625, -2.261474609375, -2.1258544921875, -1.990234375, -1.8546142578125, -1.718994140625, -1.5833740234375, -1.44775390625, -1.3121337890625, -1.176513671875, -1.0408935546875, -0.9052734375, -0.7696533203125, -0.634033203125, -0.4984130859375, -0.36279296875, -0.2271728515625, -0.091552734375, 0.0440673828125, 0.1796875, 0.3153076171875, 0.450927734375, 0.5865478515625, 0.72216796875, 0.8577880859375, 0.993408203125, 1.1290283203125, 1.2646484375, 1.4002685546875, 1.535888671875, 1.6715087890625, 1.80712890625, 1.9427490234375, 2.078369140625, 2.2139892578125, 2.349609375, 2.4852294921875, 2.620849609375, 2.7564697265625, 2.89208984375, 3.0277099609375, 3.163330078125, 3.2989501953125, 3.4345703125, 3.5701904296875, 3.705810546875, 3.8414306640625, 3.97705078125, 4.1126708984375, 4.248291015625, 4.3839111328125, 4.51953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 11.0, 11.0, 14.0, 20.0, 32.0, 33.0, 47.0, 68.0, 81.0, 97.0, 99.0, 135.0, 137.0, 181.0, 201.0, 219.0, 245.0, 230.0, 285.0, 258.0, 215.0, 241.0, 199.0, 165.0, 136.0, 137.0, 100.0, 87.0, 84.0, 71.0, 52.0, 40.0, 23.0, 15.0, 23.0, 17.0, 6.0, 9.0, 6.0, 6.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.99072265625, -0.9569778442382812, -0.9232330322265625, -0.8894882202148438, -0.855743408203125, -0.8219985961914062, -0.7882537841796875, -0.7545089721679688, -0.72076416015625, -0.6870193481445312, -0.6532745361328125, -0.6195297241210938, -0.585784912109375, -0.5520401000976562, -0.5182952880859375, -0.48455047607421875, -0.4508056640625, -0.41706085205078125, -0.3833160400390625, -0.34957122802734375, -0.315826416015625, -0.28208160400390625, -0.2483367919921875, -0.21459197998046875, -0.18084716796875, -0.14710235595703125, -0.1133575439453125, -0.07961273193359375, -0.045867919921875, -0.01212310791015625, 0.0216217041015625, 0.05536651611328125, 0.089111328125, 0.12285614013671875, 0.1566009521484375, 0.19034576416015625, 0.224090576171875, 0.25783538818359375, 0.2915802001953125, 0.32532501220703125, 0.35906982421875, 0.39281463623046875, 0.4265594482421875, 0.46030426025390625, 0.494049072265625, 0.5277938842773438, 0.5615386962890625, 0.5952835083007812, 0.6290283203125, 0.6627731323242188, 0.6965179443359375, 0.7302627563476562, 0.764007568359375, 0.7977523803710938, 0.8314971923828125, 0.8652420043945312, 0.89898681640625, 0.9327316284179688, 0.9664764404296875, 1.0002212524414062, 1.033966064453125, 1.0677108764648438, 1.1014556884765625, 1.1352005004882812, 1.1689453125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 12.0, 14.0, 12.0, 16.0, 16.0, 25.0, 49.0, 47.0, 55.0, 70.0, 64.0, 74.0, 84.0, 74.0, 80.0, 68.0, 57.0, 26.0, 30.0, 21.0, 25.0, 19.0, 8.0, 13.0, 14.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.886803150177002, -6.720529079437256, -6.554255485534668, -6.387981414794922, -6.221707344055176, -6.05543327331543, -5.889159202575684, -5.722885608673096, -5.55661153793335, -5.3903374671936035, -5.224063873291016, -5.0577898025512695, -4.891515731811523, -4.725241661071777, -4.558967590332031, -4.392693996429443, -4.226419925689697, -4.060145854949951, -3.893872022628784, -3.727598190307617, -3.561324119567871, -3.395050048828125, -3.228776216506958, -3.062502384185791, -2.896228313446045, -2.729954242706299, -2.563680410385132, -2.397406578063965, -2.2311325073242188, -2.0648584365844727, -1.8985846042633057, -1.7323106527328491, -1.5660364627838135, -1.399762511253357, -1.2334885597229004, -1.0672146081924438, -0.9009406566619873, -0.7346667051315308, -0.5683927536010742, -0.4021188020706177, -0.23584485054016113, -0.06957089900970459, 0.09670305252075195, 0.2629770040512085, 0.42925095558166504, 0.5955249071121216, 0.7617988586425781, 0.9280728101730347, 1.0943467617034912, 1.2606207132339478, 1.4268946647644043, 1.5931686162948608, 1.7594425678253174, 1.925716519355774, 2.0919904708862305, 2.2582645416259766, 2.4245383739471436, 2.5908122062683105, 2.7570862770080566, 2.9233603477478027, 3.0896341800689697, 3.2559080123901367, 3.422182083129883, 3.588456153869629, 3.754729986190796]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 4.0, 3.0, 5.0, 8.0, 4.0, 12.0, 20.0, 12.0, 25.0, 15.0, 20.0, 19.0, 26.0, 31.0, 31.0, 35.0, 33.0, 38.0, 50.0, 40.0, 32.0, 44.0, 44.0, 31.0, 42.0, 34.0, 29.0, 29.0, 20.0, 32.0, 25.0, 20.0, 19.0, 26.0, 20.0, 17.0, 14.0, 18.0, 11.0, 11.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8708324432373047, -1.8121438026428223, -1.7534551620483398, -1.6947665214538574, -1.636077880859375, -1.5773892402648926, -1.5187007188796997, -1.4600120782852173, -1.4013234376907349, -1.3426347970962524, -1.28394615650177, -1.2252575159072876, -1.1665689945220947, -1.1078803539276123, -1.0491917133331299, -0.9905030727386475, -0.931814432144165, -0.8731257915496826, -0.8144371509552002, -0.7557485699653625, -0.6970599293708801, -0.6383712887763977, -0.5796827077865601, -0.5209940671920776, -0.4623054265975952, -0.4036167860031128, -0.34492817521095276, -0.2862395644187927, -0.2275509238243103, -0.16886228322982788, -0.11017367243766785, -0.05148506164550781, 0.00720369815826416, 0.06589232385158539, 0.12458094954490662, 0.18326957523822784, 0.24195820093154907, 0.3006468415260315, 0.35933545231819153, 0.41802406311035156, 0.476712703704834, 0.5354013442993164, 0.5940899848937988, 0.6527785658836365, 0.7114672064781189, 0.7701558470726013, 0.828844428062439, 0.8875330686569214, 0.9462217092514038, 1.0049103498458862, 1.0635989904403687, 1.122287631034851, 1.180976152420044, 1.2396647930145264, 1.2983534336090088, 1.3570420742034912, 1.4157307147979736, 1.474419355392456, 1.5331079959869385, 1.591796636581421, 1.6504852771759033, 1.7091739177703857, 1.7678624391555786, 1.826551079750061, 1.8852397203445435]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 8.0, 15.0, 22.0, 37.0, 46.0, 98.0, 126.0, 216.0, 317.0, 495.0, 790.0, 1301.0, 2005.0, 3435.0, 5767.0, 10168.0, 18038.0, 32493.0, 58886.0, 105221.0, 169738.0, 210826.0, 175578.0, 111063.0, 62661.0, 34362.0, 19025.0, 10695.0, 5939.0, 3474.0, 2229.0, 1299.0, 751.0, 529.0, 307.0, 216.0, 148.0, 79.0, 44.0, 35.0, 17.0, 16.0, 12.0, 14.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.328125, -0.31862640380859375, -0.3091278076171875, -0.29962921142578125, -0.290130615234375, -0.28063201904296875, -0.2711334228515625, -0.26163482666015625, -0.25213623046875, -0.24263763427734375, -0.2331390380859375, -0.22364044189453125, -0.214141845703125, -0.20464324951171875, -0.1951446533203125, -0.18564605712890625, -0.1761474609375, -0.16664886474609375, -0.1571502685546875, -0.14765167236328125, -0.138153076171875, -0.12865447998046875, -0.1191558837890625, -0.10965728759765625, -0.10015869140625, -0.09066009521484375, -0.0811614990234375, -0.07166290283203125, -0.062164306640625, -0.05266571044921875, -0.0431671142578125, -0.03366851806640625, -0.024169921875, -0.01467132568359375, -0.0051727294921875, 0.00432586669921875, 0.013824462890625, 0.02332305908203125, 0.0328216552734375, 0.04232025146484375, 0.05181884765625, 0.06131744384765625, 0.0708160400390625, 0.08031463623046875, 0.089813232421875, 0.09931182861328125, 0.1088104248046875, 0.11830902099609375, 0.1278076171875, 0.13730621337890625, 0.1468048095703125, 0.15630340576171875, 0.165802001953125, 0.17530059814453125, 0.1847991943359375, 0.19429779052734375, 0.20379638671875, 0.21329498291015625, 0.2227935791015625, 0.23229217529296875, 0.241790771484375, 0.25128936767578125, 0.2607879638671875, 0.27028656005859375, 0.27978515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 4.0, 9.0, 10.0, 6.0, 14.0, 8.0, 16.0, 17.0, 18.0, 21.0, 26.0, 26.0, 31.0, 30.0, 46.0, 27.0, 45.0, 34.0, 48.0, 27.0, 43.0, 38.0, 37.0, 30.0, 39.0, 32.0, 36.0, 30.0, 31.0, 24.0, 19.0, 13.0, 19.0, 22.0, 21.0, 12.0, 11.0, 15.0, 12.0, 6.0, 8.0, 6.0, 6.0, 7.0, 6.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.296875, -2.228546142578125, -2.16021728515625, -2.091888427734375, -2.0235595703125, -1.955230712890625, -1.88690185546875, -1.818572998046875, -1.750244140625, -1.681915283203125, -1.61358642578125, -1.545257568359375, -1.4769287109375, -1.408599853515625, -1.34027099609375, -1.271942138671875, -1.20361328125, -1.135284423828125, -1.06695556640625, -0.998626708984375, -0.9302978515625, -0.861968994140625, -0.79364013671875, -0.725311279296875, -0.656982421875, -0.588653564453125, -0.52032470703125, -0.451995849609375, -0.3836669921875, -0.315338134765625, -0.24700927734375, -0.178680419921875, -0.1103515625, -0.042022705078125, 0.02630615234375, 0.094635009765625, 0.1629638671875, 0.231292724609375, 0.29962158203125, 0.367950439453125, 0.436279296875, 0.504608154296875, 0.57293701171875, 0.641265869140625, 0.7095947265625, 0.777923583984375, 0.84625244140625, 0.914581298828125, 0.98291015625, 1.051239013671875, 1.11956787109375, 1.187896728515625, 1.2562255859375, 1.324554443359375, 1.39288330078125, 1.461212158203125, 1.529541015625, 1.597869873046875, 1.66619873046875, 1.734527587890625, 1.8028564453125, 1.871185302734375, 1.93951416015625, 2.007843017578125, 2.076171875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 9.0, 5.0, 9.0, 11.0, 27.0, 29.0, 48.0, 71.0, 70.0, 132.0, 185.0, 259.0, 443.0, 791.0, 1316.0, 2533.0, 5318.0, 12331.0, 33200.0, 741366.0, 206411.0, 24797.0, 9747.0, 4332.0, 2118.0, 1162.0, 620.0, 423.0, 244.0, 185.0, 110.0, 73.0, 44.0, 39.0, 25.0, 23.0, 14.0, 9.0, 6.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.060546875, -1.0272674560546875, -0.993988037109375, -0.9607086181640625, -0.92742919921875, -0.8941497802734375, -0.860870361328125, -0.8275909423828125, -0.7943115234375, -0.7610321044921875, -0.727752685546875, -0.6944732666015625, -0.66119384765625, -0.6279144287109375, -0.594635009765625, -0.5613555908203125, -0.528076171875, -0.4947967529296875, -0.461517333984375, -0.4282379150390625, -0.39495849609375, -0.3616790771484375, -0.328399658203125, -0.2951202392578125, -0.2618408203125, -0.2285614013671875, -0.195281982421875, -0.1620025634765625, -0.12872314453125, -0.0954437255859375, -0.062164306640625, -0.0288848876953125, 0.00439453125, 0.0376739501953125, 0.070953369140625, 0.1042327880859375, 0.13751220703125, 0.1707916259765625, 0.204071044921875, 0.2373504638671875, 0.2706298828125, 0.3039093017578125, 0.337188720703125, 0.3704681396484375, 0.40374755859375, 0.4370269775390625, 0.470306396484375, 0.5035858154296875, 0.536865234375, 0.5701446533203125, 0.603424072265625, 0.6367034912109375, 0.66998291015625, 0.7032623291015625, 0.736541748046875, 0.7698211669921875, 0.8031005859375, 0.8363800048828125, 0.869659423828125, 0.9029388427734375, 0.93621826171875, 0.9694976806640625, 1.002777099609375, 1.0360565185546875, 1.0693359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 9.0, 7.0, 9.0, 10.0, 22.0, 21.0, 20.0, 27.0, 28.0, 25.0, 27.0, 26.0, 33.0, 33.0, 46.0, 38.0, 47.0, 46.0, 45.0, 35.0, 45.0, 43.0, 42.0, 55.0, 46.0, 29.0, 18.0, 30.0, 12.0, 24.0, 21.0, 16.0, 17.0, 9.0, 11.0, 7.0, 2.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.8232421875, -1.772857666015625, -1.72247314453125, -1.672088623046875, -1.6217041015625, -1.571319580078125, -1.52093505859375, -1.470550537109375, -1.420166015625, -1.369781494140625, -1.31939697265625, -1.269012451171875, -1.2186279296875, -1.168243408203125, -1.11785888671875, -1.067474365234375, -1.01708984375, -0.966705322265625, -0.91632080078125, -0.865936279296875, -0.8155517578125, -0.765167236328125, -0.71478271484375, -0.664398193359375, -0.614013671875, -0.563629150390625, -0.51324462890625, -0.462860107421875, -0.4124755859375, -0.362091064453125, -0.31170654296875, -0.261322021484375, -0.2109375, -0.160552978515625, -0.11016845703125, -0.059783935546875, -0.0093994140625, 0.040985107421875, 0.09136962890625, 0.141754150390625, 0.192138671875, 0.242523193359375, 0.29290771484375, 0.343292236328125, 0.3936767578125, 0.444061279296875, 0.49444580078125, 0.544830322265625, 0.59521484375, 0.645599365234375, 0.69598388671875, 0.746368408203125, 0.7967529296875, 0.847137451171875, 0.89752197265625, 0.947906494140625, 0.998291015625, 1.048675537109375, 1.09906005859375, 1.149444580078125, 1.1998291015625, 1.250213623046875, 1.30059814453125, 1.350982666015625, 1.4013671875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 14.0, 18.0, 27.0, 28.0, 28.0, 43.0, 54.0, 91.0, 151.0, 257.0, 448.0, 792.0, 1420.0, 2747.0, 5786.0, 13103.0, 36279.0, 903133.0, 53276.0, 16635.0, 6940.0, 3262.0, 1708.0, 913.0, 529.0, 292.0, 185.0, 119.0, 75.0, 51.0, 32.0, 31.0, 20.0, 15.0, 5.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0], "bins": [-0.338623046875, -0.3296241760253906, -0.32062530517578125, -0.3116264343261719, -0.3026275634765625, -0.2936286926269531, -0.28462982177734375, -0.2756309509277344, -0.266632080078125, -0.2576332092285156, -0.24863433837890625, -0.23963546752929688, -0.2306365966796875, -0.22163772583007812, -0.21263885498046875, -0.20363998413085938, -0.19464111328125, -0.18564224243164062, -0.17664337158203125, -0.16764450073242188, -0.1586456298828125, -0.14964675903320312, -0.14064788818359375, -0.13164901733398438, -0.122650146484375, -0.11365127563476562, -0.10465240478515625, -0.09565353393554688, -0.0866546630859375, -0.07765579223632812, -0.06865692138671875, -0.059658050537109375, -0.0506591796875, -0.041660308837890625, -0.03266143798828125, -0.023662567138671875, -0.0146636962890625, -0.005664825439453125, 0.00333404541015625, 0.012332916259765625, 0.021331787109375, 0.030330657958984375, 0.03932952880859375, 0.048328399658203125, 0.0573272705078125, 0.06632614135742188, 0.07532501220703125, 0.08432388305664062, 0.09332275390625, 0.10232162475585938, 0.11132049560546875, 0.12031936645507812, 0.1293182373046875, 0.13831710815429688, 0.14731597900390625, 0.15631484985351562, 0.165313720703125, 0.17431259155273438, 0.18331146240234375, 0.19231033325195312, 0.2013092041015625, 0.21030807495117188, 0.21930694580078125, 0.22830581665039062, 0.2373046875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 4.0, 4.0, 5.0, 10.0, 8.0, 17.0, 21.0, 18.0, 26.0, 20.0, 30.0, 40.0, 43.0, 37.0, 48.0, 47.0, 37.0, 56.0, 58.0, 51.0, 53.0, 54.0, 42.0, 45.0, 35.0, 30.0, 23.0, 18.0, 22.0, 9.0, 18.0, 14.0, 13.0, 7.0, 8.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.719329833984375e-05, -3.612879663705826e-05, -3.5064294934272766e-05, -3.3999793231487274e-05, -3.293529152870178e-05, -3.187078982591629e-05, -3.08062881231308e-05, -2.9741786420345306e-05, -2.8677284717559814e-05, -2.7612783014774323e-05, -2.654828131198883e-05, -2.548377960920334e-05, -2.4419277906417847e-05, -2.3354776203632355e-05, -2.2290274500846863e-05, -2.122577279806137e-05, -2.016127109527588e-05, -1.9096769392490387e-05, -1.8032267689704895e-05, -1.6967765986919403e-05, -1.590326428413391e-05, -1.483876258134842e-05, -1.3774260878562927e-05, -1.2709759175777435e-05, -1.1645257472991943e-05, -1.0580755770206451e-05, -9.51625406742096e-06, -8.451752364635468e-06, -7.387250661849976e-06, -6.322748959064484e-06, -5.258247256278992e-06, -4.1937455534935e-06, -3.129243850708008e-06, -2.064742147922516e-06, -1.000240445137024e-06, 6.426125764846802e-08, 1.12876296043396e-06, 2.193264663219452e-06, 3.257766366004944e-06, 4.322268068790436e-06, 5.386769771575928e-06, 6.45127147436142e-06, 7.515773177146912e-06, 8.580274879932404e-06, 9.644776582717896e-06, 1.0709278285503387e-05, 1.177377998828888e-05, 1.2838281691074371e-05, 1.3902783393859863e-05, 1.4967285096645355e-05, 1.6031786799430847e-05, 1.709628850221634e-05, 1.816079020500183e-05, 1.9225291907787323e-05, 2.0289793610572815e-05, 2.1354295313358307e-05, 2.24187970161438e-05, 2.348329871892929e-05, 2.4547800421714783e-05, 2.5612302124500275e-05, 2.6676803827285767e-05, 2.774130553007126e-05, 2.880580723285675e-05, 2.9870308935642242e-05, 3.0934810638427734e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 13.0, 26.0, 37.0, 44.0, 55.0, 83.0, 94.0, 138.0, 230.0, 340.0, 451.0, 632.0, 1040.0, 1523.0, 2276.0, 3626.0, 5991.0, 9577.0, 16396.0, 28144.0, 49759.0, 89647.0, 150337.0, 208660.0, 189692.0, 123210.0, 70081.0, 39741.0, 22222.0, 12958.0, 7688.0, 4773.0, 2958.0, 1933.0, 1293.0, 934.0, 623.0, 409.0, 259.0, 188.0, 161.0, 86.0, 63.0, 48.0, 28.0, 21.0, 19.0, 9.0, 10.0, 9.0, 2.0, 2.0, 2.0], "bins": [-0.07452392578125, -0.07238197326660156, -0.07024002075195312, -0.06809806823730469, -0.06595611572265625, -0.06381416320800781, -0.061672210693359375, -0.05953025817871094, -0.0573883056640625, -0.05524635314941406, -0.053104400634765625, -0.05096244812011719, -0.04882049560546875, -0.04667854309082031, -0.044536590576171875, -0.04239463806152344, -0.040252685546875, -0.03811073303222656, -0.035968780517578125, -0.03382682800292969, -0.03168487548828125, -0.029542922973632812, -0.027400970458984375, -0.025259017944335938, -0.0231170654296875, -0.020975112915039062, -0.018833160400390625, -0.016691207885742188, -0.01454925537109375, -0.012407302856445312, -0.010265350341796875, -0.008123397827148438, -0.0059814453125, -0.0038394927978515625, -0.001697540283203125, 0.0004444122314453125, 0.00258636474609375, 0.0047283172607421875, 0.006870269775390625, 0.009012222290039062, 0.0111541748046875, 0.013296127319335938, 0.015438079833984375, 0.017580032348632812, 0.01972198486328125, 0.021863937377929688, 0.024005889892578125, 0.026147842407226562, 0.028289794921875, 0.030431747436523438, 0.032573699951171875, 0.03471565246582031, 0.03685760498046875, 0.03899955749511719, 0.041141510009765625, 0.04328346252441406, 0.0454254150390625, 0.04756736755371094, 0.049709320068359375, 0.05185127258300781, 0.05399322509765625, 0.05613517761230469, 0.058277130126953125, 0.06041908264160156, 0.06256103515625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 7.0, 8.0, 12.0, 21.0, 22.0, 21.0, 32.0, 56.0, 74.0, 79.0, 79.0, 70.0, 78.0, 76.0, 73.0, 60.0, 57.0, 35.0, 32.0, 23.0, 20.0, 14.0, 12.0, 11.0, 5.0, 5.0, 2.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.020233154296875, -0.01952052116394043, -0.01880788803100586, -0.01809525489807129, -0.01738262176513672, -0.01666998863220215, -0.015957355499267578, -0.015244722366333008, -0.014532089233398438, -0.013819456100463867, -0.013106822967529297, -0.012394189834594727, -0.011681556701660156, -0.010968923568725586, -0.010256290435791016, -0.009543657302856445, -0.008831024169921875, -0.008118391036987305, -0.007405757904052734, -0.006693124771118164, -0.005980491638183594, -0.0052678585052490234, -0.004555225372314453, -0.003842592239379883, -0.0031299591064453125, -0.002417325973510742, -0.0017046928405761719, -0.0009920597076416016, -0.00027942657470703125, 0.00043320655822753906, 0.0011458396911621094, 0.0018584728240966797, 0.00257110595703125, 0.0032837390899658203, 0.003996372222900391, 0.004709005355834961, 0.005421638488769531, 0.0061342716217041016, 0.006846904754638672, 0.007559537887573242, 0.008272171020507812, 0.008984804153442383, 0.009697437286376953, 0.010410070419311523, 0.011122703552246094, 0.011835336685180664, 0.012547969818115234, 0.013260602951049805, 0.013973236083984375, 0.014685869216918945, 0.015398502349853516, 0.016111135482788086, 0.016823768615722656, 0.017536401748657227, 0.018249034881591797, 0.018961668014526367, 0.019674301147460938, 0.020386934280395508, 0.021099567413330078, 0.02181220054626465, 0.02252483367919922, 0.02323746681213379, 0.02395009994506836, 0.02466273307800293, 0.0253753662109375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 8.0, 19.0, 16.0, 27.0, 45.0, 48.0, 55.0, 71.0, 65.0, 71.0, 84.0, 83.0, 81.0, 66.0, 47.0, 29.0, 31.0, 23.0, 19.0, 22.0, 12.0, 9.0, 14.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.85531759262085, -6.689630031585693, -6.523942470550537, -6.358254432678223, -6.192566871643066, -6.02687931060791, -5.861191749572754, -5.695504188537598, -5.529816627502441, -5.364129066467285, -5.198441505432129, -5.0327534675598145, -4.867065906524658, -4.701378345489502, -4.535690784454346, -4.3700032234191895, -4.204315185546875, -4.038627624511719, -3.8729398250579834, -3.707252264022827, -3.541564464569092, -3.3758769035339355, -3.2101893424987793, -3.044501781463623, -2.8788139820098877, -2.7131264209747314, -2.547438621520996, -2.38175106048584, -2.2160634994506836, -2.0503756999969482, -1.884688138961792, -1.7190004587173462, -1.5533127784729004, -1.3876250982284546, -1.2219374179840088, -1.0562498569488525, -0.8905621767044067, -0.7248744964599609, -0.5591868758201599, -0.3934992551803589, -0.22781157493591309, -0.06212392449378967, 0.10356372594833374, 0.26925137639045715, 0.43493902683258057, 0.6006267070770264, 0.7663143277168274, 0.9320019483566284, 1.0976896286010742, 1.26337730884552, 1.4290649890899658, 1.594752550125122, 1.7604402303695679, 1.9261279106140137, 2.09181547164917, 2.257503032684326, 2.4231908321380615, 2.5888783931732178, 2.754566192626953, 2.9202537536621094, 3.0859413146972656, 3.251629114151001, 3.4173166751861572, 3.5830044746398926, 3.748692035675049]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 2.0, 3.0, 9.0, 6.0, 10.0, 16.0, 16.0, 20.0, 18.0, 18.0, 18.0, 27.0, 26.0, 36.0, 33.0, 35.0, 39.0, 46.0, 45.0, 29.0, 42.0, 45.0, 35.0, 40.0, 36.0, 28.0, 32.0, 22.0, 30.0, 22.0, 22.0, 22.0, 26.0, 21.0, 14.0, 15.0, 18.0, 10.0, 13.0, 6.0, 7.0, 5.0, 8.0, 2.0, 5.0, 2.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8758937120437622, -1.8173400163650513, -1.7587863206863403, -1.7002326250076294, -1.6416789293289185, -1.5831252336502075, -1.524571418762207, -1.466017723083496, -1.4074640274047852, -1.3489103317260742, -1.2903566360473633, -1.2318029403686523, -1.1732492446899414, -1.1146955490112305, -1.0561418533325195, -0.9975880980491638, -0.9390344619750977, -0.8804807662963867, -0.8219270706176758, -0.7633733749389648, -0.7048196792602539, -0.646265983581543, -0.5877122282981873, -0.5291585326194763, -0.4706048369407654, -0.41205114126205444, -0.3534974455833435, -0.2949437201023102, -0.23639002442359924, -0.1778363287448883, -0.11928260326385498, -0.06072890758514404, -0.0021750926971435547, 0.05637861043214798, 0.11493231356143951, 0.17348602414131165, 0.23203971982002258, 0.2905934154987335, 0.34914714097976685, 0.4077008366584778, 0.4662545323371887, 0.5248082280158997, 0.5833619236946106, 0.6419156789779663, 0.7004693746566772, 0.7590230703353882, 0.8175767660140991, 0.8761304616928101, 0.934684157371521, 0.9932378530502319, 1.0517915487289429, 1.1103452444076538, 1.1688989400863647, 1.2274526357650757, 1.2860064506530762, 1.344560146331787, 1.403113842010498, 1.461667537689209, 1.52022123336792, 1.5787749290466309, 1.6373286247253418, 1.6958823204040527, 1.7544360160827637, 1.8129897117614746, 1.8715434074401855]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 16.0, 23.0, 29.0, 52.0, 57.0, 75.0, 154.0, 233.0, 299.0, 463.0, 734.0, 1185.0, 1680.0, 2687.0, 4302.0, 6911.0, 10312.0, 16105.0, 24830.0, 37831.0, 55167.0, 77715.0, 102431.0, 123341.0, 131028.0, 120995.0, 99998.0, 75064.0, 52509.0, 35529.0, 23661.0, 15383.0, 9850.0, 6387.0, 4089.0, 2581.0, 1668.0, 1122.0, 721.0, 458.0, 312.0, 194.0, 120.0, 84.0, 55.0, 41.0, 26.0, 15.0, 9.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.22265625, -2.15618896484375, -2.0897216796875, -2.02325439453125, -1.956787109375, -1.89031982421875, -1.8238525390625, -1.75738525390625, -1.69091796875, -1.62445068359375, -1.5579833984375, -1.49151611328125, -1.425048828125, -1.35858154296875, -1.2921142578125, -1.22564697265625, -1.1591796875, -1.09271240234375, -1.0262451171875, -0.95977783203125, -0.893310546875, -0.82684326171875, -0.7603759765625, -0.69390869140625, -0.62744140625, -0.56097412109375, -0.4945068359375, -0.42803955078125, -0.361572265625, -0.29510498046875, -0.2286376953125, -0.16217041015625, -0.095703125, -0.02923583984375, 0.0372314453125, 0.10369873046875, 0.170166015625, 0.23663330078125, 0.3031005859375, 0.36956787109375, 0.43603515625, 0.50250244140625, 0.5689697265625, 0.63543701171875, 0.701904296875, 0.76837158203125, 0.8348388671875, 0.90130615234375, 0.9677734375, 1.03424072265625, 1.1007080078125, 1.16717529296875, 1.233642578125, 1.30010986328125, 1.3665771484375, 1.43304443359375, 1.49951171875, 1.56597900390625, 1.6324462890625, 1.69891357421875, 1.765380859375, 1.83184814453125, 1.8983154296875, 1.96478271484375, 2.03125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 11.0, 6.0, 11.0, 20.0, 19.0, 21.0, 29.0, 31.0, 33.0, 31.0, 41.0, 42.0, 47.0, 39.0, 46.0, 38.0, 48.0, 53.0, 33.0, 44.0, 39.0, 34.0, 37.0, 30.0, 29.0, 22.0, 24.0, 20.0, 27.0, 10.0, 8.0, 13.0, 10.0, 10.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.462890625, -2.3851318359375, -2.307373046875, -2.2296142578125, -2.15185546875, -2.0740966796875, -1.996337890625, -1.9185791015625, -1.8408203125, -1.7630615234375, -1.685302734375, -1.6075439453125, -1.52978515625, -1.4520263671875, -1.374267578125, -1.2965087890625, -1.21875, -1.1409912109375, -1.063232421875, -0.9854736328125, -0.90771484375, -0.8299560546875, -0.752197265625, -0.6744384765625, -0.5966796875, -0.5189208984375, -0.441162109375, -0.3634033203125, -0.28564453125, -0.2078857421875, -0.130126953125, -0.0523681640625, 0.025390625, 0.1031494140625, 0.180908203125, 0.2586669921875, 0.33642578125, 0.4141845703125, 0.491943359375, 0.5697021484375, 0.6474609375, 0.7252197265625, 0.802978515625, 0.8807373046875, 0.95849609375, 1.0362548828125, 1.114013671875, 1.1917724609375, 1.26953125, 1.3472900390625, 1.425048828125, 1.5028076171875, 1.58056640625, 1.6583251953125, 1.736083984375, 1.8138427734375, 1.8916015625, 1.9693603515625, 2.047119140625, 2.1248779296875, 2.20263671875, 2.2803955078125, 2.358154296875, 2.4359130859375, 2.513671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 9.0, 11.0, 16.0, 22.0, 26.0, 56.0, 73.0, 121.0, 157.0, 250.0, 365.0, 621.0, 908.0, 1485.0, 2326.0, 3771.0, 6130.0, 10011.0, 16425.0, 26272.0, 42704.0, 65500.0, 95190.0, 125552.0, 144413.0, 141825.0, 118613.0, 87730.0, 58910.0, 37881.0, 23420.0, 14468.0, 8731.0, 5496.0, 3274.0, 2123.0, 1328.0, 848.0, 496.0, 368.0, 226.0, 143.0, 85.0, 66.0, 34.0, 27.0, 21.0, 13.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.4375, -2.358551025390625, -2.27960205078125, -2.200653076171875, -2.1217041015625, -2.042755126953125, -1.96380615234375, -1.884857177734375, -1.805908203125, -1.726959228515625, -1.64801025390625, -1.569061279296875, -1.4901123046875, -1.411163330078125, -1.33221435546875, -1.253265380859375, -1.17431640625, -1.095367431640625, -1.01641845703125, -0.937469482421875, -0.8585205078125, -0.779571533203125, -0.70062255859375, -0.621673583984375, -0.542724609375, -0.463775634765625, -0.38482666015625, -0.305877685546875, -0.2269287109375, -0.147979736328125, -0.06903076171875, 0.009918212890625, 0.0888671875, 0.167816162109375, 0.24676513671875, 0.325714111328125, 0.4046630859375, 0.483612060546875, 0.56256103515625, 0.641510009765625, 0.720458984375, 0.799407958984375, 0.87835693359375, 0.957305908203125, 1.0362548828125, 1.115203857421875, 1.19415283203125, 1.273101806640625, 1.35205078125, 1.430999755859375, 1.50994873046875, 1.588897705078125, 1.6678466796875, 1.746795654296875, 1.82574462890625, 1.904693603515625, 1.983642578125, 2.062591552734375, 2.14154052734375, 2.220489501953125, 2.2994384765625, 2.378387451171875, 2.45733642578125, 2.536285400390625, 2.615234375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 11.0, 10.0, 5.0, 7.0, 13.0, 12.0, 15.0, 22.0, 17.0, 20.0, 30.0, 25.0, 23.0, 37.0, 40.0, 32.0, 37.0, 28.0, 38.0, 35.0, 30.0, 39.0, 39.0, 36.0, 36.0, 31.0, 31.0, 23.0, 16.0, 34.0, 25.0, 20.0, 22.0, 14.0, 18.0, 16.0, 12.0, 11.0, 15.0, 7.0, 8.0, 6.0, 4.0, 9.0, 6.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.3134765625, -1.274261474609375, -1.23504638671875, -1.195831298828125, -1.1566162109375, -1.117401123046875, -1.07818603515625, -1.038970947265625, -0.999755859375, -0.960540771484375, -0.92132568359375, -0.882110595703125, -0.8428955078125, -0.803680419921875, -0.76446533203125, -0.725250244140625, -0.68603515625, -0.646820068359375, -0.60760498046875, -0.568389892578125, -0.5291748046875, -0.489959716796875, -0.45074462890625, -0.411529541015625, -0.372314453125, -0.333099365234375, -0.29388427734375, -0.254669189453125, -0.2154541015625, -0.176239013671875, -0.13702392578125, -0.097808837890625, -0.05859375, -0.019378662109375, 0.01983642578125, 0.059051513671875, 0.0982666015625, 0.137481689453125, 0.17669677734375, 0.215911865234375, 0.255126953125, 0.294342041015625, 0.33355712890625, 0.372772216796875, 0.4119873046875, 0.451202392578125, 0.49041748046875, 0.529632568359375, 0.56884765625, 0.608062744140625, 0.64727783203125, 0.686492919921875, 0.7257080078125, 0.764923095703125, 0.80413818359375, 0.843353271484375, 0.882568359375, 0.921783447265625, 0.96099853515625, 1.000213623046875, 1.0394287109375, 1.078643798828125, 1.11785888671875, 1.157073974609375, 1.1962890625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 7.0, 16.0, 15.0, 29.0, 29.0, 40.0, 68.0, 96.0, 153.0, 235.0, 319.0, 577.0, 766.0, 1248.0, 1835.0, 2983.0, 4741.0, 7500.0, 12007.0, 19857.0, 33435.0, 55280.0, 89246.0, 133294.0, 168881.0, 167382.0, 128911.0, 85325.0, 52502.0, 31508.0, 18947.0, 11711.0, 7032.0, 4514.0, 2878.0, 1771.0, 1191.0, 783.0, 499.0, 297.0, 216.0, 148.0, 93.0, 69.0, 52.0, 25.0, 13.0, 13.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4228515625, -1.3737030029296875, -1.324554443359375, -1.2754058837890625, -1.22625732421875, -1.1771087646484375, -1.127960205078125, -1.0788116455078125, -1.0296630859375, -0.9805145263671875, -0.931365966796875, -0.8822174072265625, -0.83306884765625, -0.7839202880859375, -0.734771728515625, -0.6856231689453125, -0.636474609375, -0.5873260498046875, -0.538177490234375, -0.4890289306640625, -0.43988037109375, -0.3907318115234375, -0.341583251953125, -0.2924346923828125, -0.2432861328125, -0.1941375732421875, -0.144989013671875, -0.0958404541015625, -0.04669189453125, 0.0024566650390625, 0.051605224609375, 0.1007537841796875, 0.14990234375, 0.1990509033203125, 0.248199462890625, 0.2973480224609375, 0.34649658203125, 0.3956451416015625, 0.444793701171875, 0.4939422607421875, 0.5430908203125, 0.5922393798828125, 0.641387939453125, 0.6905364990234375, 0.73968505859375, 0.7888336181640625, 0.837982177734375, 0.8871307373046875, 0.936279296875, 0.9854278564453125, 1.034576416015625, 1.0837249755859375, 1.13287353515625, 1.1820220947265625, 1.231170654296875, 1.2803192138671875, 1.3294677734375, 1.3786163330078125, 1.427764892578125, 1.4769134521484375, 1.52606201171875, 1.5752105712890625, 1.624359130859375, 1.6735076904296875, 1.72265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 4.0, 1.0, 2.0, 6.0, 14.0, 11.0, 9.0, 20.0, 27.0, 26.0, 31.0, 42.0, 63.0, 50.0, 52.0, 61.0, 77.0, 64.0, 56.0, 52.0, 56.0, 42.0, 43.0, 39.0, 24.0, 20.0, 16.0, 20.0, 15.0, 11.0, 11.0, 13.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00019168853759765625, -0.0001863911747932434, -0.00018109381198883057, -0.00017579644918441772, -0.00017049908638000488, -0.00016520172357559204, -0.0001599043607711792, -0.00015460699796676636, -0.00014930963516235352, -0.00014401227235794067, -0.00013871490955352783, -0.000133417546749115, -0.00012812018394470215, -0.0001228228211402893, -0.00011752545833587646, -0.00011222809553146362, -0.00010693073272705078, -0.00010163336992263794, -9.63360071182251e-05, -9.103864431381226e-05, -8.574128150939941e-05, -8.044391870498657e-05, -7.514655590057373e-05, -6.984919309616089e-05, -6.455183029174805e-05, -5.9254467487335205e-05, -5.395710468292236e-05, -4.865974187850952e-05, -4.336237907409668e-05, -3.806501626968384e-05, -3.2767653465270996e-05, -2.7470290660858154e-05, -2.2172927856445312e-05, -1.687556505203247e-05, -1.1578202247619629e-05, -6.280839443206787e-06, -9.834766387939453e-07, 4.3138861656188965e-06, 9.611248970031738e-06, 1.490861177444458e-05, 2.0205974578857422e-05, 2.5503337383270264e-05, 3.0800700187683105e-05, 3.609806299209595e-05, 4.139542579650879e-05, 4.669278860092163e-05, 5.199015140533447e-05, 5.7287514209747314e-05, 6.258487701416016e-05, 6.7882239818573e-05, 7.317960262298584e-05, 7.847696542739868e-05, 8.377432823181152e-05, 8.907169103622437e-05, 9.436905384063721e-05, 9.966641664505005e-05, 0.00010496377944946289, 0.00011026114225387573, 0.00011555850505828857, 0.00012085586786270142, 0.00012615323066711426, 0.0001314505934715271, 0.00013674795627593994, 0.00014204531908035278, 0.00014734268188476562]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 3.0, 8.0, 9.0, 14.0, 34.0, 32.0, 45.0, 69.0, 93.0, 172.0, 243.0, 457.0, 735.0, 1195.0, 2130.0, 3774.0, 6844.0, 12355.0, 22021.0, 39530.0, 68820.0, 112243.0, 162020.0, 184841.0, 161134.0, 112501.0, 68200.0, 39165.0, 21908.0, 12127.0, 6843.0, 3727.0, 2162.0, 1235.0, 689.0, 452.0, 278.0, 164.0, 108.0, 53.0, 30.0, 35.0, 18.0, 16.0, 11.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.609375, -1.5613250732421875, -1.513275146484375, -1.4652252197265625, -1.41717529296875, -1.3691253662109375, -1.321075439453125, -1.2730255126953125, -1.2249755859375, -1.1769256591796875, -1.128875732421875, -1.0808258056640625, -1.03277587890625, -0.9847259521484375, -0.936676025390625, -0.8886260986328125, -0.840576171875, -0.7925262451171875, -0.744476318359375, -0.6964263916015625, -0.64837646484375, -0.6003265380859375, -0.552276611328125, -0.5042266845703125, -0.4561767578125, -0.4081268310546875, -0.360076904296875, -0.3120269775390625, -0.26397705078125, -0.2159271240234375, -0.167877197265625, -0.1198272705078125, -0.07177734375, -0.0237274169921875, 0.024322509765625, 0.0723724365234375, 0.12042236328125, 0.1684722900390625, 0.216522216796875, 0.2645721435546875, 0.3126220703125, 0.3606719970703125, 0.408721923828125, 0.4567718505859375, 0.50482177734375, 0.5528717041015625, 0.600921630859375, 0.6489715576171875, 0.697021484375, 0.7450714111328125, 0.793121337890625, 0.8411712646484375, 0.88922119140625, 0.9372711181640625, 0.985321044921875, 1.0333709716796875, 1.0814208984375, 1.1294708251953125, 1.177520751953125, 1.2255706787109375, 1.27362060546875, 1.3216705322265625, 1.369720458984375, 1.4177703857421875, 1.4658203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 12.0, 15.0, 21.0, 28.0, 23.0, 30.0, 50.0, 50.0, 72.0, 59.0, 71.0, 71.0, 74.0, 59.0, 55.0, 45.0, 64.0, 46.0, 42.0, 31.0, 24.0, 18.0, 10.0, 3.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5576171875, -0.5405807495117188, -0.5235443115234375, -0.5065078735351562, -0.489471435546875, -0.47243499755859375, -0.4553985595703125, -0.43836212158203125, -0.42132568359375, -0.40428924560546875, -0.3872528076171875, -0.37021636962890625, -0.353179931640625, -0.33614349365234375, -0.3191070556640625, -0.30207061767578125, -0.2850341796875, -0.26799774169921875, -0.2509613037109375, -0.23392486572265625, -0.216888427734375, -0.19985198974609375, -0.1828155517578125, -0.16577911376953125, -0.14874267578125, -0.13170623779296875, -0.1146697998046875, -0.09763336181640625, -0.080596923828125, -0.06356048583984375, -0.0465240478515625, -0.02948760986328125, -0.012451171875, 0.00458526611328125, 0.0216217041015625, 0.03865814208984375, 0.055694580078125, 0.07273101806640625, 0.0897674560546875, 0.10680389404296875, 0.12384033203125, 0.14087677001953125, 0.1579132080078125, 0.17494964599609375, 0.191986083984375, 0.20902252197265625, 0.2260589599609375, 0.24309539794921875, 0.2601318359375, 0.27716827392578125, 0.2942047119140625, 0.31124114990234375, 0.328277587890625, 0.34531402587890625, 0.3623504638671875, 0.37938690185546875, 0.39642333984375, 0.41345977783203125, 0.4304962158203125, 0.44753265380859375, 0.464569091796875, 0.48160552978515625, 0.4986419677734375, 0.5156784057617188, 0.53271484375]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 13.0, 11.0, 11.0, 18.0, 21.0, 24.0, 26.0, 41.0, 40.0, 61.0, 62.0, 75.0, 79.0, 75.0, 82.0, 49.0, 76.0, 41.0, 48.0, 19.0, 24.0, 20.0, 22.0, 14.0, 16.0, 14.0, 5.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.6054840087890625, -6.44195032119751, -6.278416633605957, -6.1148834228515625, -5.95134973526001, -5.787816047668457, -5.624282360076904, -5.460748672485352, -5.297215461730957, -5.133681774139404, -4.970148086547852, -4.806614875793457, -4.643081188201904, -4.479547500610352, -4.316013813018799, -4.152480125427246, -3.9889466762542725, -3.8254129886627197, -3.661879539489746, -3.4983458518981934, -3.3348124027252197, -3.171278715133667, -3.0077452659606934, -2.8442115783691406, -2.680677890777588, -2.517144203186035, -2.3536107540130615, -2.190077066421509, -2.026543617248535, -1.8630099296569824, -1.6994763612747192, -1.535942792892456, -1.3724095821380615, -1.2088760137557983, -1.0453424453735352, -0.8818088173866272, -0.718275249004364, -0.5547416806221008, -0.39120805263519287, -0.2276744842529297, -0.0641409158706665, 0.09939266741275787, 0.26292625069618225, 0.4264598488807678, 0.589993417263031, 0.7535269856452942, 0.9170606136322021, 1.0805941820144653, 1.2441277503967285, 1.4076613187789917, 1.5711948871612549, 1.7347285747528076, 1.8982620239257812, 2.061795711517334, 2.2253293991088867, 2.3888628482818604, 2.552396297454834, 2.7159299850463867, 2.8794634342193604, 3.042997121810913, 3.2065305709838867, 3.3700642585754395, 3.533597946166992, 3.697131395339966, 3.8606650829315186]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 2.0, 7.0, 12.0, 16.0, 11.0, 17.0, 17.0, 16.0, 26.0, 24.0, 19.0, 20.0, 30.0, 33.0, 19.0, 29.0, 35.0, 33.0, 32.0, 49.0, 39.0, 36.0, 35.0, 35.0, 39.0, 27.0, 34.0, 24.0, 17.0, 32.0, 21.0, 25.0, 21.0, 23.0, 13.0, 19.0, 14.0, 18.0, 14.0, 5.0, 10.0, 7.0, 10.0, 6.0, 2.0, 8.0, 3.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.917460560798645, -1.8577678203582764, -1.7980751991271973, -1.7383824586868286, -1.67868971824646, -1.6189970970153809, -1.5593043565750122, -1.4996116161346436, -1.4399189949035645, -1.3802262544631958, -1.3205336332321167, -1.260840892791748, -1.2011481523513794, -1.1414554119110107, -1.0817627906799316, -1.022070050239563, -0.9623773097991943, -0.9026846289634705, -0.8429918885231018, -0.7832992076873779, -0.7236064672470093, -0.6639137864112854, -0.6042211055755615, -0.5445283651351929, -0.484835684299469, -0.42514297366142273, -0.36545026302337646, -0.3057575821876526, -0.24606487154960632, -0.18637216091156006, -0.12667948007583618, -0.06698676943778992, -0.007294178009033203, 0.052398525178432465, 0.11209122836589813, 0.1717839241027832, 0.23147663474082947, 0.29116934537887573, 0.3508620262145996, 0.4105547368526459, 0.47024744749069214, 0.529940128326416, 0.5896328687667847, 0.6493255496025085, 0.7090182304382324, 0.7687109708786011, 0.828403651714325, 0.8880963325500488, 0.9477890729904175, 1.0074818134307861, 1.0671744346618652, 1.1268671751022339, 1.1865599155426025, 1.2462525367736816, 1.3059452772140503, 1.365638017654419, 1.425330638885498, 1.4850233793258667, 1.5447160005569458, 1.6044087409973145, 1.664101481437683, 1.7237942218780518, 1.7834868431091309, 1.8431795835494995, 1.9028723239898682]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 26.0, 44.0, 60.0, 100.0, 166.0, 224.0, 320.0, 479.0, 768.0, 1343.0, 2017.0, 3275.0, 5534.0, 9909.0, 17397.0, 32985.0, 65687.0, 141046.0, 332614.0, 793353.0, 1249471.0, 856099.0, 369269.0, 158618.0, 73510.0, 36634.0, 19020.0, 10270.0, 5696.0, 3384.0, 1934.0, 1102.0, 692.0, 422.0, 281.0, 169.0, 113.0, 72.0, 44.0, 21.0, 27.0, 10.0, 12.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.41015625, -4.26092529296875, -4.1116943359375, -3.96246337890625, -3.813232421875, -3.66400146484375, -3.5147705078125, -3.36553955078125, -3.21630859375, -3.06707763671875, -2.9178466796875, -2.76861572265625, -2.619384765625, -2.47015380859375, -2.3209228515625, -2.17169189453125, -2.0224609375, -1.87322998046875, -1.7239990234375, -1.57476806640625, -1.425537109375, -1.27630615234375, -1.1270751953125, -0.97784423828125, -0.82861328125, -0.67938232421875, -0.5301513671875, -0.38092041015625, -0.231689453125, -0.08245849609375, 0.0667724609375, 0.21600341796875, 0.365234375, 0.51446533203125, 0.6636962890625, 0.81292724609375, 0.962158203125, 1.11138916015625, 1.2606201171875, 1.40985107421875, 1.55908203125, 1.70831298828125, 1.8575439453125, 2.00677490234375, 2.156005859375, 2.30523681640625, 2.4544677734375, 2.60369873046875, 2.7529296875, 2.90216064453125, 3.0513916015625, 3.20062255859375, 3.349853515625, 3.49908447265625, 3.6483154296875, 3.79754638671875, 3.94677734375, 4.09600830078125, 4.2452392578125, 4.39447021484375, 4.543701171875, 4.69293212890625, 4.8421630859375, 4.99139404296875, 5.140625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 18.0, 20.0, 22.0, 21.0, 18.0, 25.0, 18.0, 24.0, 28.0, 44.0, 31.0, 35.0, 38.0, 37.0, 26.0, 36.0, 35.0, 42.0, 32.0, 36.0, 33.0, 37.0, 28.0, 24.0, 37.0, 29.0, 15.0, 28.0, 27.0, 15.0, 14.0, 18.0, 14.0, 9.0, 4.0, 15.0, 6.0, 8.0, 4.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7802734375, -1.7282562255859375, -1.676239013671875, -1.6242218017578125, -1.57220458984375, -1.5201873779296875, -1.468170166015625, -1.4161529541015625, -1.3641357421875, -1.3121185302734375, -1.260101318359375, -1.2080841064453125, -1.15606689453125, -1.1040496826171875, -1.052032470703125, -1.0000152587890625, -0.947998046875, -0.8959808349609375, -0.843963623046875, -0.7919464111328125, -0.73992919921875, -0.6879119873046875, -0.635894775390625, -0.5838775634765625, -0.5318603515625, -0.4798431396484375, -0.427825927734375, -0.3758087158203125, -0.32379150390625, -0.2717742919921875, -0.219757080078125, -0.1677398681640625, -0.11572265625, -0.0637054443359375, -0.011688232421875, 0.0403289794921875, 0.09234619140625, 0.1443634033203125, 0.196380615234375, 0.2483978271484375, 0.3004150390625, 0.3524322509765625, 0.404449462890625, 0.4564666748046875, 0.50848388671875, 0.5605010986328125, 0.612518310546875, 0.6645355224609375, 0.716552734375, 0.7685699462890625, 0.820587158203125, 0.8726043701171875, 0.92462158203125, 0.9766387939453125, 1.028656005859375, 1.0806732177734375, 1.1326904296875, 1.1847076416015625, 1.236724853515625, 1.2887420654296875, 1.34075927734375, 1.3927764892578125, 1.444793701171875, 1.4968109130859375, 1.548828125]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 9.0, 3.0, 11.0, 19.0, 26.0, 35.0, 63.0, 93.0, 155.0, 196.0, 322.0, 534.0, 826.0, 1419.0, 2301.0, 4004.0, 6839.0, 12235.0, 22022.0, 40720.0, 78965.0, 152623.0, 302319.0, 587283.0, 952865.0, 915299.0, 540664.0, 275901.0, 138908.0, 72020.0, 37760.0, 20745.0, 11339.0, 6498.0, 3679.0, 2098.0, 1331.0, 795.0, 512.0, 324.0, 207.0, 118.0, 69.0, 50.0, 34.0, 16.0, 16.0, 8.0, 8.0, 1.0, 2.0, 3.0], "bins": [-5.29296875, -5.149658203125, -5.00634765625, -4.863037109375, -4.7197265625, -4.576416015625, -4.43310546875, -4.289794921875, -4.146484375, -4.003173828125, -3.85986328125, -3.716552734375, -3.5732421875, -3.429931640625, -3.28662109375, -3.143310546875, -3.0, -2.856689453125, -2.71337890625, -2.570068359375, -2.4267578125, -2.283447265625, -2.14013671875, -1.996826171875, -1.853515625, -1.710205078125, -1.56689453125, -1.423583984375, -1.2802734375, -1.136962890625, -0.99365234375, -0.850341796875, -0.70703125, -0.563720703125, -0.42041015625, -0.277099609375, -0.1337890625, 0.009521484375, 0.15283203125, 0.296142578125, 0.439453125, 0.582763671875, 0.72607421875, 0.869384765625, 1.0126953125, 1.156005859375, 1.29931640625, 1.442626953125, 1.5859375, 1.729248046875, 1.87255859375, 2.015869140625, 2.1591796875, 2.302490234375, 2.44580078125, 2.589111328125, 2.732421875, 2.875732421875, 3.01904296875, 3.162353515625, 3.3056640625, 3.448974609375, 3.59228515625, 3.735595703125, 3.87890625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 12.0, 14.0, 20.0, 27.0, 35.0, 52.0, 52.0, 70.0, 92.0, 112.0, 122.0, 153.0, 190.0, 215.0, 242.0, 252.0, 278.0, 304.0, 265.0, 256.0, 234.0, 176.0, 178.0, 144.0, 101.0, 98.0, 87.0, 66.0, 40.0, 48.0, 40.0, 20.0, 15.0, 16.0, 7.0, 6.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.86334228515625, -0.8243408203125, -0.78533935546875, -0.746337890625, -0.70733642578125, -0.6683349609375, -0.62933349609375, -0.59033203125, -0.55133056640625, -0.5123291015625, -0.47332763671875, -0.434326171875, -0.39532470703125, -0.3563232421875, -0.31732177734375, -0.2783203125, -0.23931884765625, -0.2003173828125, -0.16131591796875, -0.122314453125, -0.08331298828125, -0.0443115234375, -0.00531005859375, 0.03369140625, 0.07269287109375, 0.1116943359375, 0.15069580078125, 0.189697265625, 0.22869873046875, 0.2677001953125, 0.30670166015625, 0.345703125, 0.38470458984375, 0.4237060546875, 0.46270751953125, 0.501708984375, 0.54071044921875, 0.5797119140625, 0.61871337890625, 0.65771484375, 0.69671630859375, 0.7357177734375, 0.77471923828125, 0.813720703125, 0.85272216796875, 0.8917236328125, 0.93072509765625, 0.9697265625, 1.00872802734375, 1.0477294921875, 1.08673095703125, 1.125732421875, 1.16473388671875, 1.2037353515625, 1.24273681640625, 1.28173828125, 1.32073974609375, 1.3597412109375, 1.39874267578125, 1.437744140625, 1.47674560546875, 1.5157470703125, 1.55474853515625, 1.59375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 17.0, 12.0, 19.0, 21.0, 23.0, 23.0, 33.0, 40.0, 46.0, 36.0, 49.0, 55.0, 60.0, 72.0, 52.0, 68.0, 42.0, 55.0, 42.0, 28.0, 33.0, 26.0, 22.0, 15.0, 21.0, 15.0, 10.0, 7.0, 11.0, 8.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.709427356719971, -4.573078155517578, -4.4367289543151855, -4.300380229949951, -4.164031028747559, -4.027681827545166, -3.8913326263427734, -3.75498366355896, -3.6186347007751465, -3.482285499572754, -3.3459365367889404, -3.209587335586548, -3.0732383728027344, -2.936889171600342, -2.800539970397949, -2.6641910076141357, -2.527841806411743, -2.3914926052093506, -2.255143642425537, -2.1187944412231445, -1.982445478439331, -1.8460962772369385, -1.7097471952438354, -1.5733981132507324, -1.4370490312576294, -1.3006999492645264, -1.1643508672714233, -1.0280017852783203, -0.8916526436805725, -0.7553035616874695, -0.6189544200897217, -0.48260533809661865, -0.3462562561035156, -0.2099071592092514, -0.07355806231498718, 0.06279104948043823, 0.19914013147354126, 0.3354892134666443, 0.4718383550643921, 0.6081874370574951, 0.7445365190505981, 0.8808856010437012, 1.0172346830368042, 1.1535837650299072, 1.2899329662322998, 1.4262819290161133, 1.5626311302185059, 1.6989802122116089, 1.835329294204712, 1.971678376197815, 2.108027458190918, 2.2443766593933105, 2.380725622177124, 2.5170748233795166, 2.65342378616333, 2.7897729873657227, 2.9261221885681152, 3.062471389770508, 3.1988203525543213, 3.335169553756714, 3.4715185165405273, 3.60786771774292, 3.7442169189453125, 3.880565881729126, 4.0169148445129395]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 10.0, 4.0, 10.0, 16.0, 20.0, 12.0, 18.0, 14.0, 22.0, 26.0, 18.0, 27.0, 35.0, 30.0, 45.0, 36.0, 41.0, 48.0, 44.0, 41.0, 48.0, 28.0, 39.0, 35.0, 27.0, 31.0, 27.0, 30.0, 29.0, 28.0, 31.0, 16.0, 19.0, 13.0, 10.0, 10.0, 17.0, 12.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.2914984226226807, -2.2230279445648193, -2.154557704925537, -2.086087226867676, -2.0176169872283936, -1.9491465091705322, -1.8806761503219604, -1.8122057914733887, -1.7437353134155273, -1.6752649545669556, -1.6067945957183838, -1.5383241176605225, -1.4698537588119507, -1.401383399963379, -1.3329130411148071, -1.2644426822662354, -1.1959723234176636, -1.1275019645690918, -1.05903160572052, -0.9905611872673035, -0.9220907688140869, -0.8536204099655151, -0.7851500511169434, -0.7166796922683716, -0.648209273815155, -0.5797389149665833, -0.5112684965133667, -0.4427981376647949, -0.37432774901390076, -0.3058573603630066, -0.23738700151443481, -0.16891661286354065, -0.10044622421264648, -0.031975843012332916, 0.03649453818798065, 0.10496491193771362, 0.1734353005886078, 0.24190568923950195, 0.31037604808807373, 0.3788464367389679, 0.44731682538986206, 0.5157871842384338, 0.5842576026916504, 0.6527279615402222, 0.721198320388794, 0.7896687388420105, 0.8581390976905823, 0.9266095161437988, 0.9950798749923706, 1.0635502338409424, 1.1320205926895142, 1.200490951538086, 1.2689614295959473, 1.337431788444519, 1.4059021472930908, 1.4743725061416626, 1.5428428649902344, 1.6113132238388062, 1.679783582687378, 1.7482540607452393, 1.816724419593811, 1.8851947784423828, 1.9536651372909546, 2.0221354961395264, 2.0906059741973877]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 14.0, 8.0, 9.0, 19.0, 22.0, 41.0, 89.0, 108.0, 185.0, 356.0, 575.0, 941.0, 1618.0, 2973.0, 5166.0, 9340.0, 17459.0, 31990.0, 59581.0, 108846.0, 174694.0, 213955.0, 176805.0, 110523.0, 61422.0, 32451.0, 17742.0, 9366.0, 5227.0, 2963.0, 1671.0, 995.0, 552.0, 340.0, 205.0, 111.0, 74.0, 40.0, 32.0, 16.0, 11.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.3935546875, -0.38306427001953125, -0.3725738525390625, -0.36208343505859375, -0.351593017578125, -0.34110260009765625, -0.3306121826171875, -0.32012176513671875, -0.30963134765625, -0.29914093017578125, -0.2886505126953125, -0.27816009521484375, -0.267669677734375, -0.25717926025390625, -0.2466888427734375, -0.23619842529296875, -0.2257080078125, -0.21521759033203125, -0.2047271728515625, -0.19423675537109375, -0.183746337890625, -0.17325592041015625, -0.1627655029296875, -0.15227508544921875, -0.14178466796875, -0.13129425048828125, -0.1208038330078125, -0.11031341552734375, -0.099822998046875, -0.08933258056640625, -0.0788421630859375, -0.06835174560546875, -0.057861328125, -0.04737091064453125, -0.0368804931640625, -0.02639007568359375, -0.015899658203125, -0.00540924072265625, 0.0050811767578125, 0.01557159423828125, 0.02606201171875, 0.03655242919921875, 0.0470428466796875, 0.05753326416015625, 0.068023681640625, 0.07851409912109375, 0.0890045166015625, 0.09949493408203125, 0.1099853515625, 0.12047576904296875, 0.1309661865234375, 0.14145660400390625, 0.151947021484375, 0.16243743896484375, 0.1729278564453125, 0.18341827392578125, 0.19390869140625, 0.20439910888671875, 0.2148895263671875, 0.22537994384765625, 0.235870361328125, 0.24636077880859375, 0.2568511962890625, 0.26734161376953125, 0.27783203125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 12.0, 11.0, 13.0, 19.0, 12.0, 25.0, 16.0, 22.0, 34.0, 34.0, 41.0, 45.0, 50.0, 29.0, 46.0, 34.0, 36.0, 29.0, 39.0, 32.0, 28.0, 30.0, 26.0, 33.0, 29.0, 26.0, 28.0, 39.0, 27.0, 20.0, 16.0, 19.0, 10.0, 9.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-2.609375, -2.532440185546875, -2.45550537109375, -2.378570556640625, -2.3016357421875, -2.224700927734375, -2.14776611328125, -2.070831298828125, -1.993896484375, -1.916961669921875, -1.84002685546875, -1.763092041015625, -1.6861572265625, -1.609222412109375, -1.53228759765625, -1.455352783203125, -1.37841796875, -1.301483154296875, -1.22454833984375, -1.147613525390625, -1.0706787109375, -0.993743896484375, -0.91680908203125, -0.839874267578125, -0.762939453125, -0.686004638671875, -0.60906982421875, -0.532135009765625, -0.4552001953125, -0.378265380859375, -0.30133056640625, -0.224395751953125, -0.1474609375, -0.070526123046875, 0.00640869140625, 0.083343505859375, 0.1602783203125, 0.237213134765625, 0.31414794921875, 0.391082763671875, 0.468017578125, 0.544952392578125, 0.62188720703125, 0.698822021484375, 0.7757568359375, 0.852691650390625, 0.92962646484375, 1.006561279296875, 1.08349609375, 1.160430908203125, 1.23736572265625, 1.314300537109375, 1.3912353515625, 1.468170166015625, 1.54510498046875, 1.622039794921875, 1.698974609375, 1.775909423828125, 1.85284423828125, 1.929779052734375, 2.0067138671875, 2.083648681640625, 2.16058349609375, 2.237518310546875, 2.314453125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 4.0, 11.0, 28.0, 13.0, 31.0, 39.0, 80.0, 98.0, 145.0, 261.0, 375.0, 625.0, 1033.0, 1892.0, 3760.0, 8173.0, 20007.0, 75853.0, 859439.0, 46672.0, 15879.0, 6871.0, 3249.0, 1599.0, 880.0, 563.0, 323.0, 209.0, 119.0, 90.0, 69.0, 41.0, 39.0, 31.0, 16.0, 9.0, 5.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2973480224609375, -1.261688232421875, -1.2260284423828125, -1.19036865234375, -1.1547088623046875, -1.119049072265625, -1.0833892822265625, -1.0477294921875, -1.0120697021484375, -0.976409912109375, -0.9407501220703125, -0.90509033203125, -0.8694305419921875, -0.833770751953125, -0.7981109619140625, -0.762451171875, -0.7267913818359375, -0.691131591796875, -0.6554718017578125, -0.61981201171875, -0.5841522216796875, -0.548492431640625, -0.5128326416015625, -0.4771728515625, -0.4415130615234375, -0.405853271484375, -0.3701934814453125, -0.33453369140625, -0.2988739013671875, -0.263214111328125, -0.2275543212890625, -0.19189453125, -0.1562347412109375, -0.120574951171875, -0.0849151611328125, -0.04925537109375, -0.0135955810546875, 0.022064208984375, 0.0577239990234375, 0.0933837890625, 0.1290435791015625, 0.164703369140625, 0.2003631591796875, 0.23602294921875, 0.2716827392578125, 0.307342529296875, 0.3430023193359375, 0.378662109375, 0.4143218994140625, 0.449981689453125, 0.4856414794921875, 0.52130126953125, 0.5569610595703125, 0.592620849609375, 0.6282806396484375, 0.6639404296875, 0.6996002197265625, 0.735260009765625, 0.7709197998046875, 0.80657958984375, 0.8422393798828125, 0.877899169921875, 0.9135589599609375, 0.94921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 8.0, 13.0, 12.0, 14.0, 17.0, 20.0, 20.0, 26.0, 25.0, 29.0, 30.0, 32.0, 30.0, 39.0, 31.0, 31.0, 38.0, 43.0, 33.0, 49.0, 38.0, 31.0, 28.0, 43.0, 26.0, 35.0, 35.0, 24.0, 36.0, 20.0, 19.0, 26.0, 18.0, 5.0, 10.0, 9.0, 14.0, 12.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.6064453125, -1.558135986328125, -1.50982666015625, -1.461517333984375, -1.4132080078125, -1.364898681640625, -1.31658935546875, -1.268280029296875, -1.219970703125, -1.171661376953125, -1.12335205078125, -1.075042724609375, -1.0267333984375, -0.978424072265625, -0.93011474609375, -0.881805419921875, -0.83349609375, -0.785186767578125, -0.73687744140625, -0.688568115234375, -0.6402587890625, -0.591949462890625, -0.54364013671875, -0.495330810546875, -0.447021484375, -0.398712158203125, -0.35040283203125, -0.302093505859375, -0.2537841796875, -0.205474853515625, -0.15716552734375, -0.108856201171875, -0.060546875, -0.012237548828125, 0.03607177734375, 0.084381103515625, 0.1326904296875, 0.180999755859375, 0.22930908203125, 0.277618408203125, 0.325927734375, 0.374237060546875, 0.42254638671875, 0.470855712890625, 0.5191650390625, 0.567474365234375, 0.61578369140625, 0.664093017578125, 0.71240234375, 0.760711669921875, 0.80902099609375, 0.857330322265625, 0.9056396484375, 0.953948974609375, 1.00225830078125, 1.050567626953125, 1.098876953125, 1.147186279296875, 1.19549560546875, 1.243804931640625, 1.2921142578125, 1.340423583984375, 1.38873291015625, 1.437042236328125, 1.4853515625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 10.0, 9.0, 18.0, 14.0, 23.0, 39.0, 51.0, 76.0, 83.0, 137.0, 165.0, 300.0, 489.0, 799.0, 1275.0, 2336.0, 4387.0, 8698.0, 18496.0, 54712.0, 886998.0, 38410.0, 15121.0, 7190.0, 3663.0, 1967.0, 1105.0, 685.0, 432.0, 266.0, 179.0, 123.0, 70.0, 49.0, 40.0, 23.0, 20.0, 21.0, 13.0, 10.0, 8.0, 7.0, 8.0, 9.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.275146484375, -0.2669029235839844, -0.25865936279296875, -0.2504158020019531, -0.2421722412109375, -0.23392868041992188, -0.22568511962890625, -0.21744155883789062, -0.209197998046875, -0.20095443725585938, -0.19271087646484375, -0.18446731567382812, -0.1762237548828125, -0.16798019409179688, -0.15973663330078125, -0.15149307250976562, -0.14324951171875, -0.13500595092773438, -0.12676239013671875, -0.11851882934570312, -0.1102752685546875, -0.10203170776367188, -0.09378814697265625, -0.08554458618164062, -0.077301025390625, -0.06905746459960938, -0.06081390380859375, -0.052570343017578125, -0.0443267822265625, -0.036083221435546875, -0.02783966064453125, -0.019596099853515625, -0.0113525390625, -0.003108978271484375, 0.00513458251953125, 0.013378143310546875, 0.0216217041015625, 0.029865264892578125, 0.03810882568359375, 0.046352386474609375, 0.054595947265625, 0.06283950805664062, 0.07108306884765625, 0.07932662963867188, 0.0875701904296875, 0.09581375122070312, 0.10405731201171875, 0.11230087280273438, 0.12054443359375, 0.12878799438476562, 0.13703155517578125, 0.14527511596679688, 0.1535186767578125, 0.16176223754882812, 0.17000579833984375, 0.17824935913085938, 0.186492919921875, 0.19473648071289062, 0.20298004150390625, 0.21122360229492188, 0.2194671630859375, 0.22771072387695312, 0.23595428466796875, 0.24419784545898438, 0.25244140625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 9.0, 10.0, 19.0, 21.0, 21.0, 34.0, 30.0, 41.0, 33.0, 52.0, 39.0, 53.0, 51.0, 63.0, 64.0, 57.0, 57.0, 38.0, 52.0, 36.0, 34.0, 29.0, 27.0, 24.0, 12.0, 18.0, 11.0, 10.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.1961669921875e-05, -4.06922772526741e-05, -3.9422884583473206e-05, -3.815349191427231e-05, -3.688409924507141e-05, -3.5614706575870514e-05, -3.434531390666962e-05, -3.307592123746872e-05, -3.180652856826782e-05, -3.0537135899066925e-05, -2.9267743229866028e-05, -2.799835056066513e-05, -2.6728957891464233e-05, -2.5459565222263336e-05, -2.419017255306244e-05, -2.2920779883861542e-05, -2.1651387214660645e-05, -2.0381994545459747e-05, -1.911260187625885e-05, -1.7843209207057953e-05, -1.6573816537857056e-05, -1.530442386865616e-05, -1.4035031199455261e-05, -1.2765638530254364e-05, -1.1496245861053467e-05, -1.022685319185257e-05, -8.957460522651672e-06, -7.688067853450775e-06, -6.418675184249878e-06, -5.149282515048981e-06, -3.8798898458480835e-06, -2.6104971766471863e-06, -1.341104507446289e-06, -7.171183824539185e-08, 1.1976808309555054e-06, 2.4670735001564026e-06, 3.7364661693573e-06, 5.005858838558197e-06, 6.275251507759094e-06, 7.5446441769599915e-06, 8.814036846160889e-06, 1.0083429515361786e-05, 1.1352822184562683e-05, 1.262221485376358e-05, 1.3891607522964478e-05, 1.5161000192165375e-05, 1.6430392861366272e-05, 1.769978553056717e-05, 1.8969178199768066e-05, 2.0238570868968964e-05, 2.150796353816986e-05, 2.2777356207370758e-05, 2.4046748876571655e-05, 2.5316141545772552e-05, 2.658553421497345e-05, 2.7854926884174347e-05, 2.9124319553375244e-05, 3.039371222257614e-05, 3.166310489177704e-05, 3.2932497560977936e-05, 3.420189023017883e-05, 3.547128289937973e-05, 3.674067556858063e-05, 3.8010068237781525e-05, 3.927946090698242e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 5.0, 6.0, 13.0, 13.0, 21.0, 22.0, 28.0, 41.0, 50.0, 69.0, 78.0, 142.0, 211.0, 273.0, 384.0, 579.0, 862.0, 1117.0, 1807.0, 2723.0, 4531.0, 7361.0, 12519.0, 22290.0, 39328.0, 70702.0, 123129.0, 189927.0, 208815.0, 151944.0, 90199.0, 50321.0, 28339.0, 15918.0, 9122.0, 5512.0, 3421.0, 2218.0, 1374.0, 921.0, 594.0, 413.0, 362.0, 223.0, 163.0, 139.0, 86.0, 77.0, 56.0, 32.0, 20.0, 19.0, 17.0, 12.0, 9.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.07623291015625, -0.0737905502319336, -0.07134819030761719, -0.06890583038330078, -0.06646347045898438, -0.06402111053466797, -0.06157875061035156, -0.059136390686035156, -0.05669403076171875, -0.054251670837402344, -0.05180931091308594, -0.04936695098876953, -0.046924591064453125, -0.04448223114013672, -0.04203987121582031, -0.039597511291503906, -0.0371551513671875, -0.034712791442871094, -0.03227043151855469, -0.02982807159423828, -0.027385711669921875, -0.02494335174560547, -0.022500991821289062, -0.020058631896972656, -0.01761627197265625, -0.015173912048339844, -0.012731552124023438, -0.010289192199707031, -0.007846832275390625, -0.005404472351074219, -0.0029621124267578125, -0.0005197525024414062, 0.001922607421875, 0.004364967346191406, 0.0068073272705078125, 0.009249687194824219, 0.011692047119140625, 0.014134407043457031, 0.016576766967773438, 0.019019126892089844, 0.02146148681640625, 0.023903846740722656, 0.026346206665039062, 0.02878856658935547, 0.031230926513671875, 0.03367328643798828, 0.03611564636230469, 0.038558006286621094, 0.0410003662109375, 0.043442726135253906, 0.04588508605957031, 0.04832744598388672, 0.050769805908203125, 0.05321216583251953, 0.05565452575683594, 0.058096885681152344, 0.06053924560546875, 0.06298160552978516, 0.06542396545410156, 0.06786632537841797, 0.07030868530273438, 0.07275104522705078, 0.07519340515136719, 0.0776357650756836, 0.080078125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 7.0, 6.0, 15.0, 15.0, 16.0, 26.0, 19.0, 32.0, 27.0, 48.0, 50.0, 50.0, 66.0, 68.0, 52.0, 75.0, 74.0, 57.0, 59.0, 47.0, 44.0, 29.0, 28.0, 21.0, 13.0, 16.0, 9.0, 7.0, 7.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0164947509765625, -0.015921354293823242, -0.015347957611083984, -0.014774560928344727, -0.014201164245605469, -0.013627767562866211, -0.013054370880126953, -0.012480974197387695, -0.011907577514648438, -0.01133418083190918, -0.010760784149169922, -0.010187387466430664, -0.009613990783691406, -0.009040594100952148, -0.00846719741821289, -0.007893800735473633, -0.007320404052734375, -0.006747007369995117, -0.006173610687255859, -0.0056002140045166016, -0.005026817321777344, -0.004453420639038086, -0.003880023956298828, -0.0033066272735595703, -0.0027332305908203125, -0.0021598339080810547, -0.0015864372253417969, -0.001013040542602539, -0.00043964385986328125, 0.00013375282287597656, 0.0007071495056152344, 0.0012805461883544922, 0.00185394287109375, 0.002427339553833008, 0.0030007362365722656, 0.0035741329193115234, 0.004147529602050781, 0.004720926284790039, 0.005294322967529297, 0.005867719650268555, 0.0064411163330078125, 0.00701451301574707, 0.007587909698486328, 0.008161306381225586, 0.008734703063964844, 0.009308099746704102, 0.00988149642944336, 0.010454893112182617, 0.011028289794921875, 0.011601686477661133, 0.01217508316040039, 0.012748479843139648, 0.013321876525878906, 0.013895273208618164, 0.014468669891357422, 0.01504206657409668, 0.015615463256835938, 0.016188859939575195, 0.016762256622314453, 0.01733565330505371, 0.01790904998779297, 0.018482446670532227, 0.019055843353271484, 0.019629240036010742, 0.02020263671875]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 6.0, 17.0, 11.0, 17.0, 23.0, 26.0, 23.0, 29.0, 37.0, 50.0, 36.0, 47.0, 51.0, 62.0, 77.0, 56.0, 62.0, 42.0, 47.0, 51.0, 29.0, 33.0, 24.0, 21.0, 19.0, 18.0, 16.0, 11.0, 5.0, 14.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.703352451324463, -4.567334175109863, -4.431316375732422, -4.295298099517822, -4.159279823303223, -4.023262023925781, -3.8872437477111816, -3.751225709915161, -3.6152076721191406, -3.47918963432312, -3.3431715965270996, -3.2071533203125, -3.0711352825164795, -2.935117244720459, -2.7990989685058594, -2.663080930709839, -2.5270628929138184, -2.391044855117798, -2.2550268173217773, -2.1190085411071777, -1.9829905033111572, -1.8469724655151367, -1.7109543085098267, -1.5749361515045166, -1.438918113708496, -1.3029000759124756, -1.1668819189071655, -1.0308637619018555, -0.894845724105835, -0.7588276267051697, -0.6228095293045044, -0.4867914319038391, -0.35077333450317383, -0.21475523710250854, -0.07873713970184326, 0.05728095769882202, 0.1932990550994873, 0.3293171525001526, 0.46533524990081787, 0.6013533473014832, 0.7373714447021484, 0.8733895421028137, 1.009407639503479, 1.145425796508789, 1.2814438343048096, 1.41746187210083, 1.5534800291061401, 1.6894981861114502, 1.8255162239074707, 1.9615342617034912, 2.0975522994995117, 2.2335705757141113, 2.369588613510132, 2.5056066513061523, 2.641624927520752, 2.7776429653167725, 2.913661003112793, 3.0496790409088135, 3.185697078704834, 3.3217153549194336, 3.457733392715454, 3.5937514305114746, 3.729769706726074, 3.8657877445220947, 4.001805782318115]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 5.0, 1.0, 1.0, 10.0, 10.0, 2.0, 6.0, 21.0, 17.0, 14.0, 14.0, 19.0, 21.0, 24.0, 22.0, 23.0, 38.0, 30.0, 47.0, 35.0, 34.0, 49.0, 51.0, 42.0, 41.0, 31.0, 41.0, 34.0, 26.0, 31.0, 29.0, 31.0, 29.0, 27.0, 30.0, 18.0, 15.0, 15.0, 11.0, 8.0, 18.0, 13.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.3029496669769287, -2.2345986366271973, -2.1662473678588867, -2.0978963375091553, -2.0295450687408447, -1.9611940383911133, -1.8928428888320923, -1.8244917392730713, -1.7561405897140503, -1.6877894401550293, -1.6194382905960083, -1.5510871410369873, -1.4827361106872559, -1.4143848419189453, -1.3460338115692139, -1.2776826620101929, -1.2093315124511719, -1.1409803628921509, -1.0726292133331299, -1.0042780637741089, -0.9359269738197327, -0.8675758242607117, -0.7992247343063354, -0.7308735847473145, -0.6625224351882935, -0.5941712856292725, -0.5258201360702515, -0.45746904611587524, -0.38911789655685425, -0.32076674699783325, -0.25241562724113464, -0.18406450748443604, -0.11571335792541504, -0.04736222326755524, 0.020988911390304565, 0.08934004604816437, 0.15769118070602417, 0.22604233026504517, 0.2943934500217438, 0.3627445697784424, 0.4310957193374634, 0.4994468688964844, 0.5677980184555054, 0.6361491084098816, 0.7045002579689026, 0.7728514075279236, 0.8412024974822998, 0.9095536470413208, 0.9779047966003418, 1.0462559461593628, 1.1146070957183838, 1.1829582452774048, 1.2513093948364258, 1.3196604251861572, 1.3880115747451782, 1.4563627243041992, 1.5247138738632202, 1.5930650234222412, 1.6614161729812622, 1.7297673225402832, 1.7981183528900146, 1.8664696216583252, 1.9348206520080566, 2.003171920776367, 2.0715229511260986]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 11.0, 16.0, 20.0, 33.0, 52.0, 104.0, 145.0, 233.0, 400.0, 685.0, 1169.0, 1926.0, 3260.0, 5428.0, 9318.0, 15524.0, 25828.0, 42270.0, 65918.0, 95814.0, 126941.0, 145913.0, 143131.0, 120443.0, 88683.0, 59615.0, 38254.0, 23097.0, 14061.0, 8248.0, 4847.0, 2863.0, 1707.0, 1088.0, 605.0, 349.0, 234.0, 107.0, 83.0, 60.0, 28.0, 19.0, 10.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86328125, -2.77349853515625, -2.6837158203125, -2.59393310546875, -2.504150390625, -2.41436767578125, -2.3245849609375, -2.23480224609375, -2.14501953125, -2.05523681640625, -1.9654541015625, -1.87567138671875, -1.785888671875, -1.69610595703125, -1.6063232421875, -1.51654052734375, -1.4267578125, -1.33697509765625, -1.2471923828125, -1.15740966796875, -1.067626953125, -0.97784423828125, -0.8880615234375, -0.79827880859375, -0.70849609375, -0.61871337890625, -0.5289306640625, -0.43914794921875, -0.349365234375, -0.25958251953125, -0.1697998046875, -0.08001708984375, 0.009765625, 0.09954833984375, 0.1893310546875, 0.27911376953125, 0.368896484375, 0.45867919921875, 0.5484619140625, 0.63824462890625, 0.72802734375, 0.81781005859375, 0.9075927734375, 0.99737548828125, 1.087158203125, 1.17694091796875, 1.2667236328125, 1.35650634765625, 1.4462890625, 1.53607177734375, 1.6258544921875, 1.71563720703125, 1.805419921875, 1.89520263671875, 1.9849853515625, 2.07476806640625, 2.16455078125, 2.25433349609375, 2.3441162109375, 2.43389892578125, 2.523681640625, 2.61346435546875, 2.7032470703125, 2.79302978515625, 2.8828125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 2.0, 6.0, 8.0, 11.0, 13.0, 7.0, 9.0, 12.0, 21.0, 17.0, 24.0, 30.0, 30.0, 28.0, 35.0, 30.0, 40.0, 54.0, 51.0, 47.0, 39.0, 52.0, 52.0, 32.0, 41.0, 43.0, 32.0, 36.0, 33.0, 24.0, 22.0, 16.0, 27.0, 17.0, 11.0, 12.0, 7.0, 7.0, 8.0, 5.0, 1.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.783203125, -2.69830322265625, -2.6134033203125, -2.52850341796875, -2.443603515625, -2.35870361328125, -2.2738037109375, -2.18890380859375, -2.10400390625, -2.01910400390625, -1.9342041015625, -1.84930419921875, -1.764404296875, -1.67950439453125, -1.5946044921875, -1.50970458984375, -1.4248046875, -1.33990478515625, -1.2550048828125, -1.17010498046875, -1.085205078125, -1.00030517578125, -0.9154052734375, -0.83050537109375, -0.74560546875, -0.66070556640625, -0.5758056640625, -0.49090576171875, -0.406005859375, -0.32110595703125, -0.2362060546875, -0.15130615234375, -0.06640625, 0.01849365234375, 0.1033935546875, 0.18829345703125, 0.273193359375, 0.35809326171875, 0.4429931640625, 0.52789306640625, 0.61279296875, 0.69769287109375, 0.7825927734375, 0.86749267578125, 0.952392578125, 1.03729248046875, 1.1221923828125, 1.20709228515625, 1.2919921875, 1.37689208984375, 1.4617919921875, 1.54669189453125, 1.631591796875, 1.71649169921875, 1.8013916015625, 1.88629150390625, 1.97119140625, 2.05609130859375, 2.1409912109375, 2.22589111328125, 2.310791015625, 2.39569091796875, 2.4805908203125, 2.56549072265625, 2.650390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [7.0, 4.0, 10.0, 7.0, 9.0, 17.0, 24.0, 31.0, 47.0, 73.0, 103.0, 185.0, 257.0, 328.0, 540.0, 869.0, 1343.0, 1948.0, 3217.0, 4800.0, 7691.0, 11740.0, 18029.0, 26917.0, 39656.0, 56290.0, 76811.0, 98115.0, 115070.0, 121740.0, 115073.0, 98111.0, 76621.0, 56326.0, 39183.0, 26356.0, 17872.0, 11873.0, 7636.0, 4804.0, 3134.0, 1936.0, 1287.0, 846.0, 551.0, 377.0, 236.0, 157.0, 111.0, 56.0, 53.0, 30.0, 19.0, 13.0, 7.0, 7.0, 11.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.353515625, -2.273712158203125, -2.19390869140625, -2.114105224609375, -2.0343017578125, -1.954498291015625, -1.87469482421875, -1.794891357421875, -1.715087890625, -1.635284423828125, -1.55548095703125, -1.475677490234375, -1.3958740234375, -1.316070556640625, -1.23626708984375, -1.156463623046875, -1.07666015625, -0.996856689453125, -0.91705322265625, -0.837249755859375, -0.7574462890625, -0.677642822265625, -0.59783935546875, -0.518035888671875, -0.438232421875, -0.358428955078125, -0.27862548828125, -0.198822021484375, -0.1190185546875, -0.039215087890625, 0.04058837890625, 0.120391845703125, 0.2001953125, 0.279998779296875, 0.35980224609375, 0.439605712890625, 0.5194091796875, 0.599212646484375, 0.67901611328125, 0.758819580078125, 0.838623046875, 0.918426513671875, 0.99822998046875, 1.078033447265625, 1.1578369140625, 1.237640380859375, 1.31744384765625, 1.397247314453125, 1.47705078125, 1.556854248046875, 1.63665771484375, 1.716461181640625, 1.7962646484375, 1.876068115234375, 1.95587158203125, 2.035675048828125, 2.115478515625, 2.195281982421875, 2.27508544921875, 2.354888916015625, 2.4346923828125, 2.514495849609375, 2.59429931640625, 2.674102783203125, 2.75390625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 4.0, 7.0, 8.0, 11.0, 12.0, 12.0, 27.0, 18.0, 25.0, 27.0, 25.0, 23.0, 32.0, 38.0, 41.0, 45.0, 49.0, 57.0, 38.0, 38.0, 42.0, 47.0, 33.0, 43.0, 30.0, 30.0, 32.0, 40.0, 23.0, 29.0, 14.0, 14.0, 9.0, 16.0, 14.0, 15.0, 12.0, 8.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4817047119140625, -1.429229736328125, -1.3767547607421875, -1.32427978515625, -1.2718048095703125, -1.219329833984375, -1.1668548583984375, -1.1143798828125, -1.0619049072265625, -1.009429931640625, -0.9569549560546875, -0.90447998046875, -0.8520050048828125, -0.799530029296875, -0.7470550537109375, -0.694580078125, -0.6421051025390625, -0.589630126953125, -0.5371551513671875, -0.48468017578125, -0.4322052001953125, -0.379730224609375, -0.3272552490234375, -0.2747802734375, -0.2223052978515625, -0.169830322265625, -0.1173553466796875, -0.06488037109375, -0.0124053955078125, 0.040069580078125, 0.0925445556640625, 0.14501953125, 0.1974945068359375, 0.249969482421875, 0.3024444580078125, 0.35491943359375, 0.4073944091796875, 0.459869384765625, 0.5123443603515625, 0.5648193359375, 0.6172943115234375, 0.669769287109375, 0.7222442626953125, 0.77471923828125, 0.8271942138671875, 0.879669189453125, 0.9321441650390625, 0.984619140625, 1.0370941162109375, 1.089569091796875, 1.1420440673828125, 1.19451904296875, 1.2469940185546875, 1.299468994140625, 1.3519439697265625, 1.4044189453125, 1.4568939208984375, 1.509368896484375, 1.5618438720703125, 1.61431884765625, 1.6667938232421875, 1.719268798828125, 1.7717437744140625, 1.82421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 10.0, 12.0, 13.0, 19.0, 19.0, 38.0, 58.0, 101.0, 138.0, 169.0, 271.0, 376.0, 576.0, 891.0, 1442.0, 2243.0, 3948.0, 7350.0, 14212.0, 29975.0, 67393.0, 149151.0, 262970.0, 252250.0, 136940.0, 60883.0, 27424.0, 13226.0, 6649.0, 3808.0, 2159.0, 1301.0, 831.0, 587.0, 356.0, 223.0, 182.0, 117.0, 91.0, 45.0, 40.0, 24.0, 21.0, 9.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.65234375, -3.5343017578125, -3.416259765625, -3.2982177734375, -3.18017578125, -3.0621337890625, -2.944091796875, -2.8260498046875, -2.7080078125, -2.5899658203125, -2.471923828125, -2.3538818359375, -2.23583984375, -2.1177978515625, -1.999755859375, -1.8817138671875, -1.763671875, -1.6456298828125, -1.527587890625, -1.4095458984375, -1.29150390625, -1.1734619140625, -1.055419921875, -0.9373779296875, -0.8193359375, -0.7012939453125, -0.583251953125, -0.4652099609375, -0.34716796875, -0.2291259765625, -0.111083984375, 0.0069580078125, 0.125, 0.2430419921875, 0.361083984375, 0.4791259765625, 0.59716796875, 0.7152099609375, 0.833251953125, 0.9512939453125, 1.0693359375, 1.1873779296875, 1.305419921875, 1.4234619140625, 1.54150390625, 1.6595458984375, 1.777587890625, 1.8956298828125, 2.013671875, 2.1317138671875, 2.249755859375, 2.3677978515625, 2.48583984375, 2.6038818359375, 2.721923828125, 2.8399658203125, 2.9580078125, 3.0760498046875, 3.194091796875, 3.3121337890625, 3.43017578125, 3.5482177734375, 3.666259765625, 3.7843017578125, 3.90234375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 6.0, 12.0, 12.0, 19.0, 41.0, 75.0, 86.0, 126.0, 133.0, 142.0, 125.0, 68.0, 43.0, 32.0, 15.0, 13.0, 14.0, 8.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006952285766601562, -0.0006757825613021851, -0.0006563365459442139, -0.0006368905305862427, -0.0006174445152282715, -0.0005979984998703003, -0.0005785524845123291, -0.0005591064691543579, -0.0005396604537963867, -0.0005202144384384155, -0.0005007684230804443, -0.00048132240772247314, -0.00046187639236450195, -0.00044243037700653076, -0.00042298436164855957, -0.0004035383462905884, -0.0003840923309326172, -0.000364646315574646, -0.0003452003002166748, -0.0003257542848587036, -0.0003063082695007324, -0.00028686225414276123, -0.00026741623878479004, -0.00024797022342681885, -0.00022852420806884766, -0.00020907819271087646, -0.00018963217735290527, -0.00017018616199493408, -0.0001507401466369629, -0.0001312941312789917, -0.00011184811592102051, -9.240210056304932e-05, -7.295608520507812e-05, -5.3510069847106934e-05, -3.406405448913574e-05, -1.461803913116455e-05, 4.827976226806641e-06, 2.4273991584777832e-05, 4.3720006942749023e-05, 6.316602230072021e-05, 8.26120376586914e-05, 0.0001020580530166626, 0.00012150406837463379, 0.00014095008373260498, 0.00016039609909057617, 0.00017984211444854736, 0.00019928812980651855, 0.00021873414516448975, 0.00023818016052246094, 0.00025762617588043213, 0.0002770721912384033, 0.0002965182065963745, 0.0003159642219543457, 0.0003354102373123169, 0.0003548562526702881, 0.0003743022680282593, 0.00039374828338623047, 0.00041319429874420166, 0.00043264031410217285, 0.00045208632946014404, 0.00047153234481811523, 0.0004909783601760864, 0.0005104243755340576, 0.0005298703908920288, 0.00054931640625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 7.0, 4.0, 9.0, 9.0, 13.0, 18.0, 28.0, 51.0, 43.0, 68.0, 108.0, 156.0, 252.0, 335.0, 451.0, 677.0, 1043.0, 1639.0, 2499.0, 4097.0, 6827.0, 11936.0, 21632.0, 39723.0, 73011.0, 129017.0, 193036.0, 207174.0, 152723.0, 89910.0, 49047.0, 26647.0, 14712.0, 8121.0, 4901.0, 3002.0, 1853.0, 1173.0, 828.0, 538.0, 386.0, 267.0, 170.0, 127.0, 87.0, 62.0, 50.0, 22.0, 31.0, 11.0, 8.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.431640625, -2.3536376953125, -2.275634765625, -2.1976318359375, -2.11962890625, -2.0416259765625, -1.963623046875, -1.8856201171875, -1.8076171875, -1.7296142578125, -1.651611328125, -1.5736083984375, -1.49560546875, -1.4176025390625, -1.339599609375, -1.2615966796875, -1.18359375, -1.1055908203125, -1.027587890625, -0.9495849609375, -0.87158203125, -0.7935791015625, -0.715576171875, -0.6375732421875, -0.5595703125, -0.4815673828125, -0.403564453125, -0.3255615234375, -0.24755859375, -0.1695556640625, -0.091552734375, -0.0135498046875, 0.064453125, 0.1424560546875, 0.220458984375, 0.2984619140625, 0.37646484375, 0.4544677734375, 0.532470703125, 0.6104736328125, 0.6884765625, 0.7664794921875, 0.844482421875, 0.9224853515625, 1.00048828125, 1.0784912109375, 1.156494140625, 1.2344970703125, 1.3125, 1.3905029296875, 1.468505859375, 1.5465087890625, 1.62451171875, 1.7025146484375, 1.780517578125, 1.8585205078125, 1.9365234375, 2.0145263671875, 2.092529296875, 2.1705322265625, 2.24853515625, 2.3265380859375, 2.404541015625, 2.4825439453125, 2.560546875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 0.0, 8.0, 10.0, 11.0, 17.0, 16.0, 27.0, 33.0, 38.0, 49.0, 44.0, 54.0, 58.0, 60.0, 79.0, 72.0, 66.0, 59.0, 55.0, 52.0, 23.0, 28.0, 23.0, 16.0, 14.0, 11.0, 11.0, 9.0, 8.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.71875, -0.696044921875, -0.67333984375, -0.650634765625, -0.6279296875, -0.605224609375, -0.58251953125, -0.559814453125, -0.537109375, -0.514404296875, -0.49169921875, -0.468994140625, -0.4462890625, -0.423583984375, -0.40087890625, -0.378173828125, -0.35546875, -0.332763671875, -0.31005859375, -0.287353515625, -0.2646484375, -0.241943359375, -0.21923828125, -0.196533203125, -0.173828125, -0.151123046875, -0.12841796875, -0.105712890625, -0.0830078125, -0.060302734375, -0.03759765625, -0.014892578125, 0.0078125, 0.030517578125, 0.05322265625, 0.075927734375, 0.0986328125, 0.121337890625, 0.14404296875, 0.166748046875, 0.189453125, 0.212158203125, 0.23486328125, 0.257568359375, 0.2802734375, 0.302978515625, 0.32568359375, 0.348388671875, 0.37109375, 0.393798828125, 0.41650390625, 0.439208984375, 0.4619140625, 0.484619140625, 0.50732421875, 0.530029296875, 0.552734375, 0.575439453125, 0.59814453125, 0.620849609375, 0.6435546875, 0.666259765625, 0.68896484375, 0.711669921875, 0.734375]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 3.0, 10.0, 13.0, 14.0, 16.0, 12.0, 29.0, 17.0, 30.0, 33.0, 34.0, 48.0, 37.0, 61.0, 58.0, 61.0, 57.0, 66.0, 66.0, 46.0, 49.0, 38.0, 35.0, 27.0, 19.0, 22.0, 23.0, 7.0, 7.0, 13.0, 4.0, 11.0, 11.0, 7.0, 4.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.617569446563721, -4.47745418548584, -4.337339401245117, -4.197224140167236, -4.0571088790893555, -3.9169936180114746, -3.776878595352173, -3.636763572692871, -3.4966483116149902, -3.3565330505371094, -3.2164180278778076, -3.076303005218506, -2.936187744140625, -2.796072483062744, -2.6559574604034424, -2.5158424377441406, -2.3757271766662598, -2.235611915588379, -2.095496892929077, -1.9553817510604858, -1.8152666091918945, -1.6751514673233032, -1.535036325454712, -1.3949211835861206, -1.2548060417175293, -1.114690899848938, -0.9745757579803467, -0.8344606161117554, -0.6943454742431641, -0.5542303323745728, -0.41411519050598145, -0.27400004863739014, -0.13388490676879883, 0.0062302350997924805, 0.1463453769683838, 0.2864605188369751, 0.4265756607055664, 0.5666908025741577, 0.706805944442749, 0.8469210863113403, 0.9870362281799316, 1.127151370048523, 1.2672665119171143, 1.4073816537857056, 1.5474967956542969, 1.6876119375228882, 1.8277270793914795, 1.9678422212600708, 2.107957363128662, 2.248072624206543, 2.3881876468658447, 2.5283026695251465, 2.6684179306030273, 2.808533191680908, 2.94864821434021, 3.0887632369995117, 3.2288784980773926, 3.3689937591552734, 3.509108781814575, 3.649223804473877, 3.789339065551758, 3.9294543266296387, 4.0695695877075195, 4.209684371948242, 4.349799633026123]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 9.0, 9.0, 10.0, 13.0, 17.0, 10.0, 18.0, 21.0, 33.0, 14.0, 33.0, 31.0, 38.0, 31.0, 33.0, 33.0, 43.0, 30.0, 39.0, 41.0, 38.0, 34.0, 34.0, 30.0, 40.0, 28.0, 33.0, 28.0, 31.0, 39.0, 14.0, 20.0, 15.0, 24.0, 6.0, 19.0, 11.0, 8.0, 5.0, 5.0, 5.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0], "bins": [-2.5560855865478516, -2.4842679500579834, -2.412450075149536, -2.340632438659668, -2.2688148021698, -2.1969971656799316, -2.1251792907714844, -2.053361654281616, -1.9815438985824585, -1.9097261428833008, -1.8379085063934326, -1.766090750694275, -1.6942729949951172, -1.622455358505249, -1.5506376028060913, -1.4788198471069336, -1.4070022106170654, -1.3351844549179077, -1.2633668184280396, -1.1915490627288818, -1.1197314262390137, -1.047913670539856, -0.9760959148406982, -0.9042782187461853, -0.8324605226516724, -0.7606428265571594, -0.6888251304626465, -0.6170073747634888, -0.5451896786689758, -0.4733719825744629, -0.40155425667762756, -0.32973653078079224, -0.2579185962677002, -0.18610088527202606, -0.11428317427635193, -0.042465463280677795, 0.029352247714996338, 0.10116994380950928, 0.1729876697063446, 0.24480539560317993, 0.31662309169769287, 0.3884407877922058, 0.46025851368904114, 0.5320762395858765, 0.6038939356803894, 0.6757116317749023, 0.7475293874740601, 0.819347083568573, 0.8911647796630859, 0.9629824757575989, 1.0348001718521118, 1.1066179275512695, 1.1784355640411377, 1.2502533197402954, 1.3220710754394531, 1.3938887119293213, 1.465706467628479, 1.5375242233276367, 1.6093418598175049, 1.6811596155166626, 1.7529773712158203, 1.8247950077056885, 1.8966127634048462, 1.968430519104004, 2.040248155593872]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 17.0, 17.0, 30.0, 26.0, 41.0, 84.0, 134.0, 181.0, 324.0, 457.0, 765.0, 1264.0, 2062.0, 3540.0, 6323.0, 11072.0, 20599.0, 39078.0, 77915.0, 164238.0, 369744.0, 805057.0, 1157518.0, 819576.0, 379241.0, 168429.0, 79440.0, 39743.0, 21030.0, 11352.0, 6233.0, 3606.0, 2044.0, 1215.0, 753.0, 441.0, 255.0, 153.0, 98.0, 72.0, 41.0, 29.0, 17.0, 7.0, 6.0, 9.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.9453125, -4.793212890625, -4.64111328125, -4.489013671875, -4.3369140625, -4.184814453125, -4.03271484375, -3.880615234375, -3.728515625, -3.576416015625, -3.42431640625, -3.272216796875, -3.1201171875, -2.968017578125, -2.81591796875, -2.663818359375, -2.51171875, -2.359619140625, -2.20751953125, -2.055419921875, -1.9033203125, -1.751220703125, -1.59912109375, -1.447021484375, -1.294921875, -1.142822265625, -0.99072265625, -0.838623046875, -0.6865234375, -0.534423828125, -0.38232421875, -0.230224609375, -0.078125, 0.073974609375, 0.22607421875, 0.378173828125, 0.5302734375, 0.682373046875, 0.83447265625, 0.986572265625, 1.138671875, 1.290771484375, 1.44287109375, 1.594970703125, 1.7470703125, 1.899169921875, 2.05126953125, 2.203369140625, 2.35546875, 2.507568359375, 2.65966796875, 2.811767578125, 2.9638671875, 3.115966796875, 3.26806640625, 3.420166015625, 3.572265625, 3.724365234375, 3.87646484375, 4.028564453125, 4.1806640625, 4.332763671875, 4.48486328125, 4.636962890625, 4.7890625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 9.0, 9.0, 5.0, 9.0, 16.0, 17.0, 14.0, 20.0, 23.0, 29.0, 24.0, 32.0, 35.0, 42.0, 45.0, 33.0, 35.0, 42.0, 50.0, 35.0, 45.0, 49.0, 44.0, 35.0, 31.0, 29.0, 24.0, 33.0, 22.0, 26.0, 24.0, 24.0, 15.0, 12.0, 18.0, 9.0, 7.0, 6.0, 9.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.2865753173828125, -2.219635009765625, -2.1526947021484375, -2.08575439453125, -2.0188140869140625, -1.951873779296875, -1.8849334716796875, -1.8179931640625, -1.7510528564453125, -1.684112548828125, -1.6171722412109375, -1.55023193359375, -1.4832916259765625, -1.416351318359375, -1.3494110107421875, -1.282470703125, -1.2155303955078125, -1.148590087890625, -1.0816497802734375, -1.01470947265625, -0.9477691650390625, -0.880828857421875, -0.8138885498046875, -0.7469482421875, -0.6800079345703125, -0.613067626953125, -0.5461273193359375, -0.47918701171875, -0.4122467041015625, -0.345306396484375, -0.2783660888671875, -0.21142578125, -0.1444854736328125, -0.077545166015625, -0.0106048583984375, 0.05633544921875, 0.1232757568359375, 0.190216064453125, 0.2571563720703125, 0.3240966796875, 0.3910369873046875, 0.457977294921875, 0.5249176025390625, 0.59185791015625, 0.6587982177734375, 0.725738525390625, 0.7926788330078125, 0.859619140625, 0.9265594482421875, 0.993499755859375, 1.0604400634765625, 1.12738037109375, 1.1943206787109375, 1.261260986328125, 1.3282012939453125, 1.3951416015625, 1.4620819091796875, 1.529022216796875, 1.5959625244140625, 1.66290283203125, 1.7298431396484375, 1.796783447265625, 1.8637237548828125, 1.9306640625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 15.0, 18.0, 15.0, 34.0, 57.0, 99.0, 138.0, 227.0, 335.0, 570.0, 937.0, 1575.0, 2800.0, 4571.0, 8458.0, 15048.0, 27894.0, 52572.0, 102349.0, 205976.0, 416428.0, 775062.0, 1021311.0, 750665.0, 398872.0, 198723.0, 98801.0, 50510.0, 26396.0, 14582.0, 7974.0, 4599.0, 2648.0, 1580.0, 907.0, 577.0, 345.0, 212.0, 132.0, 91.0, 61.0, 44.0, 21.0, 18.0, 12.0, 7.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-5.3359375, -5.176513671875, -5.01708984375, -4.857666015625, -4.6982421875, -4.538818359375, -4.37939453125, -4.219970703125, -4.060546875, -3.901123046875, -3.74169921875, -3.582275390625, -3.4228515625, -3.263427734375, -3.10400390625, -2.944580078125, -2.78515625, -2.625732421875, -2.46630859375, -2.306884765625, -2.1474609375, -1.988037109375, -1.82861328125, -1.669189453125, -1.509765625, -1.350341796875, -1.19091796875, -1.031494140625, -0.8720703125, -0.712646484375, -0.55322265625, -0.393798828125, -0.234375, -0.074951171875, 0.08447265625, 0.243896484375, 0.4033203125, 0.562744140625, 0.72216796875, 0.881591796875, 1.041015625, 1.200439453125, 1.35986328125, 1.519287109375, 1.6787109375, 1.838134765625, 1.99755859375, 2.156982421875, 2.31640625, 2.475830078125, 2.63525390625, 2.794677734375, 2.9541015625, 3.113525390625, 3.27294921875, 3.432373046875, 3.591796875, 3.751220703125, 3.91064453125, 4.070068359375, 4.2294921875, 4.388916015625, 4.54833984375, 4.707763671875, 4.8671875]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 6.0, 6.0, 15.0, 19.0, 24.0, 30.0, 40.0, 55.0, 57.0, 52.0, 81.0, 81.0, 110.0, 121.0, 165.0, 164.0, 185.0, 219.0, 219.0, 253.0, 261.0, 255.0, 232.0, 201.0, 179.0, 186.0, 147.0, 119.0, 103.0, 81.0, 66.0, 67.0, 61.0, 39.0, 33.0, 34.0, 19.0, 16.0, 10.0, 10.0, 10.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 3.0], "bins": [-1.19921875, -1.161041259765625, -1.12286376953125, -1.084686279296875, -1.0465087890625, -1.008331298828125, -0.97015380859375, -0.931976318359375, -0.893798828125, -0.855621337890625, -0.81744384765625, -0.779266357421875, -0.7410888671875, -0.702911376953125, -0.66473388671875, -0.626556396484375, -0.58837890625, -0.550201416015625, -0.51202392578125, -0.473846435546875, -0.4356689453125, -0.397491455078125, -0.35931396484375, -0.321136474609375, -0.282958984375, -0.244781494140625, -0.20660400390625, -0.168426513671875, -0.1302490234375, -0.092071533203125, -0.05389404296875, -0.015716552734375, 0.0224609375, 0.060638427734375, 0.09881591796875, 0.136993408203125, 0.1751708984375, 0.213348388671875, 0.25152587890625, 0.289703369140625, 0.327880859375, 0.366058349609375, 0.40423583984375, 0.442413330078125, 0.4805908203125, 0.518768310546875, 0.55694580078125, 0.595123291015625, 0.63330078125, 0.671478271484375, 0.70965576171875, 0.747833251953125, 0.7860107421875, 0.824188232421875, 0.86236572265625, 0.900543212890625, 0.938720703125, 0.976898193359375, 1.01507568359375, 1.053253173828125, 1.0914306640625, 1.129608154296875, 1.16778564453125, 1.205963134765625, 1.244140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 8.0, 12.0, 10.0, 16.0, 23.0, 17.0, 28.0, 34.0, 34.0, 38.0, 49.0, 52.0, 56.0, 39.0, 49.0, 56.0, 46.0, 49.0, 48.0, 45.0, 46.0, 35.0, 37.0, 29.0, 15.0, 14.0, 16.0, 13.0, 15.0, 11.0, 8.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-4.763072967529297, -4.624141216278076, -4.485208988189697, -4.346277236938477, -4.207345008850098, -4.068413257598877, -3.9294815063476562, -3.7905495166778564, -3.6516175270080566, -3.512685537338257, -3.373753547668457, -3.2348217964172363, -3.0958898067474365, -2.9569578170776367, -2.818026065826416, -2.679094076156616, -2.5401620864868164, -2.4012300968170166, -2.262298107147217, -2.123366355895996, -1.9844343662261963, -1.8455023765563965, -1.7065705060958862, -1.567638635635376, -1.4287066459655762, -1.2897746562957764, -1.1508427858352661, -1.0119109153747559, -0.872978925704956, -0.734046995639801, -0.595115065574646, -0.45618313550949097, -0.31725120544433594, -0.1783192753791809, -0.03938734531402588, 0.09954458475112915, 0.23847651481628418, 0.3774084448814392, 0.5163403749465942, 0.6552723050117493, 0.7942042350769043, 0.9331361651420593, 1.0720680952072144, 1.2109999656677246, 1.3499319553375244, 1.4888639450073242, 1.6277958154678345, 1.7667276859283447, 1.9056596755981445, 2.0445916652679443, 2.183523654937744, 2.322455406188965, 2.4613873958587646, 2.6003193855285645, 2.739251136779785, 2.878183126449585, 3.0171151161193848, 3.1560471057891846, 3.2949790954589844, 3.433910846710205, 3.572842836380005, 3.7117748260498047, 3.8507065773010254, 3.989638566970825, 4.128570556640625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 11.0, 10.0, 15.0, 12.0, 9.0, 12.0, 13.0, 28.0, 28.0, 29.0, 30.0, 38.0, 38.0, 35.0, 28.0, 44.0, 49.0, 32.0, 39.0, 37.0, 32.0, 35.0, 41.0, 48.0, 37.0, 30.0, 28.0, 24.0, 20.0, 21.0, 21.0, 20.0, 15.0, 11.0, 21.0, 11.0, 9.0, 4.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4725818634033203, -2.394728183746338, -2.3168742656707764, -2.239020586013794, -2.1611669063568115, -2.08331298828125, -2.0054593086242676, -1.9276056289672852, -1.8497518301010132, -1.7718980312347412, -1.6940443515777588, -1.6161905527114868, -1.5383367538452148, -1.4604830741882324, -1.3826292753219604, -1.3047754764556885, -1.226921796798706, -1.149067997932434, -1.0712143182754517, -0.9933605194091797, -0.9155067801475525, -0.8376530408859253, -0.7597992420196533, -0.6819455027580261, -0.6040917634963989, -0.5262380242347717, -0.44838425517082214, -0.37053048610687256, -0.29267674684524536, -0.21482300758361816, -0.13696923851966858, -0.059115469455718994, 0.0187380313873291, 0.09659178555011749, 0.17444553971290588, 0.25229930877685547, 0.33015304803848267, 0.40800678730010986, 0.48586055636405945, 0.563714325428009, 0.6415680646896362, 0.7194218039512634, 0.7972755432128906, 0.8751293420791626, 0.9529830813407898, 1.030836820602417, 1.108690619468689, 1.186544418334961, 1.2643980979919434, 1.3422518968582153, 1.4201055765151978, 1.4979593753814697, 1.5758130550384521, 1.6536668539047241, 1.731520652770996, 1.8093743324279785, 1.8872281312942505, 1.9650819301605225, 2.042935609817505, 2.1207892894744873, 2.198643207550049, 2.2764968872070312, 2.3543505668640137, 2.432204484939575, 2.5100581645965576]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 6.0, 13.0, 14.0, 24.0, 43.0, 54.0, 93.0, 148.0, 222.0, 315.0, 506.0, 850.0, 1292.0, 1911.0, 3270.0, 4887.0, 8554.0, 14897.0, 27116.0, 50646.0, 97522.0, 178512.0, 246931.0, 186547.0, 103047.0, 53550.0, 28704.0, 15543.0, 9175.0, 5243.0, 3185.0, 2096.0, 1256.0, 808.0, 536.0, 365.0, 234.0, 146.0, 103.0, 65.0, 53.0, 24.0, 23.0, 12.0, 9.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.65673828125, -0.637725830078125, -0.61871337890625, -0.599700927734375, -0.5806884765625, -0.561676025390625, -0.54266357421875, -0.523651123046875, -0.504638671875, -0.485626220703125, -0.46661376953125, -0.447601318359375, -0.4285888671875, -0.409576416015625, -0.39056396484375, -0.371551513671875, -0.3525390625, -0.333526611328125, -0.31451416015625, -0.295501708984375, -0.2764892578125, -0.257476806640625, -0.23846435546875, -0.219451904296875, -0.200439453125, -0.181427001953125, -0.16241455078125, -0.143402099609375, -0.1243896484375, -0.105377197265625, -0.08636474609375, -0.067352294921875, -0.04833984375, -0.029327392578125, -0.01031494140625, 0.008697509765625, 0.0277099609375, 0.046722412109375, 0.06573486328125, 0.084747314453125, 0.103759765625, 0.122772216796875, 0.14178466796875, 0.160797119140625, 0.1798095703125, 0.198822021484375, 0.21783447265625, 0.236846923828125, 0.255859375, 0.274871826171875, 0.29388427734375, 0.312896728515625, 0.3319091796875, 0.350921630859375, 0.36993408203125, 0.388946533203125, 0.407958984375, 0.426971435546875, 0.44598388671875, 0.464996337890625, 0.4840087890625, 0.503021240234375, 0.52203369140625, 0.541046142578125, 0.56005859375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 12.0, 11.0, 10.0, 17.0, 17.0, 26.0, 26.0, 32.0, 43.0, 36.0, 41.0, 39.0, 50.0, 50.0, 46.0, 41.0, 43.0, 38.0, 46.0, 44.0, 36.0, 33.0, 27.0, 23.0, 32.0, 25.0, 21.0, 24.0, 14.0, 11.0, 13.0, 15.0, 6.0, 9.0, 8.0, 5.0, 7.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.34375, -3.24462890625, -3.1455078125, -3.04638671875, -2.947265625, -2.84814453125, -2.7490234375, -2.64990234375, -2.55078125, -2.45166015625, -2.3525390625, -2.25341796875, -2.154296875, -2.05517578125, -1.9560546875, -1.85693359375, -1.7578125, -1.65869140625, -1.5595703125, -1.46044921875, -1.361328125, -1.26220703125, -1.1630859375, -1.06396484375, -0.96484375, -0.86572265625, -0.7666015625, -0.66748046875, -0.568359375, -0.46923828125, -0.3701171875, -0.27099609375, -0.171875, -0.07275390625, 0.0263671875, 0.12548828125, 0.224609375, 0.32373046875, 0.4228515625, 0.52197265625, 0.62109375, 0.72021484375, 0.8193359375, 0.91845703125, 1.017578125, 1.11669921875, 1.2158203125, 1.31494140625, 1.4140625, 1.51318359375, 1.6123046875, 1.71142578125, 1.810546875, 1.90966796875, 2.0087890625, 2.10791015625, 2.20703125, 2.30615234375, 2.4052734375, 2.50439453125, 2.603515625, 2.70263671875, 2.8017578125, 2.90087890625, 3.0]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 9.0, 7.0, 9.0, 13.0, 23.0, 24.0, 20.0, 39.0, 53.0, 93.0, 101.0, 183.0, 288.0, 442.0, 749.0, 1208.0, 2079.0, 4072.0, 8481.0, 20916.0, 143793.0, 813254.0, 30291.0, 10956.0, 5045.0, 2600.0, 1400.0, 872.0, 521.0, 329.0, 214.0, 143.0, 89.0, 66.0, 54.0, 24.0, 35.0, 23.0, 14.0, 9.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.068389892578125, -2.00201416015625, -1.935638427734375, -1.8692626953125, -1.802886962890625, -1.73651123046875, -1.670135498046875, -1.603759765625, -1.537384033203125, -1.47100830078125, -1.404632568359375, -1.3382568359375, -1.271881103515625, -1.20550537109375, -1.139129638671875, -1.07275390625, -1.006378173828125, -0.94000244140625, -0.873626708984375, -0.8072509765625, -0.740875244140625, -0.67449951171875, -0.608123779296875, -0.541748046875, -0.475372314453125, -0.40899658203125, -0.342620849609375, -0.2762451171875, -0.209869384765625, -0.14349365234375, -0.077117919921875, -0.0107421875, 0.055633544921875, 0.12200927734375, 0.188385009765625, 0.2547607421875, 0.321136474609375, 0.38751220703125, 0.453887939453125, 0.520263671875, 0.586639404296875, 0.65301513671875, 0.719390869140625, 0.7857666015625, 0.852142333984375, 0.91851806640625, 0.984893798828125, 1.05126953125, 1.117645263671875, 1.18402099609375, 1.250396728515625, 1.3167724609375, 1.383148193359375, 1.44952392578125, 1.515899658203125, 1.582275390625, 1.648651123046875, 1.71502685546875, 1.781402587890625, 1.8477783203125, 1.914154052734375, 1.98052978515625, 2.046905517578125, 2.11328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 7.0, 10.0, 9.0, 16.0, 20.0, 19.0, 22.0, 25.0, 24.0, 21.0, 29.0, 37.0, 42.0, 52.0, 53.0, 43.0, 43.0, 51.0, 47.0, 52.0, 33.0, 39.0, 38.0, 42.0, 34.0, 27.0, 20.0, 25.0, 20.0, 18.0, 15.0, 9.0, 13.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.041015625, -1.97149658203125, -1.9019775390625, -1.83245849609375, -1.762939453125, -1.69342041015625, -1.6239013671875, -1.55438232421875, -1.48486328125, -1.41534423828125, -1.3458251953125, -1.27630615234375, -1.206787109375, -1.13726806640625, -1.0677490234375, -0.99822998046875, -0.9287109375, -0.85919189453125, -0.7896728515625, -0.72015380859375, -0.650634765625, -0.58111572265625, -0.5115966796875, -0.44207763671875, -0.37255859375, -0.30303955078125, -0.2335205078125, -0.16400146484375, -0.094482421875, -0.02496337890625, 0.0445556640625, 0.11407470703125, 0.18359375, 0.25311279296875, 0.3226318359375, 0.39215087890625, 0.461669921875, 0.53118896484375, 0.6007080078125, 0.67022705078125, 0.73974609375, 0.80926513671875, 0.8787841796875, 0.94830322265625, 1.017822265625, 1.08734130859375, 1.1568603515625, 1.22637939453125, 1.2958984375, 1.36541748046875, 1.4349365234375, 1.50445556640625, 1.573974609375, 1.64349365234375, 1.7130126953125, 1.78253173828125, 1.85205078125, 1.92156982421875, 1.9910888671875, 2.06060791015625, 2.130126953125, 2.19964599609375, 2.2691650390625, 2.33868408203125, 2.408203125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 6.0, 9.0, 13.0, 4.0, 16.0, 10.0, 27.0, 43.0, 48.0, 79.0, 86.0, 157.0, 225.0, 315.0, 475.0, 725.0, 1092.0, 1873.0, 3142.0, 6158.0, 14804.0, 57839.0, 905037.0, 32810.0, 11298.0, 5070.0, 2660.0, 1561.0, 936.0, 647.0, 417.0, 301.0, 206.0, 128.0, 97.0, 58.0, 46.0, 37.0, 27.0, 18.0, 13.0, 10.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6018905639648438, -0.5826873779296875, -0.5634841918945312, -0.544281005859375, -0.5250778198242188, -0.5058746337890625, -0.48667144775390625, -0.46746826171875, -0.44826507568359375, -0.4290618896484375, -0.40985870361328125, -0.390655517578125, -0.37145233154296875, -0.3522491455078125, -0.33304595947265625, -0.3138427734375, -0.29463958740234375, -0.2754364013671875, -0.25623321533203125, -0.237030029296875, -0.21782684326171875, -0.1986236572265625, -0.17942047119140625, -0.16021728515625, -0.14101409912109375, -0.1218109130859375, -0.10260772705078125, -0.083404541015625, -0.06420135498046875, -0.0449981689453125, -0.02579498291015625, -0.006591796875, 0.01261138916015625, 0.0318145751953125, 0.05101776123046875, 0.070220947265625, 0.08942413330078125, 0.1086273193359375, 0.12783050537109375, 0.14703369140625, 0.16623687744140625, 0.1854400634765625, 0.20464324951171875, 0.223846435546875, 0.24304962158203125, 0.2622528076171875, 0.28145599365234375, 0.3006591796875, 0.31986236572265625, 0.3390655517578125, 0.35826873779296875, 0.377471923828125, 0.39667510986328125, 0.4158782958984375, 0.43508148193359375, 0.45428466796875, 0.47348785400390625, 0.4926910400390625, 0.5118942260742188, 0.531097412109375, 0.5503005981445312, 0.5695037841796875, 0.5887069702148438, 0.60791015625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 8.0, 5.0, 7.0, 2.0, 9.0, 11.0, 15.0, 18.0, 23.0, 22.0, 21.0, 20.0, 40.0, 40.0, 68.0, 75.0, 65.0, 74.0, 61.0, 53.0, 61.0, 50.0, 56.0, 33.0, 39.0, 21.0, 21.0, 14.0, 14.0, 11.0, 7.0, 6.0, 4.0, 8.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6684017181396484e-05, -5.498994141817093e-05, -5.3295865654945374e-05, -5.160178989171982e-05, -4.990771412849426e-05, -4.821363836526871e-05, -4.651956260204315e-05, -4.4825486838817596e-05, -4.313141107559204e-05, -4.1437335312366486e-05, -3.974325954914093e-05, -3.8049183785915375e-05, -3.635510802268982e-05, -3.4661032259464264e-05, -3.296695649623871e-05, -3.127288073301315e-05, -2.9578804969787598e-05, -2.7884729206562042e-05, -2.6190653443336487e-05, -2.449657768011093e-05, -2.2802501916885376e-05, -2.110842615365982e-05, -1.9414350390434265e-05, -1.772027462720871e-05, -1.6026198863983154e-05, -1.4332123100757599e-05, -1.2638047337532043e-05, -1.0943971574306488e-05, -9.249895811080933e-06, -7.555820047855377e-06, -5.861744284629822e-06, -4.167668521404266e-06, -2.473592758178711e-06, -7.795169949531555e-07, 9.145587682723999e-07, 2.6086345314979553e-06, 4.302710294723511e-06, 5.996786057949066e-06, 7.690861821174622e-06, 9.384937584400177e-06, 1.1079013347625732e-05, 1.2773089110851288e-05, 1.4467164874076843e-05, 1.61612406373024e-05, 1.7855316400527954e-05, 1.954939216375351e-05, 2.1243467926979065e-05, 2.293754369020462e-05, 2.4631619453430176e-05, 2.632569521665573e-05, 2.8019770979881287e-05, 2.9713846743106842e-05, 3.14079225063324e-05, 3.310199826955795e-05, 3.479607403278351e-05, 3.6490149796009064e-05, 3.818422555923462e-05, 3.9878301322460175e-05, 4.157237708568573e-05, 4.3266452848911285e-05, 4.496052861213684e-05, 4.6654604375362396e-05, 4.834868013858795e-05, 5.004275590181351e-05, 5.173683166503906e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 5.0, 5.0, 11.0, 15.0, 25.0, 45.0, 68.0, 96.0, 152.0, 199.0, 300.0, 536.0, 798.0, 1264.0, 1904.0, 3070.0, 4864.0, 7931.0, 13622.0, 23944.0, 47753.0, 118924.0, 319582.0, 297300.0, 106111.0, 44387.0, 22404.0, 12769.0, 7663.0, 4668.0, 2899.0, 1861.0, 1164.0, 788.0, 486.0, 276.0, 217.0, 136.0, 83.0, 77.0, 52.0, 31.0, 19.0, 12.0, 9.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.242431640625, -0.23433685302734375, -0.2262420654296875, -0.21814727783203125, -0.210052490234375, -0.20195770263671875, -0.1938629150390625, -0.18576812744140625, -0.17767333984375, -0.16957855224609375, -0.1614837646484375, -0.15338897705078125, -0.145294189453125, -0.13719940185546875, -0.1291046142578125, -0.12100982666015625, -0.1129150390625, -0.10482025146484375, -0.0967254638671875, -0.08863067626953125, -0.080535888671875, -0.07244110107421875, -0.0643463134765625, -0.05625152587890625, -0.04815673828125, -0.04006195068359375, -0.0319671630859375, -0.02387237548828125, -0.015777587890625, -0.00768280029296875, 0.0004119873046875, 0.00850677490234375, 0.0166015625, 0.02469635009765625, 0.0327911376953125, 0.04088592529296875, 0.048980712890625, 0.05707550048828125, 0.0651702880859375, 0.07326507568359375, 0.08135986328125, 0.08945465087890625, 0.0975494384765625, 0.10564422607421875, 0.113739013671875, 0.12183380126953125, 0.1299285888671875, 0.13802337646484375, 0.1461181640625, 0.15421295166015625, 0.1623077392578125, 0.17040252685546875, 0.178497314453125, 0.18659210205078125, 0.1946868896484375, 0.20278167724609375, 0.21087646484375, 0.21897125244140625, 0.2270660400390625, 0.23516082763671875, 0.243255615234375, 0.25135040283203125, 0.2594451904296875, 0.26753997802734375, 0.275634765625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 9.0, 6.0, 7.0, 12.0, 8.0, 18.0, 18.0, 21.0, 22.0, 30.0, 35.0, 55.0, 85.0, 61.0, 89.0, 102.0, 81.0, 84.0, 48.0, 36.0, 24.0, 21.0, 24.0, 15.0, 9.0, 13.0, 8.0, 5.0, 4.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05096435546875, -0.04932594299316406, -0.047687530517578125, -0.04604911804199219, -0.04441070556640625, -0.04277229309082031, -0.041133880615234375, -0.03949546813964844, -0.0378570556640625, -0.03621864318847656, -0.034580230712890625, -0.03294181823730469, -0.03130340576171875, -0.029664993286132812, -0.028026580810546875, -0.026388168334960938, -0.024749755859375, -0.023111343383789062, -0.021472930908203125, -0.019834518432617188, -0.01819610595703125, -0.016557693481445312, -0.014919281005859375, -0.013280868530273438, -0.0116424560546875, -0.010004043579101562, -0.008365631103515625, -0.0067272186279296875, -0.00508880615234375, -0.0034503936767578125, -0.001811981201171875, -0.0001735687255859375, 0.00146484375, 0.0031032562255859375, 0.004741668701171875, 0.0063800811767578125, 0.00801849365234375, 0.009656906127929688, 0.011295318603515625, 0.012933731079101562, 0.0145721435546875, 0.016210556030273438, 0.017848968505859375, 0.019487380981445312, 0.02112579345703125, 0.022764205932617188, 0.024402618408203125, 0.026041030883789062, 0.027679443359375, 0.029317855834960938, 0.030956268310546875, 0.03259468078613281, 0.03423309326171875, 0.03587150573730469, 0.037509918212890625, 0.03914833068847656, 0.0407867431640625, 0.04242515563964844, 0.044063568115234375, 0.04570198059082031, 0.04734039306640625, 0.04897880554199219, 0.050617218017578125, 0.05225563049316406, 0.05389404296875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 10.0, 9.0, 6.0, 11.0, 9.0, 10.0, 17.0, 21.0, 15.0, 22.0, 41.0, 31.0, 37.0, 39.0, 56.0, 54.0, 42.0, 43.0, 52.0, 54.0, 41.0, 47.0, 50.0, 40.0, 39.0, 40.0, 33.0, 25.0, 11.0, 11.0, 14.0, 16.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.538368225097656, -4.402956008911133, -4.267544269561768, -4.132132053375244, -3.996720314025879, -3.8613083362579346, -3.7258963584899902, -3.590484142303467, -3.4550724029541016, -3.3196604251861572, -3.184248447418213, -3.0488364696502686, -2.913424491882324, -2.77801251411438, -2.6426005363464355, -2.507188320159912, -2.3717763423919678, -2.2363643646240234, -2.100952386856079, -1.9655404090881348, -1.8301284313201904, -1.694716453552246, -1.5593043565750122, -1.4238923788070679, -1.2884804010391235, -1.1530684232711792, -1.0176564455032349, -0.8822444081306458, -0.7468324303627014, -0.6114204525947571, -0.47600841522216797, -0.34059643745422363, -0.2051844596862793, -0.06977246701717377, 0.06563952565193176, 0.2010515332221985, 0.3364635109901428, 0.47187548875808716, 0.6072875261306763, 0.7426995038986206, 0.8781114816665649, 1.0135234594345093, 1.1489354372024536, 1.2843475341796875, 1.4197595119476318, 1.5551714897155762, 1.6905834674835205, 1.8259954452514648, 1.9614074230194092, 2.0968194007873535, 2.232231378555298, 2.367643356323242, 2.5030553340911865, 2.638467311859131, 2.7738795280456543, 2.9092912673950195, 3.044703483581543, 3.1801154613494873, 3.3155274391174316, 3.450939416885376, 3.5863513946533203, 3.7217633724212646, 3.857175350189209, 3.9925875663757324, 4.127999305725098]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 4.0, 12.0, 11.0, 10.0, 15.0, 9.0, 15.0, 7.0, 19.0, 33.0, 25.0, 30.0, 27.0, 40.0, 34.0, 35.0, 31.0, 40.0, 48.0, 41.0, 33.0, 35.0, 35.0, 31.0, 40.0, 50.0, 37.0, 27.0, 27.0, 26.0, 18.0, 23.0, 20.0, 17.0, 14.0, 14.0, 19.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.394810438156128, -2.318641185760498, -2.2424721717834473, -2.1663029193878174, -2.0901339054107666, -2.0139646530151367, -1.9377955198287964, -1.861626386642456, -1.7854571342468262, -1.7092880010604858, -1.6331188678741455, -1.5569496154785156, -1.4807804822921753, -1.404611349105835, -1.3284422159194946, -1.2522730827331543, -1.176103949546814, -1.0999348163604736, -1.0237656831741333, -0.9475964903831482, -0.8714272975921631, -0.7952581644058228, -0.7190890312194824, -0.6429198384284973, -0.566750705242157, -0.49058154225349426, -0.41441237926483154, -0.3382432460784912, -0.2620740830898285, -0.18590492010116577, -0.10973578691482544, -0.03356659412384033, 0.0426025390625, 0.11877169460058212, 0.19494085013866425, 0.27110999822616577, 0.3472791612148285, 0.4234483242034912, 0.49961745738983154, 0.5757866501808167, 0.651955783367157, 0.7281249165534973, 0.8042941093444824, 0.8804632425308228, 0.9566323757171631, 1.032801628112793, 1.1089706420898438, 1.1851398944854736, 1.261309027671814, 1.3374781608581543, 1.4136472940444946, 1.489816427230835, 1.5659856796264648, 1.6421548128128052, 1.7183239459991455, 1.7944931983947754, 1.8706622123718262, 1.9468313455581665, 2.023000478744507, 2.0991697311401367, 2.1753387451171875, 2.2515079975128174, 2.3276772499084473, 2.403846263885498, 2.480015516281128]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 4.0, 9.0, 11.0, 25.0, 30.0, 48.0, 78.0, 86.0, 121.0, 205.0, 309.0, 524.0, 939.0, 1610.0, 2642.0, 4895.0, 8901.0, 16857.0, 31385.0, 58225.0, 100608.0, 154838.0, 189809.0, 176991.0, 127582.0, 77803.0, 43249.0, 22905.0, 12488.0, 6612.0, 3661.0, 2078.0, 1170.0, 689.0, 421.0, 255.0, 169.0, 91.0, 71.0, 59.0, 35.0, 18.0, 11.0, 9.0, 13.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.265625, -4.13128662109375, -3.9969482421875, -3.86260986328125, -3.728271484375, -3.59393310546875, -3.4595947265625, -3.32525634765625, -3.19091796875, -3.05657958984375, -2.9222412109375, -2.78790283203125, -2.653564453125, -2.51922607421875, -2.3848876953125, -2.25054931640625, -2.1162109375, -1.98187255859375, -1.8475341796875, -1.71319580078125, -1.578857421875, -1.44451904296875, -1.3101806640625, -1.17584228515625, -1.04150390625, -0.90716552734375, -0.7728271484375, -0.63848876953125, -0.504150390625, -0.36981201171875, -0.2354736328125, -0.10113525390625, 0.033203125, 0.16754150390625, 0.3018798828125, 0.43621826171875, 0.570556640625, 0.70489501953125, 0.8392333984375, 0.97357177734375, 1.10791015625, 1.24224853515625, 1.3765869140625, 1.51092529296875, 1.645263671875, 1.77960205078125, 1.9139404296875, 2.04827880859375, 2.1826171875, 2.31695556640625, 2.4512939453125, 2.58563232421875, 2.719970703125, 2.85430908203125, 2.9886474609375, 3.12298583984375, 3.25732421875, 3.39166259765625, 3.5260009765625, 3.66033935546875, 3.794677734375, 3.92901611328125, 4.0633544921875, 4.19769287109375, 4.33203125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 3.0, 7.0, 9.0, 13.0, 12.0, 13.0, 19.0, 23.0, 27.0, 40.0, 31.0, 42.0, 39.0, 45.0, 49.0, 44.0, 44.0, 41.0, 35.0, 38.0, 40.0, 37.0, 41.0, 42.0, 30.0, 29.0, 40.0, 22.0, 25.0, 20.0, 10.0, 16.0, 12.0, 12.0, 11.0, 8.0, 6.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.19921875, -3.10540771484375, -3.0115966796875, -2.91778564453125, -2.823974609375, -2.73016357421875, -2.6363525390625, -2.54254150390625, -2.44873046875, -2.35491943359375, -2.2611083984375, -2.16729736328125, -2.073486328125, -1.97967529296875, -1.8858642578125, -1.79205322265625, -1.6982421875, -1.60443115234375, -1.5106201171875, -1.41680908203125, -1.322998046875, -1.22918701171875, -1.1353759765625, -1.04156494140625, -0.94775390625, -0.85394287109375, -0.7601318359375, -0.66632080078125, -0.572509765625, -0.47869873046875, -0.3848876953125, -0.29107666015625, -0.197265625, -0.10345458984375, -0.0096435546875, 0.08416748046875, 0.177978515625, 0.27178955078125, 0.3656005859375, 0.45941162109375, 0.55322265625, 0.64703369140625, 0.7408447265625, 0.83465576171875, 0.928466796875, 1.02227783203125, 1.1160888671875, 1.20989990234375, 1.3037109375, 1.39752197265625, 1.4913330078125, 1.58514404296875, 1.678955078125, 1.77276611328125, 1.8665771484375, 1.96038818359375, 2.05419921875, 2.14801025390625, 2.2418212890625, 2.33563232421875, 2.429443359375, 2.52325439453125, 2.6170654296875, 2.71087646484375, 2.8046875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 17.0, 16.0, 22.0, 29.0, 54.0, 79.0, 142.0, 169.0, 318.0, 479.0, 813.0, 1300.0, 2166.0, 3702.0, 6402.0, 11074.0, 18402.0, 31268.0, 51294.0, 80654.0, 116918.0, 148935.0, 157984.0, 138826.0, 102753.0, 68981.0, 42734.0, 25952.0, 15233.0, 8960.0, 5053.0, 3093.0, 1814.0, 1077.0, 697.0, 417.0, 247.0, 150.0, 116.0, 60.0, 44.0, 31.0, 22.0, 16.0, 10.0, 5.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.71484375, -3.599884033203125, -3.48492431640625, -3.369964599609375, -3.2550048828125, -3.140045166015625, -3.02508544921875, -2.910125732421875, -2.795166015625, -2.680206298828125, -2.56524658203125, -2.450286865234375, -2.3353271484375, -2.220367431640625, -2.10540771484375, -1.990447998046875, -1.87548828125, -1.760528564453125, -1.64556884765625, -1.530609130859375, -1.4156494140625, -1.300689697265625, -1.18572998046875, -1.070770263671875, -0.955810546875, -0.840850830078125, -0.72589111328125, -0.610931396484375, -0.4959716796875, -0.381011962890625, -0.26605224609375, -0.151092529296875, -0.0361328125, 0.078826904296875, 0.19378662109375, 0.308746337890625, 0.4237060546875, 0.538665771484375, 0.65362548828125, 0.768585205078125, 0.883544921875, 0.998504638671875, 1.11346435546875, 1.228424072265625, 1.3433837890625, 1.458343505859375, 1.57330322265625, 1.688262939453125, 1.80322265625, 1.918182373046875, 2.03314208984375, 2.148101806640625, 2.2630615234375, 2.378021240234375, 2.49298095703125, 2.607940673828125, 2.722900390625, 2.837860107421875, 2.95281982421875, 3.067779541015625, 3.1827392578125, 3.297698974609375, 3.41265869140625, 3.527618408203125, 3.642578125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 10.0, 11.0, 12.0, 10.0, 13.0, 11.0, 13.0, 15.0, 23.0, 26.0, 26.0, 28.0, 26.0, 35.0, 33.0, 39.0, 34.0, 48.0, 36.0, 43.0, 32.0, 35.0, 31.0, 32.0, 25.0, 33.0, 27.0, 34.0, 27.0, 27.0, 20.0, 23.0, 16.0, 23.0, 14.0, 9.0, 18.0, 14.0, 3.0, 12.0, 2.0, 11.0, 8.0, 1.0, 5.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0], "bins": [-1.66796875, -1.618438720703125, -1.56890869140625, -1.519378662109375, -1.4698486328125, -1.420318603515625, -1.37078857421875, -1.321258544921875, -1.271728515625, -1.222198486328125, -1.17266845703125, -1.123138427734375, -1.0736083984375, -1.024078369140625, -0.97454833984375, -0.925018310546875, -0.87548828125, -0.825958251953125, -0.77642822265625, -0.726898193359375, -0.6773681640625, -0.627838134765625, -0.57830810546875, -0.528778076171875, -0.479248046875, -0.429718017578125, -0.38018798828125, -0.330657958984375, -0.2811279296875, -0.231597900390625, -0.18206787109375, -0.132537841796875, -0.0830078125, -0.033477783203125, 0.01605224609375, 0.065582275390625, 0.1151123046875, 0.164642333984375, 0.21417236328125, 0.263702392578125, 0.313232421875, 0.362762451171875, 0.41229248046875, 0.461822509765625, 0.5113525390625, 0.560882568359375, 0.61041259765625, 0.659942626953125, 0.70947265625, 0.759002685546875, 0.80853271484375, 0.858062744140625, 0.9075927734375, 0.957122802734375, 1.00665283203125, 1.056182861328125, 1.105712890625, 1.155242919921875, 1.20477294921875, 1.254302978515625, 1.3038330078125, 1.353363037109375, 1.40289306640625, 1.452423095703125, 1.501953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 4.0, 7.0, 13.0, 13.0, 20.0, 31.0, 33.0, 50.0, 55.0, 85.0, 89.0, 140.0, 158.0, 197.0, 271.0, 371.0, 463.0, 612.0, 853.0, 1121.0, 1565.0, 2179.0, 3323.0, 5623.0, 12627.0, 42964.0, 203496.0, 492337.0, 206416.0, 43399.0, 12877.0, 5642.0, 3226.0, 2102.0, 1521.0, 1102.0, 811.0, 670.0, 503.0, 379.0, 294.0, 211.0, 178.0, 146.0, 83.0, 76.0, 59.0, 49.0, 41.0, 22.0, 13.0, 15.0, 12.0, 9.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.8515625, -6.626953125, -6.40234375, -6.177734375, -5.953125, -5.728515625, -5.50390625, -5.279296875, -5.0546875, -4.830078125, -4.60546875, -4.380859375, -4.15625, -3.931640625, -3.70703125, -3.482421875, -3.2578125, -3.033203125, -2.80859375, -2.583984375, -2.359375, -2.134765625, -1.91015625, -1.685546875, -1.4609375, -1.236328125, -1.01171875, -0.787109375, -0.5625, -0.337890625, -0.11328125, 0.111328125, 0.3359375, 0.560546875, 0.78515625, 1.009765625, 1.234375, 1.458984375, 1.68359375, 1.908203125, 2.1328125, 2.357421875, 2.58203125, 2.806640625, 3.03125, 3.255859375, 3.48046875, 3.705078125, 3.9296875, 4.154296875, 4.37890625, 4.603515625, 4.828125, 5.052734375, 5.27734375, 5.501953125, 5.7265625, 5.951171875, 6.17578125, 6.400390625, 6.625, 6.849609375, 7.07421875, 7.298828125, 7.5234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 8.0, 7.0, 8.0, 25.0, 60.0, 102.0, 197.0, 213.0, 182.0, 96.0, 47.0, 15.0, 12.0, 5.0, 6.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009016990661621094, -0.0008754655718803406, -0.0008492320775985718, -0.000822998583316803, -0.0007967650890350342, -0.0007705315947532654, -0.0007442981004714966, -0.0007180646061897278, -0.000691831111907959, -0.0006655976176261902, -0.0006393641233444214, -0.0006131306290626526, -0.0005868971347808838, -0.000560663640499115, -0.0005344301462173462, -0.0005081966519355774, -0.0004819631576538086, -0.0004557296633720398, -0.000429496169090271, -0.0004032626748085022, -0.0003770291805267334, -0.0003507956862449646, -0.0003245621919631958, -0.000298328697681427, -0.0002720952033996582, -0.0002458617091178894, -0.0002196282148361206, -0.0001933947205543518, -0.000167161226272583, -0.0001409277319908142, -0.00011469423770904541, -8.846074342727661e-05, -6.222724914550781e-05, -3.5993754863739014e-05, -9.760260581970215e-06, 1.6473233699798584e-05, 4.270672798156738e-05, 6.894022226333618e-05, 9.517371654510498e-05, 0.00012140721082687378, 0.00014764070510864258, 0.00017387419939041138, 0.00020010769367218018, 0.00022634118795394897, 0.0002525746822357178, 0.00027880817651748657, 0.00030504167079925537, 0.00033127516508102417, 0.00035750865936279297, 0.00038374215364456177, 0.00040997564792633057, 0.00043620914220809937, 0.00046244263648986816, 0.000488676130771637, 0.0005149096250534058, 0.0005411431193351746, 0.0005673766136169434, 0.0005936101078987122, 0.000619843602180481, 0.0006460770964622498, 0.0006723105907440186, 0.0006985440850257874, 0.0007247775793075562, 0.000751011073589325, 0.0007772445678710938]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 13.0, 15.0, 18.0, 32.0, 41.0, 47.0, 60.0, 78.0, 143.0, 179.0, 275.0, 374.0, 533.0, 739.0, 1164.0, 1742.0, 2586.0, 4005.0, 9112.0, 52654.0, 457300.0, 445733.0, 50738.0, 9014.0, 3926.0, 2631.0, 1705.0, 1159.0, 750.0, 530.0, 358.0, 267.0, 187.0, 110.0, 84.0, 73.0, 43.0, 37.0, 25.0, 21.0, 18.0, 5.0, 9.0, 5.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-9.9375, -9.6451416015625, -9.352783203125, -9.0604248046875, -8.76806640625, -8.4757080078125, -8.183349609375, -7.8909912109375, -7.5986328125, -7.3062744140625, -7.013916015625, -6.7215576171875, -6.42919921875, -6.1368408203125, -5.844482421875, -5.5521240234375, -5.259765625, -4.9674072265625, -4.675048828125, -4.3826904296875, -4.09033203125, -3.7979736328125, -3.505615234375, -3.2132568359375, -2.9208984375, -2.6285400390625, -2.336181640625, -2.0438232421875, -1.75146484375, -1.4591064453125, -1.166748046875, -0.8743896484375, -0.58203125, -0.2896728515625, 0.002685546875, 0.2950439453125, 0.58740234375, 0.8797607421875, 1.172119140625, 1.4644775390625, 1.7568359375, 2.0491943359375, 2.341552734375, 2.6339111328125, 2.92626953125, 3.2186279296875, 3.510986328125, 3.8033447265625, 4.095703125, 4.3880615234375, 4.680419921875, 4.9727783203125, 5.26513671875, 5.5574951171875, 5.849853515625, 6.1422119140625, 6.4345703125, 6.7269287109375, 7.019287109375, 7.3116455078125, 7.60400390625, 7.8963623046875, 8.188720703125, 8.4810791015625, 8.7734375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 16.0, 36.0, 56.0, 108.0, 173.0, 202.0, 155.0, 113.0, 69.0, 27.0, 17.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9176177978515625, -1.847930908203125, -1.7782440185546875, -1.70855712890625, -1.6388702392578125, -1.569183349609375, -1.4994964599609375, -1.4298095703125, -1.3601226806640625, -1.290435791015625, -1.2207489013671875, -1.15106201171875, -1.0813751220703125, -1.011688232421875, -0.9420013427734375, -0.872314453125, -0.8026275634765625, -0.732940673828125, -0.6632537841796875, -0.59356689453125, -0.5238800048828125, -0.454193115234375, -0.3845062255859375, -0.3148193359375, -0.2451324462890625, -0.175445556640625, -0.1057586669921875, -0.03607177734375, 0.0336151123046875, 0.103302001953125, 0.1729888916015625, 0.24267578125, 0.3123626708984375, 0.382049560546875, 0.4517364501953125, 0.52142333984375, 0.5911102294921875, 0.660797119140625, 0.7304840087890625, 0.8001708984375, 0.8698577880859375, 0.939544677734375, 1.0092315673828125, 1.07891845703125, 1.1486053466796875, 1.218292236328125, 1.2879791259765625, 1.357666015625, 1.4273529052734375, 1.497039794921875, 1.5667266845703125, 1.63641357421875, 1.7061004638671875, 1.775787353515625, 1.8454742431640625, 1.9151611328125, 1.9848480224609375, 2.054534912109375, 2.1242218017578125, 2.19390869140625, 2.2635955810546875, 2.333282470703125, 2.4029693603515625, 2.47265625]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 4.0, 8.0, 8.0, 12.0, 18.0, 16.0, 17.0, 17.0, 18.0, 35.0, 21.0, 34.0, 42.0, 39.0, 44.0, 37.0, 52.0, 51.0, 74.0, 59.0, 37.0, 35.0, 41.0, 46.0, 38.0, 29.0, 28.0, 20.0, 17.0, 11.0, 21.0, 9.0, 7.0, 10.0, 3.0, 6.0, 5.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-4.421260833740234, -4.286639213562012, -4.152018070220947, -4.017396450042725, -3.882775068283081, -3.7481536865234375, -3.613532066345215, -3.4789106845855713, -3.3442893028259277, -3.209667921066284, -3.0750465393066406, -2.940424919128418, -2.8058035373687744, -2.671182155609131, -2.536560535430908, -2.4019391536712646, -2.267317771911621, -2.1326963901519775, -1.9980748891830444, -1.8634533882141113, -1.7288320064544678, -1.5942106246948242, -1.4595891237258911, -1.324967622756958, -1.1903462409973145, -1.055724859237671, -0.9211033582687378, -0.7864819169044495, -0.6518604755401611, -0.5172390341758728, -0.3826175928115845, -0.24799615144729614, -0.11337423324584961, 0.02124720811843872, 0.15586864948272705, 0.2904900908470154, 0.4251115322113037, 0.559732973575592, 0.6943544149398804, 0.8289758563041687, 0.963597297668457, 1.0982186794281006, 1.2328401803970337, 1.3674616813659668, 1.5020830631256104, 1.636704444885254, 1.771325945854187, 1.9059474468231201, 2.0405688285827637, 2.1751902103424072, 2.309811592102051, 2.4444332122802734, 2.579054594039917, 2.7136759757995605, 2.848297595977783, 2.9829189777374268, 3.1175403594970703, 3.252161741256714, 3.3867831230163574, 3.52140474319458, 3.6560261249542236, 3.790647506713867, 3.92526912689209, 4.059890270233154, 4.194511890411377]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 4.0, 6.0, 7.0, 8.0, 14.0, 21.0, 22.0, 15.0, 22.0, 23.0, 26.0, 20.0, 23.0, 36.0, 37.0, 38.0, 42.0, 37.0, 40.0, 27.0, 36.0, 34.0, 37.0, 36.0, 26.0, 40.0, 35.0, 35.0, 30.0, 28.0, 22.0, 22.0, 26.0, 20.0, 17.0, 5.0, 7.0, 14.0, 13.0, 5.0, 8.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.6036057472229004, -2.5236926078796387, -2.443779468536377, -2.3638663291931152, -2.2839531898498535, -2.204040050506592, -2.12412691116333, -2.0442137718200684, -1.9643006324768066, -1.884387493133545, -1.8044743537902832, -1.7245612144470215, -1.6446480751037598, -1.564734935760498, -1.4848217964172363, -1.4049086570739746, -1.3249953985214233, -1.2450822591781616, -1.1651691198349, -1.0852559804916382, -1.0053428411483765, -0.9254297018051147, -0.8455165028572083, -0.7656033635139465, -0.6856902241706848, -0.6057770848274231, -0.5258639454841614, -0.44595077633857727, -0.36603763699531555, -0.28612449765205383, -0.20621132850646973, -0.126298189163208, -0.04638504981994629, 0.03352809697389603, 0.11344124376773834, 0.19335439801216125, 0.273267537355423, 0.3531806766986847, 0.4330938458442688, 0.5130069851875305, 0.5929201245307922, 0.672833263874054, 0.7527464032173157, 0.8326596021652222, 0.9125727415084839, 0.9924858808517456, 1.0723990201950073, 1.152312159538269, 1.2322252988815308, 1.3121384382247925, 1.3920515775680542, 1.471964716911316, 1.5518778562545776, 1.6317909955978394, 1.7117042541503906, 1.7916173934936523, 1.871530532836914, 1.9514436721801758, 2.0313568115234375, 2.111269950866699, 2.191183090209961, 2.2710962295532227, 2.3510093688964844, 2.430922508239746, 2.510835647583008]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 8.0, 28.0, 26.0, 32.0, 58.0, 99.0, 93.0, 168.0, 261.0, 368.0, 520.0, 783.0, 1111.0, 1782.0, 2639.0, 4183.0, 6756.0, 10744.0, 17625.0, 29981.0, 52567.0, 95982.0, 180449.0, 346564.0, 627920.0, 889814.0, 817818.0, 510290.0, 270558.0, 141820.0, 76576.0, 42805.0, 24500.0, 14710.0, 8873.0, 5612.0, 3596.0, 2236.0, 1481.0, 968.0, 616.0, 443.0, 268.0, 176.0, 126.0, 83.0, 54.0, 38.0, 23.0, 15.0, 8.0, 8.0, 2.0, 2.0, 3.0], "bins": [-4.6328125, -4.499725341796875, -4.36663818359375, -4.233551025390625, -4.1004638671875, -3.967376708984375, -3.83428955078125, -3.701202392578125, -3.568115234375, -3.435028076171875, -3.30194091796875, -3.168853759765625, -3.0357666015625, -2.902679443359375, -2.76959228515625, -2.636505126953125, -2.50341796875, -2.370330810546875, -2.23724365234375, -2.104156494140625, -1.9710693359375, -1.837982177734375, -1.70489501953125, -1.571807861328125, -1.438720703125, -1.305633544921875, -1.17254638671875, -1.039459228515625, -0.9063720703125, -0.773284912109375, -0.64019775390625, -0.507110595703125, -0.3740234375, -0.240936279296875, -0.10784912109375, 0.025238037109375, 0.1583251953125, 0.291412353515625, 0.42449951171875, 0.557586669921875, 0.690673828125, 0.823760986328125, 0.95684814453125, 1.089935302734375, 1.2230224609375, 1.356109619140625, 1.48919677734375, 1.622283935546875, 1.75537109375, 1.888458251953125, 2.02154541015625, 2.154632568359375, 2.2877197265625, 2.420806884765625, 2.55389404296875, 2.686981201171875, 2.820068359375, 2.953155517578125, 3.08624267578125, 3.219329833984375, 3.3524169921875, 3.485504150390625, 3.61859130859375, 3.751678466796875, 3.884765625]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 5.0, 2.0, 9.0, 11.0, 9.0, 10.0, 10.0, 22.0, 22.0, 19.0, 27.0, 25.0, 22.0, 30.0, 31.0, 41.0, 31.0, 46.0, 37.0, 40.0, 34.0, 40.0, 33.0, 37.0, 42.0, 43.0, 39.0, 26.0, 35.0, 34.0, 24.0, 23.0, 23.0, 21.0, 19.0, 16.0, 8.0, 12.0, 6.0, 4.0, 6.0, 3.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.345703125, -2.2724609375, -2.19921875, -2.1259765625, -2.052734375, -1.9794921875, -1.90625, -1.8330078125, -1.759765625, -1.6865234375, -1.61328125, -1.5400390625, -1.466796875, -1.3935546875, -1.3203125, -1.2470703125, -1.173828125, -1.1005859375, -1.02734375, -0.9541015625, -0.880859375, -0.8076171875, -0.734375, -0.6611328125, -0.587890625, -0.5146484375, -0.44140625, -0.3681640625, -0.294921875, -0.2216796875, -0.1484375, -0.0751953125, -0.001953125, 0.0712890625, 0.14453125, 0.2177734375, 0.291015625, 0.3642578125, 0.4375, 0.5107421875, 0.583984375, 0.6572265625, 0.73046875, 0.8037109375, 0.876953125, 0.9501953125, 1.0234375, 1.0966796875, 1.169921875, 1.2431640625, 1.31640625, 1.3896484375, 1.462890625, 1.5361328125, 1.609375, 1.6826171875, 1.755859375, 1.8291015625, 1.90234375, 1.9755859375, 2.048828125, 2.1220703125, 2.1953125, 2.2685546875, 2.341796875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 7.0, 10.0, 18.0, 33.0, 31.0, 52.0, 81.0, 112.0, 204.0, 286.0, 404.0, 675.0, 1115.0, 1652.0, 2733.0, 4343.0, 7060.0, 11690.0, 19764.0, 34120.0, 59776.0, 107753.0, 195242.0, 353582.0, 604979.0, 838242.0, 780767.0, 512215.0, 290859.0, 159397.0, 87459.0, 49180.0, 27997.0, 16448.0, 9874.0, 5990.0, 3713.0, 2310.0, 1463.0, 889.0, 631.0, 381.0, 264.0, 154.0, 91.0, 85.0, 55.0, 30.0, 21.0, 14.0, 13.0, 7.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.38690185546875, -4.2347412109375, -4.08258056640625, -3.930419921875, -3.77825927734375, -3.6260986328125, -3.47393798828125, -3.32177734375, -3.16961669921875, -3.0174560546875, -2.86529541015625, -2.713134765625, -2.56097412109375, -2.4088134765625, -2.25665283203125, -2.1044921875, -1.95233154296875, -1.8001708984375, -1.64801025390625, -1.495849609375, -1.34368896484375, -1.1915283203125, -1.03936767578125, -0.88720703125, -0.73504638671875, -0.5828857421875, -0.43072509765625, -0.278564453125, -0.12640380859375, 0.0257568359375, 0.17791748046875, 0.330078125, 0.48223876953125, 0.6343994140625, 0.78656005859375, 0.938720703125, 1.09088134765625, 1.2430419921875, 1.39520263671875, 1.54736328125, 1.69952392578125, 1.8516845703125, 2.00384521484375, 2.156005859375, 2.30816650390625, 2.4603271484375, 2.61248779296875, 2.7646484375, 2.91680908203125, 3.0689697265625, 3.22113037109375, 3.373291015625, 3.52545166015625, 3.6776123046875, 3.82977294921875, 3.98193359375, 4.13409423828125, 4.2862548828125, 4.43841552734375, 4.590576171875, 4.74273681640625, 4.8948974609375, 5.04705810546875, 5.19921875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 2.0, 10.0, 10.0, 12.0, 18.0, 26.0, 29.0, 31.0, 40.0, 71.0, 67.0, 89.0, 102.0, 132.0, 170.0, 198.0, 247.0, 226.0, 270.0, 289.0, 268.0, 246.0, 258.0, 220.0, 218.0, 165.0, 148.0, 123.0, 84.0, 78.0, 62.0, 44.0, 36.0, 24.0, 15.0, 13.0, 8.0, 8.0, 2.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6845703125, -1.633544921875, -1.58251953125, -1.531494140625, -1.48046875, -1.429443359375, -1.37841796875, -1.327392578125, -1.2763671875, -1.225341796875, -1.17431640625, -1.123291015625, -1.072265625, -1.021240234375, -0.97021484375, -0.919189453125, -0.8681640625, -0.817138671875, -0.76611328125, -0.715087890625, -0.6640625, -0.613037109375, -0.56201171875, -0.510986328125, -0.4599609375, -0.408935546875, -0.35791015625, -0.306884765625, -0.255859375, -0.204833984375, -0.15380859375, -0.102783203125, -0.0517578125, -0.000732421875, 0.05029296875, 0.101318359375, 0.15234375, 0.203369140625, 0.25439453125, 0.305419921875, 0.3564453125, 0.407470703125, 0.45849609375, 0.509521484375, 0.560546875, 0.611572265625, 0.66259765625, 0.713623046875, 0.7646484375, 0.815673828125, 0.86669921875, 0.917724609375, 0.96875, 1.019775390625, 1.07080078125, 1.121826171875, 1.1728515625, 1.223876953125, 1.27490234375, 1.325927734375, 1.376953125, 1.427978515625, 1.47900390625, 1.530029296875, 1.5810546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 2.0, 1.0, 5.0, 3.0, 11.0, 11.0, 9.0, 18.0, 18.0, 21.0, 27.0, 38.0, 35.0, 54.0, 45.0, 60.0, 57.0, 70.0, 72.0, 53.0, 62.0, 44.0, 46.0, 44.0, 32.0, 41.0, 21.0, 21.0, 17.0, 16.0, 9.0, 12.0, 10.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.877341270446777, -5.695503234863281, -5.513665199279785, -5.331827163696289, -5.149989604949951, -4.968151569366455, -4.786313533782959, -4.604475498199463, -4.422637939453125, -4.240799903869629, -4.058961868286133, -3.877124071121216, -3.695286273956299, -3.5134482383728027, -3.3316102027893066, -3.1497721672058105, -2.9679341316223145, -2.7860960960388184, -2.6042582988739014, -2.4224202632904053, -2.2405824661254883, -2.058744430541992, -1.876906394958496, -1.6950684785842896, -1.513230562210083, -1.3313926458358765, -1.14955472946167, -0.9677166938781738, -0.7858787775039673, -0.6040408611297607, -0.42220282554626465, -0.2403649091720581, -0.05852651596069336, 0.12331143021583557, 0.3051493763923645, 0.4869873523712158, 0.6688252687454224, 0.8506631851196289, 1.032501220703125, 1.2143391370773315, 1.396177053451538, 1.5780149698257446, 1.7598528861999512, 1.9416909217834473, 2.1235289573669434, 2.3053667545318604, 2.4872047901153564, 2.6690425872802734, 2.8508806228637695, 3.0327186584472656, 3.2145564556121826, 3.3963944911956787, 3.5782322883605957, 3.760070323944092, 3.941908359527588, 4.123746395111084, 4.305583953857422, 4.487421989440918, 4.669260025024414, 4.85109806060791, 5.032935619354248, 5.214773654937744, 5.39661169052124, 5.578449726104736, 5.760287761688232]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 0.0, 6.0, 4.0, 1.0, 2.0, 6.0, 4.0, 6.0, 15.0, 12.0, 9.0, 17.0, 11.0, 18.0, 22.0, 24.0, 22.0, 38.0, 28.0, 35.0, 26.0, 33.0, 33.0, 36.0, 34.0, 52.0, 40.0, 34.0, 38.0, 33.0, 37.0, 36.0, 38.0, 31.0, 24.0, 22.0, 19.0, 21.0, 27.0, 14.0, 11.0, 13.0, 19.0, 3.0, 17.0, 7.0, 2.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0], "bins": [-2.9414868354797363, -2.855492115020752, -2.7694976329803467, -2.6835029125213623, -2.597508430480957, -2.5115137100219727, -2.4255189895629883, -2.339524507522583, -2.2535300254821777, -2.1675353050231934, -2.081540822982788, -1.9955461025238037, -1.9095516204833984, -1.823556900024414, -1.7375622987747192, -1.6515676975250244, -1.56557297706604, -1.4795783758163452, -1.3935837745666504, -1.307589054107666, -1.2215945720672607, -1.1355998516082764, -1.0496052503585815, -0.9636106491088867, -0.8776160478591919, -0.7916214466094971, -0.7056268453598022, -0.6196321845054626, -0.5336375832557678, -0.447642982006073, -0.3616483211517334, -0.2756537199020386, -0.18965911865234375, -0.10366450250148773, -0.017669886350631714, 0.0683247447013855, 0.15431934595108032, 0.24031394720077515, 0.32630860805511475, 0.41230320930480957, 0.4982978105545044, 0.5842924118041992, 0.670287013053894, 0.7562816739082336, 0.8422762751579285, 0.9282708764076233, 1.014265537261963, 1.1002601385116577, 1.1862547397613525, 1.2722493410110474, 1.3582439422607422, 1.4442386627197266, 1.5302331447601318, 1.6162278652191162, 1.702222466468811, 1.7882170677185059, 1.8742116689682007, 1.9602062702178955, 2.04620099067688, 2.132195472717285, 2.2181901931762695, 2.304184675216675, 2.390179395675659, 2.4761738777160645, 2.562168598175049]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 13.0, 15.0, 29.0, 45.0, 62.0, 97.0, 193.0, 365.0, 643.0, 1373.0, 2880.0, 6527.0, 15368.0, 38433.0, 103326.0, 266688.0, 345720.0, 164898.0, 60674.0, 23282.0, 9698.0, 4349.0, 1962.0, 894.0, 443.0, 212.0, 144.0, 79.0, 44.0, 33.0, 21.0, 9.0, 15.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8525390625, -0.8223419189453125, -0.792144775390625, -0.7619476318359375, -0.73175048828125, -0.7015533447265625, -0.671356201171875, -0.6411590576171875, -0.6109619140625, -0.5807647705078125, -0.550567626953125, -0.5203704833984375, -0.49017333984375, -0.4599761962890625, -0.429779052734375, -0.3995819091796875, -0.369384765625, -0.3391876220703125, -0.308990478515625, -0.2787933349609375, -0.24859619140625, -0.2183990478515625, -0.188201904296875, -0.1580047607421875, -0.1278076171875, -0.0976104736328125, -0.067413330078125, -0.0372161865234375, -0.00701904296875, 0.0231781005859375, 0.053375244140625, 0.0835723876953125, 0.11376953125, 0.1439666748046875, 0.174163818359375, 0.2043609619140625, 0.23455810546875, 0.2647552490234375, 0.294952392578125, 0.3251495361328125, 0.3553466796875, 0.3855438232421875, 0.415740966796875, 0.4459381103515625, 0.47613525390625, 0.5063323974609375, 0.536529541015625, 0.5667266845703125, 0.596923828125, 0.6271209716796875, 0.657318115234375, 0.6875152587890625, 0.71771240234375, 0.7479095458984375, 0.778106689453125, 0.8083038330078125, 0.8385009765625, 0.8686981201171875, 0.898895263671875, 0.9290924072265625, 0.95928955078125, 0.9894866943359375, 1.019683837890625, 1.0498809814453125, 1.080078125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 11.0, 19.0, 17.0, 25.0, 33.0, 21.0, 33.0, 28.0, 36.0, 44.0, 31.0, 40.0, 43.0, 56.0, 51.0, 47.0, 55.0, 41.0, 41.0, 39.0, 43.0, 26.0, 24.0, 28.0, 17.0, 20.0, 17.0, 17.0, 17.0, 10.0, 12.0, 12.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59765625, -3.479827880859375, -3.36199951171875, -3.244171142578125, -3.1263427734375, -3.008514404296875, -2.89068603515625, -2.772857666015625, -2.655029296875, -2.537200927734375, -2.41937255859375, -2.301544189453125, -2.1837158203125, -2.065887451171875, -1.94805908203125, -1.830230712890625, -1.71240234375, -1.594573974609375, -1.47674560546875, -1.358917236328125, -1.2410888671875, -1.123260498046875, -1.00543212890625, -0.887603759765625, -0.769775390625, -0.651947021484375, -0.53411865234375, -0.416290283203125, -0.2984619140625, -0.180633544921875, -0.06280517578125, 0.055023193359375, 0.1728515625, 0.290679931640625, 0.40850830078125, 0.526336669921875, 0.6441650390625, 0.761993408203125, 0.87982177734375, 0.997650146484375, 1.115478515625, 1.233306884765625, 1.35113525390625, 1.468963623046875, 1.5867919921875, 1.704620361328125, 1.82244873046875, 1.940277099609375, 2.05810546875, 2.175933837890625, 2.29376220703125, 2.411590576171875, 2.5294189453125, 2.647247314453125, 2.76507568359375, 2.882904052734375, 3.000732421875, 3.118560791015625, 3.23638916015625, 3.354217529296875, 3.4720458984375, 3.589874267578125, 3.70770263671875, 3.825531005859375, 3.943359375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 9.0, 8.0, 14.0, 16.0, 29.0, 36.0, 70.0, 111.0, 188.0, 315.0, 606.0, 1145.0, 2283.0, 5561.0, 16564.0, 92937.0, 884183.0, 29265.0, 8795.0, 3258.0, 1482.0, 727.0, 374.0, 240.0, 118.0, 87.0, 53.0, 30.0, 26.0, 6.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.017669677734375, -1.93768310546875, -1.857696533203125, -1.7777099609375, -1.697723388671875, -1.61773681640625, -1.537750244140625, -1.457763671875, -1.377777099609375, -1.29779052734375, -1.217803955078125, -1.1378173828125, -1.057830810546875, -0.97784423828125, -0.897857666015625, -0.81787109375, -0.737884521484375, -0.65789794921875, -0.577911376953125, -0.4979248046875, -0.417938232421875, -0.33795166015625, -0.257965087890625, -0.177978515625, -0.097991943359375, -0.01800537109375, 0.061981201171875, 0.1419677734375, 0.221954345703125, 0.30194091796875, 0.381927490234375, 0.4619140625, 0.541900634765625, 0.62188720703125, 0.701873779296875, 0.7818603515625, 0.861846923828125, 0.94183349609375, 1.021820068359375, 1.101806640625, 1.181793212890625, 1.26177978515625, 1.341766357421875, 1.4217529296875, 1.501739501953125, 1.58172607421875, 1.661712646484375, 1.74169921875, 1.821685791015625, 1.90167236328125, 1.981658935546875, 2.0616455078125, 2.141632080078125, 2.22161865234375, 2.301605224609375, 2.381591796875, 2.461578369140625, 2.54156494140625, 2.621551513671875, 2.7015380859375, 2.781524658203125, 2.86151123046875, 2.941497802734375, 3.021484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 10.0, 12.0, 10.0, 17.0, 16.0, 20.0, 27.0, 38.0, 23.0, 31.0, 41.0, 33.0, 43.0, 40.0, 39.0, 40.0, 37.0, 52.0, 46.0, 46.0, 42.0, 37.0, 26.0, 27.0, 41.0, 31.0, 19.0, 23.0, 18.0, 15.0, 13.0, 17.0, 10.0, 5.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.255859375, -2.185516357421875, -2.11517333984375, -2.044830322265625, -1.9744873046875, -1.904144287109375, -1.83380126953125, -1.763458251953125, -1.693115234375, -1.622772216796875, -1.55242919921875, -1.482086181640625, -1.4117431640625, -1.341400146484375, -1.27105712890625, -1.200714111328125, -1.13037109375, -1.060028076171875, -0.98968505859375, -0.919342041015625, -0.8489990234375, -0.778656005859375, -0.70831298828125, -0.637969970703125, -0.567626953125, -0.497283935546875, -0.42694091796875, -0.356597900390625, -0.2862548828125, -0.215911865234375, -0.14556884765625, -0.075225830078125, -0.0048828125, 0.065460205078125, 0.13580322265625, 0.206146240234375, 0.2764892578125, 0.346832275390625, 0.41717529296875, 0.487518310546875, 0.557861328125, 0.628204345703125, 0.69854736328125, 0.768890380859375, 0.8392333984375, 0.909576416015625, 0.97991943359375, 1.050262451171875, 1.12060546875, 1.190948486328125, 1.26129150390625, 1.331634521484375, 1.4019775390625, 1.472320556640625, 1.54266357421875, 1.613006591796875, 1.683349609375, 1.753692626953125, 1.82403564453125, 1.894378662109375, 1.9647216796875, 2.035064697265625, 2.10540771484375, 2.175750732421875, 2.24609375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 5.0, 0.0, 3.0, 10.0, 17.0, 24.0, 27.0, 33.0, 73.0, 97.0, 163.0, 221.0, 371.0, 675.0, 1736.0, 6957.0, 84252.0, 938120.0, 11626.0, 2206.0, 801.0, 389.0, 240.0, 167.0, 110.0, 62.0, 53.0, 34.0, 20.0, 24.0, 4.0, 5.0, 4.0, 5.0, 1.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2275390625, -1.1881103515625, -1.148681640625, -1.1092529296875, -1.06982421875, -1.0303955078125, -0.990966796875, -0.9515380859375, -0.912109375, -0.8726806640625, -0.833251953125, -0.7938232421875, -0.75439453125, -0.7149658203125, -0.675537109375, -0.6361083984375, -0.5966796875, -0.5572509765625, -0.517822265625, -0.4783935546875, -0.43896484375, -0.3995361328125, -0.360107421875, -0.3206787109375, -0.28125, -0.2418212890625, -0.202392578125, -0.1629638671875, -0.12353515625, -0.0841064453125, -0.044677734375, -0.0052490234375, 0.0341796875, 0.0736083984375, 0.113037109375, 0.1524658203125, 0.19189453125, 0.2313232421875, 0.270751953125, 0.3101806640625, 0.349609375, 0.3890380859375, 0.428466796875, 0.4678955078125, 0.50732421875, 0.5467529296875, 0.586181640625, 0.6256103515625, 0.6650390625, 0.7044677734375, 0.743896484375, 0.7833251953125, 0.82275390625, 0.8621826171875, 0.901611328125, 0.9410400390625, 0.98046875, 1.0198974609375, 1.059326171875, 1.0987548828125, 1.13818359375, 1.1776123046875, 1.217041015625, 1.2564697265625, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 20.0, 41.0, 67.0, 86.0, 150.0, 166.0, 152.0, 99.0, 96.0, 53.0, 24.0, 13.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012135505676269531, -0.00011796876788139343, -0.00011458247900009155, -0.00011119619011878967, -0.00010780990123748779, -0.00010442361235618591, -0.00010103732347488403, -9.765103459358215e-05, -9.426474571228027e-05, -9.08784568309784e-05, -8.749216794967651e-05, -8.410587906837463e-05, -8.071959018707275e-05, -7.733330130577087e-05, -7.3947012424469e-05, -7.056072354316711e-05, -6.717443466186523e-05, -6.378814578056335e-05, -6.0401856899261475e-05, -5.7015568017959595e-05, -5.3629279136657715e-05, -5.0242990255355835e-05, -4.6856701374053955e-05, -4.3470412492752075e-05, -4.0084123611450195e-05, -3.6697834730148315e-05, -3.3311545848846436e-05, -2.9925256967544556e-05, -2.6538968086242676e-05, -2.3152679204940796e-05, -1.9766390323638916e-05, -1.6380101442337036e-05, -1.2993812561035156e-05, -9.607523679733276e-06, -6.2212347984313965e-06, -2.8349459171295166e-06, 5.513429641723633e-07, 3.937631845474243e-06, 7.323920726776123e-06, 1.0710209608078003e-05, 1.4096498489379883e-05, 1.7482787370681763e-05, 2.0869076251983643e-05, 2.4255365133285522e-05, 2.7641654014587402e-05, 3.102794289588928e-05, 3.441423177719116e-05, 3.780052065849304e-05, 4.118680953979492e-05, 4.45730984210968e-05, 4.795938730239868e-05, 5.134567618370056e-05, 5.473196506500244e-05, 5.811825394630432e-05, 6.15045428276062e-05, 6.489083170890808e-05, 6.827712059020996e-05, 7.166340947151184e-05, 7.504969835281372e-05, 7.84359872341156e-05, 8.182227611541748e-05, 8.520856499671936e-05, 8.859485387802124e-05, 9.198114275932312e-05, 9.5367431640625e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 6.0, 5.0, 18.0, 22.0, 25.0, 35.0, 53.0, 52.0, 83.0, 122.0, 158.0, 287.0, 451.0, 743.0, 1266.0, 2051.0, 3426.0, 6426.0, 19152.0, 192160.0, 728236.0, 69760.0, 11734.0, 5010.0, 2768.0, 1706.0, 1027.0, 606.0, 371.0, 243.0, 175.0, 113.0, 76.0, 54.0, 44.0, 23.0, 20.0, 18.0, 5.0, 12.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.71533203125, -0.6938629150390625, -0.672393798828125, -0.6509246826171875, -0.62945556640625, -0.6079864501953125, -0.586517333984375, -0.5650482177734375, -0.5435791015625, -0.5221099853515625, -0.500640869140625, -0.4791717529296875, -0.45770263671875, -0.4362335205078125, -0.414764404296875, -0.3932952880859375, -0.371826171875, -0.3503570556640625, -0.328887939453125, -0.3074188232421875, -0.28594970703125, -0.2644805908203125, -0.243011474609375, -0.2215423583984375, -0.2000732421875, -0.1786041259765625, -0.157135009765625, -0.1356658935546875, -0.11419677734375, -0.0927276611328125, -0.071258544921875, -0.0497894287109375, -0.0283203125, -0.0068511962890625, 0.014617919921875, 0.0360870361328125, 0.05755615234375, 0.0790252685546875, 0.100494384765625, 0.1219635009765625, 0.1434326171875, 0.1649017333984375, 0.186370849609375, 0.2078399658203125, 0.22930908203125, 0.2507781982421875, 0.272247314453125, 0.2937164306640625, 0.315185546875, 0.3366546630859375, 0.358123779296875, 0.3795928955078125, 0.40106201171875, 0.4225311279296875, 0.444000244140625, 0.4654693603515625, 0.4869384765625, 0.5084075927734375, 0.529876708984375, 0.5513458251953125, 0.57281494140625, 0.5942840576171875, 0.615753173828125, 0.6372222900390625, 0.65869140625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 9.0, 17.0, 39.0, 104.0, 249.0, 325.0, 145.0, 55.0, 22.0, 14.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180908203125, -0.17509841918945312, -0.16928863525390625, -0.16347885131835938, -0.1576690673828125, -0.15185928344726562, -0.14604949951171875, -0.14023971557617188, -0.134429931640625, -0.12862014770507812, -0.12281036376953125, -0.11700057983398438, -0.1111907958984375, -0.10538101196289062, -0.09957122802734375, -0.09376144409179688, -0.08795166015625, -0.08214187622070312, -0.07633209228515625, -0.07052230834960938, -0.0647125244140625, -0.058902740478515625, -0.05309295654296875, -0.047283172607421875, -0.041473388671875, -0.035663604736328125, -0.02985382080078125, -0.024044036865234375, -0.0182342529296875, -0.012424468994140625, -0.00661468505859375, -0.000804901123046875, 0.0050048828125, 0.010814666748046875, 0.01662445068359375, 0.022434234619140625, 0.0282440185546875, 0.034053802490234375, 0.03986358642578125, 0.045673370361328125, 0.051483154296875, 0.057292938232421875, 0.06310272216796875, 0.06891250610351562, 0.0747222900390625, 0.08053207397460938, 0.08634185791015625, 0.09215164184570312, 0.09796142578125, 0.10377120971679688, 0.10958099365234375, 0.11539077758789062, 0.1212005615234375, 0.12701034545898438, 0.13282012939453125, 0.13862991333007812, 0.144439697265625, 0.15024948120117188, 0.15605926513671875, 0.16186904907226562, 0.1676788330078125, 0.17348861694335938, 0.17929840087890625, 0.18510818481445312, 0.19091796875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 6.0, 10.0, 12.0, 14.0, 20.0, 16.0, 24.0, 32.0, 37.0, 43.0, 56.0, 49.0, 56.0, 71.0, 67.0, 68.0, 66.0, 45.0, 52.0, 35.0, 39.0, 43.0, 25.0, 23.0, 17.0, 16.0, 16.0, 10.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.0382232666015625, -5.853695869445801, -5.669168472290039, -5.484641075134277, -5.300113201141357, -5.115585803985596, -4.931058406829834, -4.746531009674072, -4.562003135681152, -4.377475738525391, -4.192948341369629, -4.008420944213867, -3.8238930702209473, -3.6393656730651855, -3.454838275909424, -3.270310878753662, -3.0857834815979004, -2.9012560844421387, -2.716728448867798, -2.532201051712036, -2.3476734161376953, -2.1631460189819336, -1.9786186218261719, -1.7940911054611206, -1.6095635890960693, -1.425036072731018, -1.2405085563659668, -1.055981159210205, -0.8714536428451538, -0.6869261264801025, -0.5023987293243408, -0.31787121295928955, -0.13334321975708008, 0.051184266805648804, 0.23571175336837769, 0.4202392101287842, 0.6047667264938354, 0.7892942428588867, 0.9738216400146484, 1.1583491563796997, 1.342876672744751, 1.5274041891098022, 1.7119317054748535, 1.8964591026306152, 2.080986499786377, 2.2655141353607178, 2.4500415325164795, 2.6345691680908203, 2.819096565246582, 3.0036239624023438, 3.1881515979766846, 3.3726789951324463, 3.557206630706787, 3.741734027862549, 3.9262614250183105, 4.110788822174072, 4.295316696166992, 4.479844093322754, 4.664371490478516, 4.848898887634277, 5.033426761627197, 5.217954158782959, 5.402481555938721, 5.587008953094482, 5.771536350250244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 6.0, 4.0, 7.0, 16.0, 9.0, 11.0, 17.0, 12.0, 16.0, 18.0, 23.0, 24.0, 33.0, 37.0, 29.0, 26.0, 33.0, 28.0, 38.0, 38.0, 44.0, 47.0, 35.0, 35.0, 30.0, 39.0, 40.0, 37.0, 31.0, 26.0, 21.0, 22.0, 20.0, 22.0, 20.0, 11.0, 13.0, 11.0, 13.0, 13.0, 8.0, 3.0, 4.0, 5.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 2.0], "bins": [-2.915468454360962, -2.8307132720947266, -2.745957851409912, -2.6612026691436768, -2.5764474868774414, -2.491692304611206, -2.4069368839263916, -2.3221817016601562, -2.237426519393921, -2.1526713371276855, -2.067915916442871, -1.9831607341766357, -1.8984055519104004, -1.8136502504348755, -1.7288949489593506, -1.6441397666931152, -1.5593844652175903, -1.4746291637420654, -1.38987398147583, -1.3051186800003052, -1.2203634977340698, -1.135608196258545, -1.0508530139923096, -0.9660977125167847, -0.8813424706459045, -0.7965872287750244, -0.7118319869041443, -0.6270767450332642, -0.5423214435577393, -0.4575662314891815, -0.372810959815979, -0.2880557179450989, -0.20330047607421875, -0.11854522675275803, -0.0337899774312973, 0.05096527934074402, 0.13572052121162415, 0.22047576308250427, 0.3052310347557068, 0.3899862766265869, 0.47474151849746704, 0.5594967603683472, 0.6442520022392273, 0.7290072441101074, 0.8137625455856323, 0.8985177278518677, 0.9832730293273926, 1.068028211593628, 1.1527835130691528, 1.2375388145446777, 1.322293996810913, 1.407049298286438, 1.4918044805526733, 1.5765597820281982, 1.6613149642944336, 1.7460702657699585, 1.8308255672454834, 1.9155808687210083, 2.000336170196533, 2.0850913524627686, 2.169846534729004, 2.2546017169952393, 2.3393571376800537, 2.424112319946289, 2.5088675022125244]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 6.0, 17.0, 27.0, 35.0, 57.0, 88.0, 122.0, 185.0, 286.0, 431.0, 696.0, 1111.0, 1903.0, 3288.0, 5812.0, 10544.0, 18859.0, 33677.0, 57791.0, 93381.0, 135890.0, 167106.0, 166151.0, 132296.0, 89937.0, 55354.0, 32104.0, 18091.0, 10067.0, 5515.0, 3052.0, 1833.0, 1064.0, 644.0, 374.0, 256.0, 156.0, 120.0, 65.0, 46.0, 29.0, 28.0, 19.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.2265625, -4.09429931640625, -3.9620361328125, -3.82977294921875, -3.697509765625, -3.56524658203125, -3.4329833984375, -3.30072021484375, -3.16845703125, -3.03619384765625, -2.9039306640625, -2.77166748046875, -2.639404296875, -2.50714111328125, -2.3748779296875, -2.24261474609375, -2.1103515625, -1.97808837890625, -1.8458251953125, -1.71356201171875, -1.581298828125, -1.44903564453125, -1.3167724609375, -1.18450927734375, -1.05224609375, -0.91998291015625, -0.7877197265625, -0.65545654296875, -0.523193359375, -0.39093017578125, -0.2586669921875, -0.12640380859375, 0.005859375, 0.13812255859375, 0.2703857421875, 0.40264892578125, 0.534912109375, 0.66717529296875, 0.7994384765625, 0.93170166015625, 1.06396484375, 1.19622802734375, 1.3284912109375, 1.46075439453125, 1.593017578125, 1.72528076171875, 1.8575439453125, 1.98980712890625, 2.1220703125, 2.25433349609375, 2.3865966796875, 2.51885986328125, 2.651123046875, 2.78338623046875, 2.9156494140625, 3.04791259765625, 3.18017578125, 3.31243896484375, 3.4447021484375, 3.57696533203125, 3.709228515625, 3.84149169921875, 3.9737548828125, 4.10601806640625, 4.23828125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 7.0, 6.0, 6.0, 6.0, 8.0, 4.0, 9.0, 10.0, 24.0, 13.0, 19.0, 21.0, 21.0, 20.0, 22.0, 40.0, 27.0, 39.0, 33.0, 40.0, 51.0, 33.0, 41.0, 41.0, 40.0, 37.0, 32.0, 37.0, 41.0, 34.0, 23.0, 33.0, 19.0, 27.0, 20.0, 18.0, 16.0, 18.0, 8.0, 9.0, 7.0, 14.0, 6.0, 5.0, 1.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.968017578125, -2.87158203125, -2.775146484375, -2.6787109375, -2.582275390625, -2.48583984375, -2.389404296875, -2.29296875, -2.196533203125, -2.10009765625, -2.003662109375, -1.9072265625, -1.810791015625, -1.71435546875, -1.617919921875, -1.521484375, -1.425048828125, -1.32861328125, -1.232177734375, -1.1357421875, -1.039306640625, -0.94287109375, -0.846435546875, -0.75, -0.653564453125, -0.55712890625, -0.460693359375, -0.3642578125, -0.267822265625, -0.17138671875, -0.074951171875, 0.021484375, 0.117919921875, 0.21435546875, 0.310791015625, 0.4072265625, 0.503662109375, 0.60009765625, 0.696533203125, 0.79296875, 0.889404296875, 0.98583984375, 1.082275390625, 1.1787109375, 1.275146484375, 1.37158203125, 1.468017578125, 1.564453125, 1.660888671875, 1.75732421875, 1.853759765625, 1.9501953125, 2.046630859375, 2.14306640625, 2.239501953125, 2.3359375, 2.432373046875, 2.52880859375, 2.625244140625, 2.7216796875, 2.818115234375, 2.91455078125, 3.010986328125, 3.107421875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 7.0, 18.0, 36.0, 49.0, 73.0, 117.0, 165.0, 317.0, 503.0, 798.0, 1360.0, 2190.0, 3784.0, 6525.0, 10644.0, 18411.0, 29744.0, 48212.0, 73391.0, 103778.0, 133679.0, 147435.0, 138712.0, 111602.0, 80247.0, 52811.0, 33582.0, 20618.0, 11946.0, 7128.0, 4295.0, 2587.0, 1464.0, 880.0, 554.0, 314.0, 199.0, 137.0, 75.0, 53.0, 30.0, 26.0, 21.0, 12.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.88671875, -3.771087646484375, -3.65545654296875, -3.539825439453125, -3.4241943359375, -3.308563232421875, -3.19293212890625, -3.077301025390625, -2.961669921875, -2.846038818359375, -2.73040771484375, -2.614776611328125, -2.4991455078125, -2.383514404296875, -2.26788330078125, -2.152252197265625, -2.03662109375, -1.920989990234375, -1.80535888671875, -1.689727783203125, -1.5740966796875, -1.458465576171875, -1.34283447265625, -1.227203369140625, -1.111572265625, -0.995941162109375, -0.88031005859375, -0.764678955078125, -0.6490478515625, -0.533416748046875, -0.41778564453125, -0.302154541015625, -0.1865234375, -0.070892333984375, 0.04473876953125, 0.160369873046875, 0.2760009765625, 0.391632080078125, 0.50726318359375, 0.622894287109375, 0.738525390625, 0.854156494140625, 0.96978759765625, 1.085418701171875, 1.2010498046875, 1.316680908203125, 1.43231201171875, 1.547943115234375, 1.66357421875, 1.779205322265625, 1.89483642578125, 2.010467529296875, 2.1260986328125, 2.241729736328125, 2.35736083984375, 2.472991943359375, 2.588623046875, 2.704254150390625, 2.81988525390625, 2.935516357421875, 3.0511474609375, 3.166778564453125, 3.28240966796875, 3.398040771484375, 3.513671875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 6.0, 3.0, 7.0, 17.0, 13.0, 17.0, 18.0, 16.0, 24.0, 28.0, 27.0, 28.0, 48.0, 30.0, 46.0, 43.0, 39.0, 34.0, 44.0, 44.0, 47.0, 38.0, 40.0, 40.0, 36.0, 33.0, 23.0, 22.0, 26.0, 28.0, 23.0, 23.0, 19.0, 14.0, 15.0, 4.0, 8.0, 5.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.099609375, -2.035552978515625, -1.97149658203125, -1.907440185546875, -1.8433837890625, -1.779327392578125, -1.71527099609375, -1.651214599609375, -1.587158203125, -1.523101806640625, -1.45904541015625, -1.394989013671875, -1.3309326171875, -1.266876220703125, -1.20281982421875, -1.138763427734375, -1.07470703125, -1.010650634765625, -0.94659423828125, -0.882537841796875, -0.8184814453125, -0.754425048828125, -0.69036865234375, -0.626312255859375, -0.562255859375, -0.498199462890625, -0.43414306640625, -0.370086669921875, -0.3060302734375, -0.241973876953125, -0.17791748046875, -0.113861083984375, -0.0498046875, 0.014251708984375, 0.07830810546875, 0.142364501953125, 0.2064208984375, 0.270477294921875, 0.33453369140625, 0.398590087890625, 0.462646484375, 0.526702880859375, 0.59075927734375, 0.654815673828125, 0.7188720703125, 0.782928466796875, 0.84698486328125, 0.911041259765625, 0.97509765625, 1.039154052734375, 1.10321044921875, 1.167266845703125, 1.2313232421875, 1.295379638671875, 1.35943603515625, 1.423492431640625, 1.487548828125, 1.551605224609375, 1.61566162109375, 1.679718017578125, 1.7437744140625, 1.807830810546875, 1.87188720703125, 1.935943603515625, 2.0]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 9.0, 12.0, 11.0, 27.0, 39.0, 47.0, 69.0, 116.0, 163.0, 244.0, 376.0, 698.0, 1120.0, 1787.0, 3114.0, 5363.0, 9602.0, 17432.0, 32410.0, 59348.0, 104130.0, 160288.0, 196487.0, 176084.0, 120811.0, 71256.0, 39184.0, 21067.0, 11568.0, 6369.0, 3703.0, 2170.0, 1301.0, 795.0, 493.0, 298.0, 208.0, 115.0, 79.0, 49.0, 39.0, 28.0, 12.0, 8.0, 8.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.384765625, -2.311737060546875, -2.23870849609375, -2.165679931640625, -2.0926513671875, -2.019622802734375, -1.94659423828125, -1.873565673828125, -1.800537109375, -1.727508544921875, -1.65447998046875, -1.581451416015625, -1.5084228515625, -1.435394287109375, -1.36236572265625, -1.289337158203125, -1.21630859375, -1.143280029296875, -1.07025146484375, -0.997222900390625, -0.9241943359375, -0.851165771484375, -0.77813720703125, -0.705108642578125, -0.632080078125, -0.559051513671875, -0.48602294921875, -0.412994384765625, -0.3399658203125, -0.266937255859375, -0.19390869140625, -0.120880126953125, -0.0478515625, 0.025177001953125, 0.09820556640625, 0.171234130859375, 0.2442626953125, 0.317291259765625, 0.39031982421875, 0.463348388671875, 0.536376953125, 0.609405517578125, 0.68243408203125, 0.755462646484375, 0.8284912109375, 0.901519775390625, 0.97454833984375, 1.047576904296875, 1.12060546875, 1.193634033203125, 1.26666259765625, 1.339691162109375, 1.4127197265625, 1.485748291015625, 1.55877685546875, 1.631805419921875, 1.704833984375, 1.777862548828125, 1.85089111328125, 1.923919677734375, 1.9969482421875, 2.069976806640625, 2.14300537109375, 2.216033935546875, 2.2890625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 11.0, 10.0, 22.0, 15.0, 53.0, 58.0, 82.0, 87.0, 106.0, 113.0, 104.0, 91.0, 78.0, 55.0, 38.0, 24.0, 13.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004456043243408203, -0.00043368712067604065, -0.000421769917011261, -0.0004098527133464813, -0.00039793550968170166, -0.000386018306016922, -0.00037410110235214233, -0.00036218389868736267, -0.000350266695022583, -0.00033834949135780334, -0.0003264322876930237, -0.000314515084028244, -0.00030259788036346436, -0.0002906806766986847, -0.00027876347303390503, -0.00026684626936912537, -0.0002549290657043457, -0.00024301186203956604, -0.00023109465837478638, -0.00021917745471000671, -0.00020726025104522705, -0.0001953430473804474, -0.00018342584371566772, -0.00017150864005088806, -0.0001595914363861084, -0.00014767423272132874, -0.00013575702905654907, -0.0001238398253917694, -0.00011192262172698975, -0.00010000541806221008, -8.808821439743042e-05, -7.617101073265076e-05, -6.42538070678711e-05, -5.233660340309143e-05, -4.041939973831177e-05, -2.8502196073532104e-05, -1.658499240875244e-05, -4.667788743972778e-06, 7.249414920806885e-06, 1.9166618585586548e-05, 3.108382225036621e-05, 4.3001025915145874e-05, 5.491822957992554e-05, 6.68354332447052e-05, 7.875263690948486e-05, 9.066984057426453e-05, 0.00010258704423904419, 0.00011450424790382385, 0.00012642145156860352, 0.00013833865523338318, 0.00015025585889816284, 0.0001621730625629425, 0.00017409026622772217, 0.00018600746989250183, 0.0001979246735572815, 0.00020984187722206116, 0.00022175908088684082, 0.00023367628455162048, 0.00024559348821640015, 0.0002575106918811798, 0.00026942789554595947, 0.00028134509921073914, 0.0002932623028755188, 0.00030517950654029846, 0.0003170967102050781]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 12.0, 16.0, 25.0, 17.0, 37.0, 52.0, 58.0, 98.0, 130.0, 170.0, 240.0, 350.0, 577.0, 883.0, 1376.0, 2336.0, 3973.0, 6767.0, 12000.0, 21484.0, 39239.0, 69864.0, 118888.0, 173203.0, 193835.0, 160429.0, 104667.0, 60084.0, 33658.0, 18785.0, 10251.0, 5812.0, 3471.0, 1993.0, 1304.0, 823.0, 552.0, 350.0, 220.0, 153.0, 98.0, 88.0, 52.0, 33.0, 28.0, 21.0, 19.0, 10.0, 11.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.384765625, -2.31109619140625, -2.2374267578125, -2.16375732421875, -2.090087890625, -2.01641845703125, -1.9427490234375, -1.86907958984375, -1.79541015625, -1.72174072265625, -1.6480712890625, -1.57440185546875, -1.500732421875, -1.42706298828125, -1.3533935546875, -1.27972412109375, -1.2060546875, -1.13238525390625, -1.0587158203125, -0.98504638671875, -0.911376953125, -0.83770751953125, -0.7640380859375, -0.69036865234375, -0.61669921875, -0.54302978515625, -0.4693603515625, -0.39569091796875, -0.322021484375, -0.24835205078125, -0.1746826171875, -0.10101318359375, -0.02734375, 0.04632568359375, 0.1199951171875, 0.19366455078125, 0.267333984375, 0.34100341796875, 0.4146728515625, 0.48834228515625, 0.56201171875, 0.63568115234375, 0.7093505859375, 0.78302001953125, 0.856689453125, 0.93035888671875, 1.0040283203125, 1.07769775390625, 1.1513671875, 1.22503662109375, 1.2987060546875, 1.37237548828125, 1.446044921875, 1.51971435546875, 1.5933837890625, 1.66705322265625, 1.74072265625, 1.81439208984375, 1.8880615234375, 1.96173095703125, 2.035400390625, 2.10906982421875, 2.1827392578125, 2.25640869140625, 2.330078125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 4.0, 9.0, 5.0, 11.0, 13.0, 16.0, 24.0, 25.0, 35.0, 32.0, 38.0, 38.0, 50.0, 48.0, 66.0, 57.0, 55.0, 60.0, 43.0, 52.0, 45.0, 47.0, 34.0, 30.0, 24.0, 14.0, 26.0, 15.0, 16.0, 13.0, 8.0, 9.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.642578125, -0.6241302490234375, -0.605682373046875, -0.5872344970703125, -0.56878662109375, -0.5503387451171875, -0.531890869140625, -0.5134429931640625, -0.4949951171875, -0.4765472412109375, -0.458099365234375, -0.4396514892578125, -0.42120361328125, -0.4027557373046875, -0.384307861328125, -0.3658599853515625, -0.347412109375, -0.3289642333984375, -0.310516357421875, -0.2920684814453125, -0.27362060546875, -0.2551727294921875, -0.236724853515625, -0.2182769775390625, -0.1998291015625, -0.1813812255859375, -0.162933349609375, -0.1444854736328125, -0.12603759765625, -0.1075897216796875, -0.089141845703125, -0.0706939697265625, -0.05224609375, -0.0337982177734375, -0.015350341796875, 0.0030975341796875, 0.02154541015625, 0.0399932861328125, 0.058441162109375, 0.0768890380859375, 0.0953369140625, 0.1137847900390625, 0.132232666015625, 0.1506805419921875, 0.16912841796875, 0.1875762939453125, 0.206024169921875, 0.2244720458984375, 0.242919921875, 0.2613677978515625, 0.279815673828125, 0.2982635498046875, 0.31671142578125, 0.3351593017578125, 0.353607177734375, 0.3720550537109375, 0.3905029296875, 0.4089508056640625, 0.427398681640625, 0.4458465576171875, 0.46429443359375, 0.4827423095703125, 0.501190185546875, 0.5196380615234375, 0.5380859375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 1.0, 6.0, 8.0, 11.0, 16.0, 21.0, 21.0, 30.0, 32.0, 35.0, 44.0, 48.0, 68.0, 58.0, 63.0, 81.0, 74.0, 58.0, 59.0, 49.0, 39.0, 27.0, 31.0, 33.0, 23.0, 11.0, 9.0, 12.0, 6.0, 7.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.592738151550293, -6.400635719299316, -6.20853328704834, -6.016430854797363, -5.824328422546387, -5.63222599029541, -5.440123558044434, -5.248021125793457, -5.0559186935424805, -4.863816261291504, -4.671713829040527, -4.479611396789551, -4.287508964538574, -4.095406532287598, -3.9033043384552, -3.7112019062042236, -3.519099712371826, -3.3269972801208496, -3.134894847869873, -2.9427924156188965, -2.75068998336792, -2.5585875511169434, -2.366485357284546, -2.1743829250335693, -1.9822804927825928, -1.7901780605316162, -1.5980756282806396, -1.4059733152389526, -1.213870882987976, -1.0217684507369995, -0.8296661376953125, -0.6375637054443359, -0.4454612731933594, -0.2533588707447052, -0.061256468296051025, 0.13084590435028076, 0.3229483366012573, 0.5150507688522339, 0.7071530818939209, 0.8992555141448975, 1.091357946395874, 1.2834603786468506, 1.4755628108978271, 1.6676651239395142, 1.8597675561904907, 2.0518698692321777, 2.2439723014831543, 2.436074733734131, 2.6281771659851074, 2.820279598236084, 3.0123820304870605, 3.204484462738037, 3.3965868949890137, 3.5886893272399902, 3.7807915210723877, 3.9728939533233643, 4.164996147155762, 4.357098579406738, 4.549201011657715, 4.741303443908691, 4.933405876159668, 5.1255083084106445, 5.317610740661621, 5.509713172912598, 5.701815605163574]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 10.0, 12.0, 16.0, 22.0, 15.0, 18.0, 24.0, 27.0, 28.0, 35.0, 32.0, 32.0, 37.0, 50.0, 42.0, 39.0, 37.0, 57.0, 40.0, 42.0, 38.0, 47.0, 30.0, 34.0, 25.0, 28.0, 28.0, 18.0, 27.0, 17.0, 15.0, 11.0, 5.0, 11.0, 8.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.537686347961426, -3.4350030422210693, -3.332319498062134, -3.2296361923217773, -3.126952886581421, -3.0242693424224854, -2.921586036682129, -2.8189024925231934, -2.716219186782837, -2.6135358810424805, -2.510852336883545, -2.4081690311431885, -2.305485725402832, -2.2028021812438965, -2.10011887550354, -1.997435450553894, -1.8947521448135376, -1.7920687198638916, -1.6893854141235352, -1.5867019891738892, -1.4840185642242432, -1.3813352584838867, -1.2786518335342407, -1.1759684085845947, -1.0732851028442383, -0.9706017374992371, -0.8679183125495911, -0.7652349472045898, -0.6625515222549438, -0.5598681569099426, -0.4571847915649414, -0.3545013666152954, -0.2518179416656494, -0.1491345465183258, -0.04645116627216339, 0.05623221397399902, 0.15891560912132263, 0.26159900426864624, 0.36428236961364746, 0.46696579456329346, 0.5696491599082947, 0.6723325252532959, 0.7750159502029419, 0.8776993155479431, 0.9803826808929443, 1.0830661058425903, 1.1857495307922363, 1.2884328365325928, 1.3911162614822388, 1.4937996864318848, 1.5964829921722412, 1.6991664171218872, 1.8018498420715332, 1.9045331478118896, 2.007216453552246, 2.1098999977111816, 2.212583303451538, 2.3152666091918945, 2.41795015335083, 2.5206334590911865, 2.623316764831543, 2.7260003089904785, 2.828683614730835, 2.9313669204711914, 3.034050464630127]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 9.0, 7.0, 10.0, 22.0, 20.0, 29.0, 35.0, 60.0, 77.0, 126.0, 169.0, 253.0, 401.0, 579.0, 967.0, 1484.0, 2329.0, 3797.0, 6305.0, 10285.0, 18535.0, 34119.0, 65099.0, 132402.0, 281641.0, 586474.0, 970300.0, 954120.0, 568134.0, 274482.0, 133205.0, 66654.0, 35300.0, 19418.0, 11036.0, 6572.0, 3785.0, 2356.0, 1392.0, 902.0, 518.0, 368.0, 191.0, 127.0, 77.0, 47.0, 40.0, 8.0, 4.0, 11.0, 5.0, 3.0, 1.0, 3.0], "bins": [-6.375, -6.20263671875, -6.0302734375, -5.85791015625, -5.685546875, -5.51318359375, -5.3408203125, -5.16845703125, -4.99609375, -4.82373046875, -4.6513671875, -4.47900390625, -4.306640625, -4.13427734375, -3.9619140625, -3.78955078125, -3.6171875, -3.44482421875, -3.2724609375, -3.10009765625, -2.927734375, -2.75537109375, -2.5830078125, -2.41064453125, -2.23828125, -2.06591796875, -1.8935546875, -1.72119140625, -1.548828125, -1.37646484375, -1.2041015625, -1.03173828125, -0.859375, -0.68701171875, -0.5146484375, -0.34228515625, -0.169921875, 0.00244140625, 0.1748046875, 0.34716796875, 0.51953125, 0.69189453125, 0.8642578125, 1.03662109375, 1.208984375, 1.38134765625, 1.5537109375, 1.72607421875, 1.8984375, 2.07080078125, 2.2431640625, 2.41552734375, 2.587890625, 2.76025390625, 2.9326171875, 3.10498046875, 3.27734375, 3.44970703125, 3.6220703125, 3.79443359375, 3.966796875, 4.13916015625, 4.3115234375, 4.48388671875, 4.65625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 10.0, 14.0, 7.0, 16.0, 13.0, 15.0, 22.0, 20.0, 21.0, 25.0, 27.0, 24.0, 32.0, 39.0, 34.0, 41.0, 52.0, 49.0, 41.0, 43.0, 29.0, 53.0, 45.0, 40.0, 35.0, 38.0, 22.0, 33.0, 22.0, 13.0, 25.0, 12.0, 13.0, 11.0, 9.0, 8.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.052734375, -2.965850830078125, -2.87896728515625, -2.792083740234375, -2.7052001953125, -2.618316650390625, -2.53143310546875, -2.444549560546875, -2.357666015625, -2.270782470703125, -2.18389892578125, -2.097015380859375, -2.0101318359375, -1.923248291015625, -1.83636474609375, -1.749481201171875, -1.66259765625, -1.575714111328125, -1.48883056640625, -1.401947021484375, -1.3150634765625, -1.228179931640625, -1.14129638671875, -1.054412841796875, -0.967529296875, -0.880645751953125, -0.79376220703125, -0.706878662109375, -0.6199951171875, -0.533111572265625, -0.44622802734375, -0.359344482421875, -0.2724609375, -0.185577392578125, -0.09869384765625, -0.011810302734375, 0.0750732421875, 0.161956787109375, 0.24884033203125, 0.335723876953125, 0.422607421875, 0.509490966796875, 0.59637451171875, 0.683258056640625, 0.7701416015625, 0.857025146484375, 0.94390869140625, 1.030792236328125, 1.11767578125, 1.204559326171875, 1.29144287109375, 1.378326416015625, 1.4652099609375, 1.552093505859375, 1.63897705078125, 1.725860595703125, 1.812744140625, 1.899627685546875, 1.98651123046875, 2.073394775390625, 2.1602783203125, 2.247161865234375, 2.33404541015625, 2.420928955078125, 2.5078125]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 7.0, 10.0, 29.0, 34.0, 45.0, 74.0, 102.0, 171.0, 232.0, 376.0, 577.0, 905.0, 1361.0, 2128.0, 3283.0, 5203.0, 8395.0, 13655.0, 22872.0, 38670.0, 66692.0, 117931.0, 211257.0, 372398.0, 612727.0, 810640.0, 739668.0, 494160.0, 288017.0, 162159.0, 91197.0, 52108.0, 30061.0, 17832.0, 10897.0, 6661.0, 4154.0, 2649.0, 1666.0, 1098.0, 760.0, 476.0, 332.0, 202.0, 145.0, 99.0, 65.0, 50.0, 20.0, 20.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.390625, -5.220947265625, -5.05126953125, -4.881591796875, -4.7119140625, -4.542236328125, -4.37255859375, -4.202880859375, -4.033203125, -3.863525390625, -3.69384765625, -3.524169921875, -3.3544921875, -3.184814453125, -3.01513671875, -2.845458984375, -2.67578125, -2.506103515625, -2.33642578125, -2.166748046875, -1.9970703125, -1.827392578125, -1.65771484375, -1.488037109375, -1.318359375, -1.148681640625, -0.97900390625, -0.809326171875, -0.6396484375, -0.469970703125, -0.30029296875, -0.130615234375, 0.0390625, 0.208740234375, 0.37841796875, 0.548095703125, 0.7177734375, 0.887451171875, 1.05712890625, 1.226806640625, 1.396484375, 1.566162109375, 1.73583984375, 1.905517578125, 2.0751953125, 2.244873046875, 2.41455078125, 2.584228515625, 2.75390625, 2.923583984375, 3.09326171875, 3.262939453125, 3.4326171875, 3.602294921875, 3.77197265625, 3.941650390625, 4.111328125, 4.281005859375, 4.45068359375, 4.620361328125, 4.7900390625, 4.959716796875, 5.12939453125, 5.299072265625, 5.46875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 14.0, 13.0, 16.0, 13.0, 26.0, 35.0, 35.0, 30.0, 61.0, 75.0, 83.0, 98.0, 101.0, 149.0, 203.0, 193.0, 189.0, 214.0, 284.0, 264.0, 260.0, 254.0, 220.0, 190.0, 183.0, 157.0, 142.0, 109.0, 82.0, 71.0, 78.0, 50.0, 33.0, 33.0, 19.0, 16.0, 20.0, 12.0, 12.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.623046875, -1.569915771484375, -1.51678466796875, -1.463653564453125, -1.4105224609375, -1.357391357421875, -1.30426025390625, -1.251129150390625, -1.197998046875, -1.144866943359375, -1.09173583984375, -1.038604736328125, -0.9854736328125, -0.932342529296875, -0.87921142578125, -0.826080322265625, -0.77294921875, -0.719818115234375, -0.66668701171875, -0.613555908203125, -0.5604248046875, -0.507293701171875, -0.45416259765625, -0.401031494140625, -0.347900390625, -0.294769287109375, -0.24163818359375, -0.188507080078125, -0.1353759765625, -0.082244873046875, -0.02911376953125, 0.024017333984375, 0.0771484375, 0.130279541015625, 0.18341064453125, 0.236541748046875, 0.2896728515625, 0.342803955078125, 0.39593505859375, 0.449066162109375, 0.502197265625, 0.555328369140625, 0.60845947265625, 0.661590576171875, 0.7147216796875, 0.767852783203125, 0.82098388671875, 0.874114990234375, 0.92724609375, 0.980377197265625, 1.03350830078125, 1.086639404296875, 1.1397705078125, 1.192901611328125, 1.24603271484375, 1.299163818359375, 1.352294921875, 1.405426025390625, 1.45855712890625, 1.511688232421875, 1.5648193359375, 1.617950439453125, 1.67108154296875, 1.724212646484375, 1.77734375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 4.0, 4.0, 4.0, 9.0, 13.0, 18.0, 15.0, 16.0, 24.0, 32.0, 34.0, 32.0, 50.0, 59.0, 52.0, 45.0, 43.0, 51.0, 50.0, 43.0, 53.0, 55.0, 52.0, 42.0, 26.0, 29.0, 28.0, 23.0, 14.0, 12.0, 11.0, 10.0, 13.0, 7.0, 3.0, 9.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.2430925369262695, -5.061591148376465, -4.88008975982666, -4.6985883712768555, -4.517086982727051, -4.335585594177246, -4.154084205627441, -3.9725828170776367, -3.791081428527832, -3.6095800399780273, -3.4280786514282227, -3.246577262878418, -3.0650758743286133, -2.8835744857788086, -2.702073097229004, -2.520571708679199, -2.3390703201293945, -2.15756893157959, -1.9760675430297852, -1.7945661544799805, -1.6130647659301758, -1.431563377380371, -1.2500619888305664, -1.0685606002807617, -0.887059211730957, -0.7055578231811523, -0.5240564346313477, -0.34255504608154297, -0.16105365753173828, 0.020447731018066406, 0.2019491195678711, 0.3834505081176758, 0.5649518966674805, 0.7464532852172852, 0.9279546737670898, 1.1094560623168945, 1.2909574508666992, 1.472458839416504, 1.6539602279663086, 1.8354616165161133, 2.016963005065918, 2.1984643936157227, 2.3799657821655273, 2.561467170715332, 2.7429685592651367, 2.9244699478149414, 3.105971336364746, 3.287472724914551, 3.4689741134643555, 3.65047550201416, 3.831976890563965, 4.0134782791137695, 4.194979667663574, 4.376481056213379, 4.557982444763184, 4.739483833312988, 4.920985221862793, 5.102486610412598, 5.283987998962402, 5.465489387512207, 5.646990776062012, 5.828492164611816, 6.009993553161621, 6.191494941711426, 6.3729963302612305]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 6.0, 12.0, 11.0, 17.0, 15.0, 8.0, 17.0, 34.0, 20.0, 18.0, 29.0, 38.0, 38.0, 33.0, 46.0, 31.0, 29.0, 45.0, 45.0, 46.0, 41.0, 37.0, 50.0, 33.0, 38.0, 35.0, 31.0, 21.0, 33.0, 16.0, 13.0, 14.0, 17.0, 19.0, 2.0, 9.0, 9.0, 12.0, 5.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.1414031982421875, -4.029458999633789, -3.9175145626068115, -3.805570363998413, -3.6936261653900146, -3.581681728363037, -3.4697375297546387, -3.3577933311462402, -3.2458488941192627, -3.1339046955108643, -3.0219602584838867, -2.9100160598754883, -2.79807186126709, -2.6861274242401123, -2.574183225631714, -2.4622387886047363, -2.350294589996338, -2.2383503913879395, -2.126405954360962, -2.0144617557525635, -1.9025174379348755, -1.7905731201171875, -1.678628921508789, -1.566684603691101, -1.4547405242919922, -1.3427962064743042, -1.2308520078659058, -1.1189076900482178, -1.0069633722305298, -0.8950191140174866, -0.7830748558044434, -0.6711305379867554, -0.5591862201690674, -0.4472419321537018, -0.3352976441383362, -0.22335338592529297, -0.11140909790992737, 0.0005351901054382324, 0.11247944831848145, 0.22442376613616943, 0.33636802434921265, 0.44831231236457825, 0.5602566003799438, 0.6722008585929871, 0.7841451168060303, 0.8960894346237183, 1.0080337524414062, 1.1199779510498047, 1.2319222688674927, 1.3438665866851807, 1.455810785293579, 1.567755103111267, 1.679699420928955, 1.7916436195373535, 1.9035879373550415, 2.0155322551727295, 2.127476453781128, 2.2394206523895264, 2.351365089416504, 2.4633092880249023, 2.575253486633301, 2.6871979236602783, 2.7991421222686768, 2.9110865592956543, 3.0230307579040527]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 12.0, 5.0, 14.0, 19.0, 27.0, 49.0, 59.0, 70.0, 137.0, 221.0, 334.0, 484.0, 769.0, 1317.0, 2010.0, 3393.0, 5778.0, 9869.0, 16975.0, 30169.0, 54598.0, 96809.0, 159514.0, 208051.0, 183464.0, 118416.0, 67481.0, 37606.0, 21276.0, 12061.0, 6941.0, 4078.0, 2457.0, 1405.0, 969.0, 622.0, 348.0, 262.0, 151.0, 113.0, 76.0, 40.0, 23.0, 27.0, 12.0, 9.0, 15.0, 9.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.58251953125, -0.564697265625, -0.546875, -0.529052734375, -0.51123046875, -0.493408203125, -0.4755859375, -0.457763671875, -0.43994140625, -0.422119140625, -0.404296875, -0.386474609375, -0.36865234375, -0.350830078125, -0.3330078125, -0.315185546875, -0.29736328125, -0.279541015625, -0.26171875, -0.243896484375, -0.22607421875, -0.208251953125, -0.1904296875, -0.172607421875, -0.15478515625, -0.136962890625, -0.119140625, -0.101318359375, -0.08349609375, -0.065673828125, -0.0478515625, -0.030029296875, -0.01220703125, 0.005615234375, 0.0234375, 0.041259765625, 0.05908203125, 0.076904296875, 0.0947265625, 0.112548828125, 0.13037109375, 0.148193359375, 0.166015625, 0.183837890625, 0.20166015625, 0.219482421875, 0.2373046875, 0.255126953125, 0.27294921875, 0.290771484375, 0.30859375, 0.326416015625, 0.34423828125, 0.362060546875, 0.3798828125, 0.397705078125, 0.41552734375, 0.433349609375, 0.451171875, 0.468994140625, 0.48681640625, 0.504638671875, 0.5224609375, 0.540283203125, 0.55810546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 14.0, 17.0, 17.0, 31.0, 19.0, 27.0, 32.0, 33.0, 45.0, 48.0, 50.0, 46.0, 46.0, 49.0, 57.0, 58.0, 45.0, 50.0, 30.0, 43.0, 30.0, 26.0, 29.0, 22.0, 22.0, 22.0, 24.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.37109375, -4.2186279296875, -4.066162109375, -3.9136962890625, -3.76123046875, -3.6087646484375, -3.456298828125, -3.3038330078125, -3.1513671875, -2.9989013671875, -2.846435546875, -2.6939697265625, -2.54150390625, -2.3890380859375, -2.236572265625, -2.0841064453125, -1.931640625, -1.7791748046875, -1.626708984375, -1.4742431640625, -1.32177734375, -1.1693115234375, -1.016845703125, -0.8643798828125, -0.7119140625, -0.5594482421875, -0.406982421875, -0.2545166015625, -0.10205078125, 0.0504150390625, 0.202880859375, 0.3553466796875, 0.5078125, 0.6602783203125, 0.812744140625, 0.9652099609375, 1.11767578125, 1.2701416015625, 1.422607421875, 1.5750732421875, 1.7275390625, 1.8800048828125, 2.032470703125, 2.1849365234375, 2.33740234375, 2.4898681640625, 2.642333984375, 2.7947998046875, 2.947265625, 3.0997314453125, 3.252197265625, 3.4046630859375, 3.55712890625, 3.7095947265625, 3.862060546875, 4.0145263671875, 4.1669921875, 4.3194580078125, 4.471923828125, 4.6243896484375, 4.77685546875, 4.9293212890625, 5.081787109375, 5.2342529296875, 5.38671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 15.0, 14.0, 30.0, 32.0, 40.0, 106.0, 127.0, 168.0, 258.0, 441.0, 698.0, 1220.0, 2296.0, 4421.0, 9500.0, 22672.0, 109613.0, 828059.0, 39704.0, 14855.0, 6762.0, 3215.0, 1724.0, 953.0, 576.0, 368.0, 252.0, 129.0, 101.0, 63.0, 46.0, 31.0, 20.0, 6.0, 14.0, 7.0, 3.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7646484375, -1.7063446044921875, -1.648040771484375, -1.5897369384765625, -1.53143310546875, -1.4731292724609375, -1.414825439453125, -1.3565216064453125, -1.2982177734375, -1.2399139404296875, -1.181610107421875, -1.1233062744140625, -1.06500244140625, -1.0066986083984375, -0.948394775390625, -0.8900909423828125, -0.831787109375, -0.7734832763671875, -0.715179443359375, -0.6568756103515625, -0.59857177734375, -0.5402679443359375, -0.481964111328125, -0.4236602783203125, -0.3653564453125, -0.3070526123046875, -0.248748779296875, -0.1904449462890625, -0.13214111328125, -0.0738372802734375, -0.015533447265625, 0.0427703857421875, 0.10107421875, 0.1593780517578125, 0.217681884765625, 0.2759857177734375, 0.33428955078125, 0.3925933837890625, 0.450897216796875, 0.5092010498046875, 0.5675048828125, 0.6258087158203125, 0.684112548828125, 0.7424163818359375, 0.80072021484375, 0.8590240478515625, 0.917327880859375, 0.9756317138671875, 1.033935546875, 1.0922393798828125, 1.150543212890625, 1.2088470458984375, 1.26715087890625, 1.3254547119140625, 1.383758544921875, 1.4420623779296875, 1.5003662109375, 1.5586700439453125, 1.616973876953125, 1.6752777099609375, 1.73358154296875, 1.7918853759765625, 1.850189208984375, 1.9084930419921875, 1.966796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 7.0, 8.0, 15.0, 13.0, 19.0, 14.0, 19.0, 31.0, 19.0, 32.0, 40.0, 39.0, 51.0, 40.0, 36.0, 42.0, 51.0, 40.0, 46.0, 45.0, 45.0, 43.0, 39.0, 28.0, 22.0, 27.0, 34.0, 25.0, 20.0, 19.0, 13.0, 14.0, 12.0, 8.0, 7.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.3424072265625, -2.251220703125, -2.1600341796875, -2.06884765625, -1.9776611328125, -1.886474609375, -1.7952880859375, -1.7041015625, -1.6129150390625, -1.521728515625, -1.4305419921875, -1.33935546875, -1.2481689453125, -1.156982421875, -1.0657958984375, -0.974609375, -0.8834228515625, -0.792236328125, -0.7010498046875, -0.60986328125, -0.5186767578125, -0.427490234375, -0.3363037109375, -0.2451171875, -0.1539306640625, -0.062744140625, 0.0284423828125, 0.11962890625, 0.2108154296875, 0.302001953125, 0.3931884765625, 0.484375, 0.5755615234375, 0.666748046875, 0.7579345703125, 0.84912109375, 0.9403076171875, 1.031494140625, 1.1226806640625, 1.2138671875, 1.3050537109375, 1.396240234375, 1.4874267578125, 1.57861328125, 1.6697998046875, 1.760986328125, 1.8521728515625, 1.943359375, 2.0345458984375, 2.125732421875, 2.2169189453125, 2.30810546875, 2.3992919921875, 2.490478515625, 2.5816650390625, 2.6728515625, 2.7640380859375, 2.855224609375, 2.9464111328125, 3.03759765625, 3.1287841796875, 3.219970703125, 3.3111572265625, 3.40234375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 4.0, 8.0, 2.0, 11.0, 8.0, 12.0, 16.0, 28.0, 41.0, 48.0, 50.0, 96.0, 131.0, 194.0, 333.0, 475.0, 793.0, 1296.0, 2049.0, 3709.0, 6809.0, 13414.0, 30020.0, 809480.0, 131997.0, 23126.0, 10830.0, 5520.0, 3199.0, 1736.0, 1107.0, 691.0, 457.0, 269.0, 210.0, 116.0, 68.0, 45.0, 50.0, 29.0, 25.0, 12.0, 15.0, 10.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.318115234375, -0.30626678466796875, -0.2944183349609375, -0.28256988525390625, -0.270721435546875, -0.25887298583984375, -0.2470245361328125, -0.23517608642578125, -0.22332763671875, -0.21147918701171875, -0.1996307373046875, -0.18778228759765625, -0.175933837890625, -0.16408538818359375, -0.1522369384765625, -0.14038848876953125, -0.1285400390625, -0.11669158935546875, -0.1048431396484375, -0.09299468994140625, -0.081146240234375, -0.06929779052734375, -0.0574493408203125, -0.04560089111328125, -0.03375244140625, -0.02190399169921875, -0.0100555419921875, 0.00179290771484375, 0.013641357421875, 0.02548980712890625, 0.0373382568359375, 0.04918670654296875, 0.06103515625, 0.07288360595703125, 0.0847320556640625, 0.09658050537109375, 0.108428955078125, 0.12027740478515625, 0.1321258544921875, 0.14397430419921875, 0.15582275390625, 0.16767120361328125, 0.1795196533203125, 0.19136810302734375, 0.203216552734375, 0.21506500244140625, 0.2269134521484375, 0.23876190185546875, 0.2506103515625, 0.26245880126953125, 0.2743072509765625, 0.28615570068359375, 0.298004150390625, 0.30985260009765625, 0.3217010498046875, 0.33354949951171875, 0.34539794921875, 0.35724639892578125, 0.3690948486328125, 0.38094329833984375, 0.392791748046875, 0.40464019775390625, 0.4164886474609375, 0.42833709716796875, 0.440185546875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 12.0, 7.0, 13.0, 18.0, 16.0, 26.0, 21.0, 30.0, 19.0, 43.0, 30.0, 45.0, 41.0, 53.0, 60.0, 38.0, 54.0, 58.0, 58.0, 45.0, 45.0, 36.0, 21.0, 39.0, 24.0, 32.0, 17.0, 22.0, 13.0, 9.0, 10.0, 13.0, 4.0, 6.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2067298889160156e-05, -3.103725612163544e-05, -3.0007213354110718e-05, -2.8977170586586e-05, -2.794712781906128e-05, -2.691708505153656e-05, -2.588704228401184e-05, -2.485699951648712e-05, -2.3826956748962402e-05, -2.2796913981437683e-05, -2.1766871213912964e-05, -2.0736828446388245e-05, -1.9706785678863525e-05, -1.8676742911338806e-05, -1.7646700143814087e-05, -1.6616657376289368e-05, -1.558661460876465e-05, -1.455657184123993e-05, -1.352652907371521e-05, -1.249648630619049e-05, -1.1466443538665771e-05, -1.0436400771141052e-05, -9.406358003616333e-06, -8.376315236091614e-06, -7.3462724685668945e-06, -6.316229701042175e-06, -5.286186933517456e-06, -4.256144165992737e-06, -3.2261013984680176e-06, -2.1960586309432983e-06, -1.166015863418579e-06, -1.3597309589385986e-07, 8.940696716308594e-07, 1.9241124391555786e-06, 2.954155206680298e-06, 3.984197974205017e-06, 5.014240741729736e-06, 6.0442835092544556e-06, 7.074326276779175e-06, 8.104369044303894e-06, 9.134411811828613e-06, 1.0164454579353333e-05, 1.1194497346878052e-05, 1.2224540114402771e-05, 1.325458288192749e-05, 1.428462564945221e-05, 1.531466841697693e-05, 1.6344711184501648e-05, 1.7374753952026367e-05, 1.8404796719551086e-05, 1.9434839487075806e-05, 2.0464882254600525e-05, 2.1494925022125244e-05, 2.2524967789649963e-05, 2.3555010557174683e-05, 2.4585053324699402e-05, 2.561509609222412e-05, 2.664513885974884e-05, 2.767518162727356e-05, 2.870522439479828e-05, 2.9735267162322998e-05, 3.076530992984772e-05, 3.1795352697372437e-05, 3.2825395464897156e-05, 3.3855438232421875e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 19.0, 22.0, 29.0, 27.0, 49.0, 53.0, 98.0, 117.0, 154.0, 238.0, 352.0, 536.0, 825.0, 1222.0, 2055.0, 3467.0, 6248.0, 11312.0, 21582.0, 43809.0, 88449.0, 170722.0, 255350.0, 209157.0, 114180.0, 56987.0, 28100.0, 14410.0, 7706.0, 4267.0, 2555.0, 1561.0, 928.0, 605.0, 404.0, 252.0, 189.0, 122.0, 77.0, 67.0, 45.0, 43.0, 27.0, 26.0, 25.0, 16.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-0.1854248046875, -0.17957305908203125, -0.1737213134765625, -0.16786956787109375, -0.162017822265625, -0.15616607666015625, -0.1503143310546875, -0.14446258544921875, -0.13861083984375, -0.13275909423828125, -0.1269073486328125, -0.12105560302734375, -0.115203857421875, -0.10935211181640625, -0.1035003662109375, -0.09764862060546875, -0.091796875, -0.08594512939453125, -0.0800933837890625, -0.07424163818359375, -0.068389892578125, -0.06253814697265625, -0.0566864013671875, -0.05083465576171875, -0.04498291015625, -0.03913116455078125, -0.0332794189453125, -0.02742767333984375, -0.021575927734375, -0.01572418212890625, -0.0098724365234375, -0.00402069091796875, 0.0018310546875, 0.00768280029296875, 0.0135345458984375, 0.01938629150390625, 0.025238037109375, 0.03108978271484375, 0.0369415283203125, 0.04279327392578125, 0.04864501953125, 0.05449676513671875, 0.0603485107421875, 0.06620025634765625, 0.072052001953125, 0.07790374755859375, 0.0837554931640625, 0.08960723876953125, 0.095458984375, 0.10131072998046875, 0.1071624755859375, 0.11301422119140625, 0.118865966796875, 0.12471771240234375, 0.1305694580078125, 0.13642120361328125, 0.14227294921875, 0.14812469482421875, 0.1539764404296875, 0.15982818603515625, 0.165679931640625, 0.17153167724609375, 0.1773834228515625, 0.18323516845703125, 0.1890869140625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 7.0, 3.0, 5.0, 13.0, 14.0, 17.0, 12.0, 22.0, 26.0, 24.0, 33.0, 25.0, 48.0, 44.0, 55.0, 56.0, 60.0, 73.0, 53.0, 60.0, 54.0, 28.0, 49.0, 36.0, 26.0, 27.0, 17.0, 18.0, 14.0, 15.0, 10.0, 4.0, 8.0, 4.0, 4.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.03509521484375, -0.033934593200683594, -0.03277397155761719, -0.03161334991455078, -0.030452728271484375, -0.02929210662841797, -0.028131484985351562, -0.026970863342285156, -0.02581024169921875, -0.024649620056152344, -0.023488998413085938, -0.02232837677001953, -0.021167755126953125, -0.02000713348388672, -0.018846511840820312, -0.017685890197753906, -0.0165252685546875, -0.015364646911621094, -0.014204025268554688, -0.013043403625488281, -0.011882781982421875, -0.010722160339355469, -0.009561538696289062, -0.008400917053222656, -0.00724029541015625, -0.006079673767089844, -0.0049190521240234375, -0.0037584304809570312, -0.002597808837890625, -0.0014371871948242188, -0.0002765655517578125, 0.0008840560913085938, 0.002044677734375, 0.0032052993774414062, 0.0043659210205078125, 0.005526542663574219, 0.006687164306640625, 0.007847785949707031, 0.009008407592773438, 0.010169029235839844, 0.01132965087890625, 0.012490272521972656, 0.013650894165039062, 0.014811515808105469, 0.015972137451171875, 0.01713275909423828, 0.018293380737304688, 0.019454002380371094, 0.0206146240234375, 0.021775245666503906, 0.022935867309570312, 0.02409648895263672, 0.025257110595703125, 0.02641773223876953, 0.027578353881835938, 0.028738975524902344, 0.02989959716796875, 0.031060218811035156, 0.03222084045410156, 0.03338146209716797, 0.034542083740234375, 0.03570270538330078, 0.03686332702636719, 0.038023948669433594, 0.0391845703125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 6.0, 3.0, 11.0, 14.0, 16.0, 14.0, 17.0, 27.0, 28.0, 43.0, 31.0, 51.0, 60.0, 55.0, 45.0, 44.0, 56.0, 44.0, 46.0, 60.0, 49.0, 45.0, 43.0, 32.0, 23.0, 28.0, 16.0, 14.0, 13.0, 12.0, 13.0, 8.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.221388816833496, -5.038038730621338, -4.85468864440918, -4.6713385581970215, -4.487988471984863, -4.304637908935547, -4.121288299560547, -3.9379377365112305, -3.7545876502990723, -3.571237564086914, -3.387887477874756, -3.2045373916625977, -3.0211870670318604, -2.837836980819702, -2.654486894607544, -2.4711365699768066, -2.2877867221832275, -2.1044366359710693, -1.9210864305496216, -1.7377363443374634, -1.5543861389160156, -1.3710360527038574, -1.1876859664916992, -1.0043357610702515, -0.8209856748580933, -0.6376355290412903, -0.4542854130268097, -0.2709352970123291, -0.08758515119552612, 0.09576499462127686, 0.27911508083343506, 0.4624652862548828, 0.645815372467041, 0.829165518283844, 1.012515664100647, 1.1958657503128052, 1.379215955734253, 1.5625660419464111, 1.7459161281585693, 1.929266333580017, 2.112616539001465, 2.295966625213623, 2.4793167114257812, 2.6626667976379395, 2.8460171222686768, 3.029367208480835, 3.212717294692993, 3.3960676193237305, 3.5794174671173096, 3.7627675533294678, 3.946117639541626, 4.129467964172363, 4.3128180503845215, 4.49616813659668, 4.679518222808838, 4.862868309020996, 5.046218395233154, 5.2295684814453125, 5.412918567657471, 5.596268653869629, 5.779618740081787, 5.962968826293945, 6.146319389343262, 6.32966947555542, 6.513019561767578]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 11.0, 17.0, 11.0, 14.0, 15.0, 31.0, 22.0, 18.0, 29.0, 39.0, 38.0, 36.0, 43.0, 29.0, 32.0, 45.0, 45.0, 44.0, 41.0, 36.0, 54.0, 34.0, 34.0, 33.0, 34.0, 21.0, 30.0, 19.0, 12.0, 15.0, 17.0, 18.0, 3.0, 10.0, 7.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.09265661239624, -3.9814138412475586, -3.870170831680298, -3.758928060531616, -3.6476850509643555, -3.536442279815674, -3.425199508666992, -3.3139567375183105, -3.20271372795105, -3.091470956802368, -2.9802279472351074, -2.868985176086426, -2.757742404937744, -2.6464993953704834, -2.5352566242218018, -2.424013614654541, -2.3127708435058594, -2.2015280723571777, -2.090285062789917, -1.9790422916412354, -1.8677994012832642, -1.756556510925293, -1.6453137397766113, -1.5340708494186401, -1.422827959060669, -1.3115850687026978, -1.2003421783447266, -1.089099407196045, -0.9778565168380737, -0.8666136264801025, -0.7553707957267761, -0.6441279649734497, -0.5328850746154785, -0.4216422140598297, -0.3103993535041809, -0.1991564929485321, -0.0879136323928833, 0.02332925796508789, 0.1345720887184143, 0.24581491947174072, 0.3570578098297119, 0.4683006703853607, 0.5795435309410095, 0.6907863616943359, 0.8020292520523071, 0.9132721424102783, 1.02451491355896, 1.1357578039169312, 1.2470006942749023, 1.3582435846328735, 1.4694864749908447, 1.5807292461395264, 1.6919721364974976, 1.8032150268554688, 1.9144577980041504, 2.025700569152832, 2.1369435787200928, 2.2481863498687744, 2.359429359436035, 2.470672130584717, 2.5819149017333984, 2.693157911300659, 2.804400682449341, 2.9156436920166016, 3.026886463165283]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 26.0, 43.0, 64.0, 86.0, 149.0, 210.0, 388.0, 666.0, 1034.0, 1773.0, 3069.0, 5580.0, 10332.0, 19473.0, 36804.0, 66839.0, 112644.0, 165928.0, 190714.0, 167139.0, 115680.0, 68165.0, 37485.0, 20077.0, 10823.0, 5652.0, 3185.0, 1798.0, 1030.0, 626.0, 379.0, 244.0, 139.0, 78.0, 56.0, 60.0, 30.0, 17.0, 8.0, 9.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2578125, -5.0797119140625, -4.901611328125, -4.7235107421875, -4.54541015625, -4.3673095703125, -4.189208984375, -4.0111083984375, -3.8330078125, -3.6549072265625, -3.476806640625, -3.2987060546875, -3.12060546875, -2.9425048828125, -2.764404296875, -2.5863037109375, -2.408203125, -2.2301025390625, -2.052001953125, -1.8739013671875, -1.69580078125, -1.5177001953125, -1.339599609375, -1.1614990234375, -0.9833984375, -0.8052978515625, -0.627197265625, -0.4490966796875, -0.27099609375, -0.0928955078125, 0.085205078125, 0.2633056640625, 0.44140625, 0.6195068359375, 0.797607421875, 0.9757080078125, 1.15380859375, 1.3319091796875, 1.510009765625, 1.6881103515625, 1.8662109375, 2.0443115234375, 2.222412109375, 2.4005126953125, 2.57861328125, 2.7567138671875, 2.934814453125, 3.1129150390625, 3.291015625, 3.4691162109375, 3.647216796875, 3.8253173828125, 4.00341796875, 4.1815185546875, 4.359619140625, 4.5377197265625, 4.7158203125, 4.8939208984375, 5.072021484375, 5.2501220703125, 5.42822265625, 5.6063232421875, 5.784423828125, 5.9625244140625, 6.140625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 11.0, 4.0, 7.0, 14.0, 10.0, 21.0, 29.0, 20.0, 21.0, 21.0, 30.0, 38.0, 43.0, 41.0, 40.0, 55.0, 46.0, 51.0, 61.0, 41.0, 59.0, 50.0, 42.0, 47.0, 33.0, 32.0, 24.0, 23.0, 15.0, 15.0, 14.0, 6.0, 12.0, 8.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453125, -4.30718994140625, -4.1612548828125, -4.01531982421875, -3.869384765625, -3.72344970703125, -3.5775146484375, -3.43157958984375, -3.28564453125, -3.13970947265625, -2.9937744140625, -2.84783935546875, -2.701904296875, -2.55596923828125, -2.4100341796875, -2.26409912109375, -2.1181640625, -1.97222900390625, -1.8262939453125, -1.68035888671875, -1.534423828125, -1.38848876953125, -1.2425537109375, -1.09661865234375, -0.95068359375, -0.80474853515625, -0.6588134765625, -0.51287841796875, -0.366943359375, -0.22100830078125, -0.0750732421875, 0.07086181640625, 0.216796875, 0.36273193359375, 0.5086669921875, 0.65460205078125, 0.800537109375, 0.94647216796875, 1.0924072265625, 1.23834228515625, 1.38427734375, 1.53021240234375, 1.6761474609375, 1.82208251953125, 1.968017578125, 2.11395263671875, 2.2598876953125, 2.40582275390625, 2.5517578125, 2.69769287109375, 2.8436279296875, 2.98956298828125, 3.135498046875, 3.28143310546875, 3.4273681640625, 3.57330322265625, 3.71923828125, 3.86517333984375, 4.0111083984375, 4.15704345703125, 4.302978515625, 4.44891357421875, 4.5948486328125, 4.74078369140625, 4.88671875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 13.0, 12.0, 12.0, 17.0, 36.0, 33.0, 57.0, 79.0, 103.0, 196.0, 287.0, 405.0, 625.0, 1023.0, 1771.0, 3011.0, 5222.0, 9895.0, 17824.0, 34005.0, 62454.0, 107475.0, 161693.0, 193809.0, 173018.0, 119502.0, 70579.0, 38764.0, 20876.0, 11102.0, 6040.0, 3415.0, 1926.0, 1179.0, 701.0, 470.0, 318.0, 195.0, 133.0, 86.0, 56.0, 39.0, 38.0, 22.0, 13.0, 9.0, 4.0, 6.0, 6.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.86328125, -5.67779541015625, -5.4923095703125, -5.30682373046875, -5.121337890625, -4.93585205078125, -4.7503662109375, -4.56488037109375, -4.37939453125, -4.19390869140625, -4.0084228515625, -3.82293701171875, -3.637451171875, -3.45196533203125, -3.2664794921875, -3.08099365234375, -2.8955078125, -2.71002197265625, -2.5245361328125, -2.33905029296875, -2.153564453125, -1.96807861328125, -1.7825927734375, -1.59710693359375, -1.41162109375, -1.22613525390625, -1.0406494140625, -0.85516357421875, -0.669677734375, -0.48419189453125, -0.2987060546875, -0.11322021484375, 0.072265625, 0.25775146484375, 0.4432373046875, 0.62872314453125, 0.814208984375, 0.99969482421875, 1.1851806640625, 1.37066650390625, 1.55615234375, 1.74163818359375, 1.9271240234375, 2.11260986328125, 2.298095703125, 2.48358154296875, 2.6690673828125, 2.85455322265625, 3.0400390625, 3.22552490234375, 3.4110107421875, 3.59649658203125, 3.781982421875, 3.96746826171875, 4.1529541015625, 4.33843994140625, 4.52392578125, 4.70941162109375, 4.8948974609375, 5.08038330078125, 5.265869140625, 5.45135498046875, 5.6368408203125, 5.82232666015625, 6.0078125]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 4.0, 10.0, 4.0, 12.0, 13.0, 9.0, 19.0, 10.0, 15.0, 18.0, 31.0, 23.0, 33.0, 36.0, 43.0, 42.0, 47.0, 33.0, 43.0, 45.0, 34.0, 37.0, 41.0, 37.0, 44.0, 33.0, 30.0, 23.0, 35.0, 27.0, 23.0, 24.0, 16.0, 20.0, 20.0, 10.0, 15.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.111328125, -2.038421630859375, -1.96551513671875, -1.892608642578125, -1.8197021484375, -1.746795654296875, -1.67388916015625, -1.600982666015625, -1.528076171875, -1.455169677734375, -1.38226318359375, -1.309356689453125, -1.2364501953125, -1.163543701171875, -1.09063720703125, -1.017730712890625, -0.94482421875, -0.871917724609375, -0.79901123046875, -0.726104736328125, -0.6531982421875, -0.580291748046875, -0.50738525390625, -0.434478759765625, -0.361572265625, -0.288665771484375, -0.21575927734375, -0.142852783203125, -0.0699462890625, 0.002960205078125, 0.07586669921875, 0.148773193359375, 0.2216796875, 0.294586181640625, 0.36749267578125, 0.440399169921875, 0.5133056640625, 0.586212158203125, 0.65911865234375, 0.732025146484375, 0.804931640625, 0.877838134765625, 0.95074462890625, 1.023651123046875, 1.0965576171875, 1.169464111328125, 1.24237060546875, 1.315277099609375, 1.38818359375, 1.461090087890625, 1.53399658203125, 1.606903076171875, 1.6798095703125, 1.752716064453125, 1.82562255859375, 1.898529052734375, 1.971435546875, 2.044342041015625, 2.11724853515625, 2.190155029296875, 2.2630615234375, 2.335968017578125, 2.40887451171875, 2.481781005859375, 2.5546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 6.0, 4.0, 4.0, 9.0, 15.0, 19.0, 30.0, 41.0, 49.0, 97.0, 105.0, 151.0, 219.0, 380.0, 521.0, 824.0, 1320.0, 1920.0, 3121.0, 4948.0, 7873.0, 12922.0, 21075.0, 33874.0, 54983.0, 84998.0, 120953.0, 149523.0, 154529.0, 130626.0, 95465.0, 63379.0, 39858.0, 24656.0, 14939.0, 9342.0, 5648.0, 3578.0, 2248.0, 1489.0, 951.0, 647.0, 403.0, 258.0, 175.0, 116.0, 92.0, 61.0, 29.0, 37.0, 16.0, 11.0, 10.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0], "bins": [-2.416015625, -2.338470458984375, -2.26092529296875, -2.183380126953125, -2.1058349609375, -2.028289794921875, -1.95074462890625, -1.873199462890625, -1.795654296875, -1.718109130859375, -1.64056396484375, -1.563018798828125, -1.4854736328125, -1.407928466796875, -1.33038330078125, -1.252838134765625, -1.17529296875, -1.097747802734375, -1.02020263671875, -0.942657470703125, -0.8651123046875, -0.787567138671875, -0.71002197265625, -0.632476806640625, -0.554931640625, -0.477386474609375, -0.39984130859375, -0.322296142578125, -0.2447509765625, -0.167205810546875, -0.08966064453125, -0.012115478515625, 0.0654296875, 0.142974853515625, 0.22052001953125, 0.298065185546875, 0.3756103515625, 0.453155517578125, 0.53070068359375, 0.608245849609375, 0.685791015625, 0.763336181640625, 0.84088134765625, 0.918426513671875, 0.9959716796875, 1.073516845703125, 1.15106201171875, 1.228607177734375, 1.30615234375, 1.383697509765625, 1.46124267578125, 1.538787841796875, 1.6163330078125, 1.693878173828125, 1.77142333984375, 1.848968505859375, 1.926513671875, 2.004058837890625, 2.08160400390625, 2.159149169921875, 2.2366943359375, 2.314239501953125, 2.39178466796875, 2.469329833984375, 2.546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 10.0, 7.0, 3.0, 7.0, 27.0, 8.0, 19.0, 19.0, 26.0, 33.0, 38.0, 53.0, 46.0, 32.0, 55.0, 73.0, 52.0, 71.0, 59.0, 59.0, 60.0, 44.0, 42.0, 24.0, 27.0, 28.0, 19.0, 12.0, 9.0, 11.0, 3.0, 4.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.0003085136413574219, -0.0002989768981933594, -0.0002894401550292969, -0.0002799034118652344, -0.0002703666687011719, -0.0002608299255371094, -0.0002512931823730469, -0.00024175643920898438, -0.00023221969604492188, -0.00022268295288085938, -0.00021314620971679688, -0.00020360946655273438, -0.00019407272338867188, -0.00018453598022460938, -0.00017499923706054688, -0.00016546249389648438, -0.00015592575073242188, -0.00014638900756835938, -0.00013685226440429688, -0.00012731552124023438, -0.00011777877807617188, -0.00010824203491210938, -9.870529174804688e-05, -8.916854858398438e-05, -7.963180541992188e-05, -7.009506225585938e-05, -6.0558319091796875e-05, -5.1021575927734375e-05, -4.1484832763671875e-05, -3.1948089599609375e-05, -2.2411346435546875e-05, -1.2874603271484375e-05, -3.337860107421875e-06, 6.198883056640625e-06, 1.5735626220703125e-05, 2.5272369384765625e-05, 3.4809112548828125e-05, 4.4345855712890625e-05, 5.3882598876953125e-05, 6.341934204101562e-05, 7.295608520507812e-05, 8.249282836914062e-05, 9.202957153320312e-05, 0.00010156631469726562, 0.00011110305786132812, 0.00012063980102539062, 0.00013017654418945312, 0.00013971328735351562, 0.00014925003051757812, 0.00015878677368164062, 0.00016832351684570312, 0.00017786026000976562, 0.00018739700317382812, 0.00019693374633789062, 0.00020647048950195312, 0.00021600723266601562, 0.00022554397583007812, 0.00023508071899414062, 0.0002446174621582031, 0.0002541542053222656, 0.0002636909484863281, 0.0002732276916503906, 0.0002827644348144531, 0.0002923011779785156]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 4.0, 9.0, 9.0, 13.0, 20.0, 29.0, 43.0, 50.0, 76.0, 117.0, 158.0, 252.0, 329.0, 542.0, 732.0, 1074.0, 1620.0, 2381.0, 3554.0, 5402.0, 8293.0, 12755.0, 20154.0, 31505.0, 48395.0, 72817.0, 102931.0, 130820.0, 143108.0, 133325.0, 106192.0, 76229.0, 50986.0, 33601.0, 21440.0, 13552.0, 8722.0, 5735.0, 3718.0, 2596.0, 1653.0, 1149.0, 764.0, 535.0, 368.0, 250.0, 177.0, 119.0, 85.0, 58.0, 33.0, 35.0, 24.0, 8.0, 11.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.0606689453125, -1.988525390625, -1.9163818359375, -1.84423828125, -1.7720947265625, -1.699951171875, -1.6278076171875, -1.5556640625, -1.4835205078125, -1.411376953125, -1.3392333984375, -1.26708984375, -1.1949462890625, -1.122802734375, -1.0506591796875, -0.978515625, -0.9063720703125, -0.834228515625, -0.7620849609375, -0.68994140625, -0.6177978515625, -0.545654296875, -0.4735107421875, -0.4013671875, -0.3292236328125, -0.257080078125, -0.1849365234375, -0.11279296875, -0.0406494140625, 0.031494140625, 0.1036376953125, 0.17578125, 0.2479248046875, 0.320068359375, 0.3922119140625, 0.46435546875, 0.5364990234375, 0.608642578125, 0.6807861328125, 0.7529296875, 0.8250732421875, 0.897216796875, 0.9693603515625, 1.04150390625, 1.1136474609375, 1.185791015625, 1.2579345703125, 1.330078125, 1.4022216796875, 1.474365234375, 1.5465087890625, 1.61865234375, 1.6907958984375, 1.762939453125, 1.8350830078125, 1.9072265625, 1.9793701171875, 2.051513671875, 2.1236572265625, 2.19580078125, 2.2679443359375, 2.340087890625, 2.4122314453125, 2.484375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 4.0, 7.0, 7.0, 5.0, 9.0, 7.0, 8.0, 6.0, 20.0, 25.0, 31.0, 15.0, 28.0, 25.0, 35.0, 47.0, 43.0, 40.0, 46.0, 52.0, 55.0, 52.0, 47.0, 58.0, 51.0, 37.0, 36.0, 31.0, 32.0, 26.0, 19.0, 15.0, 16.0, 16.0, 10.0, 7.0, 5.0, 10.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.71044921875, -0.686431884765625, -0.66241455078125, -0.638397216796875, -0.6143798828125, -0.590362548828125, -0.56634521484375, -0.542327880859375, -0.518310546875, -0.494293212890625, -0.47027587890625, -0.446258544921875, -0.4222412109375, -0.398223876953125, -0.37420654296875, -0.350189208984375, -0.326171875, -0.302154541015625, -0.27813720703125, -0.254119873046875, -0.2301025390625, -0.206085205078125, -0.18206787109375, -0.158050537109375, -0.134033203125, -0.110015869140625, -0.08599853515625, -0.061981201171875, -0.0379638671875, -0.013946533203125, 0.01007080078125, 0.034088134765625, 0.05810546875, 0.082122802734375, 0.10614013671875, 0.130157470703125, 0.1541748046875, 0.178192138671875, 0.20220947265625, 0.226226806640625, 0.250244140625, 0.274261474609375, 0.29827880859375, 0.322296142578125, 0.3463134765625, 0.370330810546875, 0.39434814453125, 0.418365478515625, 0.4423828125, 0.466400146484375, 0.49041748046875, 0.514434814453125, 0.5384521484375, 0.562469482421875, 0.58648681640625, 0.610504150390625, 0.634521484375, 0.658538818359375, 0.68255615234375, 0.706573486328125, 0.7305908203125, 0.754608154296875, 0.77862548828125, 0.802642822265625, 0.82666015625]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 6.0, 7.0, 4.0, 2.0, 10.0, 10.0, 15.0, 20.0, 19.0, 21.0, 19.0, 27.0, 44.0, 30.0, 38.0, 36.0, 50.0, 59.0, 59.0, 51.0, 50.0, 51.0, 53.0, 51.0, 29.0, 39.0, 38.0, 29.0, 28.0, 20.0, 22.0, 14.0, 11.0, 6.0, 10.0, 10.0, 5.0, 8.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.928782939910889, -4.745309829711914, -4.5618367195129395, -4.378363609313965, -4.19489049911499, -4.011417388916016, -3.827944040298462, -3.6444709300994873, -3.4609978199005127, -3.277524709701538, -3.0940515995025635, -2.9105782508850098, -2.727105140686035, -2.5436320304870605, -2.360158920288086, -2.1766858100891113, -1.9932126998901367, -1.809739589691162, -1.6262664794921875, -1.4427932500839233, -1.2593201398849487, -1.0758470296859741, -0.89237380027771, -0.7089006900787354, -0.5254275798797607, -0.34195443987846375, -0.15848129987716675, 0.024991869926452637, 0.20846498012542725, 0.39193809032440186, 0.575411319732666, 0.7588844299316406, 0.9423580169677734, 1.125831127166748, 1.3093042373657227, 1.4927774667739868, 1.6762505769729614, 1.859723687171936, 2.0431969165802, 2.226670026779175, 2.4101431369781494, 2.593616247177124, 2.7770893573760986, 2.9605627059936523, 3.144035816192627, 3.3275089263916016, 3.510982036590576, 3.694455146789551, 3.8779282569885254, 4.0614013671875, 4.244874477386475, 4.428347587585449, 4.611820697784424, 4.795293807983398, 4.978767395019531, 5.162240028381348, 5.3457136154174805, 5.529186725616455, 5.71265983581543, 5.896132946014404, 6.079606056213379, 6.2630791664123535, 6.446552276611328, 6.630025863647461, 6.813498497009277]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 14.0, 16.0, 13.0, 15.0, 15.0, 19.0, 22.0, 22.0, 20.0, 34.0, 28.0, 40.0, 36.0, 26.0, 35.0, 54.0, 39.0, 50.0, 44.0, 42.0, 44.0, 35.0, 29.0, 24.0, 31.0, 32.0, 22.0, 17.0, 18.0, 24.0, 16.0, 12.0, 16.0, 12.0, 16.0, 6.0, 5.0, 3.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0], "bins": [-3.8244690895080566, -3.712723970413208, -3.6009790897369385, -3.48923397064209, -3.3774890899658203, -3.2657439708709717, -3.153998851776123, -3.0422539710998535, -2.930508852005005, -2.8187637329101562, -2.7070188522338867, -2.595273733139038, -2.4835286140441895, -2.37178373336792, -2.2600386142730713, -2.1482934951782227, -2.036548614501953, -1.924803614616394, -1.813058614730835, -1.7013134956359863, -1.5895684957504272, -1.4778234958648682, -1.3660783767700195, -1.2543333768844604, -1.1425883769989014, -1.0308433771133423, -0.9190983176231384, -0.8073532581329346, -0.6956082582473755, -0.5838632583618164, -0.47211819887161255, -0.3603731393814087, -0.2486283779144287, -0.13688334822654724, -0.02513831853866577, 0.0866067111492157, 0.19835174083709717, 0.31009674072265625, 0.4218418002128601, 0.533586859703064, 0.645331859588623, 0.7570768594741821, 0.868821918964386, 0.9805669784545898, 1.092311978340149, 1.204056978225708, 1.3158020973205566, 1.4275470972061157, 1.5392920970916748, 1.6510370969772339, 1.762782096862793, 1.8745272159576416, 1.9862722158432007, 2.0980172157287598, 2.2097623348236084, 2.321507453918457, 2.4332523345947266, 2.544997453689575, 2.6567423343658447, 2.7684874534606934, 2.880232334136963, 2.9919774532318115, 3.10372257232666, 3.2154674530029297, 3.3272125720977783]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 22.0, 22.0, 39.0, 53.0, 64.0, 109.0, 174.0, 267.0, 385.0, 587.0, 891.0, 1554.0, 2707.0, 4293.0, 7585.0, 13128.0, 24379.0, 45902.0, 90837.0, 189045.0, 405765.0, 788998.0, 1039414.0, 785845.0, 406213.0, 191629.0, 92727.0, 46413.0, 24488.0, 13014.0, 7417.0, 4140.0, 2458.0, 1417.0, 881.0, 542.0, 325.0, 200.0, 122.0, 85.0, 46.0, 27.0, 19.0, 14.0, 8.0, 5.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.90234375, -6.6962890625, -6.490234375, -6.2841796875, -6.078125, -5.8720703125, -5.666015625, -5.4599609375, -5.25390625, -5.0478515625, -4.841796875, -4.6357421875, -4.4296875, -4.2236328125, -4.017578125, -3.8115234375, -3.60546875, -3.3994140625, -3.193359375, -2.9873046875, -2.78125, -2.5751953125, -2.369140625, -2.1630859375, -1.95703125, -1.7509765625, -1.544921875, -1.3388671875, -1.1328125, -0.9267578125, -0.720703125, -0.5146484375, -0.30859375, -0.1025390625, 0.103515625, 0.3095703125, 0.515625, 0.7216796875, 0.927734375, 1.1337890625, 1.33984375, 1.5458984375, 1.751953125, 1.9580078125, 2.1640625, 2.3701171875, 2.576171875, 2.7822265625, 2.98828125, 3.1943359375, 3.400390625, 3.6064453125, 3.8125, 4.0185546875, 4.224609375, 4.4306640625, 4.63671875, 4.8427734375, 5.048828125, 5.2548828125, 5.4609375, 5.6669921875, 5.873046875, 6.0791015625, 6.28515625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 9.0, 12.0, 7.0, 9.0, 18.0, 21.0, 21.0, 21.0, 14.0, 33.0, 41.0, 39.0, 29.0, 44.0, 51.0, 48.0, 45.0, 50.0, 60.0, 52.0, 48.0, 29.0, 46.0, 39.0, 31.0, 30.0, 20.0, 23.0, 15.0, 17.0, 20.0, 11.0, 9.0, 3.0, 8.0, 10.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.701171875, -3.58648681640625, -3.4718017578125, -3.35711669921875, -3.242431640625, -3.12774658203125, -3.0130615234375, -2.89837646484375, -2.78369140625, -2.66900634765625, -2.5543212890625, -2.43963623046875, -2.324951171875, -2.21026611328125, -2.0955810546875, -1.98089599609375, -1.8662109375, -1.75152587890625, -1.6368408203125, -1.52215576171875, -1.407470703125, -1.29278564453125, -1.1781005859375, -1.06341552734375, -0.94873046875, -0.83404541015625, -0.7193603515625, -0.60467529296875, -0.489990234375, -0.37530517578125, -0.2606201171875, -0.14593505859375, -0.03125, 0.08343505859375, 0.1981201171875, 0.31280517578125, 0.427490234375, 0.54217529296875, 0.6568603515625, 0.77154541015625, 0.88623046875, 1.00091552734375, 1.1156005859375, 1.23028564453125, 1.344970703125, 1.45965576171875, 1.5743408203125, 1.68902587890625, 1.8037109375, 1.91839599609375, 2.0330810546875, 2.14776611328125, 2.262451171875, 2.37713623046875, 2.4918212890625, 2.60650634765625, 2.72119140625, 2.83587646484375, 2.9505615234375, 3.06524658203125, 3.179931640625, 3.29461669921875, 3.4093017578125, 3.52398681640625, 3.638671875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 13.0, 25.0, 35.0, 48.0, 71.0, 115.0, 195.0, 239.0, 417.0, 589.0, 984.0, 1403.0, 2121.0, 3284.0, 5206.0, 8142.0, 13094.0, 21577.0, 35271.0, 59213.0, 99988.0, 168750.0, 285494.0, 459535.0, 654453.0, 734496.0, 608889.0, 410282.0, 251651.0, 147935.0, 86820.0, 52016.0, 30878.0, 18989.0, 11692.0, 7347.0, 4578.0, 2913.0, 1904.0, 1240.0, 843.0, 519.0, 366.0, 215.0, 147.0, 97.0, 71.0, 46.0, 20.0, 19.0, 20.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.765625, -5.58184814453125, -5.3980712890625, -5.21429443359375, -5.030517578125, -4.84674072265625, -4.6629638671875, -4.47918701171875, -4.29541015625, -4.11163330078125, -3.9278564453125, -3.74407958984375, -3.560302734375, -3.37652587890625, -3.1927490234375, -3.00897216796875, -2.8251953125, -2.64141845703125, -2.4576416015625, -2.27386474609375, -2.090087890625, -1.90631103515625, -1.7225341796875, -1.53875732421875, -1.35498046875, -1.17120361328125, -0.9874267578125, -0.80364990234375, -0.619873046875, -0.43609619140625, -0.2523193359375, -0.06854248046875, 0.115234375, 0.29901123046875, 0.4827880859375, 0.66656494140625, 0.850341796875, 1.03411865234375, 1.2178955078125, 1.40167236328125, 1.58544921875, 1.76922607421875, 1.9530029296875, 2.13677978515625, 2.320556640625, 2.50433349609375, 2.6881103515625, 2.87188720703125, 3.0556640625, 3.23944091796875, 3.4232177734375, 3.60699462890625, 3.790771484375, 3.97454833984375, 4.1583251953125, 4.34210205078125, 4.52587890625, 4.70965576171875, 4.8934326171875, 5.07720947265625, 5.260986328125, 5.44476318359375, 5.6285400390625, 5.81231689453125, 5.99609375]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 3.0, 5.0, 6.0, 9.0, 13.0, 12.0, 22.0, 30.0, 45.0, 40.0, 50.0, 70.0, 94.0, 135.0, 137.0, 162.0, 171.0, 233.0, 233.0, 258.0, 284.0, 266.0, 240.0, 232.0, 237.0, 215.0, 197.0, 143.0, 119.0, 89.0, 81.0, 56.0, 44.0, 30.0, 25.0, 19.0, 14.0, 15.0, 8.0, 5.0, 6.0, 6.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.091796875, -2.02386474609375, -1.9559326171875, -1.88800048828125, -1.820068359375, -1.75213623046875, -1.6842041015625, -1.61627197265625, -1.54833984375, -1.48040771484375, -1.4124755859375, -1.34454345703125, -1.276611328125, -1.20867919921875, -1.1407470703125, -1.07281494140625, -1.0048828125, -0.93695068359375, -0.8690185546875, -0.80108642578125, -0.733154296875, -0.66522216796875, -0.5972900390625, -0.52935791015625, -0.46142578125, -0.39349365234375, -0.3255615234375, -0.25762939453125, -0.189697265625, -0.12176513671875, -0.0538330078125, 0.01409912109375, 0.08203125, 0.14996337890625, 0.2178955078125, 0.28582763671875, 0.353759765625, 0.42169189453125, 0.4896240234375, 0.55755615234375, 0.62548828125, 0.69342041015625, 0.7613525390625, 0.82928466796875, 0.897216796875, 0.96514892578125, 1.0330810546875, 1.10101318359375, 1.1689453125, 1.23687744140625, 1.3048095703125, 1.37274169921875, 1.440673828125, 1.50860595703125, 1.5765380859375, 1.64447021484375, 1.71240234375, 1.78033447265625, 1.8482666015625, 1.91619873046875, 1.984130859375, 2.05206298828125, 2.1199951171875, 2.18792724609375, 2.255859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 9.0, 11.0, 10.0, 19.0, 16.0, 34.0, 29.0, 49.0, 42.0, 54.0, 57.0, 73.0, 62.0, 62.0, 52.0, 67.0, 65.0, 53.0, 38.0, 35.0, 36.0, 26.0, 33.0, 14.0, 10.0, 14.0, 6.0, 6.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.956415176391602, -7.686728477478027, -7.417041778564453, -7.147355079650879, -6.877668380737305, -6.6079816818237305, -6.338294982910156, -6.068608283996582, -5.798921585083008, -5.529234886169434, -5.259548187255859, -4.989861488342285, -4.720174789428711, -4.450488090515137, -4.1808013916015625, -3.9111149311065674, -3.6414284706115723, -3.371741771697998, -3.102055072784424, -2.8323683738708496, -2.5626816749572754, -2.292994976043701, -2.023308515548706, -1.7536218166351318, -1.4839351177215576, -1.2142484188079834, -0.944561779499054, -0.6748751401901245, -0.4051884412765503, -0.13550174236297607, 0.1341848373413086, 0.4038715362548828, 0.673558235168457, 0.9432449340820312, 1.2129316329956055, 1.4826182126998901, 1.7523049116134644, 2.021991729736328, 2.2916781902313232, 2.5613648891448975, 2.8310515880584717, 3.100738286972046, 3.37042498588562, 3.6401114463806152, 3.9097981452941895, 4.179484844207764, 4.449171543121338, 4.718858242034912, 4.988544940948486, 5.2582316398620605, 5.527918338775635, 5.797605037689209, 6.067291736602783, 6.336978435516357, 6.606664657592773, 6.876351356506348, 7.146038055419922, 7.415724754333496, 7.68541145324707, 7.9550981521606445, 8.224784851074219, 8.494471549987793, 8.764158248901367, 9.033844947814941, 9.303531646728516]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 7.0, 9.0, 7.0, 12.0, 11.0, 17.0, 12.0, 22.0, 22.0, 34.0, 20.0, 25.0, 39.0, 41.0, 30.0, 32.0, 33.0, 47.0, 47.0, 38.0, 46.0, 41.0, 50.0, 36.0, 40.0, 38.0, 36.0, 29.0, 20.0, 25.0, 17.0, 21.0, 18.0, 18.0, 14.0, 7.0, 8.0, 7.0, 5.0, 2.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.775452136993408, -4.6400041580200195, -4.504555702209473, -4.369107723236084, -4.233659744262695, -4.098211288452148, -3.9627633094787598, -3.827315092086792, -3.691866874694824, -3.5564186573028564, -3.4209704399108887, -3.2855224609375, -3.1500742435455322, -3.0146260261535645, -2.879178047180176, -2.743729829788208, -2.6082816123962402, -2.4728333950042725, -2.3373851776123047, -2.201937198638916, -2.0664889812469482, -1.9310407638549805, -1.7955926656723022, -1.660144567489624, -1.5246963500976562, -1.3892481327056885, -1.2538000345230103, -1.118351936340332, -0.9829037189483643, -0.8474555611610413, -0.7120074033737183, -0.5765592455863953, -0.44111084938049316, -0.30566269159317017, -0.17021453380584717, -0.03476637601852417, 0.10068178176879883, 0.23612993955612183, 0.3715780973434448, 0.5070262551307678, 0.6424744129180908, 0.7779225707054138, 0.9133707284927368, 1.048818826675415, 1.1842670440673828, 1.3197152614593506, 1.4551633596420288, 1.590611457824707, 1.7260596752166748, 1.8615078926086426, 1.9969559907913208, 2.132404088973999, 2.267852306365967, 2.4033005237579346, 2.5387487411499023, 2.674196720123291, 2.809644937515259, 2.9450931549072266, 3.0805411338806152, 3.215989351272583, 3.351437568664551, 3.4868857860565186, 3.6223340034484863, 3.757781982421875, 3.8932301998138428]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 10.0, 10.0, 27.0, 44.0, 59.0, 81.0, 155.0, 196.0, 344.0, 539.0, 967.0, 1597.0, 2658.0, 4677.0, 8303.0, 14445.0, 25468.0, 45088.0, 76950.0, 126681.0, 178772.0, 189858.0, 147354.0, 94600.0, 55407.0, 31703.0, 17956.0, 10395.0, 5807.0, 3459.0, 1920.0, 1151.0, 690.0, 462.0, 254.0, 165.0, 112.0, 73.0, 48.0, 24.0, 19.0, 14.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.54248046875, -0.5245132446289062, -0.5065460205078125, -0.48857879638671875, -0.470611572265625, -0.45264434814453125, -0.4346771240234375, -0.41670989990234375, -0.39874267578125, -0.38077545166015625, -0.3628082275390625, -0.34484100341796875, -0.326873779296875, -0.30890655517578125, -0.2909393310546875, -0.27297210693359375, -0.2550048828125, -0.23703765869140625, -0.2190704345703125, -0.20110321044921875, -0.183135986328125, -0.16516876220703125, -0.1472015380859375, -0.12923431396484375, -0.11126708984375, -0.09329986572265625, -0.0753326416015625, -0.05736541748046875, -0.039398193359375, -0.02143096923828125, -0.0034637451171875, 0.01450347900390625, 0.032470703125, 0.05043792724609375, 0.0684051513671875, 0.08637237548828125, 0.104339599609375, 0.12230682373046875, 0.1402740478515625, 0.15824127197265625, 0.17620849609375, 0.19417572021484375, 0.2121429443359375, 0.23011016845703125, 0.248077392578125, 0.26604461669921875, 0.2840118408203125, 0.30197906494140625, 0.3199462890625, 0.33791351318359375, 0.3558807373046875, 0.37384796142578125, 0.391815185546875, 0.40978240966796875, 0.4277496337890625, 0.44571685791015625, 0.46368408203125, 0.48165130615234375, 0.4996185302734375, 0.5175857543945312, 0.535552978515625, 0.5535202026367188, 0.5714874267578125, 0.5894546508789062, 0.607421875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 6.0, 7.0, 6.0, 16.0, 11.0, 18.0, 15.0, 28.0, 30.0, 20.0, 33.0, 33.0, 34.0, 37.0, 30.0, 42.0, 42.0, 35.0, 33.0, 45.0, 31.0, 53.0, 44.0, 44.0, 34.0, 35.0, 30.0, 36.0, 23.0, 27.0, 21.0, 14.0, 15.0, 16.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.6171875, -5.46527099609375, -5.3133544921875, -5.16143798828125, -5.009521484375, -4.85760498046875, -4.7056884765625, -4.55377197265625, -4.40185546875, -4.24993896484375, -4.0980224609375, -3.94610595703125, -3.794189453125, -3.64227294921875, -3.4903564453125, -3.33843994140625, -3.1865234375, -3.03460693359375, -2.8826904296875, -2.73077392578125, -2.578857421875, -2.42694091796875, -2.2750244140625, -2.12310791015625, -1.97119140625, -1.81927490234375, -1.6673583984375, -1.51544189453125, -1.363525390625, -1.21160888671875, -1.0596923828125, -0.90777587890625, -0.755859375, -0.60394287109375, -0.4520263671875, -0.30010986328125, -0.148193359375, 0.00372314453125, 0.1556396484375, 0.30755615234375, 0.45947265625, 0.61138916015625, 0.7633056640625, 0.91522216796875, 1.067138671875, 1.21905517578125, 1.3709716796875, 1.52288818359375, 1.6748046875, 1.82672119140625, 1.9786376953125, 2.13055419921875, 2.282470703125, 2.43438720703125, 2.5863037109375, 2.73822021484375, 2.89013671875, 3.04205322265625, 3.1939697265625, 3.34588623046875, 3.497802734375, 3.64971923828125, 3.8016357421875, 3.95355224609375, 4.10546875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 13.0, 11.0, 23.0, 20.0, 19.0, 29.0, 39.0, 45.0, 65.0, 111.0, 106.0, 167.0, 234.0, 363.0, 487.0, 742.0, 1143.0, 1845.0, 3083.0, 5634.0, 10447.0, 20734.0, 67814.0, 811320.0, 76479.0, 22257.0, 10723.0, 5734.0, 3237.0, 1920.0, 1193.0, 742.0, 515.0, 344.0, 230.0, 170.0, 138.0, 99.0, 67.0, 54.0, 43.0, 24.0, 20.0, 14.0, 14.0, 8.0, 5.0, 6.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.50390625, -1.457672119140625, -1.41143798828125, -1.365203857421875, -1.3189697265625, -1.272735595703125, -1.22650146484375, -1.180267333984375, -1.134033203125, -1.087799072265625, -1.04156494140625, -0.995330810546875, -0.9490966796875, -0.902862548828125, -0.85662841796875, -0.810394287109375, -0.76416015625, -0.717926025390625, -0.67169189453125, -0.625457763671875, -0.5792236328125, -0.532989501953125, -0.48675537109375, -0.440521240234375, -0.394287109375, -0.348052978515625, -0.30181884765625, -0.255584716796875, -0.2093505859375, -0.163116455078125, -0.11688232421875, -0.070648193359375, -0.0244140625, 0.021820068359375, 0.06805419921875, 0.114288330078125, 0.1605224609375, 0.206756591796875, 0.25299072265625, 0.299224853515625, 0.345458984375, 0.391693115234375, 0.43792724609375, 0.484161376953125, 0.5303955078125, 0.576629638671875, 0.62286376953125, 0.669097900390625, 0.71533203125, 0.761566162109375, 0.80780029296875, 0.854034423828125, 0.9002685546875, 0.946502685546875, 0.99273681640625, 1.038970947265625, 1.085205078125, 1.131439208984375, 1.17767333984375, 1.223907470703125, 1.2701416015625, 1.316375732421875, 1.36260986328125, 1.408843994140625, 1.455078125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 12.0, 8.0, 6.0, 8.0, 6.0, 23.0, 17.0, 16.0, 11.0, 24.0, 29.0, 21.0, 25.0, 28.0, 41.0, 44.0, 34.0, 40.0, 43.0, 38.0, 42.0, 38.0, 38.0, 41.0, 37.0, 28.0, 29.0, 30.0, 29.0, 29.0, 28.0, 24.0, 14.0, 10.0, 20.0, 18.0, 9.0, 8.0, 7.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.80108642578125, -2.7115478515625, -2.62200927734375, -2.532470703125, -2.44293212890625, -2.3533935546875, -2.26385498046875, -2.17431640625, -2.08477783203125, -1.9952392578125, -1.90570068359375, -1.816162109375, -1.72662353515625, -1.6370849609375, -1.54754638671875, -1.4580078125, -1.36846923828125, -1.2789306640625, -1.18939208984375, -1.099853515625, -1.01031494140625, -0.9207763671875, -0.83123779296875, -0.74169921875, -0.65216064453125, -0.5626220703125, -0.47308349609375, -0.383544921875, -0.29400634765625, -0.2044677734375, -0.11492919921875, -0.025390625, 0.06414794921875, 0.1536865234375, 0.24322509765625, 0.332763671875, 0.42230224609375, 0.5118408203125, 0.60137939453125, 0.69091796875, 0.78045654296875, 0.8699951171875, 0.95953369140625, 1.049072265625, 1.13861083984375, 1.2281494140625, 1.31768798828125, 1.4072265625, 1.49676513671875, 1.5863037109375, 1.67584228515625, 1.765380859375, 1.85491943359375, 1.9444580078125, 2.03399658203125, 2.12353515625, 2.21307373046875, 2.3026123046875, 2.39215087890625, 2.481689453125, 2.57122802734375, 2.6607666015625, 2.75030517578125, 2.83984375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 8.0, 25.0, 30.0, 18.0, 39.0, 48.0, 57.0, 90.0, 120.0, 167.0, 249.0, 345.0, 505.0, 760.0, 1144.0, 1856.0, 2891.0, 4755.0, 8043.0, 14312.0, 28500.0, 591290.0, 333721.0, 26339.0, 13422.0, 7583.0, 4457.0, 2674.0, 1701.0, 1080.0, 686.0, 443.0, 342.0, 228.0, 168.0, 125.0, 90.0, 49.0, 42.0, 31.0, 19.0, 22.0, 15.0, 12.0, 7.0, 12.0, 4.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 4.0], "bins": [-0.3427734375, -0.3320465087890625, -0.321319580078125, -0.3105926513671875, -0.29986572265625, -0.2891387939453125, -0.278411865234375, -0.2676849365234375, -0.2569580078125, -0.2462310791015625, -0.235504150390625, -0.2247772216796875, -0.21405029296875, -0.2033233642578125, -0.192596435546875, -0.1818695068359375, -0.171142578125, -0.1604156494140625, -0.149688720703125, -0.1389617919921875, -0.12823486328125, -0.1175079345703125, -0.106781005859375, -0.0960540771484375, -0.0853271484375, -0.0746002197265625, -0.063873291015625, -0.0531463623046875, -0.04241943359375, -0.0316925048828125, -0.020965576171875, -0.0102386474609375, 0.00048828125, 0.0112152099609375, 0.021942138671875, 0.0326690673828125, 0.04339599609375, 0.0541229248046875, 0.064849853515625, 0.0755767822265625, 0.0863037109375, 0.0970306396484375, 0.107757568359375, 0.1184844970703125, 0.12921142578125, 0.1399383544921875, 0.150665283203125, 0.1613922119140625, 0.172119140625, 0.1828460693359375, 0.193572998046875, 0.2042999267578125, 0.21502685546875, 0.2257537841796875, 0.236480712890625, 0.2472076416015625, 0.2579345703125, 0.2686614990234375, 0.279388427734375, 0.2901153564453125, 0.30084228515625, 0.3115692138671875, 0.322296142578125, 0.3330230712890625, 0.34375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 10.0, 6.0, 7.0, 8.0, 11.0, 14.0, 20.0, 13.0, 23.0, 31.0, 26.0, 39.0, 34.0, 35.0, 47.0, 46.0, 50.0, 53.0, 43.0, 49.0, 42.0, 32.0, 45.0, 42.0, 36.0, 31.0, 38.0, 24.0, 29.0, 16.0, 21.0, 14.0, 14.0, 14.0, 8.0, 10.0, 4.0, 3.0, 8.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.8908252716064453e-05, -2.8051435947418213e-05, -2.7194619178771973e-05, -2.6337802410125732e-05, -2.5480985641479492e-05, -2.4624168872833252e-05, -2.3767352104187012e-05, -2.291053533554077e-05, -2.205371856689453e-05, -2.119690179824829e-05, -2.034008502960205e-05, -1.948326826095581e-05, -1.862645149230957e-05, -1.776963472366333e-05, -1.691281795501709e-05, -1.605600118637085e-05, -1.519918441772461e-05, -1.4342367649078369e-05, -1.3485550880432129e-05, -1.2628734111785889e-05, -1.1771917343139648e-05, -1.0915100574493408e-05, -1.0058283805847168e-05, -9.201467037200928e-06, -8.344650268554688e-06, -7.487833499908447e-06, -6.631016731262207e-06, -5.774199962615967e-06, -4.9173831939697266e-06, -4.060566425323486e-06, -3.203749656677246e-06, -2.346932888031006e-06, -1.4901161193847656e-06, -6.332993507385254e-07, 2.2351741790771484e-07, 1.080334186553955e-06, 1.9371509552001953e-06, 2.7939677238464355e-06, 3.6507844924926758e-06, 4.507601261138916e-06, 5.364418029785156e-06, 6.2212347984313965e-06, 7.078051567077637e-06, 7.934868335723877e-06, 8.791685104370117e-06, 9.648501873016357e-06, 1.0505318641662598e-05, 1.1362135410308838e-05, 1.2218952178955078e-05, 1.3075768947601318e-05, 1.3932585716247559e-05, 1.4789402484893799e-05, 1.564621925354004e-05, 1.650303602218628e-05, 1.735985279083252e-05, 1.821666955947876e-05, 1.9073486328125e-05, 1.993030309677124e-05, 2.078711986541748e-05, 2.164393663406372e-05, 2.250075340270996e-05, 2.33575701713562e-05, 2.421438694000244e-05, 2.507120370864868e-05, 2.5928020477294922e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 8.0, 17.0, 32.0, 35.0, 55.0, 71.0, 167.0, 222.0, 386.0, 528.0, 980.0, 1726.0, 2985.0, 5483.0, 10822.0, 22318.0, 49275.0, 113264.0, 239353.0, 294454.0, 167022.0, 73997.0, 32770.0, 15397.0, 7687.0, 3982.0, 2250.0, 1301.0, 732.0, 446.0, 279.0, 170.0, 119.0, 62.0, 45.0, 29.0, 27.0, 14.0, 10.0, 4.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.284912109375, -0.2765922546386719, -0.26827239990234375, -0.2599525451660156, -0.2516326904296875, -0.24331283569335938, -0.23499298095703125, -0.22667312622070312, -0.218353271484375, -0.21003341674804688, -0.20171356201171875, -0.19339370727539062, -0.1850738525390625, -0.17675399780273438, -0.16843414306640625, -0.16011428833007812, -0.15179443359375, -0.14347457885742188, -0.13515472412109375, -0.12683486938476562, -0.1185150146484375, -0.11019515991210938, -0.10187530517578125, -0.09355545043945312, -0.085235595703125, -0.07691574096679688, -0.06859588623046875, -0.060276031494140625, -0.0519561767578125, -0.043636322021484375, -0.03531646728515625, -0.026996612548828125, -0.0186767578125, -0.010356903076171875, -0.00203704833984375, 0.006282806396484375, 0.0146026611328125, 0.022922515869140625, 0.03124237060546875, 0.039562225341796875, 0.047882080078125, 0.056201934814453125, 0.06452178955078125, 0.07284164428710938, 0.0811614990234375, 0.08948135375976562, 0.09780120849609375, 0.10612106323242188, 0.11444091796875, 0.12276077270507812, 0.13108062744140625, 0.13940048217773438, 0.1477203369140625, 0.15604019165039062, 0.16436004638671875, 0.17267990112304688, 0.180999755859375, 0.18931961059570312, 0.19763946533203125, 0.20595932006835938, 0.2142791748046875, 0.22259902954101562, 0.23091888427734375, 0.23923873901367188, 0.24755859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 5.0, 5.0, 9.0, 15.0, 9.0, 10.0, 9.0, 18.0, 15.0, 21.0, 24.0, 34.0, 47.0, 34.0, 70.0, 54.0, 48.0, 64.0, 56.0, 56.0, 51.0, 47.0, 41.0, 35.0, 36.0, 33.0, 25.0, 29.0, 17.0, 10.0, 19.0, 12.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037353515625, -0.03598356246948242, -0.034613609313964844, -0.033243656158447266, -0.03187370300292969, -0.03050374984741211, -0.02913379669189453, -0.027763843536376953, -0.026393890380859375, -0.025023937225341797, -0.02365398406982422, -0.02228403091430664, -0.020914077758789062, -0.019544124603271484, -0.018174171447753906, -0.016804218292236328, -0.01543426513671875, -0.014064311981201172, -0.012694358825683594, -0.011324405670166016, -0.009954452514648438, -0.00858449935913086, -0.007214546203613281, -0.005844593048095703, -0.004474639892578125, -0.003104686737060547, -0.0017347335815429688, -0.0003647804260253906, 0.0010051727294921875, 0.0023751258850097656, 0.0037450790405273438, 0.005115032196044922, 0.0064849853515625, 0.007854938507080078, 0.009224891662597656, 0.010594844818115234, 0.011964797973632812, 0.01333475112915039, 0.014704704284667969, 0.016074657440185547, 0.017444610595703125, 0.018814563751220703, 0.02018451690673828, 0.02155447006225586, 0.022924423217773438, 0.024294376373291016, 0.025664329528808594, 0.027034282684326172, 0.02840423583984375, 0.029774188995361328, 0.031144142150878906, 0.032514095306396484, 0.03388404846191406, 0.03525400161743164, 0.03662395477294922, 0.0379939079284668, 0.039363861083984375, 0.04073381423950195, 0.04210376739501953, 0.04347372055053711, 0.04484367370605469, 0.046213626861572266, 0.047583580017089844, 0.04895353317260742, 0.050323486328125]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 10.0, 9.0, 15.0, 13.0, 23.0, 31.0, 33.0, 48.0, 45.0, 55.0, 65.0, 66.0, 63.0, 58.0, 62.0, 67.0, 57.0, 57.0, 34.0, 36.0, 36.0, 25.0, 31.0, 10.0, 13.0, 10.0, 8.0, 3.0, 1.0, 2.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.933457374572754, -7.662163257598877, -7.390869140625, -7.119575023651123, -6.848280906677246, -6.576986789703369, -6.305692672729492, -6.034398555755615, -5.763104438781738, -5.491810321807861, -5.220516204833984, -4.949222087860107, -4.6779279708862305, -4.4066338539123535, -4.135339736938477, -3.8640456199645996, -3.5927515029907227, -3.3214573860168457, -3.0501632690429688, -2.778869152069092, -2.507575035095215, -2.236280918121338, -1.964986801147461, -1.693692684173584, -1.422398567199707, -1.15110445022583, -0.8798103332519531, -0.6085162162780762, -0.3372220993041992, -0.06592798233032227, 0.2053661346435547, 0.47666025161743164, 0.7479534149169922, 1.0192475318908691, 1.290541648864746, 1.561835765838623, 1.8331298828125, 2.104423999786377, 2.375718116760254, 2.647012233734131, 2.918306350708008, 3.1896004676818848, 3.4608945846557617, 3.7321887016296387, 4.003482818603516, 4.274776935577393, 4.5460710525512695, 4.8173651695251465, 5.088659286499023, 5.3599534034729, 5.631247520446777, 5.902541637420654, 6.173835754394531, 6.445129871368408, 6.716423988342285, 6.987718105316162, 7.259012222290039, 7.530306339263916, 7.801600456237793, 8.072895050048828, 8.344188690185547, 8.615482330322266, 8.8867769241333, 9.158071517944336, 9.429365158081055]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 8.0, 4.0, 5.0, 11.0, 7.0, 9.0, 13.0, 18.0, 11.0, 20.0, 23.0, 32.0, 23.0, 23.0, 40.0, 35.0, 34.0, 35.0, 32.0, 40.0, 51.0, 42.0, 39.0, 43.0, 51.0, 38.0, 36.0, 42.0, 34.0, 30.0, 21.0, 26.0, 17.0, 22.0, 16.0, 17.0, 16.0, 8.0, 8.0, 7.0, 6.0, 2.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.752599716186523, -4.61810827255249, -4.483617305755615, -4.349125862121582, -4.214634895324707, -4.080143451690674, -3.9456522464752197, -3.8111610412597656, -3.6766698360443115, -3.5421786308288574, -3.4076874256134033, -3.273196220397949, -3.138704776763916, -3.004213809967041, -2.869722366333008, -2.7352311611175537, -2.6007399559020996, -2.4662487506866455, -2.3317575454711914, -2.1972663402557373, -2.062775135040283, -1.9282838106155396, -1.793792486190796, -1.6593012809753418, -1.5248100757598877, -1.3903188705444336, -1.2558276653289795, -1.1213363409042358, -0.9868451356887817, -0.8523539304733276, -0.7178626656532288, -0.5833714008331299, -0.4488801956176758, -0.3143889605998993, -0.1798977255821228, -0.045406490564346313, 0.08908474445343018, 0.22357594966888428, 0.35806721448898315, 0.49255847930908203, 0.6270496845245361, 0.7615408897399902, 0.8960321545600891, 1.030523419380188, 1.165014624595642, 1.2995058298110962, 1.4339971542358398, 1.568488359451294, 1.702979564666748, 1.8374707698822021, 1.9719619750976562, 2.1064531803131104, 2.2409443855285645, 2.3754358291625977, 2.5099270343780518, 2.644418239593506, 2.77890944480896, 2.913400650024414, 3.047891855239868, 3.1823830604553223, 3.3168745040893555, 3.4513654708862305, 3.5858569145202637, 3.7203481197357178, 3.854839324951172]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 14.0, 26.0, 38.0, 63.0, 84.0, 115.0, 179.0, 286.0, 426.0, 629.0, 969.0, 1481.0, 2389.0, 3808.0, 5710.0, 9054.0, 13802.0, 21247.0, 32086.0, 46996.0, 66732.0, 88452.0, 109439.0, 121545.0, 121791.0, 109076.0, 87754.0, 65971.0, 46994.0, 31963.0, 20821.0, 13694.0, 8710.0, 5664.0, 3668.0, 2378.0, 1554.0, 979.0, 618.0, 430.0, 284.0, 185.0, 134.0, 77.0, 75.0, 44.0, 27.0, 27.0, 14.0, 12.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0], "bins": [-3.681640625, -3.566558837890625, -3.45147705078125, -3.336395263671875, -3.2213134765625, -3.106231689453125, -2.99114990234375, -2.876068115234375, -2.760986328125, -2.645904541015625, -2.53082275390625, -2.415740966796875, -2.3006591796875, -2.185577392578125, -2.07049560546875, -1.955413818359375, -1.84033203125, -1.725250244140625, -1.61016845703125, -1.495086669921875, -1.3800048828125, -1.264923095703125, -1.14984130859375, -1.034759521484375, -0.919677734375, -0.804595947265625, -0.68951416015625, -0.574432373046875, -0.4593505859375, -0.344268798828125, -0.22918701171875, -0.114105224609375, 0.0009765625, 0.116058349609375, 0.23114013671875, 0.346221923828125, 0.4613037109375, 0.576385498046875, 0.69146728515625, 0.806549072265625, 0.921630859375, 1.036712646484375, 1.15179443359375, 1.266876220703125, 1.3819580078125, 1.497039794921875, 1.61212158203125, 1.727203369140625, 1.84228515625, 1.957366943359375, 2.07244873046875, 2.187530517578125, 2.3026123046875, 2.417694091796875, 2.53277587890625, 2.647857666015625, 2.762939453125, 2.878021240234375, 2.99310302734375, 3.108184814453125, 3.2232666015625, 3.338348388671875, 3.45343017578125, 3.568511962890625, 3.68359375]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 15.0, 8.0, 14.0, 17.0, 22.0, 23.0, 26.0, 31.0, 44.0, 28.0, 30.0, 34.0, 38.0, 35.0, 38.0, 37.0, 47.0, 33.0, 39.0, 42.0, 47.0, 30.0, 41.0, 22.0, 26.0, 24.0, 29.0, 20.0, 26.0, 14.0, 22.0, 8.0, 11.0, 7.0, 5.0, 7.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.09375, -4.95062255859375, -4.8074951171875, -4.66436767578125, -4.521240234375, -4.37811279296875, -4.2349853515625, -4.09185791015625, -3.94873046875, -3.80560302734375, -3.6624755859375, -3.51934814453125, -3.376220703125, -3.23309326171875, -3.0899658203125, -2.94683837890625, -2.8037109375, -2.66058349609375, -2.5174560546875, -2.37432861328125, -2.231201171875, -2.08807373046875, -1.9449462890625, -1.80181884765625, -1.65869140625, -1.51556396484375, -1.3724365234375, -1.22930908203125, -1.086181640625, -0.94305419921875, -0.7999267578125, -0.65679931640625, -0.513671875, -0.37054443359375, -0.2274169921875, -0.08428955078125, 0.058837890625, 0.20196533203125, 0.3450927734375, 0.48822021484375, 0.63134765625, 0.77447509765625, 0.9176025390625, 1.06072998046875, 1.203857421875, 1.34698486328125, 1.4901123046875, 1.63323974609375, 1.7763671875, 1.91949462890625, 2.0626220703125, 2.20574951171875, 2.348876953125, 2.49200439453125, 2.6351318359375, 2.77825927734375, 2.92138671875, 3.06451416015625, 3.2076416015625, 3.35076904296875, 3.493896484375, 3.63702392578125, 3.7801513671875, 3.92327880859375, 4.06640625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 11.0, 15.0, 20.0, 36.0, 67.0, 124.0, 179.0, 350.0, 596.0, 999.0, 1728.0, 3128.0, 5665.0, 9936.0, 17134.0, 30031.0, 50480.0, 79640.0, 116002.0, 148349.0, 158535.0, 141548.0, 106480.0, 71765.0, 44335.0, 26395.0, 14968.0, 8587.0, 4972.0, 2777.0, 1556.0, 867.0, 535.0, 305.0, 174.0, 93.0, 60.0, 43.0, 24.0, 12.0, 9.0, 7.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.03515625, -4.879638671875, -4.72412109375, -4.568603515625, -4.4130859375, -4.257568359375, -4.10205078125, -3.946533203125, -3.791015625, -3.635498046875, -3.47998046875, -3.324462890625, -3.1689453125, -3.013427734375, -2.85791015625, -2.702392578125, -2.546875, -2.391357421875, -2.23583984375, -2.080322265625, -1.9248046875, -1.769287109375, -1.61376953125, -1.458251953125, -1.302734375, -1.147216796875, -0.99169921875, -0.836181640625, -0.6806640625, -0.525146484375, -0.36962890625, -0.214111328125, -0.05859375, 0.096923828125, 0.25244140625, 0.407958984375, 0.5634765625, 0.718994140625, 0.87451171875, 1.030029296875, 1.185546875, 1.341064453125, 1.49658203125, 1.652099609375, 1.8076171875, 1.963134765625, 2.11865234375, 2.274169921875, 2.4296875, 2.585205078125, 2.74072265625, 2.896240234375, 3.0517578125, 3.207275390625, 3.36279296875, 3.518310546875, 3.673828125, 3.829345703125, 3.98486328125, 4.140380859375, 4.2958984375, 4.451416015625, 4.60693359375, 4.762451171875, 4.91796875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 5.0, 11.0, 8.0, 9.0, 2.0, 8.0, 14.0, 18.0, 27.0, 28.0, 36.0, 35.0, 40.0, 45.0, 59.0, 47.0, 46.0, 54.0, 64.0, 44.0, 30.0, 42.0, 53.0, 48.0, 31.0, 41.0, 21.0, 31.0, 18.0, 18.0, 22.0, 17.0, 6.0, 9.0, 4.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.796875, -2.6832275390625, -2.569580078125, -2.4559326171875, -2.34228515625, -2.2286376953125, -2.114990234375, -2.0013427734375, -1.8876953125, -1.7740478515625, -1.660400390625, -1.5467529296875, -1.43310546875, -1.3194580078125, -1.205810546875, -1.0921630859375, -0.978515625, -0.8648681640625, -0.751220703125, -0.6375732421875, -0.52392578125, -0.4102783203125, -0.296630859375, -0.1829833984375, -0.0693359375, 0.0443115234375, 0.157958984375, 0.2716064453125, 0.38525390625, 0.4989013671875, 0.612548828125, 0.7261962890625, 0.83984375, 0.9534912109375, 1.067138671875, 1.1807861328125, 1.29443359375, 1.4080810546875, 1.521728515625, 1.6353759765625, 1.7490234375, 1.8626708984375, 1.976318359375, 2.0899658203125, 2.20361328125, 2.3172607421875, 2.430908203125, 2.5445556640625, 2.658203125, 2.7718505859375, 2.885498046875, 2.9991455078125, 3.11279296875, 3.2264404296875, 3.340087890625, 3.4537353515625, 3.5673828125, 3.6810302734375, 3.794677734375, 3.9083251953125, 4.02197265625, 4.1356201171875, 4.249267578125, 4.3629150390625, 4.4765625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 10.0, 15.0, 17.0, 35.0, 47.0, 54.0, 72.0, 104.0, 169.0, 235.0, 282.0, 443.0, 624.0, 975.0, 1345.0, 2125.0, 3531.0, 6128.0, 11388.0, 22332.0, 47523.0, 102503.0, 199651.0, 258804.0, 194664.0, 100715.0, 45902.0, 21957.0, 10984.0, 6009.0, 3317.0, 2218.0, 1337.0, 885.0, 623.0, 432.0, 313.0, 246.0, 156.0, 104.0, 84.0, 54.0, 38.0, 29.0, 24.0, 17.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.1953125, -4.05767822265625, -3.9200439453125, -3.78240966796875, -3.644775390625, -3.50714111328125, -3.3695068359375, -3.23187255859375, -3.09423828125, -2.95660400390625, -2.8189697265625, -2.68133544921875, -2.543701171875, -2.40606689453125, -2.2684326171875, -2.13079833984375, -1.9931640625, -1.85552978515625, -1.7178955078125, -1.58026123046875, -1.442626953125, -1.30499267578125, -1.1673583984375, -1.02972412109375, -0.89208984375, -0.75445556640625, -0.6168212890625, -0.47918701171875, -0.341552734375, -0.20391845703125, -0.0662841796875, 0.07135009765625, 0.208984375, 0.34661865234375, 0.4842529296875, 0.62188720703125, 0.759521484375, 0.89715576171875, 1.0347900390625, 1.17242431640625, 1.31005859375, 1.44769287109375, 1.5853271484375, 1.72296142578125, 1.860595703125, 1.99822998046875, 2.1358642578125, 2.27349853515625, 2.4111328125, 2.54876708984375, 2.6864013671875, 2.82403564453125, 2.961669921875, 3.09930419921875, 3.2369384765625, 3.37457275390625, 3.51220703125, 3.64984130859375, 3.7874755859375, 3.92510986328125, 4.062744140625, 4.20037841796875, 4.3380126953125, 4.47564697265625, 4.61328125]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 4.0, 7.0, 8.0, 12.0, 15.0, 28.0, 19.0, 53.0, 29.0, 66.0, 61.0, 70.0, 75.0, 65.0, 68.0, 57.0, 67.0, 72.0, 47.0, 37.0, 31.0, 16.0, 18.0, 14.0, 9.0, 11.0, 6.0, 6.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00034999847412109375, -0.000339265912771225, -0.0003285333514213562, -0.0003178007900714874, -0.00030706822872161865, -0.0002963356673717499, -0.0002856031060218811, -0.00027487054467201233, -0.00026413798332214355, -0.0002534054219722748, -0.000242672860622406, -0.00023194029927253723, -0.00022120773792266846, -0.00021047517657279968, -0.0001997426152229309, -0.00018901005387306213, -0.00017827749252319336, -0.00016754493117332458, -0.0001568123698234558, -0.00014607980847358704, -0.00013534724712371826, -0.0001246146857738495, -0.00011388212442398071, -0.00010314956307411194, -9.241700172424316e-05, -8.168444037437439e-05, -7.095187902450562e-05, -6.021931767463684e-05, -4.9486756324768066e-05, -3.875419497489929e-05, -2.8021633625030518e-05, -1.7289072275161743e-05, -6.556510925292969e-06, 4.176050424575806e-06, 1.490861177444458e-05, 2.5641173124313354e-05, 3.637373447418213e-05, 4.71062958240509e-05, 5.783885717391968e-05, 6.857141852378845e-05, 7.930397987365723e-05, 9.0036541223526e-05, 0.00010076910257339478, 0.00011150166392326355, 0.00012223422527313232, 0.0001329667866230011, 0.00014369934797286987, 0.00015443190932273865, 0.00016516447067260742, 0.0001758970320224762, 0.00018662959337234497, 0.00019736215472221375, 0.00020809471607208252, 0.0002188272774219513, 0.00022955983877182007, 0.00024029240012168884, 0.0002510249614715576, 0.0002617575228214264, 0.00027249008417129517, 0.00028322264552116394, 0.0002939552068710327, 0.0003046877682209015, 0.00031542032957077026, 0.00032615289092063904, 0.0003368854522705078]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 7.0, 10.0, 9.0, 11.0, 22.0, 32.0, 37.0, 41.0, 57.0, 72.0, 131.0, 140.0, 204.0, 261.0, 364.0, 527.0, 823.0, 1193.0, 2008.0, 3404.0, 6605.0, 14010.0, 33634.0, 86192.0, 202408.0, 304137.0, 221869.0, 98510.0, 38463.0, 15892.0, 7354.0, 3825.0, 2154.0, 1248.0, 825.0, 571.0, 379.0, 296.0, 240.0, 141.0, 105.0, 79.0, 63.0, 51.0, 41.0, 34.0, 28.0, 16.0, 11.0, 6.0, 9.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.4765625, -5.3031005859375, -5.129638671875, -4.9561767578125, -4.78271484375, -4.6092529296875, -4.435791015625, -4.2623291015625, -4.0888671875, -3.9154052734375, -3.741943359375, -3.5684814453125, -3.39501953125, -3.2215576171875, -3.048095703125, -2.8746337890625, -2.701171875, -2.5277099609375, -2.354248046875, -2.1807861328125, -2.00732421875, -1.8338623046875, -1.660400390625, -1.4869384765625, -1.3134765625, -1.1400146484375, -0.966552734375, -0.7930908203125, -0.61962890625, -0.4461669921875, -0.272705078125, -0.0992431640625, 0.07421875, 0.2476806640625, 0.421142578125, 0.5946044921875, 0.76806640625, 0.9415283203125, 1.114990234375, 1.2884521484375, 1.4619140625, 1.6353759765625, 1.808837890625, 1.9822998046875, 2.15576171875, 2.3292236328125, 2.502685546875, 2.6761474609375, 2.849609375, 3.0230712890625, 3.196533203125, 3.3699951171875, 3.54345703125, 3.7169189453125, 3.890380859375, 4.0638427734375, 4.2373046875, 4.4107666015625, 4.584228515625, 4.7576904296875, 4.93115234375, 5.1046142578125, 5.278076171875, 5.4515380859375, 5.625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 11.0, 8.0, 11.0, 24.0, 26.0, 31.0, 40.0, 45.0, 63.0, 62.0, 71.0, 69.0, 55.0, 83.0, 62.0, 62.0, 58.0, 34.0, 35.0, 28.0, 26.0, 21.0, 11.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.1064453125, -1.0707550048828125, -1.035064697265625, -0.9993743896484375, -0.96368408203125, -0.9279937744140625, -0.892303466796875, -0.8566131591796875, -0.8209228515625, -0.7852325439453125, -0.749542236328125, -0.7138519287109375, -0.67816162109375, -0.6424713134765625, -0.606781005859375, -0.5710906982421875, -0.535400390625, -0.4997100830078125, -0.464019775390625, -0.4283294677734375, -0.39263916015625, -0.3569488525390625, -0.321258544921875, -0.2855682373046875, -0.2498779296875, -0.2141876220703125, -0.178497314453125, -0.1428070068359375, -0.10711669921875, -0.0714263916015625, -0.035736083984375, -4.57763671875e-05, 0.03564453125, 0.0713348388671875, 0.107025146484375, 0.1427154541015625, 0.17840576171875, 0.2140960693359375, 0.249786376953125, 0.2854766845703125, 0.3211669921875, 0.3568572998046875, 0.392547607421875, 0.4282379150390625, 0.46392822265625, 0.4996185302734375, 0.535308837890625, 0.5709991455078125, 0.606689453125, 0.6423797607421875, 0.678070068359375, 0.7137603759765625, 0.74945068359375, 0.7851409912109375, 0.820831298828125, 0.8565216064453125, 0.8922119140625, 0.9279022216796875, 0.963592529296875, 0.9992828369140625, 1.03497314453125, 1.0706634521484375, 1.106353759765625, 1.1420440673828125, 1.177734375]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 7.0, 14.0, 28.0, 23.0, 26.0, 33.0, 44.0, 46.0, 66.0, 67.0, 78.0, 79.0, 56.0, 62.0, 65.0, 60.0, 46.0, 44.0, 42.0, 25.0, 21.0, 25.0, 10.0, 10.0, 1.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.256855010986328, -7.958423614501953, -7.659992694854736, -7.361561298370361, -7.0631303787231445, -6.7646989822387695, -6.4662675857543945, -6.1678361892700195, -5.869405269622803, -5.570973873138428, -5.272542953491211, -4.974111557006836, -4.675680160522461, -4.377249240875244, -4.078817844390869, -3.7803866863250732, -3.4819555282592773, -3.1835243701934814, -2.8850932121276855, -2.5866618156433105, -2.2882306575775146, -1.9897994995117188, -1.6913682222366333, -1.3929369449615479, -1.094505786895752, -0.7960745692253113, -0.4976433515548706, -0.19921213388442993, 0.09921908378601074, 0.39765024185180664, 0.6960815191268921, 0.9945127964019775, 1.2929449081420898, 1.5913760662078857, 1.8898073434829712, 2.1882386207580566, 2.4866697788238525, 2.7851009368896484, 3.0835323333740234, 3.3819634914398193, 3.6803946495056152, 3.978825807571411, 4.277256965637207, 4.575688362121582, 4.874119758605957, 5.172550678253174, 5.470982074737549, 5.769412994384766, 6.067844390869141, 6.366275787353516, 6.664706707000732, 6.963138103485107, 7.261569023132324, 7.560000419616699, 7.858431816101074, 8.15686321258545, 8.455293655395508, 8.753725051879883, 9.052156448364258, 9.350586891174316, 9.649018287658691, 9.947449684143066, 10.245881080627441, 10.544312477111816, 10.842743873596191]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 8.0, 7.0, 12.0, 7.0, 8.0, 12.0, 6.0, 13.0, 18.0, 16.0, 24.0, 22.0, 18.0, 43.0, 19.0, 38.0, 32.0, 25.0, 41.0, 37.0, 40.0, 44.0, 39.0, 30.0, 43.0, 33.0, 33.0, 33.0, 35.0, 26.0, 36.0, 23.0, 19.0, 24.0, 18.0, 22.0, 25.0, 8.0, 15.0, 7.0, 9.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9709115028381348, -3.8391921520233154, -3.707473039627075, -3.575753688812256, -3.4440345764160156, -3.3123152256011963, -3.180595874786377, -3.0488767623901367, -2.9171574115753174, -2.785438060760498, -2.653718948364258, -2.5219995975494385, -2.390280246734619, -2.258561134338379, -2.1268417835235596, -1.9951225519180298, -1.8634033203125, -1.7316840887069702, -1.5999648571014404, -1.468245506286621, -1.3365262746810913, -1.2048070430755615, -1.0730876922607422, -0.9413684606552124, -0.8096492290496826, -0.6779299974441528, -0.5462107062339783, -0.4144914448261261, -0.2827721834182739, -0.15105295181274414, -0.01933366060256958, 0.11238563060760498, 0.24410486221313477, 0.37582412362098694, 0.5075433850288391, 0.6392626762390137, 0.7709819078445435, 0.9027011394500732, 1.0344204902648926, 1.1661397218704224, 1.2978589534759521, 1.429578185081482, 1.5612974166870117, 1.693016767501831, 1.8247359991073608, 1.9564552307128906, 2.08817458152771, 2.2198939323425293, 2.3516130447387695, 2.483332395553589, 2.615051507949829, 2.7467708587646484, 2.8784899711608887, 3.010209321975708, 3.1419286727905273, 3.2736477851867676, 3.405367136001587, 3.5370864868164062, 3.6688055992126465, 3.800524950027466, 3.932244300842285, 4.063963413238525, 4.195682525634766, 4.327402114868164, 4.459121227264404]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 5.0, 9.0, 7.0, 10.0, 12.0, 20.0, 23.0, 46.0, 61.0, 68.0, 139.0, 159.0, 281.0, 454.0, 678.0, 1048.0, 1851.0, 2975.0, 4947.0, 8522.0, 14791.0, 25915.0, 47929.0, 89841.0, 175287.0, 347675.0, 642379.0, 907245.0, 828155.0, 520793.0, 273099.0, 139445.0, 72378.0, 38121.0, 21033.0, 11995.0, 6807.0, 4018.0, 2342.0, 1363.0, 857.0, 562.0, 321.0, 214.0, 137.0, 93.0, 62.0, 50.0, 27.0, 13.0, 9.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.06640625, -6.84423828125, -6.6220703125, -6.39990234375, -6.177734375, -5.95556640625, -5.7333984375, -5.51123046875, -5.2890625, -5.06689453125, -4.8447265625, -4.62255859375, -4.400390625, -4.17822265625, -3.9560546875, -3.73388671875, -3.51171875, -3.28955078125, -3.0673828125, -2.84521484375, -2.623046875, -2.40087890625, -2.1787109375, -1.95654296875, -1.734375, -1.51220703125, -1.2900390625, -1.06787109375, -0.845703125, -0.62353515625, -0.4013671875, -0.17919921875, 0.04296875, 0.26513671875, 0.4873046875, 0.70947265625, 0.931640625, 1.15380859375, 1.3759765625, 1.59814453125, 1.8203125, 2.04248046875, 2.2646484375, 2.48681640625, 2.708984375, 2.93115234375, 3.1533203125, 3.37548828125, 3.59765625, 3.81982421875, 4.0419921875, 4.26416015625, 4.486328125, 4.70849609375, 4.9306640625, 5.15283203125, 5.375, 5.59716796875, 5.8193359375, 6.04150390625, 6.263671875, 6.48583984375, 6.7080078125, 6.93017578125, 7.15234375]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 3.0, 7.0, 7.0, 8.0, 12.0, 12.0, 10.0, 24.0, 32.0, 24.0, 31.0, 34.0, 38.0, 45.0, 41.0, 49.0, 59.0, 58.0, 47.0, 35.0, 36.0, 49.0, 36.0, 43.0, 42.0, 43.0, 35.0, 25.0, 31.0, 19.0, 13.0, 7.0, 9.0, 7.0, 9.0, 9.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.822662353515625, -3.67071533203125, -3.518768310546875, -3.3668212890625, -3.214874267578125, -3.06292724609375, -2.910980224609375, -2.759033203125, -2.607086181640625, -2.45513916015625, -2.303192138671875, -2.1512451171875, -1.999298095703125, -1.84735107421875, -1.695404052734375, -1.54345703125, -1.391510009765625, -1.23956298828125, -1.087615966796875, -0.9356689453125, -0.783721923828125, -0.63177490234375, -0.479827880859375, -0.327880859375, -0.175933837890625, -0.02398681640625, 0.127960205078125, 0.2799072265625, 0.431854248046875, 0.58380126953125, 0.735748291015625, 0.8876953125, 1.039642333984375, 1.19158935546875, 1.343536376953125, 1.4954833984375, 1.647430419921875, 1.79937744140625, 1.951324462890625, 2.103271484375, 2.255218505859375, 2.40716552734375, 2.559112548828125, 2.7110595703125, 2.863006591796875, 3.01495361328125, 3.166900634765625, 3.31884765625, 3.470794677734375, 3.62274169921875, 3.774688720703125, 3.9266357421875, 4.078582763671875, 4.23052978515625, 4.382476806640625, 4.534423828125, 4.686370849609375, 4.83831787109375, 4.990264892578125, 5.1422119140625, 5.294158935546875, 5.44610595703125, 5.598052978515625, 5.75]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 18.0, 35.0, 49.0, 110.0, 164.0, 253.0, 412.0, 727.0, 1243.0, 2199.0, 3628.0, 6580.0, 11854.0, 22001.0, 40766.0, 78443.0, 152811.0, 294116.0, 539645.0, 824988.0, 872000.0, 615402.0, 346684.0, 180697.0, 93642.0, 48797.0, 25480.0, 13776.0, 7642.0, 4294.0, 2400.0, 1336.0, 845.0, 474.0, 279.0, 186.0, 108.0, 59.0, 45.0, 22.0, 15.0, 19.0, 5.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.0723876953125, -7.785400390625, -7.4984130859375, -7.21142578125, -6.9244384765625, -6.637451171875, -6.3504638671875, -6.0634765625, -5.7764892578125, -5.489501953125, -5.2025146484375, -4.91552734375, -4.6285400390625, -4.341552734375, -4.0545654296875, -3.767578125, -3.4805908203125, -3.193603515625, -2.9066162109375, -2.61962890625, -2.3326416015625, -2.045654296875, -1.7586669921875, -1.4716796875, -1.1846923828125, -0.897705078125, -0.6107177734375, -0.32373046875, -0.0367431640625, 0.250244140625, 0.5372314453125, 0.82421875, 1.1112060546875, 1.398193359375, 1.6851806640625, 1.97216796875, 2.2591552734375, 2.546142578125, 2.8331298828125, 3.1201171875, 3.4071044921875, 3.694091796875, 3.9810791015625, 4.26806640625, 4.5550537109375, 4.842041015625, 5.1290283203125, 5.416015625, 5.7030029296875, 5.989990234375, 6.2769775390625, 6.56396484375, 6.8509521484375, 7.137939453125, 7.4249267578125, 7.7119140625, 7.9989013671875, 8.285888671875, 8.5728759765625, 8.85986328125, 9.1468505859375, 9.433837890625, 9.7208251953125, 10.0078125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 4.0, 6.0, 16.0, 15.0, 15.0, 29.0, 37.0, 37.0, 48.0, 61.0, 77.0, 111.0, 113.0, 143.0, 150.0, 204.0, 238.0, 254.0, 271.0, 257.0, 253.0, 202.0, 246.0, 233.0, 173.0, 152.0, 154.0, 110.0, 102.0, 70.0, 53.0, 43.0, 43.0, 37.0, 30.0, 23.0, 20.0, 9.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.716796875, -2.6339111328125, -2.551025390625, -2.4681396484375, -2.38525390625, -2.3023681640625, -2.219482421875, -2.1365966796875, -2.0537109375, -1.9708251953125, -1.887939453125, -1.8050537109375, -1.72216796875, -1.6392822265625, -1.556396484375, -1.4735107421875, -1.390625, -1.3077392578125, -1.224853515625, -1.1419677734375, -1.05908203125, -0.9761962890625, -0.893310546875, -0.8104248046875, -0.7275390625, -0.6446533203125, -0.561767578125, -0.4788818359375, -0.39599609375, -0.3131103515625, -0.230224609375, -0.1473388671875, -0.064453125, 0.0184326171875, 0.101318359375, 0.1842041015625, 0.26708984375, 0.3499755859375, 0.432861328125, 0.5157470703125, 0.5986328125, 0.6815185546875, 0.764404296875, 0.8472900390625, 0.93017578125, 1.0130615234375, 1.095947265625, 1.1788330078125, 1.26171875, 1.3446044921875, 1.427490234375, 1.5103759765625, 1.59326171875, 1.6761474609375, 1.759033203125, 1.8419189453125, 1.9248046875, 2.0076904296875, 2.090576171875, 2.1734619140625, 2.25634765625, 2.3392333984375, 2.422119140625, 2.5050048828125, 2.587890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 20.0, 23.0, 18.0, 22.0, 32.0, 26.0, 41.0, 41.0, 49.0, 48.0, 57.0, 53.0, 58.0, 72.0, 63.0, 61.0, 39.0, 40.0, 47.0, 37.0, 30.0, 24.0, 22.0, 11.0, 15.0, 3.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.052596092224121, -9.751803398132324, -9.451009750366211, -9.150217056274414, -8.849424362182617, -8.54863166809082, -8.247838020324707, -7.94704532623291, -7.646252155303955, -7.345458984375, -7.044666290283203, -6.743873119354248, -6.443079948425293, -6.142287254333496, -5.841494083404541, -5.540700912475586, -5.239908218383789, -4.939115047454834, -4.638322353363037, -4.337529182434082, -4.036736488342285, -3.73594331741333, -3.435150146484375, -3.134357213973999, -2.833564281463623, -2.532771348953247, -2.231978416442871, -1.931185245513916, -1.63039231300354, -1.329599380493164, -1.0288063287734985, -0.728013277053833, -0.42722129821777344, -0.12642830610275269, 0.17436468601226807, 0.4751576781272888, 0.7759506702423096, 1.0767436027526855, 1.377536654472351, 1.6783297061920166, 1.9791226387023926, 2.2799155712127686, 2.5807085037231445, 2.8815016746520996, 3.1822946071624756, 3.4830875396728516, 3.7838807106018066, 4.084673881530762, 4.385466575622559, 4.686259746551514, 4.9870524406433105, 5.287845611572266, 5.5886383056640625, 5.889431476593018, 6.190224647521973, 6.4910173416137695, 6.791810512542725, 7.09260368347168, 7.393396377563477, 7.694189548492432, 7.994982719421387, 8.295775413513184, 8.59656810760498, 8.897361755371094, 9.19815444946289]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 13.0, 12.0, 16.0, 11.0, 15.0, 10.0, 17.0, 36.0, 24.0, 32.0, 28.0, 21.0, 31.0, 30.0, 42.0, 38.0, 27.0, 43.0, 44.0, 28.0, 53.0, 37.0, 35.0, 40.0, 34.0, 36.0, 26.0, 30.0, 27.0, 26.0, 20.0, 17.0, 24.0, 12.0, 12.0, 8.0, 5.0, 11.0, 6.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.544286251068115, -5.38059663772583, -5.216907024383545, -5.05321741104126, -4.889527797698975, -4.7258381843566895, -4.562148571014404, -4.398458957672119, -4.234769344329834, -4.071079730987549, -3.9073901176452637, -3.7437005043029785, -3.5800108909606934, -3.416321277618408, -3.252631664276123, -3.088942050933838, -2.9252524375915527, -2.7615628242492676, -2.5978732109069824, -2.4341835975646973, -2.270493984222412, -2.106804370880127, -1.9431147575378418, -1.7794251441955566, -1.6157355308532715, -1.4520459175109863, -1.2883563041687012, -1.124666690826416, -0.9609770774841309, -0.7972874641418457, -0.6335978507995605, -0.4699082374572754, -0.30621910095214844, -0.14252948760986328, 0.021160125732421875, 0.18484973907470703, 0.3485393524169922, 0.5122289657592773, 0.6759185791015625, 0.8396081924438477, 1.0032978057861328, 1.166987419128418, 1.3306770324707031, 1.4943666458129883, 1.6580562591552734, 1.8217458724975586, 1.9854354858398438, 2.149125099182129, 2.312814712524414, 2.476504325866699, 2.6401939392089844, 2.8038835525512695, 2.9675731658935547, 3.13126277923584, 3.294952392578125, 3.45864200592041, 3.6223316192626953, 3.7860212326049805, 3.9497108459472656, 4.113400459289551, 4.277090072631836, 4.440779685974121, 4.604469299316406, 4.768158912658691, 4.931848526000977]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 1.0, 7.0, 11.0, 8.0, 23.0, 17.0, 35.0, 73.0, 93.0, 115.0, 194.0, 324.0, 501.0, 741.0, 1217.0, 2139.0, 3366.0, 5548.0, 9446.0, 16172.0, 27408.0, 47725.0, 81612.0, 132071.0, 183242.0, 187068.0, 139279.0, 87014.0, 51309.0, 29384.0, 17032.0, 10141.0, 5950.0, 3526.0, 2116.0, 1317.0, 812.0, 518.0, 330.0, 228.0, 139.0, 92.0, 66.0, 44.0, 25.0, 23.0, 14.0, 15.0, 12.0, 8.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6492996215820312, -0.6277008056640625, -0.6061019897460938, -0.584503173828125, -0.5629043579101562, -0.5413055419921875, -0.5197067260742188, -0.49810791015625, -0.47650909423828125, -0.4549102783203125, -0.43331146240234375, -0.411712646484375, -0.39011383056640625, -0.3685150146484375, -0.34691619873046875, -0.3253173828125, -0.30371856689453125, -0.2821197509765625, -0.26052093505859375, -0.238922119140625, -0.21732330322265625, -0.1957244873046875, -0.17412567138671875, -0.15252685546875, -0.13092803955078125, -0.1093292236328125, -0.08773040771484375, -0.066131591796875, -0.04453277587890625, -0.0229339599609375, -0.00133514404296875, 0.020263671875, 0.04186248779296875, 0.0634613037109375, 0.08506011962890625, 0.106658935546875, 0.12825775146484375, 0.1498565673828125, 0.17145538330078125, 0.19305419921875, 0.21465301513671875, 0.2362518310546875, 0.25785064697265625, 0.279449462890625, 0.30104827880859375, 0.3226470947265625, 0.34424591064453125, 0.3658447265625, 0.38744354248046875, 0.4090423583984375, 0.43064117431640625, 0.452239990234375, 0.47383880615234375, 0.4954376220703125, 0.5170364379882812, 0.53863525390625, 0.5602340698242188, 0.5818328857421875, 0.6034317016601562, 0.625030517578125, 0.6466293334960938, 0.6682281494140625, 0.6898269653320312, 0.71142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 2.0, 3.0, 9.0, 9.0, 11.0, 12.0, 10.0, 7.0, 14.0, 17.0, 30.0, 23.0, 29.0, 29.0, 32.0, 28.0, 35.0, 35.0, 46.0, 42.0, 40.0, 58.0, 44.0, 39.0, 53.0, 29.0, 36.0, 38.0, 34.0, 41.0, 21.0, 26.0, 21.0, 18.0, 20.0, 17.0, 11.0, 7.0, 8.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.75775146484375, -5.5623779296875, -5.36700439453125, -5.171630859375, -4.97625732421875, -4.7808837890625, -4.58551025390625, -4.39013671875, -4.19476318359375, -3.9993896484375, -3.80401611328125, -3.608642578125, -3.41326904296875, -3.2178955078125, -3.02252197265625, -2.8271484375, -2.63177490234375, -2.4364013671875, -2.24102783203125, -2.045654296875, -1.85028076171875, -1.6549072265625, -1.45953369140625, -1.26416015625, -1.06878662109375, -0.8734130859375, -0.67803955078125, -0.482666015625, -0.28729248046875, -0.0919189453125, 0.10345458984375, 0.298828125, 0.49420166015625, 0.6895751953125, 0.88494873046875, 1.080322265625, 1.27569580078125, 1.4710693359375, 1.66644287109375, 1.86181640625, 2.05718994140625, 2.2525634765625, 2.44793701171875, 2.643310546875, 2.83868408203125, 3.0340576171875, 3.22943115234375, 3.4248046875, 3.62017822265625, 3.8155517578125, 4.01092529296875, 4.206298828125, 4.40167236328125, 4.5970458984375, 4.79241943359375, 4.98779296875, 5.18316650390625, 5.3785400390625, 5.57391357421875, 5.769287109375, 5.96466064453125, 6.1600341796875, 6.35540771484375, 6.55078125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 11.0, 5.0, 13.0, 13.0, 12.0, 18.0, 29.0, 38.0, 46.0, 56.0, 84.0, 120.0, 146.0, 212.0, 306.0, 506.0, 682.0, 1115.0, 1899.0, 3222.0, 6055.0, 12095.0, 26672.0, 184586.0, 736996.0, 39928.0, 15604.0, 7679.0, 4032.0, 2341.0, 1397.0, 809.0, 515.0, 356.0, 257.0, 196.0, 140.0, 96.0, 60.0, 54.0, 42.0, 21.0, 26.0, 23.0, 7.0, 6.0, 8.0, 5.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.912109375, -1.8487548828125, -1.785400390625, -1.7220458984375, -1.65869140625, -1.5953369140625, -1.531982421875, -1.4686279296875, -1.4052734375, -1.3419189453125, -1.278564453125, -1.2152099609375, -1.15185546875, -1.0885009765625, -1.025146484375, -0.9617919921875, -0.8984375, -0.8350830078125, -0.771728515625, -0.7083740234375, -0.64501953125, -0.5816650390625, -0.518310546875, -0.4549560546875, -0.3916015625, -0.3282470703125, -0.264892578125, -0.2015380859375, -0.13818359375, -0.0748291015625, -0.011474609375, 0.0518798828125, 0.115234375, 0.1785888671875, 0.241943359375, 0.3052978515625, 0.36865234375, 0.4320068359375, 0.495361328125, 0.5587158203125, 0.6220703125, 0.6854248046875, 0.748779296875, 0.8121337890625, 0.87548828125, 0.9388427734375, 1.002197265625, 1.0655517578125, 1.12890625, 1.1922607421875, 1.255615234375, 1.3189697265625, 1.38232421875, 1.4456787109375, 1.509033203125, 1.5723876953125, 1.6357421875, 1.6990966796875, 1.762451171875, 1.8258056640625, 1.88916015625, 1.9525146484375, 2.015869140625, 2.0792236328125, 2.142578125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 8.0, 8.0, 13.0, 11.0, 11.0, 19.0, 22.0, 22.0, 20.0, 22.0, 34.0, 33.0, 32.0, 40.0, 31.0, 33.0, 41.0, 40.0, 38.0, 43.0, 38.0, 46.0, 38.0, 32.0, 33.0, 29.0, 31.0, 36.0, 27.0, 30.0, 21.0, 15.0, 14.0, 12.0, 9.0, 10.0, 13.0, 3.0, 4.0, 9.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.703125, -3.583343505859375, -3.46356201171875, -3.343780517578125, -3.2239990234375, -3.104217529296875, -2.98443603515625, -2.864654541015625, -2.744873046875, -2.625091552734375, -2.50531005859375, -2.385528564453125, -2.2657470703125, -2.145965576171875, -2.02618408203125, -1.906402587890625, -1.78662109375, -1.666839599609375, -1.54705810546875, -1.427276611328125, -1.3074951171875, -1.187713623046875, -1.06793212890625, -0.948150634765625, -0.828369140625, -0.708587646484375, -0.58880615234375, -0.469024658203125, -0.3492431640625, -0.229461669921875, -0.10968017578125, 0.010101318359375, 0.1298828125, 0.249664306640625, 0.36944580078125, 0.489227294921875, 0.6090087890625, 0.728790283203125, 0.84857177734375, 0.968353271484375, 1.088134765625, 1.207916259765625, 1.32769775390625, 1.447479248046875, 1.5672607421875, 1.687042236328125, 1.80682373046875, 1.926605224609375, 2.04638671875, 2.166168212890625, 2.28594970703125, 2.405731201171875, 2.5255126953125, 2.645294189453125, 2.76507568359375, 2.884857177734375, 3.004638671875, 3.124420166015625, 3.24420166015625, 3.363983154296875, 3.4837646484375, 3.603546142578125, 3.72332763671875, 3.843109130859375, 3.962890625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 5.0, 5.0, 11.0, 12.0, 28.0, 25.0, 56.0, 65.0, 94.0, 115.0, 184.0, 285.0, 421.0, 642.0, 979.0, 1461.0, 2147.0, 3379.0, 5138.0, 8188.0, 13455.0, 23715.0, 108709.0, 799764.0, 34049.0, 17211.0, 10228.0, 6368.0, 3996.0, 2624.0, 1754.0, 1149.0, 754.0, 491.0, 336.0, 220.0, 154.0, 111.0, 72.0, 49.0, 32.0, 30.0, 14.0, 11.0, 7.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.349609375, -0.33908843994140625, -0.3285675048828125, -0.31804656982421875, -0.307525634765625, -0.29700469970703125, -0.2864837646484375, -0.27596282958984375, -0.26544189453125, -0.25492095947265625, -0.2444000244140625, -0.23387908935546875, -0.223358154296875, -0.21283721923828125, -0.2023162841796875, -0.19179534912109375, -0.1812744140625, -0.17075347900390625, -0.1602325439453125, -0.14971160888671875, -0.139190673828125, -0.12866973876953125, -0.1181488037109375, -0.10762786865234375, -0.09710693359375, -0.08658599853515625, -0.0760650634765625, -0.06554412841796875, -0.055023193359375, -0.04450225830078125, -0.0339813232421875, -0.02346038818359375, -0.012939453125, -0.00241851806640625, 0.0081024169921875, 0.01862335205078125, 0.029144287109375, 0.03966522216796875, 0.0501861572265625, 0.06070709228515625, 0.07122802734375, 0.08174896240234375, 0.0922698974609375, 0.10279083251953125, 0.113311767578125, 0.12383270263671875, 0.1343536376953125, 0.14487457275390625, 0.1553955078125, 0.16591644287109375, 0.1764373779296875, 0.18695831298828125, 0.197479248046875, 0.20800018310546875, 0.2185211181640625, 0.22904205322265625, 0.23956298828125, 0.25008392333984375, 0.2606048583984375, 0.27112579345703125, 0.281646728515625, 0.29216766357421875, 0.3026885986328125, 0.31320953369140625, 0.32373046875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 10.0, 19.0, 19.0, 23.0, 26.0, 28.0, 33.0, 29.0, 24.0, 34.0, 30.0, 43.0, 37.0, 38.0, 29.0, 38.0, 44.0, 55.0, 57.0, 24.0, 38.0, 40.0, 34.0, 38.0, 26.0, 19.0, 21.0, 27.0, 9.0, 21.0, 12.0, 8.0, 11.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3769214749336243e-05, -2.2921711206436157e-05, -2.2074207663536072e-05, -2.1226704120635986e-05, -2.03792005777359e-05, -1.9531697034835815e-05, -1.868419349193573e-05, -1.7836689949035645e-05, -1.698918640613556e-05, -1.6141682863235474e-05, -1.5294179320335388e-05, -1.4446675777435303e-05, -1.3599172234535217e-05, -1.2751668691635132e-05, -1.1904165148735046e-05, -1.1056661605834961e-05, -1.0209158062934875e-05, -9.36165452003479e-06, -8.514150977134705e-06, -7.666647434234619e-06, -6.819143891334534e-06, -5.971640348434448e-06, -5.124136805534363e-06, -4.276633262634277e-06, -3.429129719734192e-06, -2.5816261768341064e-06, -1.734122633934021e-06, -8.866190910339355e-07, -3.91155481338501e-08, 8.083879947662354e-07, 1.6558915376663208e-06, 2.5033950805664062e-06, 3.3508986234664917e-06, 4.198402166366577e-06, 5.045905709266663e-06, 5.893409252166748e-06, 6.7409127950668335e-06, 7.588416337966919e-06, 8.435919880867004e-06, 9.28342342376709e-06, 1.0130926966667175e-05, 1.097843050956726e-05, 1.1825934052467346e-05, 1.2673437595367432e-05, 1.3520941138267517e-05, 1.4368444681167603e-05, 1.5215948224067688e-05, 1.6063451766967773e-05, 1.691095530986786e-05, 1.7758458852767944e-05, 1.860596239566803e-05, 1.9453465938568115e-05, 2.03009694814682e-05, 2.1148473024368286e-05, 2.199597656726837e-05, 2.2843480110168457e-05, 2.3690983653068542e-05, 2.4538487195968628e-05, 2.5385990738868713e-05, 2.62334942817688e-05, 2.7080997824668884e-05, 2.792850136756897e-05, 2.8776004910469055e-05, 2.962350845336914e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 17.0, 23.0, 28.0, 37.0, 54.0, 89.0, 119.0, 198.0, 294.0, 484.0, 829.0, 1229.0, 1873.0, 2948.0, 4883.0, 7726.0, 12928.0, 21809.0, 36345.0, 61327.0, 100451.0, 150181.0, 184201.0, 165239.0, 115510.0, 71664.0, 42942.0, 25444.0, 15322.0, 9088.0, 5701.0, 3518.0, 2197.0, 1380.0, 905.0, 567.0, 350.0, 222.0, 143.0, 98.0, 66.0, 43.0, 29.0, 17.0, 13.0, 8.0, 2.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1942138671875, -0.18826675415039062, -0.18231964111328125, -0.17637252807617188, -0.1704254150390625, -0.16447830200195312, -0.15853118896484375, -0.15258407592773438, -0.146636962890625, -0.14068984985351562, -0.13474273681640625, -0.12879562377929688, -0.1228485107421875, -0.11690139770507812, -0.11095428466796875, -0.10500717163085938, -0.09906005859375, -0.09311294555664062, -0.08716583251953125, -0.08121871948242188, -0.0752716064453125, -0.06932449340820312, -0.06337738037109375, -0.057430267333984375, -0.051483154296875, -0.045536041259765625, -0.03958892822265625, -0.033641815185546875, -0.0276947021484375, -0.021747589111328125, -0.01580047607421875, -0.009853363037109375, -0.00390625, 0.002040863037109375, 0.00798797607421875, 0.013935089111328125, 0.0198822021484375, 0.025829315185546875, 0.03177642822265625, 0.037723541259765625, 0.043670654296875, 0.049617767333984375, 0.05556488037109375, 0.061511993408203125, 0.0674591064453125, 0.07340621948242188, 0.07935333251953125, 0.08530044555664062, 0.09124755859375, 0.09719467163085938, 0.10314178466796875, 0.10908889770507812, 0.1150360107421875, 0.12098312377929688, 0.12693023681640625, 0.13287734985351562, 0.138824462890625, 0.14477157592773438, 0.15071868896484375, 0.15666580200195312, 0.1626129150390625, 0.16856002807617188, 0.17450714111328125, 0.18045425415039062, 0.1864013671875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 3.0, 4.0, 9.0, 15.0, 14.0, 16.0, 26.0, 34.0, 29.0, 43.0, 39.0, 47.0, 53.0, 44.0, 71.0, 56.0, 69.0, 50.0, 48.0, 54.0, 54.0, 39.0, 25.0, 30.0, 23.0, 19.0, 16.0, 13.0, 8.0, 9.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.055511474609375, -0.05358457565307617, -0.051657676696777344, -0.049730777740478516, -0.04780387878417969, -0.04587697982788086, -0.04395008087158203, -0.0420231819152832, -0.040096282958984375, -0.03816938400268555, -0.03624248504638672, -0.03431558609008789, -0.03238868713378906, -0.030461788177490234, -0.028534889221191406, -0.026607990264892578, -0.02468109130859375, -0.022754192352294922, -0.020827293395996094, -0.018900394439697266, -0.016973495483398438, -0.01504659652709961, -0.013119697570800781, -0.011192798614501953, -0.009265899658203125, -0.007339000701904297, -0.005412101745605469, -0.0034852027893066406, -0.0015583038330078125, 0.0003685951232910156, 0.0022954940795898438, 0.004222393035888672, 0.0061492919921875, 0.008076190948486328, 0.010003089904785156, 0.011929988861083984, 0.013856887817382812, 0.01578378677368164, 0.01771068572998047, 0.019637584686279297, 0.021564483642578125, 0.023491382598876953, 0.02541828155517578, 0.02734518051147461, 0.029272079467773438, 0.031198978424072266, 0.033125877380371094, 0.03505277633666992, 0.03697967529296875, 0.03890657424926758, 0.040833473205566406, 0.042760372161865234, 0.04468727111816406, 0.04661417007446289, 0.04854106903076172, 0.05046796798706055, 0.052394866943359375, 0.0543217658996582, 0.05624866485595703, 0.05817556381225586, 0.06010246276855469, 0.062029361724853516, 0.06395626068115234, 0.06588315963745117, 0.06781005859375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 6.0, 13.0, 22.0, 18.0, 22.0, 21.0, 37.0, 32.0, 41.0, 47.0, 47.0, 47.0, 58.0, 57.0, 65.0, 70.0, 48.0, 60.0, 41.0, 44.0, 37.0, 34.0, 31.0, 21.0, 18.0, 12.0, 10.0, 8.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.832262992858887, -9.5341215133667, -9.235980033874512, -8.937837600708008, -8.63969612121582, -8.341554641723633, -8.043413162231445, -7.745271682739258, -7.447129726409912, -7.148988246917725, -6.850846290588379, -6.552704811096191, -6.254563331604004, -5.956421375274658, -5.658279895782471, -5.360137939453125, -5.0619964599609375, -4.76385498046875, -4.465713024139404, -4.167571544647217, -3.86942982673645, -3.5712881088256836, -3.273146629333496, -2.9750049114227295, -2.676863193511963, -2.3787214756011963, -2.0805797576904297, -1.7824382781982422, -1.4842965602874756, -1.186154842376709, -0.8880132436752319, -0.5898716449737549, -0.2917299270629883, 0.006411731243133545, 0.30455338954925537, 0.6026950478553772, 0.900836706161499, 1.1989784240722656, 1.4971200227737427, 1.7952616214752197, 2.0934033393859863, 2.391545057296753, 2.6896867752075195, 2.987828254699707, 3.2859699726104736, 3.5841116905212402, 3.8822531700134277, 4.180395126342773, 4.478536605834961, 4.776678085327148, 5.074820041656494, 5.372961521148682, 5.671103477478027, 5.969244956970215, 6.267386436462402, 6.56552791595459, 6.8636698722839355, 7.161811351776123, 7.459953308105469, 7.758094787597656, 8.056236267089844, 8.354377746582031, 8.652520179748535, 8.950661659240723, 9.24880313873291]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 7.0, 7.0, 15.0, 12.0, 16.0, 9.0, 14.0, 12.0, 17.0, 35.0, 29.0, 30.0, 25.0, 23.0, 31.0, 36.0, 36.0, 37.0, 29.0, 51.0, 36.0, 31.0, 47.0, 45.0, 32.0, 38.0, 34.0, 32.0, 30.0, 30.0, 28.0, 25.0, 19.0, 14.0, 24.0, 12.0, 14.0, 7.0, 5.0, 10.0, 7.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.478827476501465, -5.315625190734863, -5.1524224281311035, -4.989220142364502, -4.8260178565979, -4.662815570831299, -4.499612808227539, -4.3364105224609375, -4.173208236694336, -4.010005950927734, -3.8468034267425537, -3.683600902557373, -3.5203986167907715, -3.357196092605591, -3.19399356842041, -3.0307912826538086, -2.867588758468628, -2.7043862342834473, -2.5411839485168457, -2.377981424331665, -2.2147791385650635, -2.051576614379883, -1.8883742094039917, -1.7251718044281006, -1.5619693994522095, -1.3987669944763184, -1.2355645895004272, -1.0723621845245361, -0.9091597199440002, -0.7459573149681091, -0.5827548503875732, -0.41955244541168213, -0.256350040435791, -0.09314762055873871, 0.0700547993183136, 0.2332572340965271, 0.3964596390724182, 0.5596620440483093, 0.7228645086288452, 0.8860669136047363, 1.0492693185806274, 1.2124717235565186, 1.3756741285324097, 1.5388765335083008, 1.7020790576934814, 1.865281343460083, 2.0284838676452637, 2.1916861534118652, 2.354888677597046, 2.5180912017822266, 2.681293487548828, 2.844496011734009, 3.0076982975006104, 3.170900821685791, 3.3341031074523926, 3.4973056316375732, 3.660508155822754, 3.8237106800079346, 3.986912965774536, 4.150115489959717, 4.313317775726318, 4.47652006149292, 4.63972282409668, 4.802925109863281, 4.966127395629883]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 9.0, 9.0, 22.0, 21.0, 47.0, 60.0, 94.0, 147.0, 229.0, 325.0, 463.0, 735.0, 1195.0, 1746.0, 2808.0, 4309.0, 6651.0, 9953.0, 14834.0, 22394.0, 32843.0, 46396.0, 63640.0, 82631.0, 99908.0, 110825.0, 112827.0, 104792.0, 89115.0, 70896.0, 53277.0, 37934.0, 25945.0, 17783.0, 11644.0, 7599.0, 5015.0, 3284.0, 2128.0, 1416.0, 900.0, 566.0, 363.0, 285.0, 163.0, 115.0, 72.0, 54.0, 34.0, 20.0, 18.0, 5.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-3.8984375, -3.77734375, -3.65625, -3.53515625, -3.4140625, -3.29296875, -3.171875, -3.05078125, -2.9296875, -2.80859375, -2.6875, -2.56640625, -2.4453125, -2.32421875, -2.203125, -2.08203125, -1.9609375, -1.83984375, -1.71875, -1.59765625, -1.4765625, -1.35546875, -1.234375, -1.11328125, -0.9921875, -0.87109375, -0.75, -0.62890625, -0.5078125, -0.38671875, -0.265625, -0.14453125, -0.0234375, 0.09765625, 0.21875, 0.33984375, 0.4609375, 0.58203125, 0.703125, 0.82421875, 0.9453125, 1.06640625, 1.1875, 1.30859375, 1.4296875, 1.55078125, 1.671875, 1.79296875, 1.9140625, 2.03515625, 2.15625, 2.27734375, 2.3984375, 2.51953125, 2.640625, 2.76171875, 2.8828125, 3.00390625, 3.125, 3.24609375, 3.3671875, 3.48828125, 3.609375, 3.73046875, 3.8515625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 9.0, 13.0, 14.0, 11.0, 24.0, 17.0, 18.0, 26.0, 37.0, 26.0, 32.0, 18.0, 32.0, 38.0, 46.0, 31.0, 40.0, 48.0, 28.0, 39.0, 47.0, 32.0, 39.0, 41.0, 25.0, 44.0, 30.0, 31.0, 23.0, 22.0, 24.0, 22.0, 7.0, 10.0, 9.0, 7.0, 5.0, 9.0, 6.0, 1.0, 7.0, 3.0, 2.0, 2.0, 1.0], "bins": [-6.69140625, -6.51092529296875, -6.3304443359375, -6.14996337890625, -5.969482421875, -5.78900146484375, -5.6085205078125, -5.42803955078125, -5.24755859375, -5.06707763671875, -4.8865966796875, -4.70611572265625, -4.525634765625, -4.34515380859375, -4.1646728515625, -3.98419189453125, -3.8037109375, -3.62322998046875, -3.4427490234375, -3.26226806640625, -3.081787109375, -2.90130615234375, -2.7208251953125, -2.54034423828125, -2.35986328125, -2.17938232421875, -1.9989013671875, -1.81842041015625, -1.637939453125, -1.45745849609375, -1.2769775390625, -1.09649658203125, -0.916015625, -0.73553466796875, -0.5550537109375, -0.37457275390625, -0.194091796875, -0.01361083984375, 0.1668701171875, 0.34735107421875, 0.52783203125, 0.70831298828125, 0.8887939453125, 1.06927490234375, 1.249755859375, 1.43023681640625, 1.6107177734375, 1.79119873046875, 1.9716796875, 2.15216064453125, 2.3326416015625, 2.51312255859375, 2.693603515625, 2.87408447265625, 3.0545654296875, 3.23504638671875, 3.41552734375, 3.59600830078125, 3.7764892578125, 3.95697021484375, 4.137451171875, 4.31793212890625, 4.4984130859375, 4.67889404296875, 4.859375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 7.0, 8.0, 7.0, 24.0, 21.0, 34.0, 52.0, 85.0, 112.0, 179.0, 275.0, 445.0, 679.0, 1075.0, 1722.0, 2652.0, 4383.0, 6939.0, 10829.0, 16856.0, 26276.0, 39140.0, 56839.0, 78006.0, 100234.0, 117554.0, 123762.0, 116502.0, 99299.0, 77704.0, 56173.0, 38992.0, 25871.0, 16858.0, 10662.0, 6653.0, 4335.0, 2684.0, 1675.0, 1064.0, 709.0, 397.0, 281.0, 165.0, 107.0, 67.0, 57.0, 39.0, 27.0, 13.0, 10.0, 11.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.40234375, -4.2579345703125, -4.113525390625, -3.9691162109375, -3.82470703125, -3.6802978515625, -3.535888671875, -3.3914794921875, -3.2470703125, -3.1026611328125, -2.958251953125, -2.8138427734375, -2.66943359375, -2.5250244140625, -2.380615234375, -2.2362060546875, -2.091796875, -1.9473876953125, -1.802978515625, -1.6585693359375, -1.51416015625, -1.3697509765625, -1.225341796875, -1.0809326171875, -0.9365234375, -0.7921142578125, -0.647705078125, -0.5032958984375, -0.35888671875, -0.2144775390625, -0.070068359375, 0.0743408203125, 0.21875, 0.3631591796875, 0.507568359375, 0.6519775390625, 0.79638671875, 0.9407958984375, 1.085205078125, 1.2296142578125, 1.3740234375, 1.5184326171875, 1.662841796875, 1.8072509765625, 1.95166015625, 2.0960693359375, 2.240478515625, 2.3848876953125, 2.529296875, 2.6737060546875, 2.818115234375, 2.9625244140625, 3.10693359375, 3.2513427734375, 3.395751953125, 3.5401611328125, 3.6845703125, 3.8289794921875, 3.973388671875, 4.1177978515625, 4.26220703125, 4.4066162109375, 4.551025390625, 4.6954345703125, 4.83984375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 3.0, 8.0, 6.0, 14.0, 10.0, 11.0, 14.0, 22.0, 30.0, 29.0, 41.0, 30.0, 37.0, 38.0, 33.0, 42.0, 62.0, 44.0, 39.0, 48.0, 60.0, 28.0, 58.0, 34.0, 34.0, 35.0, 29.0, 34.0, 21.0, 31.0, 23.0, 15.0, 9.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.12774658203125, -3.9976806640625, -3.86761474609375, -3.737548828125, -3.60748291015625, -3.4774169921875, -3.34735107421875, -3.21728515625, -3.08721923828125, -2.9571533203125, -2.82708740234375, -2.697021484375, -2.56695556640625, -2.4368896484375, -2.30682373046875, -2.1767578125, -2.04669189453125, -1.9166259765625, -1.78656005859375, -1.656494140625, -1.52642822265625, -1.3963623046875, -1.26629638671875, -1.13623046875, -1.00616455078125, -0.8760986328125, -0.74603271484375, -0.615966796875, -0.48590087890625, -0.3558349609375, -0.22576904296875, -0.095703125, 0.03436279296875, 0.1644287109375, 0.29449462890625, 0.424560546875, 0.55462646484375, 0.6846923828125, 0.81475830078125, 0.94482421875, 1.07489013671875, 1.2049560546875, 1.33502197265625, 1.465087890625, 1.59515380859375, 1.7252197265625, 1.85528564453125, 1.9853515625, 2.11541748046875, 2.2454833984375, 2.37554931640625, 2.505615234375, 2.63568115234375, 2.7657470703125, 2.89581298828125, 3.02587890625, 3.15594482421875, 3.2860107421875, 3.41607666015625, 3.546142578125, 3.67620849609375, 3.8062744140625, 3.93634033203125, 4.06640625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 7.0, 3.0, 15.0, 10.0, 19.0, 25.0, 47.0, 63.0, 91.0, 125.0, 194.0, 296.0, 433.0, 720.0, 1195.0, 1816.0, 2996.0, 4833.0, 8690.0, 14858.0, 26382.0, 46171.0, 79822.0, 125716.0, 170667.0, 180963.0, 147400.0, 97897.0, 58227.0, 33236.0, 18851.0, 10844.0, 6154.0, 3639.0, 2275.0, 1386.0, 882.0, 568.0, 342.0, 247.0, 144.0, 93.0, 73.0, 41.0, 29.0, 30.0, 19.0, 3.0, 4.0, 5.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.95501708984375, -3.8240966796875, -3.69317626953125, -3.562255859375, -3.43133544921875, -3.3004150390625, -3.16949462890625, -3.03857421875, -2.90765380859375, -2.7767333984375, -2.64581298828125, -2.514892578125, -2.38397216796875, -2.2530517578125, -2.12213134765625, -1.9912109375, -1.86029052734375, -1.7293701171875, -1.59844970703125, -1.467529296875, -1.33660888671875, -1.2056884765625, -1.07476806640625, -0.94384765625, -0.81292724609375, -0.6820068359375, -0.55108642578125, -0.420166015625, -0.28924560546875, -0.1583251953125, -0.02740478515625, 0.103515625, 0.23443603515625, 0.3653564453125, 0.49627685546875, 0.627197265625, 0.75811767578125, 0.8890380859375, 1.01995849609375, 1.15087890625, 1.28179931640625, 1.4127197265625, 1.54364013671875, 1.674560546875, 1.80548095703125, 1.9364013671875, 2.06732177734375, 2.1982421875, 2.32916259765625, 2.4600830078125, 2.59100341796875, 2.721923828125, 2.85284423828125, 2.9837646484375, 3.11468505859375, 3.24560546875, 3.37652587890625, 3.5074462890625, 3.63836669921875, 3.769287109375, 3.90020751953125, 4.0311279296875, 4.16204833984375, 4.29296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 3.0, 9.0, 13.0, 17.0, 14.0, 19.0, 36.0, 30.0, 47.0, 50.0, 61.0, 71.0, 86.0, 66.0, 60.0, 63.0, 68.0, 44.0, 38.0, 44.0, 21.0, 26.0, 17.0, 16.0, 12.0, 16.0, 8.0, 2.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005102157592773438, -0.0004954151809215546, -0.0004806146025657654, -0.0004658140242099762, -0.000451013445854187, -0.00043621286749839783, -0.00042141228914260864, -0.00040661171078681946, -0.0003918111324310303, -0.0003770105540752411, -0.0003622099757194519, -0.0003474093973636627, -0.00033260881900787354, -0.00031780824065208435, -0.00030300766229629517, -0.000288207083940506, -0.0002734065055847168, -0.0002586059272289276, -0.00024380534887313843, -0.00022900477051734924, -0.00021420419216156006, -0.00019940361380577087, -0.0001846030354499817, -0.0001698024570941925, -0.00015500187873840332, -0.00014020130038261414, -0.00012540072202682495, -0.00011060014367103577, -9.579956531524658e-05, -8.09989869594574e-05, -6.619840860366821e-05, -5.139783024787903e-05, -3.6597251892089844e-05, -2.179667353630066e-05, -6.996095180511475e-06, 7.80448317527771e-06, 2.2605061531066895e-05, 3.740563988685608e-05, 5.2206218242645264e-05, 6.700679659843445e-05, 8.180737495422363e-05, 9.660795331001282e-05, 0.000111408531665802, 0.0001262091100215912, 0.00014100968837738037, 0.00015581026673316956, 0.00017061084508895874, 0.00018541142344474792, 0.0002002120018005371, 0.0002150125801563263, 0.00022981315851211548, 0.00024461373686790466, 0.00025941431522369385, 0.00027421489357948303, 0.0002890154719352722, 0.0003038160502910614, 0.0003186166286468506, 0.00033341720700263977, 0.00034821778535842896, 0.00036301836371421814, 0.0003778189420700073, 0.0003926195204257965, 0.0004074200987815857, 0.0004222206771373749, 0.00043702125549316406]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 10.0, 14.0, 27.0, 50.0, 67.0, 81.0, 117.0, 170.0, 266.0, 431.0, 694.0, 1045.0, 1694.0, 2659.0, 4658.0, 7731.0, 13490.0, 24031.0, 42880.0, 76789.0, 124727.0, 174583.0, 188610.0, 151719.0, 98752.0, 57985.0, 32072.0, 17849.0, 10006.0, 5961.0, 3511.0, 2121.0, 1316.0, 819.0, 523.0, 368.0, 234.0, 142.0, 125.0, 74.0, 51.0, 28.0, 25.0, 16.0, 7.0, 4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.8359375, -4.69049072265625, -4.5450439453125, -4.39959716796875, -4.254150390625, -4.10870361328125, -3.9632568359375, -3.81781005859375, -3.67236328125, -3.52691650390625, -3.3814697265625, -3.23602294921875, -3.090576171875, -2.94512939453125, -2.7996826171875, -2.65423583984375, -2.5087890625, -2.36334228515625, -2.2178955078125, -2.07244873046875, -1.927001953125, -1.78155517578125, -1.6361083984375, -1.49066162109375, -1.34521484375, -1.19976806640625, -1.0543212890625, -0.90887451171875, -0.763427734375, -0.61798095703125, -0.4725341796875, -0.32708740234375, -0.181640625, -0.03619384765625, 0.1092529296875, 0.25469970703125, 0.400146484375, 0.54559326171875, 0.6910400390625, 0.83648681640625, 0.98193359375, 1.12738037109375, 1.2728271484375, 1.41827392578125, 1.563720703125, 1.70916748046875, 1.8546142578125, 2.00006103515625, 2.1455078125, 2.29095458984375, 2.4364013671875, 2.58184814453125, 2.727294921875, 2.87274169921875, 3.0181884765625, 3.16363525390625, 3.30908203125, 3.45452880859375, 3.5999755859375, 3.74542236328125, 3.890869140625, 4.03631591796875, 4.1817626953125, 4.32720947265625, 4.47265625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 9.0, 6.0, 4.0, 13.0, 12.0, 14.0, 13.0, 23.0, 26.0, 34.0, 42.0, 55.0, 54.0, 53.0, 68.0, 60.0, 66.0, 60.0, 65.0, 58.0, 56.0, 42.0, 20.0, 30.0, 21.0, 12.0, 15.0, 13.0, 15.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5048828125, -1.4627532958984375, -1.420623779296875, -1.3784942626953125, -1.33636474609375, -1.2942352294921875, -1.252105712890625, -1.2099761962890625, -1.1678466796875, -1.1257171630859375, -1.083587646484375, -1.0414581298828125, -0.99932861328125, -0.9571990966796875, -0.915069580078125, -0.8729400634765625, -0.830810546875, -0.7886810302734375, -0.746551513671875, -0.7044219970703125, -0.66229248046875, -0.6201629638671875, -0.578033447265625, -0.5359039306640625, -0.4937744140625, -0.4516448974609375, -0.409515380859375, -0.3673858642578125, -0.32525634765625, -0.2831268310546875, -0.240997314453125, -0.1988677978515625, -0.15673828125, -0.1146087646484375, -0.072479248046875, -0.0303497314453125, 0.01177978515625, 0.0539093017578125, 0.096038818359375, 0.1381683349609375, 0.1802978515625, 0.2224273681640625, 0.264556884765625, 0.3066864013671875, 0.34881591796875, 0.3909454345703125, 0.433074951171875, 0.4752044677734375, 0.517333984375, 0.5594635009765625, 0.601593017578125, 0.6437225341796875, 0.68585205078125, 0.7279815673828125, 0.770111083984375, 0.8122406005859375, 0.8543701171875, 0.8964996337890625, 0.938629150390625, 0.9807586669921875, 1.02288818359375, 1.0650177001953125, 1.107147216796875, 1.1492767333984375, 1.19140625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 8.0, 6.0, 8.0, 10.0, 12.0, 25.0, 14.0, 24.0, 34.0, 26.0, 36.0, 41.0, 55.0, 48.0, 42.0, 54.0, 55.0, 62.0, 65.0, 49.0, 51.0, 42.0, 46.0, 41.0, 34.0, 15.0, 21.0, 24.0, 12.0, 12.0, 6.0, 9.0, 1.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.650629043579102, -10.352104187011719, -10.053580284118652, -9.75505542755127, -9.456531524658203, -9.15800666809082, -8.859481811523438, -8.560957908630371, -8.262433052062988, -7.963908672332764, -7.665384292602539, -7.366859436035156, -7.068335056304932, -6.769810676574707, -6.471286296844482, -6.172761917114258, -5.874237537384033, -5.575713157653809, -5.277188777923584, -4.978664398193359, -4.680139541625977, -4.381615161895752, -4.083090782165527, -3.7845661640167236, -3.486041784286499, -3.1875174045562744, -2.8889927864074707, -2.590468406677246, -2.2919440269470215, -1.9934194087982178, -1.6948950290679932, -1.3963704109191895, -1.0978460311889648, -0.7993215322494507, -0.5007970929145813, -0.20227265357971191, 0.09625184535980225, 0.3947763442993164, 0.693300724029541, 0.9918253421783447, 1.2903497219085693, 1.5888742208480835, 1.8873987197875977, 2.1859230995178223, 2.484447479248047, 2.7829720973968506, 3.081496477127075, 3.380021095275879, 3.6785454750061035, 3.977069854736328, 4.275594234466553, 4.574118614196777, 4.87264347076416, 5.171167850494385, 5.469692230224609, 5.768217086791992, 6.066740989685059, 6.365265369415283, 6.663789749145508, 6.962314605712891, 7.260838985443115, 7.55936336517334, 7.8578877449035645, 8.156412124633789, 8.454936981201172]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 13.0, 12.0, 19.0, 19.0, 18.0, 26.0, 20.0, 26.0, 32.0, 34.0, 36.0, 37.0, 31.0, 43.0, 49.0, 50.0, 34.0, 37.0, 42.0, 37.0, 40.0, 30.0, 39.0, 37.0, 27.0, 25.0, 29.0, 23.0, 23.0, 16.0, 18.0, 10.0, 8.0, 13.0, 9.0, 9.0, 4.0, 5.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.264275074005127, -6.079763412475586, -5.895252227783203, -5.710740566253662, -5.526229381561279, -5.341717720031738, -5.1572065353393555, -4.9726948738098145, -4.788183689117432, -4.603672027587891, -4.419160842895508, -4.234649181365967, -4.050137996673584, -3.865626573562622, -3.68111515045166, -3.496603488922119, -3.3120920658111572, -3.1275806427001953, -2.9430692195892334, -2.7585577964782715, -2.5740463733673096, -2.3895349502563477, -2.2050232887268066, -2.020512104034424, -1.8360005617141724, -1.6514891386032104, -1.4669777154922485, -1.282466173171997, -1.0979547500610352, -0.913443386554718, -0.7289319038391113, -0.5444204807281494, -0.3599090576171875, -0.1753976196050644, 0.009113818407058716, 0.19362527132034302, 0.37813669443130493, 0.5626481175422668, 0.7471596002578735, 0.9316710233688354, 1.1161824464797974, 1.3006938695907593, 1.4852052927017212, 1.6697168350219727, 1.8542282581329346, 2.0387396812438965, 2.2232511043548584, 2.4077625274658203, 2.5922739505767822, 2.776785373687744, 2.961296796798706, 3.145808219909668, 3.33031964302063, 3.514831066131592, 3.699342727661133, 3.8838539123535156, 4.068365573883057, 4.252877235412598, 4.4373884201049805, 4.6219000816345215, 4.806411266326904, 4.990922927856445, 5.175434112548828, 5.359945774078369, 5.544456958770752]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 19.0, 22.0, 27.0, 37.0, 68.0, 103.0, 165.0, 216.0, 318.0, 554.0, 766.0, 1223.0, 1942.0, 3110.0, 5101.0, 8688.0, 15240.0, 27559.0, 51448.0, 101181.0, 207114.0, 427300.0, 767312.0, 963519.0, 758700.0, 424153.0, 209678.0, 103656.0, 52238.0, 27649.0, 14766.0, 8443.0, 4816.0, 2732.0, 1664.0, 1050.0, 610.0, 431.0, 248.0, 145.0, 83.0, 60.0, 41.0, 27.0, 19.0, 14.0, 9.0, 6.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.0078125, -9.7176513671875, -9.427490234375, -9.1373291015625, -8.84716796875, -8.5570068359375, -8.266845703125, -7.9766845703125, -7.6865234375, -7.3963623046875, -7.106201171875, -6.8160400390625, -6.52587890625, -6.2357177734375, -5.945556640625, -5.6553955078125, -5.365234375, -5.0750732421875, -4.784912109375, -4.4947509765625, -4.20458984375, -3.9144287109375, -3.624267578125, -3.3341064453125, -3.0439453125, -2.7537841796875, -2.463623046875, -2.1734619140625, -1.88330078125, -1.5931396484375, -1.302978515625, -1.0128173828125, -0.72265625, -0.4324951171875, -0.142333984375, 0.1478271484375, 0.43798828125, 0.7281494140625, 1.018310546875, 1.3084716796875, 1.5986328125, 1.8887939453125, 2.178955078125, 2.4691162109375, 2.75927734375, 3.0494384765625, 3.339599609375, 3.6297607421875, 3.919921875, 4.2100830078125, 4.500244140625, 4.7904052734375, 5.08056640625, 5.3707275390625, 5.660888671875, 5.9510498046875, 6.2412109375, 6.5313720703125, 6.821533203125, 7.1116943359375, 7.40185546875, 7.6920166015625, 7.982177734375, 8.2723388671875, 8.5625]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 9.0, 5.0, 7.0, 15.0, 11.0, 24.0, 14.0, 15.0, 22.0, 23.0, 32.0, 26.0, 35.0, 40.0, 41.0, 41.0, 43.0, 46.0, 49.0, 42.0, 35.0, 43.0, 31.0, 25.0, 40.0, 31.0, 35.0, 32.0, 29.0, 27.0, 25.0, 17.0, 15.0, 15.0, 11.0, 12.0, 4.0, 13.0, 4.0, 6.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.1875, -5.01556396484375, -4.8436279296875, -4.67169189453125, -4.499755859375, -4.32781982421875, -4.1558837890625, -3.98394775390625, -3.81201171875, -3.64007568359375, -3.4681396484375, -3.29620361328125, -3.124267578125, -2.95233154296875, -2.7803955078125, -2.60845947265625, -2.4365234375, -2.26458740234375, -2.0926513671875, -1.92071533203125, -1.748779296875, -1.57684326171875, -1.4049072265625, -1.23297119140625, -1.06103515625, -0.88909912109375, -0.7171630859375, -0.54522705078125, -0.373291015625, -0.20135498046875, -0.0294189453125, 0.14251708984375, 0.314453125, 0.48638916015625, 0.6583251953125, 0.83026123046875, 1.002197265625, 1.17413330078125, 1.3460693359375, 1.51800537109375, 1.68994140625, 1.86187744140625, 2.0338134765625, 2.20574951171875, 2.377685546875, 2.54962158203125, 2.7215576171875, 2.89349365234375, 3.0654296875, 3.23736572265625, 3.4093017578125, 3.58123779296875, 3.753173828125, 3.92510986328125, 4.0970458984375, 4.26898193359375, 4.44091796875, 4.61285400390625, 4.7847900390625, 4.95672607421875, 5.128662109375, 5.30059814453125, 5.4725341796875, 5.64447021484375, 5.81640625]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 4.0, 18.0, 19.0, 45.0, 47.0, 90.0, 114.0, 198.0, 253.0, 389.0, 617.0, 973.0, 1584.0, 2613.0, 4212.0, 7009.0, 11938.0, 20688.0, 35840.0, 64739.0, 117119.0, 211301.0, 371836.0, 594448.0, 776310.0, 736693.0, 522398.0, 312973.0, 175267.0, 97050.0, 54132.0, 30011.0, 17441.0, 10175.0, 5935.0, 3721.0, 2251.0, 1371.0, 844.0, 554.0, 383.0, 238.0, 149.0, 93.0, 52.0, 50.0, 29.0, 21.0, 8.0, 11.0, 6.0, 7.0, 0.0, 5.0, 3.0, 2.0, 2.0], "bins": [-10.359375, -10.0340576171875, -9.708740234375, -9.3834228515625, -9.05810546875, -8.7327880859375, -8.407470703125, -8.0821533203125, -7.7568359375, -7.4315185546875, -7.106201171875, -6.7808837890625, -6.45556640625, -6.1302490234375, -5.804931640625, -5.4796142578125, -5.154296875, -4.8289794921875, -4.503662109375, -4.1783447265625, -3.85302734375, -3.5277099609375, -3.202392578125, -2.8770751953125, -2.5517578125, -2.2264404296875, -1.901123046875, -1.5758056640625, -1.25048828125, -0.9251708984375, -0.599853515625, -0.2745361328125, 0.05078125, 0.3760986328125, 0.701416015625, 1.0267333984375, 1.35205078125, 1.6773681640625, 2.002685546875, 2.3280029296875, 2.6533203125, 2.9786376953125, 3.303955078125, 3.6292724609375, 3.95458984375, 4.2799072265625, 4.605224609375, 4.9305419921875, 5.255859375, 5.5811767578125, 5.906494140625, 6.2318115234375, 6.55712890625, 6.8824462890625, 7.207763671875, 7.5330810546875, 7.8583984375, 8.1837158203125, 8.509033203125, 8.8343505859375, 9.15966796875, 9.4849853515625, 9.810302734375, 10.1356201171875, 10.4609375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 17.0, 27.0, 37.0, 47.0, 50.0, 72.0, 70.0, 111.0, 158.0, 150.0, 181.0, 203.0, 264.0, 296.0, 276.0, 294.0, 287.0, 265.0, 241.0, 214.0, 188.0, 132.0, 105.0, 88.0, 71.0, 58.0, 38.0, 38.0, 28.0, 13.0, 17.0, 11.0, 3.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.73828125, -4.61676025390625, -4.4952392578125, -4.37371826171875, -4.252197265625, -4.13067626953125, -4.0091552734375, -3.88763427734375, -3.76611328125, -3.64459228515625, -3.5230712890625, -3.40155029296875, -3.280029296875, -3.15850830078125, -3.0369873046875, -2.91546630859375, -2.7939453125, -2.67242431640625, -2.5509033203125, -2.42938232421875, -2.307861328125, -2.18634033203125, -2.0648193359375, -1.94329833984375, -1.82177734375, -1.70025634765625, -1.5787353515625, -1.45721435546875, -1.335693359375, -1.21417236328125, -1.0926513671875, -0.97113037109375, -0.849609375, -0.72808837890625, -0.6065673828125, -0.48504638671875, -0.363525390625, -0.24200439453125, -0.1204833984375, 0.00103759765625, 0.12255859375, 0.24407958984375, 0.3656005859375, 0.48712158203125, 0.608642578125, 0.73016357421875, 0.8516845703125, 0.97320556640625, 1.0947265625, 1.21624755859375, 1.3377685546875, 1.45928955078125, 1.580810546875, 1.70233154296875, 1.8238525390625, 1.94537353515625, 2.06689453125, 2.18841552734375, 2.3099365234375, 2.43145751953125, 2.552978515625, 2.67449951171875, 2.7960205078125, 2.91754150390625, 3.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 8.0, 5.0, 6.0, 10.0, 10.0, 17.0, 14.0, 18.0, 32.0, 32.0, 30.0, 41.0, 42.0, 55.0, 56.0, 61.0, 65.0, 65.0, 50.0, 64.0, 46.0, 38.0, 43.0, 37.0, 31.0, 28.0, 24.0, 20.0, 14.0, 11.0, 9.0, 8.0, 3.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.759474754333496, -13.364616394042969, -12.969757080078125, -12.574898719787598, -12.18004035949707, -11.785181999206543, -11.390323638916016, -10.995464324951172, -10.600605964660645, -10.205747604370117, -9.810888290405273, -9.416029930114746, -9.021171569824219, -8.626313209533691, -8.231454849243164, -7.83659553527832, -7.441737174987793, -7.046878814697266, -6.65201997756958, -6.2571611404418945, -5.862302780151367, -5.46744441986084, -5.072585582733154, -4.677726745605469, -4.282868385314941, -3.888009786605835, -3.4931511878967285, -3.098292589187622, -2.7034339904785156, -2.308575391769409, -1.9137167930603027, -1.5188581943511963, -1.1240005493164062, -0.7291419506072998, -0.33428335189819336, 0.060575246810913086, 0.45543384552001953, 0.850292444229126, 1.2451510429382324, 1.6400096416473389, 2.0348682403564453, 2.4297268390655518, 2.824585437774658, 3.2194440364837646, 3.614302635192871, 4.009160995483398, 4.404019832611084, 4.7988786697387695, 5.193737030029297, 5.588595390319824, 5.98345422744751, 6.378313064575195, 6.773171424865723, 7.16802978515625, 7.5628886222839355, 7.957747459411621, 8.352605819702148, 8.747464179992676, 9.142322540283203, 9.537181854248047, 9.932040214538574, 10.326898574829102, 10.721757888793945, 11.116616249084473, 11.511474609375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 6.0, 10.0, 8.0, 16.0, 16.0, 14.0, 19.0, 20.0, 18.0, 27.0, 28.0, 13.0, 36.0, 34.0, 27.0, 50.0, 34.0, 40.0, 37.0, 38.0, 33.0, 42.0, 50.0, 34.0, 35.0, 33.0, 37.0, 28.0, 35.0, 21.0, 24.0, 23.0, 17.0, 18.0, 18.0, 7.0, 13.0, 13.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.569639205932617, -6.363455295562744, -6.157271385192871, -5.95108699798584, -5.744903087615967, -5.538719177246094, -5.332535266876221, -5.126351356506348, -4.920166969299316, -4.713983058929443, -4.50779914855957, -4.301614761352539, -4.095430850982666, -3.889246940612793, -3.68306303024292, -3.4768788814544678, -3.2706949710845947, -3.0645110607147217, -2.8583269119262695, -2.6521430015563965, -2.4459588527679443, -2.2397749423980713, -2.033590793609619, -1.827406883239746, -1.6212228536605835, -1.415038824081421, -1.2088547945022583, -1.0026707649230957, -0.7964867949485779, -0.5903028249740601, -0.38411879539489746, -0.17793476581573486, 0.028249263763427734, 0.23443327844142914, 0.44061729311943054, 0.6468012928962708, 0.8529853224754333, 1.0591692924499512, 1.2653533220291138, 1.4715373516082764, 1.677721381187439, 1.8839054107666016, 2.0900893211364746, 2.2962734699249268, 2.5024573802948, 2.708641529083252, 2.914825439453125, 3.121009349822998, 3.32719349861145, 3.5333774089813232, 3.7395615577697754, 3.9457454681396484, 4.1519293785095215, 4.3581132888793945, 4.564297676086426, 4.770481586456299, 4.976665496826172, 5.182849407196045, 5.389033317565918, 5.595217704772949, 5.801401615142822, 6.007585525512695, 6.213769435882568, 6.419953346252441, 6.626137733459473]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 9.0, 18.0, 23.0, 32.0, 60.0, 67.0, 128.0, 201.0, 292.0, 444.0, 774.0, 1144.0, 2008.0, 3053.0, 5206.0, 8671.0, 14477.0, 24862.0, 42141.0, 69471.0, 110331.0, 155324.0, 178288.0, 153745.0, 108365.0, 67847.0, 41207.0, 24246.0, 14281.0, 8375.0, 5058.0, 3184.0, 1971.0, 1200.0, 724.0, 485.0, 291.0, 183.0, 138.0, 76.0, 43.0, 33.0, 25.0, 13.0, 17.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.806640625, -0.7818069458007812, -0.7569732666015625, -0.7321395874023438, -0.707305908203125, -0.6824722290039062, -0.6576385498046875, -0.6328048706054688, -0.60797119140625, -0.5831375122070312, -0.5583038330078125, -0.5334701538085938, -0.508636474609375, -0.48380279541015625, -0.4589691162109375, -0.43413543701171875, -0.4093017578125, -0.38446807861328125, -0.3596343994140625, -0.33480072021484375, -0.309967041015625, -0.28513336181640625, -0.2602996826171875, -0.23546600341796875, -0.21063232421875, -0.18579864501953125, -0.1609649658203125, -0.13613128662109375, -0.111297607421875, -0.08646392822265625, -0.0616302490234375, -0.03679656982421875, -0.011962890625, 0.01287078857421875, 0.0377044677734375, 0.06253814697265625, 0.087371826171875, 0.11220550537109375, 0.1370391845703125, 0.16187286376953125, 0.18670654296875, 0.21154022216796875, 0.2363739013671875, 0.26120758056640625, 0.286041259765625, 0.31087493896484375, 0.3357086181640625, 0.36054229736328125, 0.3853759765625, 0.41020965576171875, 0.4350433349609375, 0.45987701416015625, 0.484710693359375, 0.5095443725585938, 0.5343780517578125, 0.5592117309570312, 0.58404541015625, 0.6088790893554688, 0.6337127685546875, 0.6585464477539062, 0.683380126953125, 0.7082138061523438, 0.7330474853515625, 0.7578811645507812, 0.78271484375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 6.0, 8.0, 12.0, 9.0, 10.0, 13.0, 13.0, 23.0, 21.0, 27.0, 34.0, 23.0, 28.0, 27.0, 34.0, 36.0, 36.0, 38.0, 47.0, 47.0, 47.0, 34.0, 29.0, 37.0, 34.0, 35.0, 33.0, 32.0, 28.0, 31.0, 27.0, 26.0, 26.0, 17.0, 12.0, 12.0, 7.0, 10.0, 7.0, 4.0, 7.0, 4.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.015625, -6.7830810546875, -6.550537109375, -6.3179931640625, -6.08544921875, -5.8529052734375, -5.620361328125, -5.3878173828125, -5.1552734375, -4.9227294921875, -4.690185546875, -4.4576416015625, -4.22509765625, -3.9925537109375, -3.760009765625, -3.5274658203125, -3.294921875, -3.0623779296875, -2.829833984375, -2.5972900390625, -2.36474609375, -2.1322021484375, -1.899658203125, -1.6671142578125, -1.4345703125, -1.2020263671875, -0.969482421875, -0.7369384765625, -0.50439453125, -0.2718505859375, -0.039306640625, 0.1932373046875, 0.42578125, 0.6583251953125, 0.890869140625, 1.1234130859375, 1.35595703125, 1.5885009765625, 1.821044921875, 2.0535888671875, 2.2861328125, 2.5186767578125, 2.751220703125, 2.9837646484375, 3.21630859375, 3.4488525390625, 3.681396484375, 3.9139404296875, 4.146484375, 4.3790283203125, 4.611572265625, 4.8441162109375, 5.07666015625, 5.3092041015625, 5.541748046875, 5.7742919921875, 6.0068359375, 6.2393798828125, 6.471923828125, 6.7044677734375, 6.93701171875, 7.1695556640625, 7.402099609375, 7.6346435546875, 7.8671875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 10.0, 18.0, 18.0, 24.0, 36.0, 51.0, 47.0, 99.0, 99.0, 133.0, 210.0, 290.0, 451.0, 741.0, 1117.0, 1722.0, 2954.0, 5358.0, 10455.0, 21488.0, 80016.0, 819859.0, 61323.0, 19788.0, 9534.0, 5093.0, 2824.0, 1635.0, 996.0, 647.0, 431.0, 307.0, 240.0, 135.0, 100.0, 77.0, 66.0, 49.0, 26.0, 19.0, 10.0, 16.0, 10.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.517578125, -2.4375, -2.357421875, -2.27734375, -2.197265625, -2.1171875, -2.037109375, -1.95703125, -1.876953125, -1.796875, -1.716796875, -1.63671875, -1.556640625, -1.4765625, -1.396484375, -1.31640625, -1.236328125, -1.15625, -1.076171875, -0.99609375, -0.916015625, -0.8359375, -0.755859375, -0.67578125, -0.595703125, -0.515625, -0.435546875, -0.35546875, -0.275390625, -0.1953125, -0.115234375, -0.03515625, 0.044921875, 0.125, 0.205078125, 0.28515625, 0.365234375, 0.4453125, 0.525390625, 0.60546875, 0.685546875, 0.765625, 0.845703125, 0.92578125, 1.005859375, 1.0859375, 1.166015625, 1.24609375, 1.326171875, 1.40625, 1.486328125, 1.56640625, 1.646484375, 1.7265625, 1.806640625, 1.88671875, 1.966796875, 2.046875, 2.126953125, 2.20703125, 2.287109375, 2.3671875, 2.447265625, 2.52734375, 2.607421875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 11.0, 11.0, 8.0, 14.0, 15.0, 25.0, 14.0, 12.0, 17.0, 24.0, 24.0, 26.0, 28.0, 37.0, 32.0, 36.0, 34.0, 29.0, 36.0, 30.0, 40.0, 34.0, 31.0, 35.0, 36.0, 29.0, 35.0, 31.0, 29.0, 29.0, 26.0, 18.0, 22.0, 17.0, 22.0, 14.0, 19.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.69140625, -4.5523681640625, -4.413330078125, -4.2742919921875, -4.13525390625, -3.9962158203125, -3.857177734375, -3.7181396484375, -3.5791015625, -3.4400634765625, -3.301025390625, -3.1619873046875, -3.02294921875, -2.8839111328125, -2.744873046875, -2.6058349609375, -2.466796875, -2.3277587890625, -2.188720703125, -2.0496826171875, -1.91064453125, -1.7716064453125, -1.632568359375, -1.4935302734375, -1.3544921875, -1.2154541015625, -1.076416015625, -0.9373779296875, -0.79833984375, -0.6593017578125, -0.520263671875, -0.3812255859375, -0.2421875, -0.1031494140625, 0.035888671875, 0.1749267578125, 0.31396484375, 0.4530029296875, 0.592041015625, 0.7310791015625, 0.8701171875, 1.0091552734375, 1.148193359375, 1.2872314453125, 1.42626953125, 1.5653076171875, 1.704345703125, 1.8433837890625, 1.982421875, 2.1214599609375, 2.260498046875, 2.3995361328125, 2.53857421875, 2.6776123046875, 2.816650390625, 2.9556884765625, 3.0947265625, 3.2337646484375, 3.372802734375, 3.5118408203125, 3.65087890625, 3.7899169921875, 3.928955078125, 4.0679931640625, 4.20703125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 16.0, 23.0, 28.0, 37.0, 45.0, 88.0, 101.0, 182.0, 284.0, 445.0, 776.0, 1356.0, 2425.0, 4539.0, 8823.0, 18025.0, 47365.0, 884669.0, 43601.0, 17247.0, 8395.0, 4345.0, 2357.0, 1328.0, 756.0, 460.0, 295.0, 185.0, 105.0, 75.0, 58.0, 33.0, 20.0, 19.0, 6.0, 8.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7001953125, -0.677947998046875, -0.65570068359375, -0.633453369140625, -0.6112060546875, -0.588958740234375, -0.56671142578125, -0.544464111328125, -0.522216796875, -0.499969482421875, -0.47772216796875, -0.455474853515625, -0.4332275390625, -0.410980224609375, -0.38873291015625, -0.366485595703125, -0.34423828125, -0.321990966796875, -0.29974365234375, -0.277496337890625, -0.2552490234375, -0.233001708984375, -0.21075439453125, -0.188507080078125, -0.166259765625, -0.144012451171875, -0.12176513671875, -0.099517822265625, -0.0772705078125, -0.055023193359375, -0.03277587890625, -0.010528564453125, 0.01171875, 0.033966064453125, 0.05621337890625, 0.078460693359375, 0.1007080078125, 0.122955322265625, 0.14520263671875, 0.167449951171875, 0.189697265625, 0.211944580078125, 0.23419189453125, 0.256439208984375, 0.2786865234375, 0.300933837890625, 0.32318115234375, 0.345428466796875, 0.36767578125, 0.389923095703125, 0.41217041015625, 0.434417724609375, 0.4566650390625, 0.478912353515625, 0.50115966796875, 0.523406982421875, 0.545654296875, 0.567901611328125, 0.59014892578125, 0.612396240234375, 0.6346435546875, 0.656890869140625, 0.67913818359375, 0.701385498046875, 0.7236328125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 1.0, 7.0, 6.0, 4.0, 6.0, 9.0, 8.0, 12.0, 7.0, 15.0, 20.0, 12.0, 19.0, 22.0, 24.0, 25.0, 36.0, 24.0, 33.0, 34.0, 44.0, 39.0, 40.0, 36.0, 31.0, 40.0, 30.0, 36.0, 29.0, 42.0, 34.0, 29.0, 34.0, 28.0, 25.0, 14.0, 18.0, 17.0, 17.0, 19.0, 14.0, 15.0, 5.0, 6.0, 3.0, 8.0, 8.0, 6.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.4616718292236328e-05, -2.3845583200454712e-05, -2.3074448108673096e-05, -2.230331301689148e-05, -2.1532177925109863e-05, -2.0761042833328247e-05, -1.998990774154663e-05, -1.9218772649765015e-05, -1.84476375579834e-05, -1.7676502466201782e-05, -1.6905367374420166e-05, -1.613423228263855e-05, -1.5363097190856934e-05, -1.4591962099075317e-05, -1.3820827007293701e-05, -1.3049691915512085e-05, -1.2278556823730469e-05, -1.1507421731948853e-05, -1.0736286640167236e-05, -9.96515154838562e-06, -9.194016456604004e-06, -8.422881364822388e-06, -7.651746273040771e-06, -6.880611181259155e-06, -6.109476089477539e-06, -5.338340997695923e-06, -4.567205905914307e-06, -3.7960708141326904e-06, -3.0249357223510742e-06, -2.253800630569458e-06, -1.4826655387878418e-06, -7.115304470062256e-07, 5.960464477539063e-08, 8.307397365570068e-07, 1.601874828338623e-06, 2.3730099201202393e-06, 3.1441450119018555e-06, 3.915280103683472e-06, 4.686415195465088e-06, 5.457550287246704e-06, 6.22868537902832e-06, 6.9998204708099365e-06, 7.770955562591553e-06, 8.542090654373169e-06, 9.313225746154785e-06, 1.0084360837936401e-05, 1.0855495929718018e-05, 1.1626631021499634e-05, 1.239776611328125e-05, 1.3168901205062866e-05, 1.3940036296844482e-05, 1.4711171388626099e-05, 1.5482306480407715e-05, 1.625344157218933e-05, 1.7024576663970947e-05, 1.7795711755752563e-05, 1.856684684753418e-05, 1.9337981939315796e-05, 2.0109117031097412e-05, 2.088025212287903e-05, 2.1651387214660645e-05, 2.242252230644226e-05, 2.3193657398223877e-05, 2.3964792490005493e-05, 2.473592758178711e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 16.0, 14.0, 20.0, 33.0, 40.0, 73.0, 91.0, 162.0, 199.0, 307.0, 508.0, 997.0, 1810.0, 3555.0, 7661.0, 17385.0, 41635.0, 103331.0, 235637.0, 317743.0, 184929.0, 76237.0, 30901.0, 13100.0, 5798.0, 2757.0, 1435.0, 836.0, 427.0, 282.0, 195.0, 112.0, 76.0, 62.0, 46.0, 33.0, 27.0, 22.0, 15.0, 12.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.3826026916503906, -0.36750030517578125, -0.3523979187011719, -0.3372955322265625, -0.3221931457519531, -0.30709075927734375, -0.2919883728027344, -0.276885986328125, -0.2617835998535156, -0.24668121337890625, -0.23157882690429688, -0.2164764404296875, -0.20137405395507812, -0.18627166748046875, -0.17116928100585938, -0.15606689453125, -0.14096450805664062, -0.12586212158203125, -0.11075973510742188, -0.0956573486328125, -0.08055496215820312, -0.06545257568359375, -0.050350189208984375, -0.035247802734375, -0.020145416259765625, -0.00504302978515625, 0.010059356689453125, 0.0251617431640625, 0.040264129638671875, 0.05536651611328125, 0.07046890258789062, 0.0855712890625, 0.10067367553710938, 0.11577606201171875, 0.13087844848632812, 0.1459808349609375, 0.16108322143554688, 0.17618560791015625, 0.19128799438476562, 0.206390380859375, 0.22149276733398438, 0.23659515380859375, 0.2516975402832031, 0.2667999267578125, 0.2819023132324219, 0.29700469970703125, 0.3121070861816406, 0.32720947265625, 0.3423118591308594, 0.35741424560546875, 0.3725166320800781, 0.3876190185546875, 0.4027214050292969, 0.41782379150390625, 0.4329261779785156, 0.448028564453125, 0.4631309509277344, 0.47823333740234375, 0.4933357238769531, 0.5084381103515625, 0.5235404968261719, 0.5386428833007812, 0.5537452697753906, 0.56884765625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 5.0, 8.0, 6.0, 13.0, 17.0, 20.0, 19.0, 23.0, 27.0, 34.0, 35.0, 46.0, 60.0, 53.0, 56.0, 59.0, 48.0, 57.0, 53.0, 55.0, 48.0, 37.0, 27.0, 29.0, 19.0, 31.0, 20.0, 24.0, 15.0, 11.0, 12.0, 9.0, 2.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.092529296875, -0.08972930908203125, -0.0869293212890625, -0.08412933349609375, -0.081329345703125, -0.07852935791015625, -0.0757293701171875, -0.07292938232421875, -0.07012939453125, -0.06732940673828125, -0.0645294189453125, -0.06172943115234375, -0.058929443359375, -0.05612945556640625, -0.0533294677734375, -0.05052947998046875, -0.0477294921875, -0.04492950439453125, -0.0421295166015625, -0.03932952880859375, -0.036529541015625, -0.03372955322265625, -0.0309295654296875, -0.02812957763671875, -0.02532958984375, -0.02252960205078125, -0.0197296142578125, -0.01692962646484375, -0.014129638671875, -0.01132965087890625, -0.0085296630859375, -0.00572967529296875, -0.0029296875, -0.00012969970703125, 0.0026702880859375, 0.00547027587890625, 0.008270263671875, 0.01107025146484375, 0.0138702392578125, 0.01667022705078125, 0.01947021484375, 0.02227020263671875, 0.0250701904296875, 0.02787017822265625, 0.030670166015625, 0.03347015380859375, 0.0362701416015625, 0.03907012939453125, 0.0418701171875, 0.04467010498046875, 0.0474700927734375, 0.05027008056640625, 0.053070068359375, 0.05587005615234375, 0.0586700439453125, 0.06147003173828125, 0.06427001953125, 0.06707000732421875, 0.0698699951171875, 0.07266998291015625, 0.075469970703125, 0.07826995849609375, 0.0810699462890625, 0.08386993408203125, 0.086669921875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 10.0, 14.0, 15.0, 16.0, 27.0, 30.0, 27.0, 41.0, 40.0, 44.0, 54.0, 55.0, 66.0, 58.0, 64.0, 49.0, 66.0, 43.0, 31.0, 49.0, 28.0, 35.0, 25.0, 25.0, 19.0, 13.0, 6.0, 10.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.455452919006348, -13.064770698547363, -12.674088478088379, -12.283407211303711, -11.892724990844727, -11.502042770385742, -11.111360549926758, -10.720678329467773, -10.329996109008789, -9.939313888549805, -9.54863166809082, -9.157949447631836, -8.767268180847168, -8.376585960388184, -7.985903739929199, -7.595221519470215, -7.204539775848389, -6.813857555389404, -6.423175811767578, -6.032493591308594, -5.641811370849609, -5.251129150390625, -4.860447406768799, -4.4697651863098145, -4.079083442687988, -3.688401460647583, -3.2977192401885986, -2.9070372581481934, -2.516355037689209, -2.1256730556488037, -1.7349910736083984, -1.344308853149414, -0.9536266326904297, -0.5629445314407349, -0.17226248979568481, 0.21841955184936523, 0.6091016530990601, 0.9997837543487549, 1.3904657363891602, 1.7811479568481445, 2.17182993888855, 2.562511920928955, 2.9531941413879395, 3.3438761234283447, 3.73455810546875, 4.125240325927734, 4.515922546386719, 4.906604766845703, 5.297286510467529, 5.687968730926514, 6.07865047454834, 6.469332695007324, 6.860014915466309, 7.250697135925293, 7.641378879547119, 8.032060623168945, 8.42274284362793, 8.813425064086914, 9.204107284545898, 9.594789505004883, 9.98547077178955, 10.376152992248535, 10.76683521270752, 11.157517433166504, 11.548199653625488]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 7.0, 3.0, 13.0, 9.0, 17.0, 14.0, 14.0, 21.0, 18.0, 20.0, 28.0, 23.0, 17.0, 33.0, 36.0, 35.0, 38.0, 39.0, 40.0, 39.0, 36.0, 32.0, 46.0, 51.0, 27.0, 39.0, 32.0, 39.0, 29.0, 32.0, 20.0, 23.0, 25.0, 14.0, 17.0, 19.0, 6.0, 13.0, 13.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5517683029174805, -6.345795631408691, -6.1398234367370605, -5.9338507652282715, -5.727878093719482, -5.521905899047852, -5.3159332275390625, -5.109960556030273, -4.903987884521484, -4.698015213012695, -4.4920430183410645, -4.286070346832275, -4.080097675323486, -3.8741252422332764, -3.6681528091430664, -3.4621801376342773, -3.2562079429626465, -3.0502355098724365, -2.8442628383636475, -2.6382904052734375, -2.4323177337646484, -2.2263453006744385, -2.0203728675842285, -1.814400315284729, -1.6084277629852295, -1.40245521068573, -1.1964826583862305, -0.9905102252960205, -0.784537672996521, -0.5785651206970215, -0.3725926876068115, -0.166620135307312, 0.0393519401550293, 0.24532446265220642, 0.45129698514938354, 0.6572694778442383, 0.8632420301437378, 1.0692145824432373, 1.2751870155334473, 1.4811595678329468, 1.6871321201324463, 1.8931046724319458, 2.0990772247314453, 2.3050496578216553, 2.5110220909118652, 2.7169947624206543, 2.9229671955108643, 3.128939628601074, 3.3349123001098633, 3.5408847332000732, 3.7468574047088623, 3.9528298377990723, 4.158802509307861, 4.364774703979492, 4.570747375488281, 4.77672004699707, 4.982692718505859, 5.188665390014648, 5.394637584686279, 5.600610256195068, 5.806582927703857, 6.012555122375488, 6.218527793884277, 6.424500465393066, 6.630472660064697]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 6.0, 9.0, 15.0, 28.0, 21.0, 30.0, 62.0, 76.0, 105.0, 192.0, 239.0, 348.0, 499.0, 773.0, 1181.0, 1806.0, 2907.0, 4703.0, 8132.0, 14097.0, 26150.0, 47564.0, 83948.0, 134435.0, 177946.0, 182407.0, 144607.0, 93684.0, 53896.0, 29445.0, 16049.0, 9009.0, 5171.0, 3129.0, 1947.0, 1312.0, 834.0, 565.0, 393.0, 263.0, 188.0, 114.0, 87.0, 54.0, 42.0, 20.0, 20.0, 16.0, 12.0, 11.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.5303955078125, -8.256103515625, -7.9818115234375, -7.70751953125, -7.4332275390625, -7.158935546875, -6.8846435546875, -6.6103515625, -6.3360595703125, -6.061767578125, -5.7874755859375, -5.51318359375, -5.2388916015625, -4.964599609375, -4.6903076171875, -4.416015625, -4.1417236328125, -3.867431640625, -3.5931396484375, -3.31884765625, -3.0445556640625, -2.770263671875, -2.4959716796875, -2.2216796875, -1.9473876953125, -1.673095703125, -1.3988037109375, -1.12451171875, -0.8502197265625, -0.575927734375, -0.3016357421875, -0.02734375, 0.2469482421875, 0.521240234375, 0.7955322265625, 1.06982421875, 1.3441162109375, 1.618408203125, 1.8927001953125, 2.1669921875, 2.4412841796875, 2.715576171875, 2.9898681640625, 3.26416015625, 3.5384521484375, 3.812744140625, 4.0870361328125, 4.361328125, 4.6356201171875, 4.909912109375, 5.1842041015625, 5.45849609375, 5.7327880859375, 6.007080078125, 6.2813720703125, 6.5556640625, 6.8299560546875, 7.104248046875, 7.3785400390625, 7.65283203125, 7.9271240234375, 8.201416015625, 8.4757080078125, 8.75]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 12.0, 9.0, 14.0, 11.0, 14.0, 16.0, 24.0, 20.0, 24.0, 29.0, 29.0, 34.0, 32.0, 27.0, 29.0, 39.0, 41.0, 34.0, 39.0, 39.0, 36.0, 30.0, 34.0, 38.0, 43.0, 35.0, 33.0, 21.0, 29.0, 18.0, 21.0, 25.0, 16.0, 18.0, 21.0, 11.0, 13.0, 11.0, 10.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.73046875, -6.5091552734375, -6.287841796875, -6.0665283203125, -5.84521484375, -5.6239013671875, -5.402587890625, -5.1812744140625, -4.9599609375, -4.7386474609375, -4.517333984375, -4.2960205078125, -4.07470703125, -3.8533935546875, -3.632080078125, -3.4107666015625, -3.189453125, -2.9681396484375, -2.746826171875, -2.5255126953125, -2.30419921875, -2.0828857421875, -1.861572265625, -1.6402587890625, -1.4189453125, -1.1976318359375, -0.976318359375, -0.7550048828125, -0.53369140625, -0.3123779296875, -0.091064453125, 0.1302490234375, 0.3515625, 0.5728759765625, 0.794189453125, 1.0155029296875, 1.23681640625, 1.4581298828125, 1.679443359375, 1.9007568359375, 2.1220703125, 2.3433837890625, 2.564697265625, 2.7860107421875, 3.00732421875, 3.2286376953125, 3.449951171875, 3.6712646484375, 3.892578125, 4.1138916015625, 4.335205078125, 4.5565185546875, 4.77783203125, 4.9991455078125, 5.220458984375, 5.4417724609375, 5.6630859375, 5.8843994140625, 6.105712890625, 6.3270263671875, 6.54833984375, 6.7696533203125, 6.990966796875, 7.2122802734375, 7.43359375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 15.0, 22.0, 28.0, 36.0, 46.0, 67.0, 124.0, 162.0, 210.0, 358.0, 541.0, 844.0, 1308.0, 2122.0, 3337.0, 5762.0, 11154.0, 22845.0, 52159.0, 118479.0, 220413.0, 261365.0, 182233.0, 88098.0, 38327.0, 17188.0, 8820.0, 4715.0, 2860.0, 1749.0, 1069.0, 725.0, 427.0, 305.0, 192.0, 144.0, 99.0, 52.0, 55.0, 25.0, 24.0, 12.0, 10.0, 6.0, 6.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.34375, -14.8831787109375, -14.422607421875, -13.9620361328125, -13.50146484375, -13.0408935546875, -12.580322265625, -12.1197509765625, -11.6591796875, -11.1986083984375, -10.738037109375, -10.2774658203125, -9.81689453125, -9.3563232421875, -8.895751953125, -8.4351806640625, -7.974609375, -7.5140380859375, -7.053466796875, -6.5928955078125, -6.13232421875, -5.6717529296875, -5.211181640625, -4.7506103515625, -4.2900390625, -3.8294677734375, -3.368896484375, -2.9083251953125, -2.44775390625, -1.9871826171875, -1.526611328125, -1.0660400390625, -0.60546875, -0.1448974609375, 0.315673828125, 0.7762451171875, 1.23681640625, 1.6973876953125, 2.157958984375, 2.6185302734375, 3.0791015625, 3.5396728515625, 4.000244140625, 4.4608154296875, 4.92138671875, 5.3819580078125, 5.842529296875, 6.3031005859375, 6.763671875, 7.2242431640625, 7.684814453125, 8.1453857421875, 8.60595703125, 9.0665283203125, 9.527099609375, 9.9876708984375, 10.4482421875, 10.9088134765625, 11.369384765625, 11.8299560546875, 12.29052734375, 12.7510986328125, 13.211669921875, 13.6722412109375, 14.1328125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 10.0, 7.0, 6.0, 10.0, 19.0, 14.0, 23.0, 21.0, 18.0, 19.0, 18.0, 19.0, 26.0, 44.0, 27.0, 35.0, 44.0, 39.0, 41.0, 27.0, 53.0, 37.0, 39.0, 36.0, 37.0, 30.0, 31.0, 41.0, 36.0, 29.0, 24.0, 11.0, 18.0, 13.0, 20.0, 13.0, 12.0, 11.0, 8.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.30078125, -5.1474609375, -4.994140625, -4.8408203125, -4.6875, -4.5341796875, -4.380859375, -4.2275390625, -4.07421875, -3.9208984375, -3.767578125, -3.6142578125, -3.4609375, -3.3076171875, -3.154296875, -3.0009765625, -2.84765625, -2.6943359375, -2.541015625, -2.3876953125, -2.234375, -2.0810546875, -1.927734375, -1.7744140625, -1.62109375, -1.4677734375, -1.314453125, -1.1611328125, -1.0078125, -0.8544921875, -0.701171875, -0.5478515625, -0.39453125, -0.2412109375, -0.087890625, 0.0654296875, 0.21875, 0.3720703125, 0.525390625, 0.6787109375, 0.83203125, 0.9853515625, 1.138671875, 1.2919921875, 1.4453125, 1.5986328125, 1.751953125, 1.9052734375, 2.05859375, 2.2119140625, 2.365234375, 2.5185546875, 2.671875, 2.8251953125, 2.978515625, 3.1318359375, 3.28515625, 3.4384765625, 3.591796875, 3.7451171875, 3.8984375, 4.0517578125, 4.205078125, 4.3583984375, 4.51171875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 6.0, 12.0, 15.0, 18.0, 47.0, 50.0, 92.0, 118.0, 209.0, 291.0, 446.0, 682.0, 964.0, 1487.0, 2279.0, 3673.0, 5540.0, 8893.0, 14221.0, 24116.0, 41475.0, 71925.0, 121726.0, 177615.0, 194099.0, 150739.0, 94222.0, 53590.0, 30876.0, 18253.0, 10935.0, 7003.0, 4451.0, 2928.0, 2001.0, 1236.0, 720.0, 513.0, 361.0, 232.0, 169.0, 113.0, 67.0, 50.0, 29.0, 27.0, 17.0, 6.0, 6.0, 4.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.4285888671875, -6.208740234375, -5.9888916015625, -5.76904296875, -5.5491943359375, -5.329345703125, -5.1094970703125, -4.8896484375, -4.6697998046875, -4.449951171875, -4.2301025390625, -4.01025390625, -3.7904052734375, -3.570556640625, -3.3507080078125, -3.130859375, -2.9110107421875, -2.691162109375, -2.4713134765625, -2.25146484375, -2.0316162109375, -1.811767578125, -1.5919189453125, -1.3720703125, -1.1522216796875, -0.932373046875, -0.7125244140625, -0.49267578125, -0.2728271484375, -0.052978515625, 0.1668701171875, 0.38671875, 0.6065673828125, 0.826416015625, 1.0462646484375, 1.26611328125, 1.4859619140625, 1.705810546875, 1.9256591796875, 2.1455078125, 2.3653564453125, 2.585205078125, 2.8050537109375, 3.02490234375, 3.2447509765625, 3.464599609375, 3.6844482421875, 3.904296875, 4.1241455078125, 4.343994140625, 4.5638427734375, 4.78369140625, 5.0035400390625, 5.223388671875, 5.4432373046875, 5.6630859375, 5.8829345703125, 6.102783203125, 6.3226318359375, 6.54248046875, 6.7623291015625, 6.982177734375, 7.2020263671875, 7.421875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 9.0, 14.0, 25.0, 30.0, 26.0, 28.0, 43.0, 49.0, 53.0, 64.0, 74.0, 65.0, 63.0, 66.0, 54.0, 41.0, 44.0, 39.0, 32.0, 30.0, 23.0, 18.0, 18.0, 7.0, 9.0, 6.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0006823539733886719, -0.0006618201732635498, -0.0006412863731384277, -0.0006207525730133057, -0.0006002187728881836, -0.0005796849727630615, -0.0005591511726379395, -0.0005386173725128174, -0.0005180835723876953, -0.0004975497722625732, -0.00047701597213745117, -0.0004564821720123291, -0.00043594837188720703, -0.00041541457176208496, -0.0003948807716369629, -0.0003743469715118408, -0.00035381317138671875, -0.0003332793712615967, -0.0003127455711364746, -0.00029221177101135254, -0.00027167797088623047, -0.0002511441707611084, -0.00023061037063598633, -0.00021007657051086426, -0.0001895427703857422, -0.00016900897026062012, -0.00014847517013549805, -0.00012794137001037598, -0.0001074075698852539, -8.687376976013184e-05, -6.633996963500977e-05, -4.5806169509887695e-05, -2.5272369384765625e-05, -4.738569259643555e-06, 1.5795230865478516e-05, 3.6329030990600586e-05, 5.6862831115722656e-05, 7.739663124084473e-05, 9.79304313659668e-05, 0.00011846423149108887, 0.00013899803161621094, 0.000159531831741333, 0.00018006563186645508, 0.00020059943199157715, 0.00022113323211669922, 0.0002416670322418213, 0.00026220083236694336, 0.00028273463249206543, 0.0003032684326171875, 0.00032380223274230957, 0.00034433603286743164, 0.0003648698329925537, 0.0003854036331176758, 0.00040593743324279785, 0.0004264712333679199, 0.000447005033493042, 0.00046753883361816406, 0.00048807263374328613, 0.0005086064338684082, 0.0005291402339935303, 0.0005496740341186523, 0.0005702078342437744, 0.0005907416343688965, 0.0006112754344940186, 0.0006318092346191406]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 20.0, 23.0, 30.0, 49.0, 80.0, 156.0, 198.0, 323.0, 447.0, 807.0, 1241.0, 1956.0, 3018.0, 5184.0, 8589.0, 14171.0, 24929.0, 43293.0, 76179.0, 129863.0, 188642.0, 197682.0, 144733.0, 87379.0, 50112.0, 28230.0, 16387.0, 9754.0, 5806.0, 3439.0, 2191.0, 1292.0, 810.0, 523.0, 355.0, 222.0, 160.0, 85.0, 64.0, 52.0, 30.0, 17.0, 13.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9921875, -6.7520751953125, -6.511962890625, -6.2718505859375, -6.03173828125, -5.7916259765625, -5.551513671875, -5.3114013671875, -5.0712890625, -4.8311767578125, -4.591064453125, -4.3509521484375, -4.11083984375, -3.8707275390625, -3.630615234375, -3.3905029296875, -3.150390625, -2.9102783203125, -2.670166015625, -2.4300537109375, -2.18994140625, -1.9498291015625, -1.709716796875, -1.4696044921875, -1.2294921875, -0.9893798828125, -0.749267578125, -0.5091552734375, -0.26904296875, -0.0289306640625, 0.211181640625, 0.4512939453125, 0.69140625, 0.9315185546875, 1.171630859375, 1.4117431640625, 1.65185546875, 1.8919677734375, 2.132080078125, 2.3721923828125, 2.6123046875, 2.8524169921875, 3.092529296875, 3.3326416015625, 3.57275390625, 3.8128662109375, 4.052978515625, 4.2930908203125, 4.533203125, 4.7733154296875, 5.013427734375, 5.2535400390625, 5.49365234375, 5.7337646484375, 5.973876953125, 6.2139892578125, 6.4541015625, 6.6942138671875, 6.934326171875, 7.1744384765625, 7.41455078125, 7.6546630859375, 7.894775390625, 8.1348876953125, 8.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 3.0, 5.0, 11.0, 13.0, 14.0, 18.0, 28.0, 20.0, 26.0, 27.0, 46.0, 48.0, 53.0, 58.0, 67.0, 65.0, 62.0, 58.0, 54.0, 54.0, 54.0, 38.0, 30.0, 24.0, 17.0, 17.0, 19.0, 8.0, 11.0, 2.0, 9.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.99609375, -1.93450927734375, -1.8729248046875, -1.81134033203125, -1.749755859375, -1.68817138671875, -1.6265869140625, -1.56500244140625, -1.50341796875, -1.44183349609375, -1.3802490234375, -1.31866455078125, -1.257080078125, -1.19549560546875, -1.1339111328125, -1.07232666015625, -1.0107421875, -0.94915771484375, -0.8875732421875, -0.82598876953125, -0.764404296875, -0.70281982421875, -0.6412353515625, -0.57965087890625, -0.51806640625, -0.45648193359375, -0.3948974609375, -0.33331298828125, -0.271728515625, -0.21014404296875, -0.1485595703125, -0.08697509765625, -0.025390625, 0.03619384765625, 0.0977783203125, 0.15936279296875, 0.220947265625, 0.28253173828125, 0.3441162109375, 0.40570068359375, 0.46728515625, 0.52886962890625, 0.5904541015625, 0.65203857421875, 0.713623046875, 0.77520751953125, 0.8367919921875, 0.89837646484375, 0.9599609375, 1.02154541015625, 1.0831298828125, 1.14471435546875, 1.206298828125, 1.26788330078125, 1.3294677734375, 1.39105224609375, 1.45263671875, 1.51422119140625, 1.5758056640625, 1.63739013671875, 1.698974609375, 1.76055908203125, 1.8221435546875, 1.88372802734375, 1.9453125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 10.0, 15.0, 19.0, 24.0, 21.0, 20.0, 40.0, 27.0, 47.0, 49.0, 39.0, 47.0, 61.0, 49.0, 51.0, 60.0, 73.0, 31.0, 33.0, 48.0, 35.0, 31.0, 25.0, 19.0, 12.0, 11.0, 20.0, 17.0, 8.0, 13.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.122962951660156, -11.743892669677734, -11.364823341369629, -10.985753059387207, -10.606683731079102, -10.22761344909668, -9.848543167114258, -9.469472885131836, -9.09040355682373, -8.711333274841309, -8.332263946533203, -7.953193664550781, -7.574123859405518, -7.195054054260254, -6.815983772277832, -6.436913967132568, -6.057844161987305, -5.678774356842041, -5.299704551696777, -4.9206342697143555, -4.541564464569092, -4.162494659423828, -3.7834246158599854, -3.4043545722961426, -3.025284767150879, -2.6462149620056152, -2.2671449184417725, -1.8880749940872192, -1.509005069732666, -1.1299351453781128, -0.7508652210235596, -0.3717951774597168, 0.007274627685546875, 0.3863445520401001, 0.7654144763946533, 1.1444844007492065, 1.5235543251037598, 1.902624249458313, 2.281694173812866, 2.660764217376709, 3.0398340225219727, 3.4189038276672363, 3.797973871231079, 4.177043914794922, 4.5561137199401855, 4.935183525085449, 5.314253807067871, 5.693323612213135, 6.072393417358398, 6.451463222503662, 6.830533027648926, 7.209603309631348, 7.588673114776611, 7.967742919921875, 8.346813201904297, 8.725883483886719, 9.104952812194824, 9.484023094177246, 9.863092422485352, 10.242162704467773, 10.621232986450195, 11.0003023147583, 11.379372596740723, 11.758441925048828, 12.13751220703125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 13.0, 10.0, 11.0, 14.0, 21.0, 21.0, 13.0, 19.0, 24.0, 21.0, 40.0, 30.0, 38.0, 51.0, 43.0, 30.0, 46.0, 35.0, 39.0, 46.0, 30.0, 42.0, 41.0, 29.0, 22.0, 28.0, 27.0, 29.0, 31.0, 17.0, 20.0, 24.0, 11.0, 16.0, 15.0, 15.0, 8.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.735739707946777, -7.48982572555542, -7.2439117431640625, -6.997997760772705, -6.752083778381348, -6.50616979598999, -6.260255813598633, -6.014341831207275, -5.768427848815918, -5.5225138664245605, -5.276599884033203, -5.030685901641846, -4.784771919250488, -4.538857936859131, -4.292943954467773, -4.047029972076416, -3.8011162281036377, -3.5552022457122803, -3.309288263320923, -3.0633742809295654, -2.817460298538208, -2.5715465545654297, -2.3256325721740723, -2.079718589782715, -1.8338044881820679, -1.5878905057907104, -1.341976523399353, -1.0960626602172852, -0.850148618221283, -0.6042346954345703, -0.3583207130432129, -0.11240673065185547, 0.13350725173950195, 0.3794212341308594, 0.6253352165222168, 0.8712491393089294, 1.1171631813049316, 1.3630770444869995, 1.608991026878357, 1.8549050092697144, 2.1008191108703613, 2.3467330932617188, 2.592647075653076, 2.8385610580444336, 3.084475040435791, 3.3303890228271484, 3.576303005218506, 3.8222169876098633, 4.0681304931640625, 4.31404447555542, 4.559958457946777, 4.805872440338135, 5.051786422729492, 5.29770040512085, 5.543614387512207, 5.7895283699035645, 6.035442352294922, 6.281356334686279, 6.527270317077637, 6.773184299468994, 7.019098281860352, 7.265012264251709, 7.510926246643066, 7.756840229034424, 8.002754211425781]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [5.0, 4.0, 10.0, 7.0, 18.0, 28.0, 36.0, 69.0, 87.0, 150.0, 233.0, 367.0, 582.0, 850.0, 1477.0, 2163.0, 3567.0, 6069.0, 10181.0, 17147.0, 30263.0, 52705.0, 97186.0, 180228.0, 335413.0, 581254.0, 807711.0, 798423.0, 562165.0, 321863.0, 172463.0, 91872.0, 50666.0, 28436.0, 16379.0, 9590.0, 5677.0, 3495.0, 2082.0, 1280.0, 766.0, 446.0, 325.0, 183.0, 135.0, 90.0, 54.0, 45.0, 23.0, 11.0, 10.0, 7.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.73388671875, -8.3974609375, -8.06103515625, -7.724609375, -7.38818359375, -7.0517578125, -6.71533203125, -6.37890625, -6.04248046875, -5.7060546875, -5.36962890625, -5.033203125, -4.69677734375, -4.3603515625, -4.02392578125, -3.6875, -3.35107421875, -3.0146484375, -2.67822265625, -2.341796875, -2.00537109375, -1.6689453125, -1.33251953125, -0.99609375, -0.65966796875, -0.3232421875, 0.01318359375, 0.349609375, 0.68603515625, 1.0224609375, 1.35888671875, 1.6953125, 2.03173828125, 2.3681640625, 2.70458984375, 3.041015625, 3.37744140625, 3.7138671875, 4.05029296875, 4.38671875, 4.72314453125, 5.0595703125, 5.39599609375, 5.732421875, 6.06884765625, 6.4052734375, 6.74169921875, 7.078125, 7.41455078125, 7.7509765625, 8.08740234375, 8.423828125, 8.76025390625, 9.0966796875, 9.43310546875, 9.76953125, 10.10595703125, 10.4423828125, 10.77880859375, 11.115234375, 11.45166015625, 11.7880859375, 12.12451171875, 12.4609375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 11.0, 7.0, 10.0, 21.0, 11.0, 17.0, 21.0, 22.0, 31.0, 45.0, 27.0, 27.0, 30.0, 33.0, 43.0, 44.0, 43.0, 47.0, 36.0, 46.0, 42.0, 51.0, 36.0, 33.0, 34.0, 26.0, 31.0, 22.0, 32.0, 22.0, 16.0, 16.0, 12.0, 7.0, 10.0, 8.0, 6.0, 5.0, 8.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.80462646484375, -8.5389404296875, -8.27325439453125, -8.007568359375, -7.74188232421875, -7.4761962890625, -7.21051025390625, -6.94482421875, -6.67913818359375, -6.4134521484375, -6.14776611328125, -5.882080078125, -5.61639404296875, -5.3507080078125, -5.08502197265625, -4.8193359375, -4.55364990234375, -4.2879638671875, -4.02227783203125, -3.756591796875, -3.49090576171875, -3.2252197265625, -2.95953369140625, -2.69384765625, -2.42816162109375, -2.1624755859375, -1.89678955078125, -1.631103515625, -1.36541748046875, -1.0997314453125, -0.83404541015625, -0.568359375, -0.30267333984375, -0.0369873046875, 0.22869873046875, 0.494384765625, 0.76007080078125, 1.0257568359375, 1.29144287109375, 1.55712890625, 1.82281494140625, 2.0885009765625, 2.35418701171875, 2.619873046875, 2.88555908203125, 3.1512451171875, 3.41693115234375, 3.6826171875, 3.94830322265625, 4.2139892578125, 4.47967529296875, 4.745361328125, 5.01104736328125, 5.2767333984375, 5.54241943359375, 5.80810546875, 6.07379150390625, 6.3394775390625, 6.60516357421875, 6.870849609375, 7.13653564453125, 7.4022216796875, 7.66790771484375, 7.93359375]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 18.0, 19.0, 37.0, 34.0, 69.0, 96.0, 145.0, 276.0, 357.0, 558.0, 945.0, 1575.0, 2480.0, 3986.0, 6762.0, 11503.0, 20078.0, 35114.0, 64625.0, 118348.0, 219939.0, 399606.0, 654743.0, 843349.0, 738913.0, 477081.0, 269107.0, 145174.0, 78291.0, 42624.0, 24169.0, 13807.0, 8005.0, 4717.0, 2893.0, 1748.0, 1088.0, 673.0, 434.0, 334.0, 183.0, 145.0, 77.0, 53.0, 34.0, 24.0, 13.0, 11.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-16.125, -15.64599609375, -15.1669921875, -14.68798828125, -14.208984375, -13.72998046875, -13.2509765625, -12.77197265625, -12.29296875, -11.81396484375, -11.3349609375, -10.85595703125, -10.376953125, -9.89794921875, -9.4189453125, -8.93994140625, -8.4609375, -7.98193359375, -7.5029296875, -7.02392578125, -6.544921875, -6.06591796875, -5.5869140625, -5.10791015625, -4.62890625, -4.14990234375, -3.6708984375, -3.19189453125, -2.712890625, -2.23388671875, -1.7548828125, -1.27587890625, -0.796875, -0.31787109375, 0.1611328125, 0.64013671875, 1.119140625, 1.59814453125, 2.0771484375, 2.55615234375, 3.03515625, 3.51416015625, 3.9931640625, 4.47216796875, 4.951171875, 5.43017578125, 5.9091796875, 6.38818359375, 6.8671875, 7.34619140625, 7.8251953125, 8.30419921875, 8.783203125, 9.26220703125, 9.7412109375, 10.22021484375, 10.69921875, 11.17822265625, 11.6572265625, 12.13623046875, 12.615234375, 13.09423828125, 13.5732421875, 14.05224609375, 14.53125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 8.0, 17.0, 20.0, 20.0, 32.0, 38.0, 52.0, 58.0, 58.0, 72.0, 98.0, 137.0, 182.0, 192.0, 227.0, 251.0, 224.0, 255.0, 273.0, 298.0, 246.0, 199.0, 194.0, 186.0, 144.0, 140.0, 108.0, 81.0, 52.0, 49.0, 40.0, 43.0, 30.0, 13.0, 11.0, 4.0, 7.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.36590576171875, -4.2044677734375, -4.04302978515625, -3.881591796875, -3.72015380859375, -3.5587158203125, -3.39727783203125, -3.23583984375, -3.07440185546875, -2.9129638671875, -2.75152587890625, -2.590087890625, -2.42864990234375, -2.2672119140625, -2.10577392578125, -1.9443359375, -1.78289794921875, -1.6214599609375, -1.46002197265625, -1.298583984375, -1.13714599609375, -0.9757080078125, -0.81427001953125, -0.65283203125, -0.49139404296875, -0.3299560546875, -0.16851806640625, -0.007080078125, 0.15435791015625, 0.3157958984375, 0.47723388671875, 0.638671875, 0.80010986328125, 0.9615478515625, 1.12298583984375, 1.284423828125, 1.44586181640625, 1.6072998046875, 1.76873779296875, 1.93017578125, 2.09161376953125, 2.2530517578125, 2.41448974609375, 2.575927734375, 2.73736572265625, 2.8988037109375, 3.06024169921875, 3.2216796875, 3.38311767578125, 3.5445556640625, 3.70599365234375, 3.867431640625, 4.02886962890625, 4.1903076171875, 4.35174560546875, 4.51318359375, 4.67462158203125, 4.8360595703125, 4.99749755859375, 5.158935546875, 5.32037353515625, 5.4818115234375, 5.64324951171875, 5.8046875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 8.0, 5.0, 14.0, 10.0, 14.0, 20.0, 14.0, 27.0, 26.0, 40.0, 35.0, 35.0, 46.0, 54.0, 50.0, 52.0, 53.0, 54.0, 53.0, 47.0, 47.0, 47.0, 37.0, 23.0, 28.0, 39.0, 25.0, 20.0, 14.0, 12.0, 12.0, 4.0, 5.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.755992889404297, -17.209001541137695, -16.662010192871094, -16.115018844604492, -15.56802749633789, -15.021036148071289, -14.474045753479004, -13.927054405212402, -13.3800630569458, -12.8330717086792, -12.286080360412598, -11.739089012145996, -11.192098617553711, -10.64510726928711, -10.098115921020508, -9.551124572753906, -9.004133224487305, -8.457141876220703, -7.910150527954102, -7.363159656524658, -6.816168308258057, -6.269176959991455, -5.722186088562012, -5.17519474029541, -4.628203392028809, -4.081212043762207, -3.5342209339141846, -2.987229824066162, -2.4402384757995605, -1.893247127532959, -1.3462560176849365, -0.7992649078369141, -0.2522735595703125, 0.2947176694869995, 0.8417088985443115, 1.3887001276016235, 1.9356913566589355, 2.482682704925537, 3.0296738147735596, 3.576664924621582, 4.123656272888184, 4.670647621154785, 5.217638969421387, 5.76462984085083, 6.311621189117432, 6.858612537384033, 7.405603408813477, 7.952594757080078, 8.49958610534668, 9.046577453613281, 9.593568801879883, 10.140560150146484, 10.687551498413086, 11.234542846679688, 11.781533241271973, 12.328524589538574, 12.875515937805176, 13.422507286071777, 13.969498634338379, 14.51648998260498, 15.063480377197266, 15.610471725463867, 16.15746307373047, 16.70445442199707, 17.251445770263672]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 11.0, 11.0, 10.0, 14.0, 19.0, 19.0, 19.0, 25.0, 18.0, 25.0, 35.0, 27.0, 28.0, 30.0, 43.0, 33.0, 32.0, 38.0, 27.0, 38.0, 38.0, 34.0, 32.0, 34.0, 25.0, 32.0, 23.0, 30.0, 35.0, 26.0, 19.0, 18.0, 16.0, 17.0, 18.0, 16.0, 19.0, 6.0, 11.0, 8.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-9.7020845413208, -9.396124839782715, -9.090165138244629, -8.78420639038086, -8.478246688842773, -8.172286987304688, -7.866327285766602, -7.560368061065674, -7.254408836364746, -6.94844913482666, -6.642489910125732, -6.3365302085876465, -6.030570983886719, -5.724611282348633, -5.418651580810547, -5.112692356109619, -4.806732654571533, -4.500772953033447, -4.1948137283325195, -3.8888540267944336, -3.582894802093506, -3.27693510055542, -2.970975637435913, -2.6650161743164062, -2.3590567111968994, -2.0530972480773926, -1.7471377849578857, -1.4411782026290894, -1.1352187395095825, -0.8292592763900757, -0.5232996940612793, -0.21734023094177246, 0.08861923217773438, 0.3945787250995636, 0.7005382180213928, 1.0064977407455444, 1.3124572038650513, 1.618416666984558, 1.9243762493133545, 2.2303357124328613, 2.536295175552368, 2.842254638671875, 3.148214101791382, 3.4541735649108887, 3.7601332664489746, 4.066092491149902, 4.372052192687988, 4.678011894226074, 4.983971118927002, 5.289930820465088, 5.595890045166016, 5.901849746704102, 6.207808971405029, 6.513768672943115, 6.819727897644043, 7.125687599182129, 7.431647300720215, 7.737607002258301, 8.043566703796387, 8.349525451660156, 8.655485153198242, 8.961444854736328, 9.267404556274414, 9.5733642578125, 9.87932300567627]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 9.0, 11.0, 27.0, 27.0, 69.0, 91.0, 125.0, 232.0, 364.0, 584.0, 996.0, 1530.0, 2577.0, 4309.0, 7073.0, 11893.0, 20196.0, 34496.0, 59493.0, 98685.0, 150991.0, 188987.0, 170730.0, 117805.0, 73009.0, 42597.0, 25169.0, 14509.0, 8687.0, 5158.0, 3199.0, 1912.0, 1131.0, 690.0, 431.0, 269.0, 159.0, 94.0, 79.0, 48.0, 30.0, 20.0, 15.0, 10.0, 4.0, 7.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0], "bins": [-1.4033203125, -1.3603973388671875, -1.317474365234375, -1.2745513916015625, -1.23162841796875, -1.1887054443359375, -1.145782470703125, -1.1028594970703125, -1.0599365234375, -1.0170135498046875, -0.974090576171875, -0.9311676025390625, -0.88824462890625, -0.8453216552734375, -0.802398681640625, -0.7594757080078125, -0.716552734375, -0.6736297607421875, -0.630706787109375, -0.5877838134765625, -0.54486083984375, -0.5019378662109375, -0.459014892578125, -0.4160919189453125, -0.3731689453125, -0.3302459716796875, -0.287322998046875, -0.2444000244140625, -0.20147705078125, -0.1585540771484375, -0.115631103515625, -0.0727081298828125, -0.02978515625, 0.0131378173828125, 0.056060791015625, 0.0989837646484375, 0.14190673828125, 0.1848297119140625, 0.227752685546875, 0.2706756591796875, 0.3135986328125, 0.3565216064453125, 0.399444580078125, 0.4423675537109375, 0.48529052734375, 0.5282135009765625, 0.571136474609375, 0.6140594482421875, 0.656982421875, 0.6999053955078125, 0.742828369140625, 0.7857513427734375, 0.82867431640625, 0.8715972900390625, 0.914520263671875, 0.9574432373046875, 1.0003662109375, 1.0432891845703125, 1.086212158203125, 1.1291351318359375, 1.17205810546875, 1.2149810791015625, 1.257904052734375, 1.3008270263671875, 1.34375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 4.0, 7.0, 10.0, 8.0, 15.0, 12.0, 15.0, 17.0, 21.0, 31.0, 27.0, 30.0, 34.0, 27.0, 38.0, 36.0, 35.0, 44.0, 44.0, 49.0, 30.0, 32.0, 37.0, 33.0, 32.0, 38.0, 33.0, 32.0, 26.0, 34.0, 24.0, 18.0, 18.0, 18.0, 18.0, 12.0, 12.0, 9.0, 5.0, 8.0, 4.0, 0.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.4921875, -12.1234130859375, -11.754638671875, -11.3858642578125, -11.01708984375, -10.6483154296875, -10.279541015625, -9.9107666015625, -9.5419921875, -9.1732177734375, -8.804443359375, -8.4356689453125, -8.06689453125, -7.6981201171875, -7.329345703125, -6.9605712890625, -6.591796875, -6.2230224609375, -5.854248046875, -5.4854736328125, -5.11669921875, -4.7479248046875, -4.379150390625, -4.0103759765625, -3.6416015625, -3.2728271484375, -2.904052734375, -2.5352783203125, -2.16650390625, -1.7977294921875, -1.428955078125, -1.0601806640625, -0.69140625, -0.3226318359375, 0.046142578125, 0.4149169921875, 0.78369140625, 1.1524658203125, 1.521240234375, 1.8900146484375, 2.2587890625, 2.6275634765625, 2.996337890625, 3.3651123046875, 3.73388671875, 4.1026611328125, 4.471435546875, 4.8402099609375, 5.208984375, 5.5777587890625, 5.946533203125, 6.3153076171875, 6.68408203125, 7.0528564453125, 7.421630859375, 7.7904052734375, 8.1591796875, 8.5279541015625, 8.896728515625, 9.2655029296875, 9.63427734375, 10.0030517578125, 10.371826171875, 10.7406005859375, 11.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 2.0, 7.0, 8.0, 11.0, 20.0, 35.0, 33.0, 46.0, 78.0, 104.0, 118.0, 214.0, 298.0, 435.0, 776.0, 1276.0, 2116.0, 3972.0, 7776.0, 16320.0, 42024.0, 786443.0, 137701.0, 24650.0, 11268.0, 5604.0, 2917.0, 1628.0, 981.0, 580.0, 362.0, 221.0, 175.0, 114.0, 80.0, 43.0, 41.0, 21.0, 16.0, 12.0, 11.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.849609375, -3.715728759765625, -3.58184814453125, -3.447967529296875, -3.3140869140625, -3.180206298828125, -3.04632568359375, -2.912445068359375, -2.778564453125, -2.644683837890625, -2.51080322265625, -2.376922607421875, -2.2430419921875, -2.109161376953125, -1.97528076171875, -1.841400146484375, -1.70751953125, -1.573638916015625, -1.43975830078125, -1.305877685546875, -1.1719970703125, -1.038116455078125, -0.90423583984375, -0.770355224609375, -0.636474609375, -0.502593994140625, -0.36871337890625, -0.234832763671875, -0.1009521484375, 0.032928466796875, 0.16680908203125, 0.300689697265625, 0.4345703125, 0.568450927734375, 0.70233154296875, 0.836212158203125, 0.9700927734375, 1.103973388671875, 1.23785400390625, 1.371734619140625, 1.505615234375, 1.639495849609375, 1.77337646484375, 1.907257080078125, 2.0411376953125, 2.175018310546875, 2.30889892578125, 2.442779541015625, 2.57666015625, 2.710540771484375, 2.84442138671875, 2.978302001953125, 3.1121826171875, 3.246063232421875, 3.37994384765625, 3.513824462890625, 3.647705078125, 3.781585693359375, 3.91546630859375, 4.049346923828125, 4.1832275390625, 4.317108154296875, 4.45098876953125, 4.584869384765625, 4.71875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 7.0, 5.0, 12.0, 15.0, 16.0, 20.0, 23.0, 18.0, 27.0, 25.0, 28.0, 26.0, 30.0, 37.0, 38.0, 36.0, 40.0, 33.0, 38.0, 41.0, 41.0, 45.0, 37.0, 40.0, 39.0, 48.0, 28.0, 29.0, 22.0, 29.0, 24.0, 20.0, 20.0, 16.0, 6.0, 7.0, 5.0, 4.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.7265625, -7.4775390625, -7.228515625, -6.9794921875, -6.73046875, -6.4814453125, -6.232421875, -5.9833984375, -5.734375, -5.4853515625, -5.236328125, -4.9873046875, -4.73828125, -4.4892578125, -4.240234375, -3.9912109375, -3.7421875, -3.4931640625, -3.244140625, -2.9951171875, -2.74609375, -2.4970703125, -2.248046875, -1.9990234375, -1.75, -1.5009765625, -1.251953125, -1.0029296875, -0.75390625, -0.5048828125, -0.255859375, -0.0068359375, 0.2421875, 0.4912109375, 0.740234375, 0.9892578125, 1.23828125, 1.4873046875, 1.736328125, 1.9853515625, 2.234375, 2.4833984375, 2.732421875, 2.9814453125, 3.23046875, 3.4794921875, 3.728515625, 3.9775390625, 4.2265625, 4.4755859375, 4.724609375, 4.9736328125, 5.22265625, 5.4716796875, 5.720703125, 5.9697265625, 6.21875, 6.4677734375, 6.716796875, 6.9658203125, 7.21484375, 7.4638671875, 7.712890625, 7.9619140625, 8.2109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 9.0, 5.0, 17.0, 15.0, 25.0, 30.0, 49.0, 57.0, 96.0, 129.0, 170.0, 254.0, 382.0, 517.0, 836.0, 1167.0, 1884.0, 2714.0, 4381.0, 7050.0, 11797.0, 22009.0, 73907.0, 841025.0, 36589.0, 17271.0, 9673.0, 5833.0, 3620.0, 2292.0, 1498.0, 989.0, 617.0, 484.0, 378.0, 243.0, 170.0, 101.0, 81.0, 63.0, 32.0, 30.0, 23.0, 14.0, 12.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8271484375, -0.79986572265625, -0.7725830078125, -0.74530029296875, -0.718017578125, -0.69073486328125, -0.6634521484375, -0.63616943359375, -0.60888671875, -0.58160400390625, -0.5543212890625, -0.52703857421875, -0.499755859375, -0.47247314453125, -0.4451904296875, -0.41790771484375, -0.390625, -0.36334228515625, -0.3360595703125, -0.30877685546875, -0.281494140625, -0.25421142578125, -0.2269287109375, -0.19964599609375, -0.17236328125, -0.14508056640625, -0.1177978515625, -0.09051513671875, -0.063232421875, -0.03594970703125, -0.0086669921875, 0.01861572265625, 0.0458984375, 0.07318115234375, 0.1004638671875, 0.12774658203125, 0.155029296875, 0.18231201171875, 0.2095947265625, 0.23687744140625, 0.26416015625, 0.29144287109375, 0.3187255859375, 0.34600830078125, 0.373291015625, 0.40057373046875, 0.4278564453125, 0.45513916015625, 0.482421875, 0.50970458984375, 0.5369873046875, 0.56427001953125, 0.591552734375, 0.61883544921875, 0.6461181640625, 0.67340087890625, 0.70068359375, 0.72796630859375, 0.7552490234375, 0.78253173828125, 0.809814453125, 0.83709716796875, 0.8643798828125, 0.89166259765625, 0.9189453125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 1.0, 8.0, 8.0, 7.0, 5.0, 19.0, 20.0, 12.0, 11.0, 18.0, 24.0, 21.0, 26.0, 37.0, 34.0, 36.0, 41.0, 58.0, 48.0, 30.0, 54.0, 54.0, 47.0, 36.0, 39.0, 36.0, 40.0, 27.0, 32.0, 35.0, 27.0, 21.0, 9.0, 11.0, 18.0, 11.0, 8.0, 8.0, 7.0, 9.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.5762786865234375e-05, -3.473460674285889e-05, -3.37064266204834e-05, -3.267824649810791e-05, -3.165006637573242e-05, -3.0621886253356934e-05, -2.9593706130981445e-05, -2.8565526008605957e-05, -2.753734588623047e-05, -2.650916576385498e-05, -2.5480985641479492e-05, -2.4452805519104004e-05, -2.3424625396728516e-05, -2.2396445274353027e-05, -2.136826515197754e-05, -2.034008502960205e-05, -1.9311904907226562e-05, -1.8283724784851074e-05, -1.7255544662475586e-05, -1.6227364540100098e-05, -1.519918441772461e-05, -1.4171004295349121e-05, -1.3142824172973633e-05, -1.2114644050598145e-05, -1.1086463928222656e-05, -1.0058283805847168e-05, -9.03010368347168e-06, -8.001923561096191e-06, -6.973743438720703e-06, -5.945563316345215e-06, -4.9173831939697266e-06, -3.889203071594238e-06, -2.86102294921875e-06, -1.8328428268432617e-06, -8.046627044677734e-07, 2.2351741790771484e-07, 1.2516975402832031e-06, 2.2798776626586914e-06, 3.3080577850341797e-06, 4.336237907409668e-06, 5.364418029785156e-06, 6.3925981521606445e-06, 7.420778274536133e-06, 8.448958396911621e-06, 9.47713851928711e-06, 1.0505318641662598e-05, 1.1533498764038086e-05, 1.2561678886413574e-05, 1.3589859008789062e-05, 1.461803913116455e-05, 1.564621925354004e-05, 1.6674399375915527e-05, 1.7702579498291016e-05, 1.8730759620666504e-05, 1.9758939743041992e-05, 2.078711986541748e-05, 2.181529998779297e-05, 2.2843480110168457e-05, 2.3871660232543945e-05, 2.4899840354919434e-05, 2.5928020477294922e-05, 2.695620059967041e-05, 2.79843807220459e-05, 2.9012560844421387e-05, 3.0040740966796875e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 10.0, 5.0, 14.0, 21.0, 30.0, 30.0, 61.0, 102.0, 148.0, 265.0, 351.0, 525.0, 790.0, 1276.0, 2000.0, 3231.0, 5389.0, 8569.0, 14668.0, 25077.0, 42856.0, 73323.0, 121559.0, 179500.0, 195575.0, 147362.0, 92709.0, 54384.0, 31865.0, 18355.0, 10925.0, 6657.0, 4012.0, 2469.0, 1560.0, 1006.0, 661.0, 404.0, 287.0, 200.0, 119.0, 76.0, 46.0, 31.0, 21.0, 20.0, 8.0, 6.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54150390625, -0.5256805419921875, -0.509857177734375, -0.4940338134765625, -0.47821044921875, -0.4623870849609375, -0.446563720703125, -0.4307403564453125, -0.4149169921875, -0.3990936279296875, -0.383270263671875, -0.3674468994140625, -0.35162353515625, -0.3358001708984375, -0.319976806640625, -0.3041534423828125, -0.288330078125, -0.2725067138671875, -0.256683349609375, -0.2408599853515625, -0.22503662109375, -0.2092132568359375, -0.193389892578125, -0.1775665283203125, -0.1617431640625, -0.1459197998046875, -0.130096435546875, -0.1142730712890625, -0.09844970703125, -0.0826263427734375, -0.066802978515625, -0.0509796142578125, -0.03515625, -0.0193328857421875, -0.003509521484375, 0.0123138427734375, 0.02813720703125, 0.0439605712890625, 0.059783935546875, 0.0756072998046875, 0.0914306640625, 0.1072540283203125, 0.123077392578125, 0.1389007568359375, 0.15472412109375, 0.1705474853515625, 0.186370849609375, 0.2021942138671875, 0.218017578125, 0.2338409423828125, 0.249664306640625, 0.2654876708984375, 0.28131103515625, 0.2971343994140625, 0.312957763671875, 0.3287811279296875, 0.3446044921875, 0.3604278564453125, 0.376251220703125, 0.3920745849609375, 0.40789794921875, 0.4237213134765625, 0.439544677734375, 0.4553680419921875, 0.47119140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 14.0, 13.0, 8.0, 18.0, 16.0, 15.0, 19.0, 39.0, 39.0, 47.0, 55.0, 55.0, 64.0, 68.0, 64.0, 72.0, 55.0, 65.0, 52.0, 41.0, 21.0, 23.0, 29.0, 19.0, 19.0, 13.0, 9.0, 4.0, 6.0, 9.0, 6.0, 2.0, 1.0, 5.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.193115234375, -0.18789291381835938, -0.18267059326171875, -0.17744827270507812, -0.1722259521484375, -0.16700363159179688, -0.16178131103515625, -0.15655899047851562, -0.151336669921875, -0.14611434936523438, -0.14089202880859375, -0.13566970825195312, -0.1304473876953125, -0.12522506713867188, -0.12000274658203125, -0.11478042602539062, -0.10955810546875, -0.10433578491210938, -0.09911346435546875, -0.09389114379882812, -0.0886688232421875, -0.08344650268554688, -0.07822418212890625, -0.07300186157226562, -0.067779541015625, -0.06255722045898438, -0.05733489990234375, -0.052112579345703125, -0.0468902587890625, -0.041667938232421875, -0.03644561767578125, -0.031223297119140625, -0.0260009765625, -0.020778656005859375, -0.01555633544921875, -0.010334014892578125, -0.0051116943359375, 0.000110626220703125, 0.00533294677734375, 0.010555267333984375, 0.015777587890625, 0.020999908447265625, 0.02622222900390625, 0.031444549560546875, 0.0366668701171875, 0.041889190673828125, 0.04711151123046875, 0.052333831787109375, 0.05755615234375, 0.06277847290039062, 0.06800079345703125, 0.07322311401367188, 0.0784454345703125, 0.08366775512695312, 0.08889007568359375, 0.09411239624023438, 0.099334716796875, 0.10455703735351562, 0.10977935791015625, 0.11500167846679688, 0.1202239990234375, 0.12544631958007812, 0.13066864013671875, 0.13589096069335938, 0.14111328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 14.0, 11.0, 13.0, 20.0, 15.0, 19.0, 26.0, 37.0, 37.0, 36.0, 44.0, 47.0, 55.0, 50.0, 54.0, 48.0, 47.0, 54.0, 41.0, 49.0, 42.0, 30.0, 26.0, 35.0, 30.0, 19.0, 18.0, 16.0, 8.0, 7.0, 7.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.071125030517578, -16.5330867767334, -15.995046615600586, -15.457008361816406, -14.91896915435791, -14.380929946899414, -13.842891693115234, -13.304852485656738, -12.766813278198242, -12.228774070739746, -11.69073486328125, -11.15269660949707, -10.614657402038574, -10.076618194580078, -9.538579940795898, -9.000540733337402, -8.462501525878906, -7.92446231842041, -7.386423587799072, -6.848384857177734, -6.310345649719238, -5.772306442260742, -5.234267711639404, -4.696228981018066, -4.15818977355957, -3.6201508045196533, -3.0821118354797363, -2.5440728664398193, -2.0060338973999023, -1.4679949283599854, -0.9299559593200684, -0.39191699028015137, 0.14612388610839844, 0.6841628551483154, 1.2222018241882324, 1.7602407932281494, 2.2982797622680664, 2.8363187313079834, 3.3743577003479004, 3.9123966693878174, 4.450435638427734, 4.9884748458862305, 5.526513576507568, 6.064552307128906, 6.602591514587402, 7.140630722045898, 7.678669452667236, 8.216708183288574, 8.75474739074707, 9.292786598205566, 9.830825805664062, 10.368864059448242, 10.906903266906738, 11.444942474365234, 11.982980728149414, 12.52101993560791, 13.059059143066406, 13.597098350524902, 14.135137557983398, 14.673175811767578, 15.211215019226074, 15.74925422668457, 16.28729248046875, 16.825332641601562, 17.363370895385742]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 7.0, 4.0, 6.0, 5.0, 6.0, 13.0, 10.0, 10.0, 13.0, 19.0, 18.0, 18.0, 27.0, 18.0, 25.0, 32.0, 31.0, 27.0, 29.0, 46.0, 32.0, 31.0, 37.0, 35.0, 33.0, 37.0, 36.0, 28.0, 37.0, 24.0, 34.0, 25.0, 28.0, 34.0, 26.0, 19.0, 16.0, 18.0, 18.0, 16.0, 15.0, 19.0, 7.0, 11.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.865306854248047, -9.556503295898438, -9.247699737548828, -8.938896179199219, -8.63009262084961, -8.321290016174316, -8.012486457824707, -7.703682899475098, -7.394879341125488, -7.086075782775879, -6.7772722244262695, -6.468469142913818, -6.159665584564209, -5.8508620262146, -5.542058944702148, -5.233255386352539, -4.92445182800293, -4.61564826965332, -4.306844711303711, -3.9980416297912598, -3.6892380714416504, -3.380434513092041, -3.0716311931610107, -2.7628278732299805, -2.454024314880371, -2.1452207565307617, -1.8364174365997314, -1.5276139974594116, -1.2188105583190918, -0.910007119178772, -0.6012036800384521, -0.2924003601074219, 0.016402244567871094, 0.3252056837081909, 0.6340091228485107, 0.9428125619888306, 1.2516160011291504, 1.5604194402694702, 1.86922287940979, 2.1780261993408203, 2.4868297576904297, 2.795633316040039, 3.1044366359710693, 3.4132399559020996, 3.722043514251709, 4.030847072601318, 4.3396501541137695, 4.648453712463379, 4.957257270812988, 5.266060829162598, 5.574864387512207, 5.883667469024658, 6.192471027374268, 6.501274585723877, 6.810077667236328, 7.1188812255859375, 7.427684783935547, 7.736488342285156, 8.045291900634766, 8.354095458984375, 8.662899017333984, 8.971701622009277, 9.280505180358887, 9.589308738708496, 9.898112297058105]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 9.0, 16.0, 15.0, 24.0, 33.0, 70.0, 83.0, 162.0, 247.0, 390.0, 630.0, 1089.0, 1913.0, 3379.0, 6409.0, 11348.0, 21308.0, 38771.0, 68895.0, 113305.0, 161112.0, 184051.0, 162827.0, 114693.0, 70139.0, 39483.0, 21756.0, 11647.0, 6384.0, 3496.0, 1967.0, 1159.0, 662.0, 416.0, 230.0, 162.0, 92.0, 59.0, 36.0, 28.0, 18.0, 8.0, 15.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.015625, -11.6461181640625, -11.276611328125, -10.9071044921875, -10.53759765625, -10.1680908203125, -9.798583984375, -9.4290771484375, -9.0595703125, -8.6900634765625, -8.320556640625, -7.9510498046875, -7.58154296875, -7.2120361328125, -6.842529296875, -6.4730224609375, -6.103515625, -5.7340087890625, -5.364501953125, -4.9949951171875, -4.62548828125, -4.2559814453125, -3.886474609375, -3.5169677734375, -3.1474609375, -2.7779541015625, -2.408447265625, -2.0389404296875, -1.66943359375, -1.2999267578125, -0.930419921875, -0.5609130859375, -0.19140625, 0.1781005859375, 0.547607421875, 0.9171142578125, 1.28662109375, 1.6561279296875, 2.025634765625, 2.3951416015625, 2.7646484375, 3.1341552734375, 3.503662109375, 3.8731689453125, 4.24267578125, 4.6121826171875, 4.981689453125, 5.3511962890625, 5.720703125, 6.0902099609375, 6.459716796875, 6.8292236328125, 7.19873046875, 7.5682373046875, 7.937744140625, 8.3072509765625, 8.6767578125, 9.0462646484375, 9.415771484375, 9.7852783203125, 10.15478515625, 10.5242919921875, 10.893798828125, 11.2633056640625, 11.6328125]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 8.0, 9.0, 10.0, 16.0, 9.0, 18.0, 23.0, 27.0, 23.0, 36.0, 24.0, 25.0, 40.0, 43.0, 39.0, 38.0, 45.0, 47.0, 46.0, 46.0, 40.0, 44.0, 34.0, 37.0, 43.0, 26.0, 28.0, 36.0, 28.0, 14.0, 23.0, 17.0, 12.0, 13.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.0390625, -12.6461181640625, -12.253173828125, -11.8602294921875, -11.46728515625, -11.0743408203125, -10.681396484375, -10.2884521484375, -9.8955078125, -9.5025634765625, -9.109619140625, -8.7166748046875, -8.32373046875, -7.9307861328125, -7.537841796875, -7.1448974609375, -6.751953125, -6.3590087890625, -5.966064453125, -5.5731201171875, -5.18017578125, -4.7872314453125, -4.394287109375, -4.0013427734375, -3.6083984375, -3.2154541015625, -2.822509765625, -2.4295654296875, -2.03662109375, -1.6436767578125, -1.250732421875, -0.8577880859375, -0.46484375, -0.0718994140625, 0.321044921875, 0.7139892578125, 1.10693359375, 1.4998779296875, 1.892822265625, 2.2857666015625, 2.6787109375, 3.0716552734375, 3.464599609375, 3.8575439453125, 4.25048828125, 4.6434326171875, 5.036376953125, 5.4293212890625, 5.822265625, 6.2152099609375, 6.608154296875, 7.0010986328125, 7.39404296875, 7.7869873046875, 8.179931640625, 8.5728759765625, 8.9658203125, 9.3587646484375, 9.751708984375, 10.1446533203125, 10.53759765625, 10.9305419921875, 11.323486328125, 11.7164306640625, 12.109375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 19.0, 21.0, 37.0, 48.0, 74.0, 107.0, 169.0, 247.0, 374.0, 612.0, 1005.0, 1660.0, 2869.0, 4783.0, 8542.0, 15858.0, 29247.0, 56062.0, 103252.0, 172553.0, 217229.0, 183935.0, 114379.0, 62566.0, 32618.0, 17423.0, 9641.0, 5345.0, 3053.0, 1798.0, 1060.0, 679.0, 458.0, 270.0, 174.0, 108.0, 83.0, 55.0, 43.0, 31.0, 17.0, 15.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-19.125, -18.5380859375, -17.951171875, -17.3642578125, -16.77734375, -16.1904296875, -15.603515625, -15.0166015625, -14.4296875, -13.8427734375, -13.255859375, -12.6689453125, -12.08203125, -11.4951171875, -10.908203125, -10.3212890625, -9.734375, -9.1474609375, -8.560546875, -7.9736328125, -7.38671875, -6.7998046875, -6.212890625, -5.6259765625, -5.0390625, -4.4521484375, -3.865234375, -3.2783203125, -2.69140625, -2.1044921875, -1.517578125, -0.9306640625, -0.34375, 0.2431640625, 0.830078125, 1.4169921875, 2.00390625, 2.5908203125, 3.177734375, 3.7646484375, 4.3515625, 4.9384765625, 5.525390625, 6.1123046875, 6.69921875, 7.2861328125, 7.873046875, 8.4599609375, 9.046875, 9.6337890625, 10.220703125, 10.8076171875, 11.39453125, 11.9814453125, 12.568359375, 13.1552734375, 13.7421875, 14.3291015625, 14.916015625, 15.5029296875, 16.08984375, 16.6767578125, 17.263671875, 17.8505859375, 18.4375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 6.0, 8.0, 13.0, 12.0, 10.0, 16.0, 18.0, 17.0, 13.0, 20.0, 33.0, 21.0, 30.0, 38.0, 42.0, 44.0, 44.0, 48.0, 43.0, 37.0, 47.0, 48.0, 44.0, 47.0, 35.0, 33.0, 24.0, 32.0, 15.0, 33.0, 21.0, 27.0, 18.0, 10.0, 10.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9375, -6.701904296875, -6.46630859375, -6.230712890625, -5.9951171875, -5.759521484375, -5.52392578125, -5.288330078125, -5.052734375, -4.817138671875, -4.58154296875, -4.345947265625, -4.1103515625, -3.874755859375, -3.63916015625, -3.403564453125, -3.16796875, -2.932373046875, -2.69677734375, -2.461181640625, -2.2255859375, -1.989990234375, -1.75439453125, -1.518798828125, -1.283203125, -1.047607421875, -0.81201171875, -0.576416015625, -0.3408203125, -0.105224609375, 0.13037109375, 0.365966796875, 0.6015625, 0.837158203125, 1.07275390625, 1.308349609375, 1.5439453125, 1.779541015625, 2.01513671875, 2.250732421875, 2.486328125, 2.721923828125, 2.95751953125, 3.193115234375, 3.4287109375, 3.664306640625, 3.89990234375, 4.135498046875, 4.37109375, 4.606689453125, 4.84228515625, 5.077880859375, 5.3134765625, 5.549072265625, 5.78466796875, 6.020263671875, 6.255859375, 6.491455078125, 6.72705078125, 6.962646484375, 7.1982421875, 7.433837890625, 7.66943359375, 7.905029296875, 8.140625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 5.0, 9.0, 11.0, 26.0, 31.0, 45.0, 53.0, 89.0, 134.0, 175.0, 230.0, 340.0, 515.0, 681.0, 947.0, 1463.0, 2214.0, 3277.0, 5222.0, 8441.0, 13862.0, 23301.0, 39998.0, 68952.0, 112389.0, 161351.0, 182344.0, 156916.0, 106713.0, 64578.0, 37127.0, 21955.0, 12818.0, 7762.0, 4865.0, 3041.0, 2000.0, 1394.0, 954.0, 705.0, 477.0, 336.0, 221.0, 168.0, 104.0, 79.0, 77.0, 46.0, 34.0, 22.0, 25.0, 8.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0], "bins": [-9.578125, -9.2828369140625, -8.987548828125, -8.6922607421875, -8.39697265625, -8.1016845703125, -7.806396484375, -7.5111083984375, -7.2158203125, -6.9205322265625, -6.625244140625, -6.3299560546875, -6.03466796875, -5.7393798828125, -5.444091796875, -5.1488037109375, -4.853515625, -4.5582275390625, -4.262939453125, -3.9676513671875, -3.67236328125, -3.3770751953125, -3.081787109375, -2.7864990234375, -2.4912109375, -2.1959228515625, -1.900634765625, -1.6053466796875, -1.31005859375, -1.0147705078125, -0.719482421875, -0.4241943359375, -0.12890625, 0.1663818359375, 0.461669921875, 0.7569580078125, 1.05224609375, 1.3475341796875, 1.642822265625, 1.9381103515625, 2.2333984375, 2.5286865234375, 2.823974609375, 3.1192626953125, 3.41455078125, 3.7098388671875, 4.005126953125, 4.3004150390625, 4.595703125, 4.8909912109375, 5.186279296875, 5.4815673828125, 5.77685546875, 6.0721435546875, 6.367431640625, 6.6627197265625, 6.9580078125, 7.2532958984375, 7.548583984375, 7.8438720703125, 8.13916015625, 8.4344482421875, 8.729736328125, 9.0250244140625, 9.3203125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 8.0, 7.0, 11.0, 10.0, 13.0, 22.0, 16.0, 22.0, 38.0, 52.0, 55.0, 46.0, 69.0, 80.0, 81.0, 66.0, 69.0, 71.0, 43.0, 48.0, 38.0, 27.0, 24.0, 17.0, 13.0, 13.0, 7.0, 7.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.0016374588012695312, -0.0015962719917297363, -0.0015550851821899414, -0.0015138983726501465, -0.0014727115631103516, -0.0014315247535705566, -0.0013903379440307617, -0.0013491511344909668, -0.0013079643249511719, -0.001266777515411377, -0.001225590705871582, -0.0011844038963317871, -0.0011432170867919922, -0.0011020302772521973, -0.0010608434677124023, -0.0010196566581726074, -0.0009784698486328125, -0.0009372830390930176, -0.0008960962295532227, -0.0008549094200134277, -0.0008137226104736328, -0.0007725358009338379, -0.000731348991394043, -0.000690162181854248, -0.0006489753723144531, -0.0006077885627746582, -0.0005666017532348633, -0.0005254149436950684, -0.00048422813415527344, -0.0004430413246154785, -0.0004018545150756836, -0.00036066770553588867, -0.00031948089599609375, -0.00027829408645629883, -0.0002371072769165039, -0.00019592046737670898, -0.00015473365783691406, -0.00011354684829711914, -7.236003875732422e-05, -3.11732292175293e-05, 1.0013580322265625e-05, 5.120038986206055e-05, 9.238719940185547e-05, 0.0001335740089416504, 0.0001747608184814453, 0.00021594762802124023, 0.00025713443756103516, 0.0002983212471008301, 0.000339508056640625, 0.0003806948661804199, 0.00042188167572021484, 0.00046306848526000977, 0.0005042552947998047, 0.0005454421043395996, 0.0005866289138793945, 0.0006278157234191895, 0.0006690025329589844, 0.0007101893424987793, 0.0007513761520385742, 0.0007925629615783691, 0.0008337497711181641, 0.000874936580657959, 0.0009161233901977539, 0.0009573101997375488, 0.0009984970092773438]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 6.0, 10.0, 22.0, 27.0, 36.0, 61.0, 76.0, 107.0, 143.0, 228.0, 354.0, 479.0, 786.0, 1113.0, 1630.0, 2717.0, 4018.0, 6463.0, 10238.0, 17417.0, 29917.0, 51659.0, 87266.0, 137393.0, 178373.0, 176341.0, 133329.0, 84709.0, 49992.0, 28935.0, 16909.0, 10116.0, 6105.0, 4069.0, 2532.0, 1671.0, 1074.0, 738.0, 482.0, 311.0, 214.0, 141.0, 119.0, 72.0, 47.0, 31.0, 36.0, 15.0, 6.0, 4.0, 10.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.578125, -9.296142578125, -9.01416015625, -8.732177734375, -8.4501953125, -8.168212890625, -7.88623046875, -7.604248046875, -7.322265625, -7.040283203125, -6.75830078125, -6.476318359375, -6.1943359375, -5.912353515625, -5.63037109375, -5.348388671875, -5.06640625, -4.784423828125, -4.50244140625, -4.220458984375, -3.9384765625, -3.656494140625, -3.37451171875, -3.092529296875, -2.810546875, -2.528564453125, -2.24658203125, -1.964599609375, -1.6826171875, -1.400634765625, -1.11865234375, -0.836669921875, -0.5546875, -0.272705078125, 0.00927734375, 0.291259765625, 0.5732421875, 0.855224609375, 1.13720703125, 1.419189453125, 1.701171875, 1.983154296875, 2.26513671875, 2.547119140625, 2.8291015625, 3.111083984375, 3.39306640625, 3.675048828125, 3.95703125, 4.239013671875, 4.52099609375, 4.802978515625, 5.0849609375, 5.366943359375, 5.64892578125, 5.930908203125, 6.212890625, 6.494873046875, 6.77685546875, 7.058837890625, 7.3408203125, 7.622802734375, 7.90478515625, 8.186767578125, 8.46875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 4.0, 7.0, 6.0, 6.0, 8.0, 11.0, 20.0, 21.0, 24.0, 24.0, 38.0, 36.0, 52.0, 61.0, 71.0, 65.0, 72.0, 51.0, 55.0, 56.0, 48.0, 41.0, 45.0, 28.0, 25.0, 16.0, 16.0, 12.0, 15.0, 15.0, 9.0, 6.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.455078125, -2.377197265625, -2.29931640625, -2.221435546875, -2.1435546875, -2.065673828125, -1.98779296875, -1.909912109375, -1.83203125, -1.754150390625, -1.67626953125, -1.598388671875, -1.5205078125, -1.442626953125, -1.36474609375, -1.286865234375, -1.208984375, -1.131103515625, -1.05322265625, -0.975341796875, -0.8974609375, -0.819580078125, -0.74169921875, -0.663818359375, -0.5859375, -0.508056640625, -0.43017578125, -0.352294921875, -0.2744140625, -0.196533203125, -0.11865234375, -0.040771484375, 0.037109375, 0.114990234375, 0.19287109375, 0.270751953125, 0.3486328125, 0.426513671875, 0.50439453125, 0.582275390625, 0.66015625, 0.738037109375, 0.81591796875, 0.893798828125, 0.9716796875, 1.049560546875, 1.12744140625, 1.205322265625, 1.283203125, 1.361083984375, 1.43896484375, 1.516845703125, 1.5947265625, 1.672607421875, 1.75048828125, 1.828369140625, 1.90625, 1.984130859375, 2.06201171875, 2.139892578125, 2.2177734375, 2.295654296875, 2.37353515625, 2.451416015625, 2.529296875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 5.0, 3.0, 3.0, 8.0, 8.0, 8.0, 17.0, 16.0, 21.0, 23.0, 23.0, 26.0, 36.0, 42.0, 41.0, 31.0, 52.0, 52.0, 53.0, 67.0, 49.0, 54.0, 49.0, 52.0, 37.0, 36.0, 31.0, 30.0, 28.0, 19.0, 17.0, 13.0, 11.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.077926635742188, -20.463621139526367, -19.849315643310547, -19.235010147094727, -18.620704650878906, -18.006399154663086, -17.392093658447266, -16.777786254882812, -16.163482666015625, -15.549177169799805, -14.934871673583984, -14.320566177368164, -13.706260681152344, -13.091955184936523, -12.477648735046387, -11.863343238830566, -11.24903678894043, -10.63473129272461, -10.020425796508789, -9.406120300292969, -8.791814804077148, -8.177509307861328, -7.563202857971191, -6.948897361755371, -6.334591865539551, -5.7202863693237305, -5.10598087310791, -4.491674900054932, -3.8773694038391113, -3.263063907623291, -2.6487581729888916, -2.034452438354492, -1.4201488494873047, -0.8058432340621948, -0.19153761863708496, 0.4227679967880249, 1.0370736122131348, 1.651379108428955, 2.2656848430633545, 2.879990577697754, 3.494296073913574, 4.1086015701293945, 4.722907066345215, 5.337213039398193, 5.951518535614014, 6.565824031829834, 7.1801300048828125, 7.794435501098633, 8.408740997314453, 9.023046493530273, 9.637351989746094, 10.251657485961914, 10.865962982177734, 11.480268478393555, 12.094574928283691, 12.708880424499512, 13.323185920715332, 13.937491416931152, 14.551796913146973, 15.166102409362793, 15.78040885925293, 16.39471435546875, 17.00901985168457, 17.62332534790039, 18.23763084411621]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 4.0, 11.0, 7.0, 10.0, 15.0, 17.0, 12.0, 10.0, 15.0, 21.0, 19.0, 33.0, 29.0, 26.0, 34.0, 33.0, 37.0, 47.0, 34.0, 38.0, 39.0, 40.0, 55.0, 27.0, 31.0, 34.0, 27.0, 36.0, 36.0, 27.0, 29.0, 23.0, 27.0, 12.0, 13.0, 13.0, 7.0, 18.0, 7.0, 7.0, 5.0, 7.0, 5.0, 8.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.295456886291504, -12.856975555419922, -12.41849422454834, -11.980012893676758, -11.541531562805176, -11.103050231933594, -10.664569854736328, -10.22608757019043, -9.787607192993164, -9.349125862121582, -8.91064453125, -8.472163200378418, -8.033681869506836, -7.595200538635254, -7.15671968460083, -6.718238353729248, -6.279756546020508, -5.841275215148926, -5.402793884277344, -4.964312553405762, -4.52583122253418, -4.087349891662598, -3.648869037628174, -3.210387706756592, -2.7719063758850098, -2.3334250450134277, -1.8949438333511353, -1.4564626216888428, -1.0179812908172607, -0.5794999599456787, -0.14101886749267578, 0.29746246337890625, 0.7359437942504883, 1.1744251251220703, 1.6129063367843628, 2.0513875484466553, 2.4898688793182373, 2.9283502101898193, 3.3668313026428223, 3.8053126335144043, 4.243793964385986, 4.682275295257568, 5.12075662612915, 5.559237480163574, 5.997718811035156, 6.436200141906738, 6.87468147277832, 7.313162803649902, 7.751644134521484, 8.190125465393066, 8.628606796264648, 9.06708812713623, 9.505569458007812, 9.944050788879395, 10.382532119750977, 10.821012496948242, 11.25949478149414, 11.697976112365723, 12.136457443237305, 12.574938774108887, 13.013420104980469, 13.45190143585205, 13.890382766723633, 14.328863143920898, 14.76734447479248]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 7.0, 4.0, 6.0, 13.0, 8.0, 23.0, 24.0, 29.0, 42.0, 49.0, 74.0, 90.0, 130.0, 185.0, 258.0, 410.0, 593.0, 1104.0, 1882.0, 4602.0, 496139.0, 10543.0, 3664.0, 1690.0, 909.0, 598.0, 325.0, 210.0, 174.0, 121.0, 111.0, 64.0, 33.0, 30.0, 28.0, 22.0, 25.0, 16.0, 9.0, 5.0, 7.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.6606140136719, -263.2204895019531, -253.78036499023438, -244.34024047851562, -234.90011596679688, -225.45999145507812, -216.0198516845703, -206.57972717285156, -197.1396026611328, -187.69947814941406, -178.2593536376953, -168.81922912597656, -159.37908935546875, -149.93896484375, -140.49884033203125, -131.0587158203125, -121.61859130859375, -112.178466796875, -102.73834228515625, -93.29821014404297, -83.85808563232422, -74.41796112060547, -64.97782897949219, -55.53770446777344, -46.09757995605469, -36.65745544433594, -27.217327117919922, -17.77720069885254, -8.337074279785156, 1.1030502319335938, 10.54317855834961, 19.983306884765625, 29.423431396484375, 38.863555908203125, 48.30368423461914, 57.743812561035156, 67.1839370727539, 76.62406158447266, 86.06419372558594, 95.50431823730469, 104.94444274902344, 114.38456726074219, 123.82469177246094, 133.2648162841797, 142.7049560546875, 152.14508056640625, 161.585205078125, 171.02532958984375, 180.4654541015625, 189.90557861328125, 199.345703125, 208.78582763671875, 218.2259521484375, 227.66607666015625, 237.10621643066406, 246.5463409423828, 255.98646545410156, 265.4266052246094, 274.8667297363281, 284.3068542480469, 293.7469787597656, 303.1871032714844, 312.6272277832031, 322.0673522949219, 331.5074768066406]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 4.0, 7.0, 10.0, 12.0, 14.0, 18.0, 14.0, 6.0, 19.0, 18.0, 22.0, 30.0, 31.0, 27.0, 39.0, 31.0, 39.0, 40.0, 33.0, 32.0, 43.0, 1076.0, 44.0, 31.0, 28.0, 37.0, 26.0, 37.0, 30.0, 33.0, 21.0, 29.0, 19.0, 20.0, 9.0, 17.0, 10.0, 15.0, 4.0, 8.0, 4.0, 7.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-412.3919372558594, -398.66351318359375, -384.93511962890625, -371.20672607421875, -357.4783020019531, -343.7498779296875, -330.021484375, -316.2930908203125, -302.5646667480469, -288.83624267578125, -275.10784912109375, -261.37945556640625, -247.65103149414062, -233.92262268066406, -220.1942138671875, -206.46580505371094, -192.73739624023438, -179.0089874267578, -165.28057861328125, -151.5521697998047, -137.82376098632812, -124.09535217285156, -110.366943359375, -96.63853454589844, -82.91012573242188, -69.18171691894531, -55.45330810546875, -41.72489929199219, -27.996490478515625, -14.268081665039062, -0.5396728515625, 13.188735961914062, 26.917144775390625, 40.64555358886719, 54.37396240234375, 68.10237121582031, 81.83078002929688, 95.55918884277344, 109.28759765625, 123.01600646972656, 136.74441528320312, 150.4728240966797, 164.20123291015625, 177.9296417236328, 191.65805053710938, 205.38645935058594, 219.1148681640625, 232.84327697753906, 246.57168579101562, 260.30010986328125, 274.02850341796875, 287.75689697265625, 301.4853210449219, 315.2137451171875, 328.942138671875, 342.6705322265625, 356.3989562988281, 370.12738037109375, 383.85577392578125, 397.58416748046875, 411.3125915527344, 425.041015625, 438.7694091796875, 452.497802734375, 466.2262268066406]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 5.0, 6.0, 4.0, 9.0, 12.0, 6.0, 11.0, 10.0, 15.0, 26.0, 31.0, 28.0, 35.0, 50.0, 83.0, 110.0, 157.0, 258.0, 328.0, 512.0, 690.0, 926.0, 1171.0, 1581.0, 2182.0, 3398.0, 4810.0, 11404.0, 31146528.0, 52135.0, 10468.0, 7266.0, 6639.0, 1471.0, 632.0, 417.0, 279.0, 247.0, 168.0, 126.0, 108.0, 85.0, 41.0, 22.0, 8.0, 7.0, 0.0, 0.0, 1.0], "bins": [-690.6199951171875, -674.8472900390625, -659.0745849609375, -643.3018798828125, -627.5291137695312, -611.7564086914062, -595.9837036132812, -580.2109985351562, -564.4382934570312, -548.6655883789062, -532.8928833007812, -517.1201171875, -501.3474426269531, -485.57470703125, -469.802001953125, -454.029296875, -438.2565612792969, -422.4838562011719, -406.71112060546875, -390.93841552734375, -375.16571044921875, -359.39300537109375, -343.6202697753906, -327.8475646972656, -312.0748291015625, -296.3021240234375, -280.5293884277344, -264.7566833496094, -248.98397827148438, -233.2112579345703, -217.43853759765625, -201.66583251953125, -185.89309692382812, -170.12037658691406, -154.34767150878906, -138.574951171875, -122.80223846435547, -107.02952575683594, -91.25680541992188, -75.48409271240234, -59.71138000488281, -43.93866729736328, -28.165950775146484, -12.393234252929688, 3.3794784545898438, 19.152191162109375, 34.92491149902344, 50.69762420654297, 66.4703369140625, 82.24304962158203, 98.01576232910156, 113.78848266601562, 129.56118774414062, 145.3339080810547, 161.10662841796875, 176.87933349609375, 192.6520538330078, 208.42477416992188, 224.19747924804688, 239.97019958496094, 255.742919921875, 271.515625, 287.288330078125, 303.0610656738281, 318.8337707519531]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 20.0, 23.0, 20.0, 40.0, 43.0, 57.0, 62.0, 93.0, 99.0, 88.0, 80.0, 83.0, 54.0, 51.0, 33.0, 34.0, 17.0, 20.0, 17.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-550.7784423828125, -535.5905151367188, -520.402587890625, -505.21466064453125, -490.0267028808594, -474.8387756347656, -459.6508483886719, -444.4629211425781, -429.27496337890625, -414.0870361328125, -398.89910888671875, -383.711181640625, -368.5232238769531, -353.3352966308594, -338.1473693847656, -322.9594421386719, -307.7715148925781, -292.5835876464844, -277.3956604003906, -262.20770263671875, -247.019775390625, -231.83184814453125, -216.6439208984375, -201.45599365234375, -186.26805114746094, -171.0801239013672, -155.89218139648438, -140.70425415039062, -125.51631927490234, -110.32838439941406, -95.14045715332031, -79.95252227783203, -64.76458740234375, -49.57665252685547, -34.38872146606445, -19.200790405273438, -4.012855529785156, 11.175079345703125, 26.363006591796875, 41.550941467285156, 56.73887634277344, 71.92681121826172, 87.11474609375, 102.30267333984375, 117.49060821533203, 132.6785430908203, 147.86647033691406, 163.05441284179688, 178.24234008789062, 193.43026733398438, 208.6182098388672, 223.80613708496094, 238.99407958984375, 254.1820068359375, 269.36993408203125, 284.557861328125, 299.74578857421875, 314.9337158203125, 330.12164306640625, 345.3095703125, 360.4975280761719, 375.6854553222656, 390.8733825683594, 406.0613098144531, 421.249267578125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 7.0, 4.0, 13.0, 11.0, 12.0, 16.0, 15.0, 7.0, 23.0, 21.0, 30.0, 30.0, 35.0, 49.0, 58.0, 71.0, 85.0, 69.0, 77.0, 55.0, 37.0, 36.0, 31.0, 28.0, 22.0, 28.0, 15.0, 13.0, 13.0, 9.0, 9.0, 20.0, 3.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-474.1795654296875, -460.4901428222656, -446.80072021484375, -433.111328125, -419.4219055175781, -405.73248291015625, -392.0430908203125, -378.3536682128906, -364.66424560546875, -350.9748229980469, -337.285400390625, -323.59600830078125, -309.9065856933594, -296.2171630859375, -282.52777099609375, -268.8383483886719, -255.14892578125, -241.45950317382812, -227.7700958251953, -214.0806884765625, -200.39126586914062, -186.70184326171875, -173.01243591308594, -159.32302856445312, -145.63360595703125, -131.94418334960938, -118.25477600097656, -104.56536102294922, -90.87594604492188, -77.18653106689453, -63.49711608886719, -49.807701110839844, -36.118255615234375, -22.42884063720703, -8.739425659179688, 4.949989318847656, 18.639404296875, 32.328819274902344, 46.01823425292969, 59.70764923095703, 73.39706420898438, 87.08647918701172, 100.77589416503906, 114.4653091430664, 128.15472412109375, 141.84414672851562, 155.53355407714844, 169.22296142578125, 182.91238403320312, 196.601806640625, 210.2912139892578, 223.98062133789062, 237.6700439453125, 251.35946655273438, 265.04888916015625, 278.73828125, 292.4277038574219, 306.11712646484375, 319.8065185546875, 333.4959411621094, 347.18536376953125, 360.8747863769531, 374.564208984375, 388.25360107421875, 401.9430236816406]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 12.0, 12.0, 27.0, 39.0, 63.0, 91.0, 125.0, 198.0, 280.0, 422.0, 666.0, 972.0, 1409.0, 2289.0, 3595.0, 5950.0, 9764.0, 17205.0, 31923.0, 61449.0, 123836.0, 264246.0, 607553.0, 1620773.0, 789513.0, 336472.0, 153290.0, 74528.0, 38695.0, 20849.0, 11672.0, 6685.0, 3998.0, 2374.0, 1374.0, 784.0, 444.0, 283.0, 178.0, 91.0, 51.0, 47.0, 26.0, 13.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.313232421875, -9.00927734375, -8.705322265625, -8.4013671875, -8.097412109375, -7.79345703125, -7.489501953125, -7.185546875, -6.881591796875, -6.57763671875, -6.273681640625, -5.9697265625, -5.665771484375, -5.36181640625, -5.057861328125, -4.75390625, -4.449951171875, -4.14599609375, -3.842041015625, -3.5380859375, -3.234130859375, -2.93017578125, -2.626220703125, -2.322265625, -2.018310546875, -1.71435546875, -1.410400390625, -1.1064453125, -0.802490234375, -0.49853515625, -0.194580078125, 0.109375, 0.413330078125, 0.71728515625, 1.021240234375, 1.3251953125, 1.629150390625, 1.93310546875, 2.237060546875, 2.541015625, 2.844970703125, 3.14892578125, 3.452880859375, 3.7568359375, 4.060791015625, 4.36474609375, 4.668701171875, 4.97265625, 5.276611328125, 5.58056640625, 5.884521484375, 6.1884765625, 6.492431640625, 6.79638671875, 7.100341796875, 7.404296875, 7.708251953125, 8.01220703125, 8.316162109375, 8.6201171875, 8.924072265625, 9.22802734375, 9.531982421875, 9.8359375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 4.0, 7.0, 3.0, 13.0, 18.0, 7.0, 19.0, 13.0, 20.0, 26.0, 40.0, 54.0, 44.0, 41.0, 59.0, 62.0, 64.0, 62.0, 65.0, 60.0, 62.0, 38.0, 46.0, 25.0, 24.0, 24.0, 19.0, 16.0, 8.0, 9.0, 6.0, 6.0, 7.0, 2.0, 5.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88037109375, -0.8542861938476562, -0.8282012939453125, -0.8021163940429688, -0.776031494140625, -0.7499465942382812, -0.7238616943359375, -0.6977767944335938, -0.67169189453125, -0.6456069946289062, -0.6195220947265625, -0.5934371948242188, -0.567352294921875, -0.5412673950195312, -0.5151824951171875, -0.48909759521484375, -0.4630126953125, -0.43692779541015625, -0.4108428955078125, -0.38475799560546875, -0.358673095703125, -0.33258819580078125, -0.3065032958984375, -0.28041839599609375, -0.25433349609375, -0.22824859619140625, -0.2021636962890625, -0.17607879638671875, -0.149993896484375, -0.12390899658203125, -0.0978240966796875, -0.07173919677734375, -0.045654296875, -0.01956939697265625, 0.0065155029296875, 0.03260040283203125, 0.058685302734375, 0.08477020263671875, 0.1108551025390625, 0.13694000244140625, 0.16302490234375, 0.18910980224609375, 0.2151947021484375, 0.24127960205078125, 0.267364501953125, 0.29344940185546875, 0.3195343017578125, 0.34561920166015625, 0.3717041015625, 0.39778900146484375, 0.4238739013671875, 0.44995880126953125, 0.476043701171875, 0.5021286010742188, 0.5282135009765625, 0.5542984008789062, 0.58038330078125, 0.6064682006835938, 0.6325531005859375, 0.6586380004882812, 0.684722900390625, 0.7108078002929688, 0.7368927001953125, 0.7629776000976562, 0.7890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 1.0, 5.0, 15.0, 19.0, 19.0, 27.0, 48.0, 47.0, 92.0, 133.0, 199.0, 337.0, 635.0, 1200.0, 2583.0, 6389.0, 17607.0, 55745.0, 199260.0, 735735.0, 1958032.0, 877025.0, 239232.0, 66075.0, 20448.0, 7354.0, 2967.0, 1358.0, 690.0, 371.0, 217.0, 124.0, 93.0, 55.0, 37.0, 24.0, 10.0, 13.0, 11.0, 10.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-10.7890625, -10.4857177734375, -10.182373046875, -9.8790283203125, -9.57568359375, -9.2723388671875, -8.968994140625, -8.6656494140625, -8.3623046875, -8.0589599609375, -7.755615234375, -7.4522705078125, -7.14892578125, -6.8455810546875, -6.542236328125, -6.2388916015625, -5.935546875, -5.6322021484375, -5.328857421875, -5.0255126953125, -4.72216796875, -4.4188232421875, -4.115478515625, -3.8121337890625, -3.5087890625, -3.2054443359375, -2.902099609375, -2.5987548828125, -2.29541015625, -1.9920654296875, -1.688720703125, -1.3853759765625, -1.08203125, -0.7786865234375, -0.475341796875, -0.1719970703125, 0.13134765625, 0.4346923828125, 0.738037109375, 1.0413818359375, 1.3447265625, 1.6480712890625, 1.951416015625, 2.2547607421875, 2.55810546875, 2.8614501953125, 3.164794921875, 3.4681396484375, 3.771484375, 4.0748291015625, 4.378173828125, 4.6815185546875, 4.98486328125, 5.2882080078125, 5.591552734375, 5.8948974609375, 6.1982421875, 6.5015869140625, 6.804931640625, 7.1082763671875, 7.41162109375, 7.7149658203125, 8.018310546875, 8.3216552734375, 8.625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 17.0, 34.0, 46.0, 45.0, 81.0, 91.0, 104.0, 115.0, 180.0, 194.0, 282.0, 289.0, 417.0, 485.0, 322.0, 266.0, 235.0, 189.0, 144.0, 114.0, 86.0, 83.0, 61.0, 33.0, 42.0, 16.0, 15.0, 19.0, 10.0, 7.0, 5.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.408966064453125, -2.31988525390625, -2.230804443359375, -2.1417236328125, -2.052642822265625, -1.96356201171875, -1.874481201171875, -1.785400390625, -1.696319580078125, -1.60723876953125, -1.518157958984375, -1.4290771484375, -1.339996337890625, -1.25091552734375, -1.161834716796875, -1.07275390625, -0.983673095703125, -0.89459228515625, -0.805511474609375, -0.7164306640625, -0.627349853515625, -0.53826904296875, -0.449188232421875, -0.360107421875, -0.271026611328125, -0.18194580078125, -0.092864990234375, -0.0037841796875, 0.085296630859375, 0.17437744140625, 0.263458251953125, 0.3525390625, 0.441619873046875, 0.53070068359375, 0.619781494140625, 0.7088623046875, 0.797943115234375, 0.88702392578125, 0.976104736328125, 1.065185546875, 1.154266357421875, 1.24334716796875, 1.332427978515625, 1.4215087890625, 1.510589599609375, 1.59967041015625, 1.688751220703125, 1.77783203125, 1.866912841796875, 1.95599365234375, 2.045074462890625, 2.1341552734375, 2.223236083984375, 2.31231689453125, 2.401397705078125, 2.490478515625, 2.579559326171875, 2.66864013671875, 2.757720947265625, 2.8468017578125, 2.935882568359375, 3.02496337890625, 3.114044189453125, 3.203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 6.0, 5.0, 11.0, 9.0, 12.0, 19.0, 22.0, 35.0, 40.0, 53.0, 65.0, 64.0, 65.0, 67.0, 87.0, 65.0, 80.0, 62.0, 60.0, 41.0, 37.0, 16.0, 15.0, 13.0, 9.0, 9.0, 6.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.275325775146484, -27.48114585876465, -26.686967849731445, -25.89278793334961, -25.098608016967773, -24.30443000793457, -23.510250091552734, -22.71607208251953, -21.921892166137695, -21.12771224975586, -20.333534240722656, -19.53935432434082, -18.745174407958984, -17.95099639892578, -17.156816482543945, -16.36263656616211, -15.56845760345459, -14.77427864074707, -13.980098724365234, -13.185919761657715, -12.391740798950195, -11.59756088256836, -10.80338191986084, -10.00920295715332, -9.215023040771484, -8.420844078063965, -7.626664638519287, -6.832485198974609, -6.03830623626709, -5.244126796722412, -4.449947357177734, -3.655768394470215, -2.8615894317626953, -2.0674102306365967, -1.2732309103012085, -0.4790515899658203, 0.3151276111602783, 1.109306812286377, 1.9034862518310547, 2.697665214538574, 3.491844654083252, 4.28602409362793, 5.080203056335449, 5.874382495880127, 6.668561935424805, 7.462740898132324, 8.256919860839844, 9.05109977722168, 9.8452787399292, 10.639457702636719, 11.433637619018555, 12.227816581726074, 13.021995544433594, 13.81617546081543, 14.61035442352295, 15.404533386230469, 16.198713302612305, 16.99289321899414, 17.787071228027344, 18.58125114440918, 19.375431060791016, 20.16960906982422, 20.963788986206055, 21.75796890258789, 22.552146911621094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 5.0, 8.0, 14.0, 12.0, 7.0, 20.0, 16.0, 13.0, 22.0, 30.0, 37.0, 33.0, 40.0, 36.0, 40.0, 40.0, 44.0, 54.0, 40.0, 39.0, 33.0, 28.0, 35.0, 46.0, 39.0, 39.0, 32.0, 15.0, 22.0, 34.0, 13.0, 18.0, 14.0, 5.0, 10.0, 7.0, 5.0, 12.0, 5.0, 3.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0], "bins": [-16.215167999267578, -15.719022750854492, -15.222877502441406, -14.72673225402832, -14.230587005615234, -13.734441757202148, -13.238296508789062, -12.742151260375977, -12.24600601196289, -11.749860763549805, -11.253715515136719, -10.757570266723633, -10.261425018310547, -9.765279769897461, -9.269134521484375, -8.772989273071289, -8.276844024658203, -7.780698776245117, -7.284553527832031, -6.788408279418945, -6.292263031005859, -5.796117782592773, -5.2999725341796875, -4.803827285766602, -4.307682037353516, -3.8115367889404297, -3.3153915405273438, -2.819246292114258, -2.323101043701172, -1.826955795288086, -1.330810546875, -0.8346652984619141, -0.3385200500488281, 0.1576251983642578, 0.6537704467773438, 1.1499156951904297, 1.6460609436035156, 2.1422061920166016, 2.6383514404296875, 3.1344966888427734, 3.6306419372558594, 4.126787185668945, 4.622932434082031, 5.119077682495117, 5.615222930908203, 6.111368179321289, 6.607513427734375, 7.103658676147461, 7.599803924560547, 8.095949172973633, 8.592094421386719, 9.088239669799805, 9.58438491821289, 10.080530166625977, 10.576675415039062, 11.072820663452148, 11.568965911865234, 12.06511116027832, 12.561256408691406, 13.057401657104492, 13.553546905517578, 14.049692153930664, 14.54583740234375, 15.041982650756836, 15.538127899169922]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 2.0, 4.0, 8.0, 9.0, 9.0, 22.0, 32.0, 33.0, 53.0, 73.0, 127.0, 150.0, 233.0, 371.0, 507.0, 845.0, 1300.0, 2082.0, 3552.0, 6047.0, 10742.0, 20464.0, 40791.0, 86796.0, 187705.0, 304868.0, 198050.0, 91642.0, 42811.0, 21433.0, 11550.0, 6435.0, 3712.0, 2208.0, 1355.0, 886.0, 554.0, 363.0, 205.0, 155.0, 112.0, 70.0, 49.0, 33.0, 27.0, 25.0, 17.0, 11.0, 4.0, 9.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-5.91796875, -5.736083984375, -5.55419921875, -5.372314453125, -5.1904296875, -5.008544921875, -4.82666015625, -4.644775390625, -4.462890625, -4.281005859375, -4.09912109375, -3.917236328125, -3.7353515625, -3.553466796875, -3.37158203125, -3.189697265625, -3.0078125, -2.825927734375, -2.64404296875, -2.462158203125, -2.2802734375, -2.098388671875, -1.91650390625, -1.734619140625, -1.552734375, -1.370849609375, -1.18896484375, -1.007080078125, -0.8251953125, -0.643310546875, -0.46142578125, -0.279541015625, -0.09765625, 0.084228515625, 0.26611328125, 0.447998046875, 0.6298828125, 0.811767578125, 0.99365234375, 1.175537109375, 1.357421875, 1.539306640625, 1.72119140625, 1.903076171875, 2.0849609375, 2.266845703125, 2.44873046875, 2.630615234375, 2.8125, 2.994384765625, 3.17626953125, 3.358154296875, 3.5400390625, 3.721923828125, 3.90380859375, 4.085693359375, 4.267578125, 4.449462890625, 4.63134765625, 4.813232421875, 4.9951171875, 5.177001953125, 5.35888671875, 5.540771484375, 5.72265625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 0.0, 2.0, 4.0, 3.0, 7.0, 3.0, 10.0, 8.0, 10.0, 22.0, 18.0, 18.0, 26.0, 36.0, 31.0, 36.0, 64.0, 55.0, 53.0, 47.0, 55.0, 61.0, 57.0, 59.0, 44.0, 32.0, 37.0, 48.0, 26.0, 21.0, 19.0, 19.0, 15.0, 13.0, 8.0, 4.0, 9.0, 6.0, 4.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0234375, -0.9931640625, -0.962890625, -0.9326171875, -0.90234375, -0.8720703125, -0.841796875, -0.8115234375, -0.78125, -0.7509765625, -0.720703125, -0.6904296875, -0.66015625, -0.6298828125, -0.599609375, -0.5693359375, -0.5390625, -0.5087890625, -0.478515625, -0.4482421875, -0.41796875, -0.3876953125, -0.357421875, -0.3271484375, -0.296875, -0.2666015625, -0.236328125, -0.2060546875, -0.17578125, -0.1455078125, -0.115234375, -0.0849609375, -0.0546875, -0.0244140625, 0.005859375, 0.0361328125, 0.06640625, 0.0966796875, 0.126953125, 0.1572265625, 0.1875, 0.2177734375, 0.248046875, 0.2783203125, 0.30859375, 0.3388671875, 0.369140625, 0.3994140625, 0.4296875, 0.4599609375, 0.490234375, 0.5205078125, 0.55078125, 0.5810546875, 0.611328125, 0.6416015625, 0.671875, 0.7021484375, 0.732421875, 0.7626953125, 0.79296875, 0.8232421875, 0.853515625, 0.8837890625, 0.9140625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 12.0, 8.0, 8.0, 16.0, 25.0, 24.0, 44.0, 69.0, 100.0, 200.0, 357.0, 641.0, 1296.0, 2770.0, 6974.0, 20730.0, 84097.0, 496751.0, 348553.0, 59587.0, 15989.0, 5595.0, 2295.0, 1076.0, 544.0, 300.0, 176.0, 108.0, 66.0, 35.0, 23.0, 21.0, 9.0, 6.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.99609375, -7.73724365234375, -7.4783935546875, -7.21954345703125, -6.960693359375, -6.70184326171875, -6.4429931640625, -6.18414306640625, -5.92529296875, -5.66644287109375, -5.4075927734375, -5.14874267578125, -4.889892578125, -4.63104248046875, -4.3721923828125, -4.11334228515625, -3.8544921875, -3.59564208984375, -3.3367919921875, -3.07794189453125, -2.819091796875, -2.56024169921875, -2.3013916015625, -2.04254150390625, -1.78369140625, -1.52484130859375, -1.2659912109375, -1.00714111328125, -0.748291015625, -0.48944091796875, -0.2305908203125, 0.02825927734375, 0.287109375, 0.54595947265625, 0.8048095703125, 1.06365966796875, 1.322509765625, 1.58135986328125, 1.8402099609375, 2.09906005859375, 2.35791015625, 2.61676025390625, 2.8756103515625, 3.13446044921875, 3.393310546875, 3.65216064453125, 3.9110107421875, 4.16986083984375, 4.4287109375, 4.68756103515625, 4.9464111328125, 5.20526123046875, 5.464111328125, 5.72296142578125, 5.9818115234375, 6.24066162109375, 6.49951171875, 6.75836181640625, 7.0172119140625, 7.27606201171875, 7.534912109375, 7.79376220703125, 8.0526123046875, 8.31146240234375, 8.5703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 10.0, 10.0, 14.0, 19.0, 13.0, 11.0, 15.0, 21.0, 30.0, 21.0, 36.0, 28.0, 27.0, 36.0, 28.0, 38.0, 38.0, 39.0, 32.0, 41.0, 35.0, 32.0, 43.0, 27.0, 29.0, 41.0, 38.0, 27.0, 20.0, 27.0, 22.0, 23.0, 17.0, 17.0, 8.0, 6.0, 7.0, 7.0, 7.0, 6.0, 9.0, 3.0, 6.0, 4.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.763671875, -3.645416259765625, -3.52716064453125, -3.408905029296875, -3.2906494140625, -3.172393798828125, -3.05413818359375, -2.935882568359375, -2.817626953125, -2.699371337890625, -2.58111572265625, -2.462860107421875, -2.3446044921875, -2.226348876953125, -2.10809326171875, -1.989837646484375, -1.87158203125, -1.753326416015625, -1.63507080078125, -1.516815185546875, -1.3985595703125, -1.280303955078125, -1.16204833984375, -1.043792724609375, -0.925537109375, -0.807281494140625, -0.68902587890625, -0.570770263671875, -0.4525146484375, -0.334259033203125, -0.21600341796875, -0.097747802734375, 0.0205078125, 0.138763427734375, 0.25701904296875, 0.375274658203125, 0.4935302734375, 0.611785888671875, 0.73004150390625, 0.848297119140625, 0.966552734375, 1.084808349609375, 1.20306396484375, 1.321319580078125, 1.4395751953125, 1.557830810546875, 1.67608642578125, 1.794342041015625, 1.91259765625, 2.030853271484375, 2.14910888671875, 2.267364501953125, 2.3856201171875, 2.503875732421875, 2.62213134765625, 2.740386962890625, 2.858642578125, 2.976898193359375, 3.09515380859375, 3.213409423828125, 3.3316650390625, 3.449920654296875, 3.56817626953125, 3.686431884765625, 3.8046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 7.0, 15.0, 38.0, 73.0, 133.0, 322.0, 1689.0, 38011.0, 1000172.0, 6875.0, 762.0, 252.0, 89.0, 36.0, 24.0, 12.0, 12.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -63.69140625, -62.0703125, -60.44921875, -58.828125, -57.20703125, -55.5859375, -53.96484375, -52.34375, -50.72265625, -49.1015625, -47.48046875, -45.859375, -44.23828125, -42.6171875, -40.99609375, -39.375, -37.75390625, -36.1328125, -34.51171875, -32.890625, -31.26953125, -29.6484375, -28.02734375, -26.40625, -24.78515625, -23.1640625, -21.54296875, -19.921875, -18.30078125, -16.6796875, -15.05859375, -13.4375, -11.81640625, -10.1953125, -8.57421875, -6.953125, -5.33203125, -3.7109375, -2.08984375, -0.46875, 1.15234375, 2.7734375, 4.39453125, 6.015625, 7.63671875, 9.2578125, 10.87890625, 12.5, 14.12109375, 15.7421875, 17.36328125, 18.984375, 20.60546875, 22.2265625, 23.84765625, 25.46875, 27.08984375, 28.7109375, 30.33203125, 31.953125, 33.57421875, 35.1953125, 36.81640625, 38.4375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 10.0, 15.0, 20.0, 30.0, 51.0, 50.0, 58.0, 78.0, 91.0, 89.0, 96.0, 95.0, 74.0, 49.0, 34.0, 29.0, 34.0, 13.0, 18.0, 10.0, 10.0, 6.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042724609375, -0.0004123672842979431, -0.00039748847484588623, -0.00038260966539382935, -0.00036773085594177246, -0.0003528520464897156, -0.0003379732370376587, -0.0003230944275856018, -0.0003082156181335449, -0.00029333680868148804, -0.00027845799922943115, -0.00026357918977737427, -0.0002487003803253174, -0.0002338215708732605, -0.0002189427614212036, -0.00020406395196914673, -0.00018918514251708984, -0.00017430633306503296, -0.00015942752361297607, -0.0001445487141609192, -0.0001296699047088623, -0.00011479109525680542, -9.991228580474854e-05, -8.503347635269165e-05, -7.015466690063477e-05, -5.527585744857788e-05, -4.0397047996520996e-05, -2.551823854446411e-05, -1.0639429092407227e-05, 4.239380359649658e-06, 1.9118189811706543e-05, 3.399699926376343e-05, 4.887580871582031e-05, 6.37546181678772e-05, 7.863342761993408e-05, 9.351223707199097e-05, 0.00010839104652404785, 0.00012326985597610474, 0.00013814866542816162, 0.0001530274748802185, 0.0001679062843322754, 0.00018278509378433228, 0.00019766390323638916, 0.00021254271268844604, 0.00022742152214050293, 0.00024230033159255981, 0.0002571791410446167, 0.0002720579504966736, 0.00028693675994873047, 0.00030181556940078735, 0.00031669437885284424, 0.0003315731883049011, 0.000346451997756958, 0.0003613308072090149, 0.0003762096166610718, 0.00039108842611312866, 0.00040596723556518555, 0.00042084604501724243, 0.0004357248544692993, 0.0004506036639213562, 0.0004654824733734131, 0.00048036128282546997, 0.0004952400922775269, 0.0005101189017295837, 0.0005249977111816406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 5.0, 13.0, 21.0, 14.0, 23.0, 41.0, 46.0, 68.0, 108.0, 143.0, 223.0, 422.0, 706.0, 1335.0, 2847.0, 6937.0, 21371.0, 101802.0, 614353.0, 241318.0, 37880.0, 10630.0, 4083.0, 1885.0, 871.0, 512.0, 284.0, 182.0, 125.0, 84.0, 47.0, 40.0, 34.0, 26.0, 13.0, 15.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.03125, -8.7166748046875, -8.402099609375, -8.0875244140625, -7.77294921875, -7.4583740234375, -7.143798828125, -6.8292236328125, -6.5146484375, -6.2000732421875, -5.885498046875, -5.5709228515625, -5.25634765625, -4.9417724609375, -4.627197265625, -4.3126220703125, -3.998046875, -3.6834716796875, -3.368896484375, -3.0543212890625, -2.73974609375, -2.4251708984375, -2.110595703125, -1.7960205078125, -1.4814453125, -1.1668701171875, -0.852294921875, -0.5377197265625, -0.22314453125, 0.0914306640625, 0.406005859375, 0.7205810546875, 1.03515625, 1.3497314453125, 1.664306640625, 1.9788818359375, 2.29345703125, 2.6080322265625, 2.922607421875, 3.2371826171875, 3.5517578125, 3.8663330078125, 4.180908203125, 4.4954833984375, 4.81005859375, 5.1246337890625, 5.439208984375, 5.7537841796875, 6.068359375, 6.3829345703125, 6.697509765625, 7.0120849609375, 7.32666015625, 7.6412353515625, 7.955810546875, 8.2703857421875, 8.5849609375, 8.8995361328125, 9.214111328125, 9.5286865234375, 9.84326171875, 10.1578369140625, 10.472412109375, 10.7869873046875, 11.1015625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 18.0, 28.0, 37.0, 52.0, 112.0, 154.0, 184.0, 166.0, 98.0, 44.0, 30.0, 21.0, 7.0, 6.0, 7.0, 6.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.46875, -9.20721435546875, -8.9456787109375, -8.68414306640625, -8.422607421875, -8.16107177734375, -7.8995361328125, -7.63800048828125, -7.37646484375, -7.11492919921875, -6.8533935546875, -6.59185791015625, -6.330322265625, -6.06878662109375, -5.8072509765625, -5.54571533203125, -5.2841796875, -5.02264404296875, -4.7611083984375, -4.49957275390625, -4.238037109375, -3.97650146484375, -3.7149658203125, -3.45343017578125, -3.19189453125, -2.93035888671875, -2.6688232421875, -2.40728759765625, -2.145751953125, -1.88421630859375, -1.6226806640625, -1.36114501953125, -1.099609375, -0.83807373046875, -0.5765380859375, -0.31500244140625, -0.053466796875, 0.20806884765625, 0.4696044921875, 0.73114013671875, 0.99267578125, 1.25421142578125, 1.5157470703125, 1.77728271484375, 2.038818359375, 2.30035400390625, 2.5618896484375, 2.82342529296875, 3.0849609375, 3.34649658203125, 3.6080322265625, 3.86956787109375, 4.131103515625, 4.39263916015625, 4.6541748046875, 4.91571044921875, 5.17724609375, 5.43878173828125, 5.7003173828125, 5.96185302734375, 6.223388671875, 6.48492431640625, 6.7464599609375, 7.00799560546875, 7.26953125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 9.0, 14.0, 18.0, 62.0, 248.0, 390.0, 163.0, 63.0, 18.0, 7.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.04808807373047, -68.29481506347656, -63.54153823852539, -58.788265228271484, -54.03498840332031, -49.281715393066406, -44.5284423828125, -39.77516555786133, -35.02189254760742, -30.268617630004883, -25.515342712402344, -20.762069702148438, -16.0087947845459, -11.25551986694336, -6.502246856689453, -1.7489700317382812, 3.004302978515625, 7.757577419281006, 12.510851860046387, 17.26412582397461, 22.01740074157715, 26.770675659179688, 31.523948669433594, 36.277225494384766, 41.03049850463867, 45.78377151489258, 50.53704833984375, 55.290321350097656, 60.04359436035156, 64.796875, 69.55014038085938, 74.30342102050781, 79.05668640136719, 83.8099594116211, 88.563232421875, 93.31651306152344, 98.06978607177734, 102.82305908203125, 107.57633209228516, 112.32960510253906, 117.0828857421875, 121.8361587524414, 126.58943176269531, 131.34271240234375, 136.09597778320312, 140.84925842285156, 145.6025390625, 150.35580444335938, 155.10906982421875, 159.8623504638672, 164.61561584472656, 169.368896484375, 174.12216186523438, 178.8754425048828, 183.62872314453125, 188.38198852539062, 193.13526916503906, 197.8885498046875, 202.64181518554688, 207.3950958251953, 212.1483612060547, 216.90164184570312, 221.6549072265625, 226.40818786621094, 231.16146850585938]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 6.0, 10.0, 15.0, 24.0, 27.0, 45.0, 64.0, 102.0, 134.0, 141.0, 132.0, 94.0, 74.0, 42.0, 28.0, 8.0, 13.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.29398345947266, -88.3702392578125, -85.44650268554688, -82.52275848388672, -79.59901428222656, -76.67527770996094, -73.75153350830078, -70.82778930664062, -67.904052734375, -64.98030853271484, -62.05657196044922, -59.13282775878906, -56.20908737182617, -53.28534698486328, -50.361602783203125, -47.437862396240234, -44.514122009277344, -41.59038162231445, -38.66664123535156, -35.742897033691406, -32.819156646728516, -29.895416259765625, -26.9716739654541, -24.047931671142578, -21.124191284179688, -18.200450897216797, -15.276708602905273, -12.352967262268066, -9.42922592163086, -6.505484580993652, -3.5817432403564453, -0.6580009460449219, 2.2657318115234375, 5.1894731521606445, 8.113214492797852, 11.036955833435059, 13.960697174072266, 16.884437561035156, 19.80817985534668, 22.731922149658203, 25.655662536621094, 28.579402923583984, 31.503145217895508, 34.42688751220703, 37.35062789916992, 40.27436828613281, 43.19811248779297, 46.12185287475586, 49.04559326171875, 51.96933364868164, 54.89307403564453, 57.81681823730469, 60.74055862426758, 63.66429901123047, 66.58804321289062, 69.51177978515625, 72.4355239868164, 75.35926818847656, 78.28300476074219, 81.20674896240234, 84.1304931640625, 87.05422973632812, 89.97797393798828, 92.90171813964844, 95.82545471191406]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 12.0, 17.0, 31.0, 47.0, 76.0, 105.0, 214.0, 358.0, 579.0, 1131.0, 2268.0, 4944.0, 11589.0, 30242.0, 94326.0, 424416.0, 3273166.0, 244358.0, 66140.0, 22919.0, 9320.0, 4120.0, 1868.0, 890.0, 490.0, 219.0, 168.0, 83.0, 48.0, 39.0, 25.0, 21.0, 12.0, 7.0, 8.0, 3.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.5625, -22.810791015625, -22.05908203125, -21.307373046875, -20.5556640625, -19.803955078125, -19.05224609375, -18.300537109375, -17.548828125, -16.797119140625, -16.04541015625, -15.293701171875, -14.5419921875, -13.790283203125, -13.03857421875, -12.286865234375, -11.53515625, -10.783447265625, -10.03173828125, -9.280029296875, -8.5283203125, -7.776611328125, -7.02490234375, -6.273193359375, -5.521484375, -4.769775390625, -4.01806640625, -3.266357421875, -2.5146484375, -1.762939453125, -1.01123046875, -0.259521484375, 0.4921875, 1.243896484375, 1.99560546875, 2.747314453125, 3.4990234375, 4.250732421875, 5.00244140625, 5.754150390625, 6.505859375, 7.257568359375, 8.00927734375, 8.760986328125, 9.5126953125, 10.264404296875, 11.01611328125, 11.767822265625, 12.51953125, 13.271240234375, 14.02294921875, 14.774658203125, 15.5263671875, 16.278076171875, 17.02978515625, 17.781494140625, 18.533203125, 19.284912109375, 20.03662109375, 20.788330078125, 21.5400390625, 22.291748046875, 23.04345703125, 23.795166015625, 24.546875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 8.0, 11.0, 19.0, 17.0, 27.0, 30.0, 28.0, 45.0, 54.0, 67.0, 55.0, 74.0, 70.0, 66.0, 56.0, 57.0, 66.0, 44.0, 39.0, 37.0, 26.0, 22.0, 14.0, 13.0, 7.0, 10.0, 5.0, 8.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9886627197265625, -0.949005126953125, -0.9093475341796875, -0.86968994140625, -0.8300323486328125, -0.790374755859375, -0.7507171630859375, -0.7110595703125, -0.6714019775390625, -0.631744384765625, -0.5920867919921875, -0.55242919921875, -0.5127716064453125, -0.473114013671875, -0.4334564208984375, -0.393798828125, -0.3541412353515625, -0.314483642578125, -0.2748260498046875, -0.23516845703125, -0.1955108642578125, -0.155853271484375, -0.1161956787109375, -0.0765380859375, -0.0368804931640625, 0.002777099609375, 0.0424346923828125, 0.08209228515625, 0.1217498779296875, 0.161407470703125, 0.2010650634765625, 0.24072265625, 0.2803802490234375, 0.320037841796875, 0.3596954345703125, 0.39935302734375, 0.4390106201171875, 0.478668212890625, 0.5183258056640625, 0.5579833984375, 0.5976409912109375, 0.637298583984375, 0.6769561767578125, 0.71661376953125, 0.7562713623046875, 0.795928955078125, 0.8355865478515625, 0.875244140625, 0.9149017333984375, 0.954559326171875, 0.9942169189453125, 1.03387451171875, 1.0735321044921875, 1.113189697265625, 1.1528472900390625, 1.1925048828125, 1.2321624755859375, 1.271820068359375, 1.3114776611328125, 1.35113525390625, 1.3907928466796875, 1.430450439453125, 1.4701080322265625, 1.509765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 8.0, 13.0, 24.0, 27.0, 48.0, 57.0, 80.0, 135.0, 201.0, 305.0, 535.0, 891.0, 1513.0, 2807.0, 5225.0, 10036.0, 20916.0, 44031.0, 100203.0, 256582.0, 1094945.0, 2180721.0, 278093.0, 106710.0, 46070.0, 21353.0, 10510.0, 5333.0, 2782.0, 1620.0, 930.0, 574.0, 370.0, 235.0, 132.0, 88.0, 54.0, 27.0, 23.0, 17.0, 17.0, 17.0, 12.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.8828125, -14.432373046875, -13.98193359375, -13.531494140625, -13.0810546875, -12.630615234375, -12.18017578125, -11.729736328125, -11.279296875, -10.828857421875, -10.37841796875, -9.927978515625, -9.4775390625, -9.027099609375, -8.57666015625, -8.126220703125, -7.67578125, -7.225341796875, -6.77490234375, -6.324462890625, -5.8740234375, -5.423583984375, -4.97314453125, -4.522705078125, -4.072265625, -3.621826171875, -3.17138671875, -2.720947265625, -2.2705078125, -1.820068359375, -1.36962890625, -0.919189453125, -0.46875, -0.018310546875, 0.43212890625, 0.882568359375, 1.3330078125, 1.783447265625, 2.23388671875, 2.684326171875, 3.134765625, 3.585205078125, 4.03564453125, 4.486083984375, 4.9365234375, 5.386962890625, 5.83740234375, 6.287841796875, 6.73828125, 7.188720703125, 7.63916015625, 8.089599609375, 8.5400390625, 8.990478515625, 9.44091796875, 9.891357421875, 10.341796875, 10.792236328125, 11.24267578125, 11.693115234375, 12.1435546875, 12.593994140625, 13.04443359375, 13.494873046875, 13.9453125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 6.0, 7.0, 19.0, 22.0, 28.0, 30.0, 45.0, 57.0, 65.0, 66.0, 107.0, 119.0, 153.0, 267.0, 557.0, 1416.0, 326.0, 184.0, 156.0, 107.0, 67.0, 64.0, 44.0, 46.0, 29.0, 23.0, 16.0, 12.0, 6.0, 1.0, 6.0, 1.0, 7.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.12109375, -3.026947021484375, -2.93280029296875, -2.838653564453125, -2.7445068359375, -2.650360107421875, -2.55621337890625, -2.462066650390625, -2.367919921875, -2.273773193359375, -2.17962646484375, -2.085479736328125, -1.9913330078125, -1.897186279296875, -1.80303955078125, -1.708892822265625, -1.61474609375, -1.520599365234375, -1.42645263671875, -1.332305908203125, -1.2381591796875, -1.144012451171875, -1.04986572265625, -0.955718994140625, -0.861572265625, -0.767425537109375, -0.67327880859375, -0.579132080078125, -0.4849853515625, -0.390838623046875, -0.29669189453125, -0.202545166015625, -0.1083984375, -0.014251708984375, 0.07989501953125, 0.174041748046875, 0.2681884765625, 0.362335205078125, 0.45648193359375, 0.550628662109375, 0.644775390625, 0.738922119140625, 0.83306884765625, 0.927215576171875, 1.0213623046875, 1.115509033203125, 1.20965576171875, 1.303802490234375, 1.39794921875, 1.492095947265625, 1.58624267578125, 1.680389404296875, 1.7745361328125, 1.868682861328125, 1.96282958984375, 2.056976318359375, 2.151123046875, 2.245269775390625, 2.33941650390625, 2.433563232421875, 2.5277099609375, 2.621856689453125, 2.71600341796875, 2.810150146484375, 2.904296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 3.0, 6.0, 10.0, 10.0, 6.0, 25.0, 21.0, 47.0, 67.0, 96.0, 120.0, 139.0, 113.0, 95.0, 78.0, 46.0, 39.0, 24.0, 11.0, 8.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.469757080078125, -22.664220809936523, -21.858684539794922, -21.05314826965332, -20.24761199951172, -19.442075729370117, -18.636539459228516, -17.831003189086914, -17.025466918945312, -16.21993064880371, -15.41439437866211, -14.608858108520508, -13.803321838378906, -12.997785568237305, -12.192249298095703, -11.386713027954102, -10.581177711486816, -9.775641441345215, -8.970105171203613, -8.164568901062012, -7.35903263092041, -6.553496837615967, -5.747960567474365, -4.942424297332764, -4.136888027191162, -3.3313517570495605, -2.525815486907959, -1.7202794551849365, -0.914743185043335, -0.1092071533203125, 0.6963291168212891, 1.5018653869628906, 2.307401657104492, 3.1129379272460938, 3.9184741973876953, 4.724010467529297, 5.529546737670898, 6.335082530975342, 7.140618801116943, 7.946155071258545, 8.751691818237305, 9.557228088378906, 10.362764358520508, 11.16830062866211, 11.973836898803711, 12.779373168945312, 13.584909439086914, 14.390445709228516, 15.1959810256958, 16.001516342163086, 16.807052612304688, 17.61258888244629, 18.41812515258789, 19.223661422729492, 20.029197692871094, 20.834733963012695, 21.640270233154297, 22.4458065032959, 23.2513427734375, 24.0568790435791, 24.862415313720703, 25.667951583862305, 26.473487854003906, 27.279024124145508, 28.08456039428711]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 5.0, 4.0, 9.0, 11.0, 10.0, 22.0, 26.0, 28.0, 20.0, 33.0, 26.0, 45.0, 45.0, 52.0, 43.0, 67.0, 47.0, 52.0, 68.0, 52.0, 49.0, 41.0, 46.0, 33.0, 23.0, 29.0, 29.0, 16.0, 11.0, 9.0, 7.0, 11.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.70572566986084, -13.225020408630371, -12.744315147399902, -12.263609886169434, -11.782905578613281, -11.302200317382812, -10.821495056152344, -10.340789794921875, -9.860084533691406, -9.379379272460938, -8.898674011230469, -8.41796875, -7.9372639656066895, -7.456558704376221, -6.97585391998291, -6.495148658752441, -6.014443397521973, -5.533738136291504, -5.053032875061035, -4.572328090667725, -4.091622829437256, -3.610917568206787, -3.1302125453948975, -2.649507522583008, -2.168802261352539, -1.6880971193313599, -1.2073919773101807, -0.7266868352890015, -0.24598169326782227, 0.23472356796264648, 0.7154285907745361, 1.1961336135864258, 1.6768379211425781, 2.157543182373047, 2.6382482051849365, 3.118953227996826, 3.599658489227295, 4.080363750457764, 4.561068534851074, 5.041773796081543, 5.522479057312012, 6.0031843185424805, 6.483889579772949, 6.96459436416626, 7.4452996253967285, 7.926004886627197, 8.406709671020508, 8.887414932250977, 9.368120193481445, 9.848825454711914, 10.329530715942383, 10.810235977172852, 11.29094123840332, 11.771646499633789, 12.252350807189941, 12.73305606842041, 13.213761329650879, 13.694466590881348, 14.175171852111816, 14.655877113342285, 15.136581420898438, 15.617286682128906, 16.097991943359375, 16.578697204589844, 17.059402465820312]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 6.0, 9.0, 6.0, 8.0, 30.0, 37.0, 49.0, 94.0, 120.0, 229.0, 383.0, 678.0, 1350.0, 2630.0, 5040.0, 11658.0, 30493.0, 110833.0, 552842.0, 246600.0, 52898.0, 17690.0, 7391.0, 3464.0, 1811.0, 928.0, 521.0, 282.0, 177.0, 100.0, 56.0, 53.0, 19.0, 17.0, 12.0, 10.0, 5.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.734375, -21.090087890625, -20.44580078125, -19.801513671875, -19.1572265625, -18.512939453125, -17.86865234375, -17.224365234375, -16.580078125, -15.935791015625, -15.29150390625, -14.647216796875, -14.0029296875, -13.358642578125, -12.71435546875, -12.070068359375, -11.42578125, -10.781494140625, -10.13720703125, -9.492919921875, -8.8486328125, -8.204345703125, -7.56005859375, -6.915771484375, -6.271484375, -5.627197265625, -4.98291015625, -4.338623046875, -3.6943359375, -3.050048828125, -2.40576171875, -1.761474609375, -1.1171875, -0.472900390625, 0.17138671875, 0.815673828125, 1.4599609375, 2.104248046875, 2.74853515625, 3.392822265625, 4.037109375, 4.681396484375, 5.32568359375, 5.969970703125, 6.6142578125, 7.258544921875, 7.90283203125, 8.547119140625, 9.19140625, 9.835693359375, 10.47998046875, 11.124267578125, 11.7685546875, 12.412841796875, 13.05712890625, 13.701416015625, 14.345703125, 14.989990234375, 15.63427734375, 16.278564453125, 16.9228515625, 17.567138671875, 18.21142578125, 18.855712890625, 19.5]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 7.0, 12.0, 9.0, 14.0, 13.0, 25.0, 25.0, 23.0, 40.0, 35.0, 51.0, 51.0, 45.0, 51.0, 61.0, 39.0, 53.0, 59.0, 59.0, 52.0, 39.0, 40.0, 44.0, 25.0, 23.0, 19.0, 14.0, 10.0, 15.0, 13.0, 9.0, 3.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2275390625, -1.1898345947265625, -1.152130126953125, -1.1144256591796875, -1.07672119140625, -1.0390167236328125, -1.001312255859375, -0.9636077880859375, -0.9259033203125, -0.8881988525390625, -0.850494384765625, -0.8127899169921875, -0.77508544921875, -0.7373809814453125, -0.699676513671875, -0.6619720458984375, -0.624267578125, -0.5865631103515625, -0.548858642578125, -0.5111541748046875, -0.47344970703125, -0.4357452392578125, -0.398040771484375, -0.3603363037109375, -0.3226318359375, -0.2849273681640625, -0.247222900390625, -0.2095184326171875, -0.17181396484375, -0.1341094970703125, -0.096405029296875, -0.0587005615234375, -0.02099609375, 0.0167083740234375, 0.054412841796875, 0.0921173095703125, 0.12982177734375, 0.1675262451171875, 0.205230712890625, 0.2429351806640625, 0.2806396484375, 0.3183441162109375, 0.356048583984375, 0.3937530517578125, 0.43145751953125, 0.4691619873046875, 0.506866455078125, 0.5445709228515625, 0.582275390625, 0.6199798583984375, 0.657684326171875, 0.6953887939453125, 0.73309326171875, 0.7707977294921875, 0.808502197265625, 0.8462066650390625, 0.8839111328125, 0.9216156005859375, 0.959320068359375, 0.9970245361328125, 1.03472900390625, 1.0724334716796875, 1.110137939453125, 1.1478424072265625, 1.185546875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 9.0, 4.0, 11.0, 26.0, 47.0, 290.0, 3531.0, 504185.0, 536521.0, 3451.0, 281.0, 44.0, 15.0, 14.0, 10.0, 13.0, 7.0, 5.0, 6.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.3125, -59.123046875, -56.93359375, -54.744140625, -52.5546875, -50.365234375, -48.17578125, -45.986328125, -43.796875, -41.607421875, -39.41796875, -37.228515625, -35.0390625, -32.849609375, -30.66015625, -28.470703125, -26.28125, -24.091796875, -21.90234375, -19.712890625, -17.5234375, -15.333984375, -13.14453125, -10.955078125, -8.765625, -6.576171875, -4.38671875, -2.197265625, -0.0078125, 2.181640625, 4.37109375, 6.560546875, 8.75, 10.939453125, 13.12890625, 15.318359375, 17.5078125, 19.697265625, 21.88671875, 24.076171875, 26.265625, 28.455078125, 30.64453125, 32.833984375, 35.0234375, 37.212890625, 39.40234375, 41.591796875, 43.78125, 45.970703125, 48.16015625, 50.349609375, 52.5390625, 54.728515625, 56.91796875, 59.107421875, 61.296875, 63.486328125, 65.67578125, 67.865234375, 70.0546875, 72.244140625, 74.43359375, 76.623046875, 78.8125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 5.0, 10.0, 2.0, 9.0, 7.0, 17.0, 13.0, 18.0, 20.0, 23.0, 23.0, 24.0, 31.0, 46.0, 38.0, 31.0, 47.0, 32.0, 40.0, 36.0, 48.0, 45.0, 48.0, 44.0, 38.0, 43.0, 37.0, 29.0, 27.0, 34.0, 18.0, 22.0, 10.0, 13.0, 14.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.4453125, -5.28094482421875, -5.1165771484375, -4.95220947265625, -4.787841796875, -4.62347412109375, -4.4591064453125, -4.29473876953125, -4.13037109375, -3.96600341796875, -3.8016357421875, -3.63726806640625, -3.472900390625, -3.30853271484375, -3.1441650390625, -2.97979736328125, -2.8154296875, -2.65106201171875, -2.4866943359375, -2.32232666015625, -2.157958984375, -1.99359130859375, -1.8292236328125, -1.66485595703125, -1.50048828125, -1.33612060546875, -1.1717529296875, -1.00738525390625, -0.843017578125, -0.67864990234375, -0.5142822265625, -0.34991455078125, -0.185546875, -0.02117919921875, 0.1431884765625, 0.30755615234375, 0.471923828125, 0.63629150390625, 0.8006591796875, 0.96502685546875, 1.12939453125, 1.29376220703125, 1.4581298828125, 1.62249755859375, 1.786865234375, 1.95123291015625, 2.1156005859375, 2.27996826171875, 2.4443359375, 2.60870361328125, 2.7730712890625, 2.93743896484375, 3.101806640625, 3.26617431640625, 3.4305419921875, 3.59490966796875, 3.75927734375, 3.92364501953125, 4.0880126953125, 4.25238037109375, 4.416748046875, 4.58111572265625, 4.7454833984375, 4.90985107421875, 5.07421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0, 4.0, 0.0, 5.0, 11.0, 7.0, 11.0, 10.0, 13.0, 37.0, 122.0, 514.0, 14516.0, 1029814.0, 3027.0, 286.0, 74.0, 22.0, 20.0, 12.0, 5.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-106.6875, -103.4873046875, -100.287109375, -97.0869140625, -93.88671875, -90.6865234375, -87.486328125, -84.2861328125, -81.0859375, -77.8857421875, -74.685546875, -71.4853515625, -68.28515625, -65.0849609375, -61.884765625, -58.6845703125, -55.484375, -52.2841796875, -49.083984375, -45.8837890625, -42.68359375, -39.4833984375, -36.283203125, -33.0830078125, -29.8828125, -26.6826171875, -23.482421875, -20.2822265625, -17.08203125, -13.8818359375, -10.681640625, -7.4814453125, -4.28125, -1.0810546875, 2.119140625, 5.3193359375, 8.51953125, 11.7197265625, 14.919921875, 18.1201171875, 21.3203125, 24.5205078125, 27.720703125, 30.9208984375, 34.12109375, 37.3212890625, 40.521484375, 43.7216796875, 46.921875, 50.1220703125, 53.322265625, 56.5224609375, 59.72265625, 62.9228515625, 66.123046875, 69.3232421875, 72.5234375, 75.7236328125, 78.923828125, 82.1240234375, 85.32421875, 88.5244140625, 91.724609375, 94.9248046875, 98.125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 10.0, 14.0, 33.0, 34.0, 64.0, 105.0, 172.0, 173.0, 145.0, 81.0, 55.0, 36.0, 19.0, 8.0, 13.0, 9.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0010538101196289062, -0.0010282471776008606, -0.001002684235572815, -0.0009771212935447693, -0.0009515583515167236, -0.000925995409488678, -0.0009004324674606323, -0.0008748695254325867, -0.000849306583404541, -0.0008237436413764954, -0.0007981806993484497, -0.000772617757320404, -0.0007470548152923584, -0.0007214918732643127, -0.0006959289312362671, -0.0006703659892082214, -0.0006448030471801758, -0.0006192401051521301, -0.0005936771631240845, -0.0005681142210960388, -0.0005425512790679932, -0.0005169883370399475, -0.0004914253950119019, -0.0004658624529838562, -0.00044029951095581055, -0.0004147365689277649, -0.00038917362689971924, -0.0003636106848716736, -0.00033804774284362793, -0.0003124848008155823, -0.0002869218587875366, -0.00026135891675949097, -0.0002357959747314453, -0.00021023303270339966, -0.000184670090675354, -0.00015910714864730835, -0.0001335442066192627, -0.00010798126459121704, -8.241832256317139e-05, -5.685538053512573e-05, -3.129243850708008e-05, -5.729496479034424e-06, 1.983344554901123e-05, 4.5396387577056885e-05, 7.095932960510254e-05, 9.65222716331482e-05, 0.00012208521366119385, 0.0001476481556892395, 0.00017321109771728516, 0.0001987740397453308, 0.00022433698177337646, 0.0002498999238014221, 0.0002754628658294678, 0.00030102580785751343, 0.0003265887498855591, 0.00035215169191360474, 0.0003777146339416504, 0.00040327757596969604, 0.0004288405179977417, 0.00045440346002578735, 0.000479966402053833, 0.0005055293440818787, 0.0005310922861099243, 0.00055665522813797, 0.0005822181701660156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 6.0, 2.0, 3.0, 6.0, 13.0, 9.0, 22.0, 36.0, 62.0, 83.0, 111.0, 196.0, 349.0, 557.0, 1004.0, 2134.0, 5179.0, 16617.0, 143552.0, 807262.0, 54095.0, 10036.0, 3595.0, 1627.0, 833.0, 455.0, 276.0, 150.0, 100.0, 63.0, 43.0, 33.0, 16.0, 12.0, 10.0, 6.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.21533203125, -33.0869140625, -31.95849609375, -30.830078125, -29.70166015625, -28.5732421875, -27.44482421875, -26.31640625, -25.18798828125, -24.0595703125, -22.93115234375, -21.802734375, -20.67431640625, -19.5458984375, -18.41748046875, -17.2890625, -16.16064453125, -15.0322265625, -13.90380859375, -12.775390625, -11.64697265625, -10.5185546875, -9.39013671875, -8.26171875, -7.13330078125, -6.0048828125, -4.87646484375, -3.748046875, -2.61962890625, -1.4912109375, -0.36279296875, 0.765625, 1.89404296875, 3.0224609375, 4.15087890625, 5.279296875, 6.40771484375, 7.5361328125, 8.66455078125, 9.79296875, 10.92138671875, 12.0498046875, 13.17822265625, 14.306640625, 15.43505859375, 16.5634765625, 17.69189453125, 18.8203125, 19.94873046875, 21.0771484375, 22.20556640625, 23.333984375, 24.46240234375, 25.5908203125, 26.71923828125, 27.84765625, 28.97607421875, 30.1044921875, 31.23291015625, 32.361328125, 33.48974609375, 34.6181640625, 35.74658203125, 36.875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 3.0, 5.0, 4.0, 10.0, 9.0, 11.0, 9.0, 22.0, 27.0, 28.0, 29.0, 56.0, 72.0, 92.0, 142.0, 89.0, 92.0, 64.0, 62.0, 46.0, 33.0, 24.0, 17.0, 13.0, 16.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.734375, -9.47772216796875, -9.2210693359375, -8.96441650390625, -8.707763671875, -8.45111083984375, -8.1944580078125, -7.93780517578125, -7.68115234375, -7.42449951171875, -7.1678466796875, -6.91119384765625, -6.654541015625, -6.39788818359375, -6.1412353515625, -5.88458251953125, -5.6279296875, -5.37127685546875, -5.1146240234375, -4.85797119140625, -4.601318359375, -4.34466552734375, -4.0880126953125, -3.83135986328125, -3.57470703125, -3.31805419921875, -3.0614013671875, -2.80474853515625, -2.548095703125, -2.29144287109375, -2.0347900390625, -1.77813720703125, -1.521484375, -1.26483154296875, -1.0081787109375, -0.75152587890625, -0.494873046875, -0.23822021484375, 0.0184326171875, 0.27508544921875, 0.53173828125, 0.78839111328125, 1.0450439453125, 1.30169677734375, 1.558349609375, 1.81500244140625, 2.0716552734375, 2.32830810546875, 2.5849609375, 2.84161376953125, 3.0982666015625, 3.35491943359375, 3.611572265625, 3.86822509765625, 4.1248779296875, 4.38153076171875, 4.63818359375, 4.89483642578125, 5.1514892578125, 5.40814208984375, 5.664794921875, 5.92144775390625, 6.1781005859375, 6.43475341796875, 6.69140625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 10.0, 20.0, 36.0, 62.0, 119.0, 166.0, 172.0, 178.0, 94.0, 61.0, 30.0, 18.0, 13.0, 9.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.8785400390625, -99.69815063476562, -96.51775360107422, -93.33736419677734, -90.15696716308594, -86.97657775878906, -83.79618835449219, -80.61579895019531, -77.4354019165039, -74.25501251220703, -71.07461547851562, -67.89422607421875, -64.71383666992188, -61.53343963623047, -58.353050231933594, -55.17265701293945, -51.99226379394531, -48.81187057495117, -45.63147735595703, -42.451087951660156, -39.270694732666016, -36.090301513671875, -32.909912109375, -29.72951889038086, -26.54912567138672, -23.368732452392578, -20.18834114074707, -17.007949829101562, -13.827556610107422, -10.647164344787598, -7.466772079467773, -4.286380767822266, -1.105987548828125, 2.074404716491699, 5.254796981811523, 8.435189247131348, 11.615581512451172, 14.795973777770996, 17.97636604309082, 21.156757354736328, 24.33715057373047, 27.51754379272461, 30.697935104370117, 33.878326416015625, 37.058719635009766, 40.239112854003906, 43.41950225830078, 46.59989547729492, 49.78028869628906, 52.9606819152832, 56.141075134277344, 59.32146453857422, 62.50185775756836, 65.6822509765625, 68.86264038085938, 72.04302978515625, 75.22342681884766, 78.40381622314453, 81.58421325683594, 84.76460266113281, 87.94499206542969, 91.1253890991211, 94.30577850341797, 97.48617553710938, 100.66656494140625]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 3.0, 6.0, 4.0, 8.0, 10.0, 18.0, 10.0, 8.0, 16.0, 20.0, 20.0, 30.0, 35.0, 42.0, 45.0, 41.0, 52.0, 49.0, 62.0, 60.0, 58.0, 60.0, 40.0, 34.0, 32.0, 41.0, 30.0, 26.0, 27.0, 22.0, 21.0, 11.0, 13.0, 8.0, 9.0, 4.0, 10.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.935176849365234, -40.591121673583984, -39.247066497802734, -37.903011322021484, -36.558956146240234, -35.21490478515625, -33.870849609375, -32.52679443359375, -31.1827392578125, -29.83868408203125, -28.49462890625, -27.15057373046875, -25.806520462036133, -24.462465286254883, -23.118410110473633, -21.774356842041016, -20.430299758911133, -19.086244583129883, -17.742189407348633, -16.398136138916016, -15.054080963134766, -13.710025787353516, -12.365970611572266, -11.021916389465332, -9.677861213684082, -8.333806037902832, -6.989751815795898, -5.645696640014648, -4.301641941070557, -2.957587242126465, -1.6135320663452148, -0.26947784423828125, 1.0745773315429688, 2.4186320304870605, 3.7626869678497314, 5.106741905212402, 6.450796604156494, 7.794851303100586, 9.138906478881836, 10.48296070098877, 11.82701587677002, 13.17107105255127, 14.515125274658203, 15.859180450439453, 17.203235626220703, 18.547290802001953, 19.891345977783203, 21.23539924621582, 22.57945442199707, 23.92350959777832, 25.26756477355957, 26.611618041992188, 27.955673217773438, 29.299728393554688, 30.643783569335938, 31.987838745117188, 33.33189392089844, 34.67594909667969, 36.02000427246094, 37.36405944824219, 38.70811462402344, 40.05216979980469, 41.39622497558594, 42.74027633666992, 44.08433151245117]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 11.0, 14.0, 15.0, 25.0, 44.0, 52.0, 77.0, 134.0, 182.0, 280.0, 472.0, 870.0, 1637.0, 3189.0, 7330.0, 18273.0, 60448.0, 408501.0, 3539880.0, 105648.0, 28027.0, 10079.0, 4295.0, 2085.0, 1125.0, 647.0, 372.0, 198.0, 141.0, 67.0, 38.0, 27.0, 21.0, 16.0, 11.0, 7.0, 0.0, 2.0, 5.0], "bins": [-48.3125, -47.19384765625, -46.0751953125, -44.95654296875, -43.837890625, -42.71923828125, -41.6005859375, -40.48193359375, -39.36328125, -38.24462890625, -37.1259765625, -36.00732421875, -34.888671875, -33.77001953125, -32.6513671875, -31.53271484375, -30.4140625, -29.29541015625, -28.1767578125, -27.05810546875, -25.939453125, -24.82080078125, -23.7021484375, -22.58349609375, -21.46484375, -20.34619140625, -19.2275390625, -18.10888671875, -16.990234375, -15.87158203125, -14.7529296875, -13.63427734375, -12.515625, -11.39697265625, -10.2783203125, -9.15966796875, -8.041015625, -6.92236328125, -5.8037109375, -4.68505859375, -3.56640625, -2.44775390625, -1.3291015625, -0.21044921875, 0.908203125, 2.02685546875, 3.1455078125, 4.26416015625, 5.3828125, 6.50146484375, 7.6201171875, 8.73876953125, 9.857421875, 10.97607421875, 12.0947265625, 13.21337890625, 14.33203125, 15.45068359375, 16.5693359375, 17.68798828125, 18.806640625, 19.92529296875, 21.0439453125, 22.16259765625, 23.28125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 13.0, 10.0, 14.0, 18.0, 24.0, 30.0, 43.0, 42.0, 34.0, 39.0, 41.0, 44.0, 44.0, 37.0, 48.0, 53.0, 55.0, 53.0, 53.0, 43.0, 26.0, 29.0, 29.0, 31.0, 16.0, 22.0, 19.0, 13.0, 8.0, 11.0, 5.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.04296875, -1.0087890625, -0.974609375, -0.9404296875, -0.90625, -0.8720703125, -0.837890625, -0.8037109375, -0.76953125, -0.7353515625, -0.701171875, -0.6669921875, -0.6328125, -0.5986328125, -0.564453125, -0.5302734375, -0.49609375, -0.4619140625, -0.427734375, -0.3935546875, -0.359375, -0.3251953125, -0.291015625, -0.2568359375, -0.22265625, -0.1884765625, -0.154296875, -0.1201171875, -0.0859375, -0.0517578125, -0.017578125, 0.0166015625, 0.05078125, 0.0849609375, 0.119140625, 0.1533203125, 0.1875, 0.2216796875, 0.255859375, 0.2900390625, 0.32421875, 0.3583984375, 0.392578125, 0.4267578125, 0.4609375, 0.4951171875, 0.529296875, 0.5634765625, 0.59765625, 0.6318359375, 0.666015625, 0.7001953125, 0.734375, 0.7685546875, 0.802734375, 0.8369140625, 0.87109375, 0.9052734375, 0.939453125, 0.9736328125, 1.0078125, 1.0419921875, 1.076171875, 1.1103515625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 19.0, 15.0, 32.0, 38.0, 55.0, 94.0, 197.0, 1091.0, 27140.0, 4054593.0, 108060.0, 2324.0, 302.0, 107.0, 55.0, 46.0, 27.0, 21.0, 25.0, 12.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.625, -141.5400390625, -137.455078125, -133.3701171875, -129.28515625, -125.2001953125, -121.115234375, -117.0302734375, -112.9453125, -108.8603515625, -104.775390625, -100.6904296875, -96.60546875, -92.5205078125, -88.435546875, -84.3505859375, -80.265625, -76.1806640625, -72.095703125, -68.0107421875, -63.92578125, -59.8408203125, -55.755859375, -51.6708984375, -47.5859375, -43.5009765625, -39.416015625, -35.3310546875, -31.24609375, -27.1611328125, -23.076171875, -18.9912109375, -14.90625, -10.8212890625, -6.736328125, -2.6513671875, 1.43359375, 5.5185546875, 9.603515625, 13.6884765625, 17.7734375, 21.8583984375, 25.943359375, 30.0283203125, 34.11328125, 38.1982421875, 42.283203125, 46.3681640625, 50.453125, 54.5380859375, 58.623046875, 62.7080078125, 66.79296875, 70.8779296875, 74.962890625, 79.0478515625, 83.1328125, 87.2177734375, 91.302734375, 95.3876953125, 99.47265625, 103.5576171875, 107.642578125, 111.7275390625, 115.8125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 16.0, 15.0, 12.0, 12.0, 27.0, 43.0, 40.0, 55.0, 68.0, 107.0, 152.0, 297.0, 1835.0, 572.0, 225.0, 149.0, 104.0, 75.0, 56.0, 35.0, 38.0, 28.0, 25.0, 15.0, 11.0, 6.0, 5.0, 6.0, 7.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0390625, -3.919677734375, -3.80029296875, -3.680908203125, -3.5615234375, -3.442138671875, -3.32275390625, -3.203369140625, -3.083984375, -2.964599609375, -2.84521484375, -2.725830078125, -2.6064453125, -2.487060546875, -2.36767578125, -2.248291015625, -2.12890625, -2.009521484375, -1.89013671875, -1.770751953125, -1.6513671875, -1.531982421875, -1.41259765625, -1.293212890625, -1.173828125, -1.054443359375, -0.93505859375, -0.815673828125, -0.6962890625, -0.576904296875, -0.45751953125, -0.338134765625, -0.21875, -0.099365234375, 0.02001953125, 0.139404296875, 0.2587890625, 0.378173828125, 0.49755859375, 0.616943359375, 0.736328125, 0.855712890625, 0.97509765625, 1.094482421875, 1.2138671875, 1.333251953125, 1.45263671875, 1.572021484375, 1.69140625, 1.810791015625, 1.93017578125, 2.049560546875, 2.1689453125, 2.288330078125, 2.40771484375, 2.527099609375, 2.646484375, 2.765869140625, 2.88525390625, 3.004638671875, 3.1240234375, 3.243408203125, 3.36279296875, 3.482177734375, 3.6015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 33.0, 94.0, 219.0, 252.0, 230.0, 97.0, 39.0, 19.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.35034942626953, -114.00067901611328, -111.65100860595703, -109.30133819580078, -106.95167541503906, -104.60200500488281, -102.25233459472656, -99.90266418457031, -97.55299377441406, -95.20332336425781, -92.85365295410156, -90.50398254394531, -88.15431213378906, -85.80464935302734, -83.4549789428711, -81.10530853271484, -78.7556381225586, -76.40596771240234, -74.0562973022461, -71.70662689208984, -69.35696411132812, -67.00729370117188, -64.65762329101562, -62.307952880859375, -59.958282470703125, -57.608612060546875, -55.258941650390625, -52.90927505493164, -50.55960464477539, -48.20993423461914, -45.860267639160156, -43.510597229003906, -41.16092300415039, -38.81125259399414, -36.461585998535156, -34.111915588378906, -31.762245178222656, -29.412574768066406, -27.06290626525879, -24.713237762451172, -22.363567352294922, -20.013896942138672, -17.664228439331055, -15.314558982849121, -12.964889526367188, -10.615220069885254, -8.26555061340332, -5.915882110595703, -3.566211700439453, -1.2165422439575195, 1.133127212524414, 3.4827966690063477, 5.832466125488281, 8.182135581970215, 10.531805038452148, 12.881473541259766, 15.231143951416016, 17.580814361572266, 19.930482864379883, 22.2801513671875, 24.62982177734375, 26.9794921875, 29.329160690307617, 31.678829193115234, 34.028499603271484]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 3.0, 9.0, 7.0, 6.0, 13.0, 12.0, 18.0, 14.0, 20.0, 26.0, 20.0, 39.0, 40.0, 41.0, 46.0, 47.0, 59.0, 48.0, 59.0, 48.0, 56.0, 49.0, 49.0, 35.0, 44.0, 34.0, 33.0, 34.0, 13.0, 21.0, 12.0, 17.0, 6.0, 6.0, 4.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.313941955566406, -19.796260833740234, -19.278579711914062, -18.76089859008789, -18.24321746826172, -17.72553825378418, -17.207857131958008, -16.690176010131836, -16.172494888305664, -15.654813766479492, -15.13713264465332, -14.619452476501465, -14.101771354675293, -13.584090232849121, -13.066410064697266, -12.548728942871094, -12.031047821044922, -11.51336669921875, -10.995685577392578, -10.478005409240723, -9.96032428741455, -9.442643165588379, -8.924962997436523, -8.407281875610352, -7.88960075378418, -7.371919631958008, -6.854238986968994, -6.3365583419799805, -5.818877220153809, -5.301196098327637, -4.783515453338623, -4.265834808349609, -3.7481517791748047, -3.230470895767212, -2.712790012359619, -2.1951091289520264, -1.6774282455444336, -1.1597473621368408, -0.642066478729248, -0.12438559532165527, 0.3932952880859375, 0.9109761714935303, 1.428657054901123, 1.9463379383087158, 2.4640188217163086, 2.9816997051239014, 3.499380588531494, 4.017061233520508, 4.53474235534668, 5.052423477172852, 5.570104122161865, 6.087784767150879, 6.605465888977051, 7.123147010803223, 7.640827655792236, 8.15850830078125, 8.676189422607422, 9.193870544433594, 9.711551666259766, 10.229231834411621, 10.746912956237793, 11.264594078063965, 11.78227424621582, 12.299955368041992, 12.817636489868164]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 6.0, 12.0, 15.0, 27.0, 36.0, 45.0, 74.0, 122.0, 201.0, 399.0, 772.0, 1826.0, 4183.0, 10409.0, 27349.0, 72314.0, 181080.0, 328241.0, 247460.0, 106891.0, 40813.0, 15424.0, 5996.0, 2545.0, 1136.0, 510.0, 260.0, 136.0, 81.0, 51.0, 31.0, 18.0, 24.0, 18.0, 9.0, 5.0, 6.0, 2.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.9954833984375, -15.490966796875, -14.9864501953125, -14.48193359375, -13.9774169921875, -13.472900390625, -12.9683837890625, -12.4638671875, -11.9593505859375, -11.454833984375, -10.9503173828125, -10.44580078125, -9.9412841796875, -9.436767578125, -8.9322509765625, -8.427734375, -7.9232177734375, -7.418701171875, -6.9141845703125, -6.40966796875, -5.9051513671875, -5.400634765625, -4.8961181640625, -4.3916015625, -3.8870849609375, -3.382568359375, -2.8780517578125, -2.37353515625, -1.8690185546875, -1.364501953125, -0.8599853515625, -0.35546875, 0.1490478515625, 0.653564453125, 1.1580810546875, 1.66259765625, 2.1671142578125, 2.671630859375, 3.1761474609375, 3.6806640625, 4.1851806640625, 4.689697265625, 5.1942138671875, 5.69873046875, 6.2032470703125, 6.707763671875, 7.2122802734375, 7.716796875, 8.2213134765625, 8.725830078125, 9.2303466796875, 9.73486328125, 10.2393798828125, 10.743896484375, 11.2484130859375, 11.7529296875, 12.2574462890625, 12.761962890625, 13.2664794921875, 13.77099609375, 14.2755126953125, 14.780029296875, 15.2845458984375, 15.7890625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 10.0, 19.0, 22.0, 26.0, 34.0, 42.0, 40.0, 47.0, 60.0, 58.0, 78.0, 72.0, 64.0, 66.0, 70.0, 50.0, 43.0, 36.0, 33.0, 28.0, 24.0, 20.0, 8.0, 13.0, 6.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0322265625, -0.9848175048828125, -0.937408447265625, -0.8899993896484375, -0.84259033203125, -0.7951812744140625, -0.747772216796875, -0.7003631591796875, -0.6529541015625, -0.6055450439453125, -0.558135986328125, -0.5107269287109375, -0.46331787109375, -0.4159088134765625, -0.368499755859375, -0.3210906982421875, -0.273681640625, -0.2262725830078125, -0.178863525390625, -0.1314544677734375, -0.08404541015625, -0.0366363525390625, 0.010772705078125, 0.0581817626953125, 0.1055908203125, 0.1529998779296875, 0.200408935546875, 0.2478179931640625, 0.29522705078125, 0.3426361083984375, 0.390045166015625, 0.4374542236328125, 0.48486328125, 0.5322723388671875, 0.579681396484375, 0.6270904541015625, 0.67449951171875, 0.7219085693359375, 0.769317626953125, 0.8167266845703125, 0.8641357421875, 0.9115447998046875, 0.958953857421875, 1.0063629150390625, 1.05377197265625, 1.1011810302734375, 1.148590087890625, 1.1959991455078125, 1.243408203125, 1.2908172607421875, 1.338226318359375, 1.3856353759765625, 1.43304443359375, 1.4804534912109375, 1.527862548828125, 1.5752716064453125, 1.6226806640625, 1.6700897216796875, 1.717498779296875, 1.7649078369140625, 1.81231689453125, 1.8597259521484375, 1.907135009765625, 1.9545440673828125, 2.001953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 7.0, 7.0, 11.0, 23.0, 22.0, 34.0, 47.0, 66.0, 99.0, 121.0, 176.0, 223.0, 294.0, 465.0, 695.0, 1155.0, 1915.0, 2974.0, 5253.0, 10005.0, 19032.0, 37685.0, 76001.0, 145713.0, 234711.0, 227561.0, 137425.0, 71082.0, 35463.0, 17946.0, 9463.0, 5082.0, 2887.0, 1702.0, 1052.0, 655.0, 459.0, 268.0, 191.0, 150.0, 116.0, 71.0, 73.0, 43.0, 46.0, 22.0, 13.0, 11.0, 13.0, 11.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-11.703125, -11.3369140625, -10.970703125, -10.6044921875, -10.23828125, -9.8720703125, -9.505859375, -9.1396484375, -8.7734375, -8.4072265625, -8.041015625, -7.6748046875, -7.30859375, -6.9423828125, -6.576171875, -6.2099609375, -5.84375, -5.4775390625, -5.111328125, -4.7451171875, -4.37890625, -4.0126953125, -3.646484375, -3.2802734375, -2.9140625, -2.5478515625, -2.181640625, -1.8154296875, -1.44921875, -1.0830078125, -0.716796875, -0.3505859375, 0.015625, 0.3818359375, 0.748046875, 1.1142578125, 1.48046875, 1.8466796875, 2.212890625, 2.5791015625, 2.9453125, 3.3115234375, 3.677734375, 4.0439453125, 4.41015625, 4.7763671875, 5.142578125, 5.5087890625, 5.875, 6.2412109375, 6.607421875, 6.9736328125, 7.33984375, 7.7060546875, 8.072265625, 8.4384765625, 8.8046875, 9.1708984375, 9.537109375, 9.9033203125, 10.26953125, 10.6357421875, 11.001953125, 11.3681640625, 11.734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 6.0, 3.0, 10.0, 15.0, 14.0, 16.0, 19.0, 18.0, 17.0, 20.0, 25.0, 34.0, 30.0, 38.0, 28.0, 47.0, 50.0, 44.0, 38.0, 38.0, 38.0, 47.0, 38.0, 39.0, 39.0, 42.0, 31.0, 33.0, 29.0, 19.0, 25.0, 31.0, 14.0, 11.0, 3.0, 11.0, 7.0, 3.0, 7.0, 3.0, 3.0, 2.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.23046875, -7.01580810546875, -6.8011474609375, -6.58648681640625, -6.371826171875, -6.15716552734375, -5.9425048828125, -5.72784423828125, -5.51318359375, -5.29852294921875, -5.0838623046875, -4.86920166015625, -4.654541015625, -4.43988037109375, -4.2252197265625, -4.01055908203125, -3.7958984375, -3.58123779296875, -3.3665771484375, -3.15191650390625, -2.937255859375, -2.72259521484375, -2.5079345703125, -2.29327392578125, -2.07861328125, -1.86395263671875, -1.6492919921875, -1.43463134765625, -1.219970703125, -1.00531005859375, -0.7906494140625, -0.57598876953125, -0.361328125, -0.14666748046875, 0.0679931640625, 0.28265380859375, 0.497314453125, 0.71197509765625, 0.9266357421875, 1.14129638671875, 1.35595703125, 1.57061767578125, 1.7852783203125, 1.99993896484375, 2.214599609375, 2.42926025390625, 2.6439208984375, 2.85858154296875, 3.0732421875, 3.28790283203125, 3.5025634765625, 3.71722412109375, 3.931884765625, 4.14654541015625, 4.3612060546875, 4.57586669921875, 4.79052734375, 5.00518798828125, 5.2198486328125, 5.43450927734375, 5.649169921875, 5.86383056640625, 6.0784912109375, 6.29315185546875, 6.5078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 20.0, 17.0, 41.0, 33.0, 50.0, 101.0, 124.0, 190.0, 265.0, 431.0, 685.0, 1198.0, 2165.0, 4552.0, 9781.0, 23252.0, 64868.0, 184044.0, 358032.0, 249316.0, 91650.0, 32524.0, 12905.0, 5672.0, 2761.0, 1455.0, 886.0, 524.0, 307.0, 197.0, 126.0, 92.0, 71.0, 58.0, 34.0, 26.0, 18.0, 12.0, 12.0, 7.0, 6.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.140625, -9.8302001953125, -9.519775390625, -9.2093505859375, -8.89892578125, -8.5885009765625, -8.278076171875, -7.9676513671875, -7.6572265625, -7.3468017578125, -7.036376953125, -6.7259521484375, -6.41552734375, -6.1051025390625, -5.794677734375, -5.4842529296875, -5.173828125, -4.8634033203125, -4.552978515625, -4.2425537109375, -3.93212890625, -3.6217041015625, -3.311279296875, -3.0008544921875, -2.6904296875, -2.3800048828125, -2.069580078125, -1.7591552734375, -1.44873046875, -1.1383056640625, -0.827880859375, -0.5174560546875, -0.20703125, 0.1033935546875, 0.413818359375, 0.7242431640625, 1.03466796875, 1.3450927734375, 1.655517578125, 1.9659423828125, 2.2763671875, 2.5867919921875, 2.897216796875, 3.2076416015625, 3.51806640625, 3.8284912109375, 4.138916015625, 4.4493408203125, 4.759765625, 5.0701904296875, 5.380615234375, 5.6910400390625, 6.00146484375, 6.3118896484375, 6.622314453125, 6.9327392578125, 7.2431640625, 7.5535888671875, 7.864013671875, 8.1744384765625, 8.48486328125, 8.7952880859375, 9.105712890625, 9.4161376953125, 9.7265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 3.0, 8.0, 15.0, 14.0, 16.0, 25.0, 36.0, 41.0, 49.0, 53.0, 64.0, 68.0, 65.0, 80.0, 79.0, 75.0, 45.0, 65.0, 42.0, 28.0, 25.0, 24.0, 13.0, 11.0, 12.0, 6.0, 4.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00141143798828125, -0.0013714134693145752, -0.0013313889503479004, -0.0012913644313812256, -0.0012513399124145508, -0.001211315393447876, -0.0011712908744812012, -0.0011312663555145264, -0.0010912418365478516, -0.0010512173175811768, -0.001011192798614502, -0.0009711682796478271, -0.0009311437606811523, -0.0008911192417144775, -0.0008510947227478027, -0.0008110702037811279, -0.0007710456848144531, -0.0007310211658477783, -0.0006909966468811035, -0.0006509721279144287, -0.0006109476089477539, -0.0005709230899810791, -0.0005308985710144043, -0.0004908740520477295, -0.0004508495330810547, -0.0004108250141143799, -0.0003708004951477051, -0.0003307759761810303, -0.00029075145721435547, -0.00025072693824768066, -0.00021070241928100586, -0.00017067790031433105, -0.00013065338134765625, -9.062886238098145e-05, -5.060434341430664e-05, -1.0579824447631836e-05, 2.944469451904297e-05, 6.946921348571777e-05, 0.00010949373245239258, 0.00014951825141906738, 0.0001895427703857422, 0.000229567289352417, 0.0002695918083190918, 0.0003096163272857666, 0.0003496408462524414, 0.0003896653652191162, 0.000429689884185791, 0.0004697144031524658, 0.0005097389221191406, 0.0005497634410858154, 0.0005897879600524902, 0.000629812479019165, 0.0006698369979858398, 0.0007098615169525146, 0.0007498860359191895, 0.0007899105548858643, 0.0008299350738525391, 0.0008699595928192139, 0.0009099841117858887, 0.0009500086307525635, 0.0009900331497192383, 0.001030057668685913, 0.0010700821876525879, 0.0011101067066192627, 0.0011501312255859375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 7.0, 1.0, 4.0, 7.0, 8.0, 13.0, 15.0, 27.0, 34.0, 45.0, 64.0, 96.0, 155.0, 249.0, 422.0, 665.0, 1121.0, 2201.0, 4000.0, 8237.0, 19262.0, 52741.0, 161113.0, 378570.0, 272310.0, 90992.0, 30996.0, 12442.0, 5902.0, 2900.0, 1625.0, 866.0, 528.0, 329.0, 202.0, 120.0, 103.0, 55.0, 43.0, 21.0, 20.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 4.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-11.078125, -10.7398681640625, -10.401611328125, -10.0633544921875, -9.72509765625, -9.3868408203125, -9.048583984375, -8.7103271484375, -8.3720703125, -8.0338134765625, -7.695556640625, -7.3572998046875, -7.01904296875, -6.6807861328125, -6.342529296875, -6.0042724609375, -5.666015625, -5.3277587890625, -4.989501953125, -4.6512451171875, -4.31298828125, -3.9747314453125, -3.636474609375, -3.2982177734375, -2.9599609375, -2.6217041015625, -2.283447265625, -1.9451904296875, -1.60693359375, -1.2686767578125, -0.930419921875, -0.5921630859375, -0.25390625, 0.0843505859375, 0.422607421875, 0.7608642578125, 1.09912109375, 1.4373779296875, 1.775634765625, 2.1138916015625, 2.4521484375, 2.7904052734375, 3.128662109375, 3.4669189453125, 3.80517578125, 4.1434326171875, 4.481689453125, 4.8199462890625, 5.158203125, 5.4964599609375, 5.834716796875, 6.1729736328125, 6.51123046875, 6.8494873046875, 7.187744140625, 7.5260009765625, 7.8642578125, 8.2025146484375, 8.540771484375, 8.8790283203125, 9.21728515625, 9.5555419921875, 9.893798828125, 10.2320556640625, 10.5703125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 4.0, 7.0, 10.0, 14.0, 13.0, 20.0, 22.0, 30.0, 22.0, 45.0, 45.0, 57.0, 48.0, 53.0, 64.0, 72.0, 72.0, 60.0, 59.0, 39.0, 42.0, 39.0, 23.0, 31.0, 21.0, 19.0, 9.0, 11.0, 12.0, 6.0, 9.0, 6.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.83502197265625, -4.6856689453125, -4.53631591796875, -4.386962890625, -4.23760986328125, -4.0882568359375, -3.93890380859375, -3.78955078125, -3.64019775390625, -3.4908447265625, -3.34149169921875, -3.192138671875, -3.04278564453125, -2.8934326171875, -2.74407958984375, -2.5947265625, -2.44537353515625, -2.2960205078125, -2.14666748046875, -1.997314453125, -1.84796142578125, -1.6986083984375, -1.54925537109375, -1.39990234375, -1.25054931640625, -1.1011962890625, -0.95184326171875, -0.802490234375, -0.65313720703125, -0.5037841796875, -0.35443115234375, -0.205078125, -0.05572509765625, 0.0936279296875, 0.24298095703125, 0.392333984375, 0.54168701171875, 0.6910400390625, 0.84039306640625, 0.98974609375, 1.13909912109375, 1.2884521484375, 1.43780517578125, 1.587158203125, 1.73651123046875, 1.8858642578125, 2.03521728515625, 2.1845703125, 2.33392333984375, 2.4832763671875, 2.63262939453125, 2.781982421875, 2.93133544921875, 3.0806884765625, 3.23004150390625, 3.37939453125, 3.52874755859375, 3.6781005859375, 3.82745361328125, 3.976806640625, 4.12615966796875, 4.2755126953125, 4.42486572265625, 4.57421875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 1.0, 3.0, 10.0, 7.0, 12.0, 10.0, 25.0, 34.0, 55.0, 78.0, 103.0, 114.0, 128.0, 121.0, 78.0, 69.0, 57.0, 23.0, 21.0, 20.0, 7.0, 12.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.85691833496094, -89.43411254882812, -86.01130676269531, -82.5885009765625, -79.16569519042969, -75.74288940429688, -72.32007598876953, -68.89727020263672, -65.4744644165039, -62.051658630371094, -58.62885284423828, -55.2060432434082, -51.78323745727539, -48.36043167114258, -44.9376220703125, -41.51481628417969, -38.092010498046875, -34.66920471191406, -31.246397018432617, -27.823589324951172, -24.40078353881836, -20.977977752685547, -17.5551700592041, -14.132362365722656, -10.709556579589844, -7.286749839782715, -3.863943099975586, -0.44113636016845703, 2.981670379638672, 6.404476165771484, 9.82728385925293, 13.250091552734375, 16.672897338867188, 20.095703125, 23.518510818481445, 26.94131851196289, 30.364124298095703, 33.786930084228516, 37.209739685058594, 40.632545471191406, 44.05535125732422, 47.47815704345703, 50.900962829589844, 54.32377243041992, 57.746578216552734, 61.16938400268555, 64.59219360351562, 68.01499938964844, 71.43780517578125, 74.86061096191406, 78.28341674804688, 81.70622253417969, 85.1290283203125, 88.55183410644531, 91.97464752197266, 95.39745330810547, 98.82025909423828, 102.2430648803711, 105.6658706665039, 109.08867645263672, 112.51148986816406, 115.93429565429688, 119.35710144042969, 122.7799072265625, 126.20271301269531]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 12.0, 9.0, 17.0, 10.0, 38.0, 33.0, 40.0, 49.0, 75.0, 74.0, 56.0, 76.0, 70.0, 77.0, 66.0, 60.0, 45.0, 37.0, 39.0, 23.0, 25.0, 19.0, 12.0, 11.0, 3.0, 8.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.665313720703125, -58.071136474609375, -55.47695541381836, -52.882774353027344, -50.288597106933594, -47.694419860839844, -45.10023880004883, -42.50605773925781, -39.91188049316406, -37.31770324707031, -34.7235221862793, -32.12934112548828, -29.53516387939453, -26.94098472595215, -24.346805572509766, -21.752626419067383, -19.158447265625, -16.564268112182617, -13.970088958740234, -11.375909805297852, -8.781730651855469, -6.187551498413086, -3.593372344970703, -0.9991931915283203, 1.5949859619140625, 4.189165115356445, 6.783344268798828, 9.377523422241211, 11.971702575683594, 14.565881729125977, 17.16006088256836, 19.754240036010742, 22.348426818847656, 24.94260597229004, 27.536785125732422, 30.130964279174805, 32.72514343261719, 35.31932067871094, 37.91350173950195, 40.50768280029297, 43.10186004638672, 45.69603729248047, 48.290218353271484, 50.8843994140625, 53.47857666015625, 56.07275390625, 58.666934967041016, 61.26111602783203, 63.85529327392578, 66.44947052001953, 69.04365539550781, 71.63783264160156, 74.23200988769531, 76.82618713378906, 79.42036437988281, 82.0145492553711, 84.60872650146484, 87.2029037475586, 89.79708862304688, 92.39126586914062, 94.98544311523438, 97.57962036132812, 100.17379760742188, 102.76798248291016, 105.3621597290039]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 11.0, 16.0, 32.0, 41.0, 63.0, 139.0, 260.0, 769.0, 4390.0, 49761.0, 3927023.0, 195983.0, 12674.0, 2039.0, 586.0, 227.0, 97.0, 64.0, 46.0, 21.0, 14.0, 10.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.9375, -90.548828125, -87.16015625, -83.771484375, -80.3828125, -76.994140625, -73.60546875, -70.216796875, -66.828125, -63.439453125, -60.05078125, -56.662109375, -53.2734375, -49.884765625, -46.49609375, -43.107421875, -39.71875, -36.330078125, -32.94140625, -29.552734375, -26.1640625, -22.775390625, -19.38671875, -15.998046875, -12.609375, -9.220703125, -5.83203125, -2.443359375, 0.9453125, 4.333984375, 7.72265625, 11.111328125, 14.5, 17.888671875, 21.27734375, 24.666015625, 28.0546875, 31.443359375, 34.83203125, 38.220703125, 41.609375, 44.998046875, 48.38671875, 51.775390625, 55.1640625, 58.552734375, 61.94140625, 65.330078125, 68.71875, 72.107421875, 75.49609375, 78.884765625, 82.2734375, 85.662109375, 89.05078125, 92.439453125, 95.828125, 99.216796875, 102.60546875, 105.994140625, 109.3828125, 112.771484375, 116.16015625, 119.548828125, 122.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 13.0, 27.0, 24.0, 38.0, 53.0, 66.0, 57.0, 70.0, 84.0, 105.0, 87.0, 71.0, 65.0, 49.0, 53.0, 43.0, 29.0, 20.0, 12.0, 4.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.9500732421875, -1.870849609375, -1.7916259765625, -1.71240234375, -1.6331787109375, -1.553955078125, -1.4747314453125, -1.3955078125, -1.3162841796875, -1.237060546875, -1.1578369140625, -1.07861328125, -0.9993896484375, -0.920166015625, -0.8409423828125, -0.76171875, -0.6824951171875, -0.603271484375, -0.5240478515625, -0.44482421875, -0.3656005859375, -0.286376953125, -0.2071533203125, -0.1279296875, -0.0487060546875, 0.030517578125, 0.1097412109375, 0.18896484375, 0.2681884765625, 0.347412109375, 0.4266357421875, 0.505859375, 0.5850830078125, 0.664306640625, 0.7435302734375, 0.82275390625, 0.9019775390625, 0.981201171875, 1.0604248046875, 1.1396484375, 1.2188720703125, 1.298095703125, 1.3773193359375, 1.45654296875, 1.5357666015625, 1.614990234375, 1.6942138671875, 1.7734375, 1.8526611328125, 1.931884765625, 2.0111083984375, 2.09033203125, 2.1695556640625, 2.248779296875, 2.3280029296875, 2.4072265625, 2.4864501953125, 2.565673828125, 2.6448974609375, 2.72412109375, 2.8033447265625, 2.882568359375, 2.9617919921875, 3.041015625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 31.0, 24.0, 57.0, 92.0, 163.0, 380.0, 1082.0, 3551.0, 14766.0, 80039.0, 961414.0, 3007361.0, 101362.0, 17732.0, 4256.0, 1163.0, 384.0, 191.0, 84.0, 60.0, 31.0, 12.0, 15.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.96875, -52.173828125, -50.37890625, -48.583984375, -46.7890625, -44.994140625, -43.19921875, -41.404296875, -39.609375, -37.814453125, -36.01953125, -34.224609375, -32.4296875, -30.634765625, -28.83984375, -27.044921875, -25.25, -23.455078125, -21.66015625, -19.865234375, -18.0703125, -16.275390625, -14.48046875, -12.685546875, -10.890625, -9.095703125, -7.30078125, -5.505859375, -3.7109375, -1.916015625, -0.12109375, 1.673828125, 3.46875, 5.263671875, 7.05859375, 8.853515625, 10.6484375, 12.443359375, 14.23828125, 16.033203125, 17.828125, 19.623046875, 21.41796875, 23.212890625, 25.0078125, 26.802734375, 28.59765625, 30.392578125, 32.1875, 33.982421875, 35.77734375, 37.572265625, 39.3671875, 41.162109375, 42.95703125, 44.751953125, 46.546875, 48.341796875, 50.13671875, 51.931640625, 53.7265625, 55.521484375, 57.31640625, 59.111328125, 60.90625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 8.0, 11.0, 6.0, 14.0, 13.0, 19.0, 39.0, 43.0, 56.0, 90.0, 90.0, 126.0, 206.0, 494.0, 1862.0, 365.0, 210.0, 106.0, 83.0, 75.0, 35.0, 29.0, 16.0, 19.0, 15.0, 17.0, 8.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.02227783203125, -5.8101806640625, -5.59808349609375, -5.385986328125, -5.17388916015625, -4.9617919921875, -4.74969482421875, -4.53759765625, -4.32550048828125, -4.1134033203125, -3.90130615234375, -3.689208984375, -3.47711181640625, -3.2650146484375, -3.05291748046875, -2.8408203125, -2.62872314453125, -2.4166259765625, -2.20452880859375, -1.992431640625, -1.78033447265625, -1.5682373046875, -1.35614013671875, -1.14404296875, -0.93194580078125, -0.7198486328125, -0.50775146484375, -0.295654296875, -0.08355712890625, 0.1285400390625, 0.34063720703125, 0.552734375, 0.76483154296875, 0.9769287109375, 1.18902587890625, 1.401123046875, 1.61322021484375, 1.8253173828125, 2.03741455078125, 2.24951171875, 2.46160888671875, 2.6737060546875, 2.88580322265625, 3.097900390625, 3.30999755859375, 3.5220947265625, 3.73419189453125, 3.9462890625, 4.15838623046875, 4.3704833984375, 4.58258056640625, 4.794677734375, 5.00677490234375, 5.2188720703125, 5.43096923828125, 5.64306640625, 5.85516357421875, 6.0672607421875, 6.27935791015625, 6.491455078125, 6.70355224609375, 6.9156494140625, 7.12774658203125, 7.33984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 2.0, 16.0, 14.0, 27.0, 35.0, 51.0, 73.0, 103.0, 129.0, 119.0, 116.0, 106.0, 74.0, 41.0, 26.0, 15.0, 20.0, 6.0, 4.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.21955108642578, -30.569355010986328, -28.919158935546875, -27.268962860107422, -25.6187686920166, -23.96857261657715, -22.318376541137695, -20.668182373046875, -19.017986297607422, -17.36779022216797, -15.717595100402832, -14.067399024963379, -12.417203903198242, -10.767007827758789, -9.116811752319336, -7.466616630554199, -5.81641960144043, -4.166224002838135, -2.5160281658172607, -0.8658323287963867, 0.7843632698059082, 2.434558868408203, 4.084754943847656, 5.734950065612793, 7.385146141052246, 9.0353422164917, 10.685537338256836, 12.335733413696289, 13.985929489135742, 15.636124610900879, 17.286319732666016, 18.93651580810547, 20.586711883544922, 22.236907958984375, 23.887104034423828, 25.53730010986328, 27.1874942779541, 28.837690353393555, 30.487886428833008, 32.13808059692383, 33.78827667236328, 35.438472747802734, 37.08866882324219, 38.73886489868164, 40.389060974121094, 42.03925323486328, 43.689453125, 45.33964538574219, 46.989845275878906, 48.64004135131836, 50.29023742675781, 51.940433502197266, 53.59062957763672, 55.240821838378906, 56.891021728515625, 58.54121398925781, 60.191410064697266, 61.84160614013672, 63.49180221557617, 65.14199829101562, 66.79219055175781, 68.44239044189453, 70.09258270263672, 71.74278259277344, 73.39297485351562]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 4.0, 9.0, 10.0, 11.0, 15.0, 19.0, 19.0, 16.0, 26.0, 28.0, 29.0, 38.0, 29.0, 38.0, 42.0, 43.0, 36.0, 57.0, 50.0, 65.0, 53.0, 48.0, 38.0, 37.0, 37.0, 33.0, 29.0, 21.0, 19.0, 17.0, 27.0, 8.0, 10.0, 4.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0], "bins": [-31.966903686523438, -31.10605812072754, -30.245210647583008, -29.38436508178711, -28.52351951599121, -27.662673950195312, -26.80182647705078, -25.940980911254883, -25.080135345458984, -24.219289779663086, -23.358442306518555, -22.497596740722656, -21.636751174926758, -20.77590560913086, -19.915058135986328, -19.05421257019043, -18.19336700439453, -17.332521438598633, -16.4716739654541, -15.610828399658203, -14.749982833862305, -13.88913631439209, -13.028289794921875, -12.167444229125977, -11.306596755981445, -10.44575023651123, -9.584904670715332, -8.724058151245117, -7.863212585449219, -7.002366065979004, -6.141520023345947, -5.280673980712891, -4.419828414916992, -3.5589823722839355, -2.698136329650879, -1.8372900485992432, -0.9764440059661865, -0.11559772491455078, 0.7452483177185059, 1.6060943603515625, 2.466940402984619, 3.327786445617676, 4.188632488250732, 5.049478530883789, 5.910325050354004, 6.7711710929870605, 7.632017135620117, 8.492862701416016, 9.35370922088623, 10.214555740356445, 11.075401306152344, 11.936247825622559, 12.797093391418457, 13.657939910888672, 14.51878547668457, 15.379631996154785, 16.240478515625, 17.1013240814209, 17.96217155456543, 18.823017120361328, 19.683862686157227, 20.544708251953125, 21.405555725097656, 22.266401290893555, 23.127246856689453]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 9.0, 2.0, 9.0, 11.0, 12.0, 21.0, 35.0, 32.0, 47.0, 80.0, 87.0, 174.0, 246.0, 442.0, 711.0, 1556.0, 3586.0, 10875.0, 39895.0, 161917.0, 476233.0, 260279.0, 65422.0, 17127.0, 5375.0, 2068.0, 914.0, 481.0, 290.0, 180.0, 126.0, 83.0, 64.0, 38.0, 36.0, 24.0, 15.0, 7.0, 12.0, 12.0, 5.0, 4.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0], "bins": [-27.578125, -26.80517578125, -26.0322265625, -25.25927734375, -24.486328125, -23.71337890625, -22.9404296875, -22.16748046875, -21.39453125, -20.62158203125, -19.8486328125, -19.07568359375, -18.302734375, -17.52978515625, -16.7568359375, -15.98388671875, -15.2109375, -14.43798828125, -13.6650390625, -12.89208984375, -12.119140625, -11.34619140625, -10.5732421875, -9.80029296875, -9.02734375, -8.25439453125, -7.4814453125, -6.70849609375, -5.935546875, -5.16259765625, -4.3896484375, -3.61669921875, -2.84375, -2.07080078125, -1.2978515625, -0.52490234375, 0.248046875, 1.02099609375, 1.7939453125, 2.56689453125, 3.33984375, 4.11279296875, 4.8857421875, 5.65869140625, 6.431640625, 7.20458984375, 7.9775390625, 8.75048828125, 9.5234375, 10.29638671875, 11.0693359375, 11.84228515625, 12.615234375, 13.38818359375, 14.1611328125, 14.93408203125, 15.70703125, 16.47998046875, 17.2529296875, 18.02587890625, 18.798828125, 19.57177734375, 20.3447265625, 21.11767578125, 21.890625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 11.0, 27.0, 42.0, 60.0, 58.0, 105.0, 121.0, 109.0, 110.0, 94.0, 72.0, 62.0, 37.0, 40.0, 13.0, 13.0, 4.0, 7.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.429168701171875, -3.30950927734375, -3.189849853515625, -3.0701904296875, -2.950531005859375, -2.83087158203125, -2.711212158203125, -2.591552734375, -2.471893310546875, -2.35223388671875, -2.232574462890625, -2.1129150390625, -1.993255615234375, -1.87359619140625, -1.753936767578125, -1.63427734375, -1.514617919921875, -1.39495849609375, -1.275299072265625, -1.1556396484375, -1.035980224609375, -0.91632080078125, -0.796661376953125, -0.677001953125, -0.557342529296875, -0.43768310546875, -0.318023681640625, -0.1983642578125, -0.078704833984375, 0.04095458984375, 0.160614013671875, 0.2802734375, 0.399932861328125, 0.51959228515625, 0.639251708984375, 0.7589111328125, 0.878570556640625, 0.99822998046875, 1.117889404296875, 1.237548828125, 1.357208251953125, 1.47686767578125, 1.596527099609375, 1.7161865234375, 1.835845947265625, 1.95550537109375, 2.075164794921875, 2.19482421875, 2.314483642578125, 2.43414306640625, 2.553802490234375, 2.6734619140625, 2.793121337890625, 2.91278076171875, 3.032440185546875, 3.152099609375, 3.271759033203125, 3.39141845703125, 3.511077880859375, 3.6307373046875, 3.750396728515625, 3.87005615234375, 3.989715576171875, 4.109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 5.0, 4.0, 7.0, 19.0, 16.0, 24.0, 33.0, 46.0, 75.0, 118.0, 167.0, 245.0, 404.0, 721.0, 1397.0, 2684.0, 5500.0, 14358.0, 40619.0, 127652.0, 383418.0, 314377.0, 101647.0, 33104.0, 11827.0, 4702.0, 2365.0, 1187.0, 644.0, 410.0, 273.0, 156.0, 100.0, 75.0, 54.0, 37.0, 20.0, 17.0, 12.0, 17.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-20.484375, -19.880126953125, -19.27587890625, -18.671630859375, -18.0673828125, -17.463134765625, -16.85888671875, -16.254638671875, -15.650390625, -15.046142578125, -14.44189453125, -13.837646484375, -13.2333984375, -12.629150390625, -12.02490234375, -11.420654296875, -10.81640625, -10.212158203125, -9.60791015625, -9.003662109375, -8.3994140625, -7.795166015625, -7.19091796875, -6.586669921875, -5.982421875, -5.378173828125, -4.77392578125, -4.169677734375, -3.5654296875, -2.961181640625, -2.35693359375, -1.752685546875, -1.1484375, -0.544189453125, 0.06005859375, 0.664306640625, 1.2685546875, 1.872802734375, 2.47705078125, 3.081298828125, 3.685546875, 4.289794921875, 4.89404296875, 5.498291015625, 6.1025390625, 6.706787109375, 7.31103515625, 7.915283203125, 8.51953125, 9.123779296875, 9.72802734375, 10.332275390625, 10.9365234375, 11.540771484375, 12.14501953125, 12.749267578125, 13.353515625, 13.957763671875, 14.56201171875, 15.166259765625, 15.7705078125, 16.374755859375, 16.97900390625, 17.583251953125, 18.1875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 7.0, 10.0, 23.0, 20.0, 15.0, 33.0, 28.0, 33.0, 43.0, 41.0, 36.0, 42.0, 46.0, 46.0, 53.0, 50.0, 44.0, 48.0, 44.0, 45.0, 41.0, 32.0, 28.0, 18.0, 22.0, 23.0, 20.0, 14.0, 18.0, 10.0, 7.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.3702392578125, -9.045166015625, -8.7200927734375, -8.39501953125, -8.0699462890625, -7.744873046875, -7.4197998046875, -7.0947265625, -6.7696533203125, -6.444580078125, -6.1195068359375, -5.79443359375, -5.4693603515625, -5.144287109375, -4.8192138671875, -4.494140625, -4.1690673828125, -3.843994140625, -3.5189208984375, -3.19384765625, -2.8687744140625, -2.543701171875, -2.2186279296875, -1.8935546875, -1.5684814453125, -1.243408203125, -0.9183349609375, -0.59326171875, -0.2681884765625, 0.056884765625, 0.3819580078125, 0.70703125, 1.0321044921875, 1.357177734375, 1.6822509765625, 2.00732421875, 2.3323974609375, 2.657470703125, 2.9825439453125, 3.3076171875, 3.6326904296875, 3.957763671875, 4.2828369140625, 4.60791015625, 4.9329833984375, 5.258056640625, 5.5831298828125, 5.908203125, 6.2332763671875, 6.558349609375, 6.8834228515625, 7.20849609375, 7.5335693359375, 7.858642578125, 8.1837158203125, 8.5087890625, 8.8338623046875, 9.158935546875, 9.4840087890625, 9.80908203125, 10.1341552734375, 10.459228515625, 10.7843017578125, 11.109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 7.0, 6.0, 8.0, 15.0, 8.0, 30.0, 46.0, 60.0, 161.0, 298.0, 755.0, 2100.0, 8755.0, 55960.0, 504636.0, 419797.0, 45333.0, 7437.0, 1956.0, 611.0, 270.0, 129.0, 63.0, 44.0, 19.0, 16.0, 17.0, 11.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.761474609375, -17.14794921875, -16.534423828125, -15.9208984375, -15.307373046875, -14.69384765625, -14.080322265625, -13.466796875, -12.853271484375, -12.23974609375, -11.626220703125, -11.0126953125, -10.399169921875, -9.78564453125, -9.172119140625, -8.55859375, -7.945068359375, -7.33154296875, -6.718017578125, -6.1044921875, -5.490966796875, -4.87744140625, -4.263916015625, -3.650390625, -3.036865234375, -2.42333984375, -1.809814453125, -1.1962890625, -0.582763671875, 0.03076171875, 0.644287109375, 1.2578125, 1.871337890625, 2.48486328125, 3.098388671875, 3.7119140625, 4.325439453125, 4.93896484375, 5.552490234375, 6.166015625, 6.779541015625, 7.39306640625, 8.006591796875, 8.6201171875, 9.233642578125, 9.84716796875, 10.460693359375, 11.07421875, 11.687744140625, 12.30126953125, 12.914794921875, 13.5283203125, 14.141845703125, 14.75537109375, 15.368896484375, 15.982421875, 16.595947265625, 17.20947265625, 17.822998046875, 18.4365234375, 19.050048828125, 19.66357421875, 20.277099609375, 20.890625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 4.0, 4.0, 7.0, 16.0, 13.0, 21.0, 17.0, 22.0, 34.0, 38.0, 39.0, 52.0, 70.0, 96.0, 83.0, 91.0, 74.0, 56.0, 49.0, 30.0, 40.0, 30.0, 23.0, 17.0, 13.0, 6.0, 4.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0014314651489257812, -0.0013904869556427002, -0.0013495087623596191, -0.001308530569076538, -0.001267552375793457, -0.001226574182510376, -0.001185595989227295, -0.0011446177959442139, -0.0011036396026611328, -0.0010626614093780518, -0.0010216832160949707, -0.0009807050228118896, -0.0009397268295288086, -0.0008987486362457275, -0.0008577704429626465, -0.0008167922496795654, -0.0007758140563964844, -0.0007348358631134033, -0.0006938576698303223, -0.0006528794765472412, -0.0006119012832641602, -0.0005709230899810791, -0.000529944896697998, -0.000488966703414917, -0.00044798851013183594, -0.0004070103168487549, -0.00036603212356567383, -0.0003250539302825928, -0.0002840757369995117, -0.00024309754371643066, -0.0002021193504333496, -0.00016114115715026855, -0.0001201629638671875, -7.918477058410645e-05, -3.820657730102539e-05, 2.771615982055664e-06, 4.374980926513672e-05, 8.472800254821777e-05, 0.00012570619583129883, 0.00016668438911437988, 0.00020766258239746094, 0.000248640775680542, 0.00028961896896362305, 0.0003305971622467041, 0.00037157535552978516, 0.0004125535488128662, 0.00045353174209594727, 0.0004945099353790283, 0.0005354881286621094, 0.0005764663219451904, 0.0006174445152282715, 0.0006584227085113525, 0.0006994009017944336, 0.0007403790950775146, 0.0007813572883605957, 0.0008223354816436768, 0.0008633136749267578, 0.0009042918682098389, 0.0009452700614929199, 0.000986248254776001, 0.001027226448059082, 0.001068204641342163, 0.0011091828346252441, 0.0011501610279083252, 0.0011911392211914062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 9.0, 17.0, 19.0, 43.0, 52.0, 87.0, 118.0, 221.0, 469.0, 1142.0, 3407.0, 13912.0, 98625.0, 694438.0, 204978.0, 23367.0, 4960.0, 1506.0, 554.0, 263.0, 125.0, 73.0, 63.0, 31.0, 20.0, 12.0, 6.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.2177734375, -23.498046875, -22.7783203125, -22.05859375, -21.3388671875, -20.619140625, -19.8994140625, -19.1796875, -18.4599609375, -17.740234375, -17.0205078125, -16.30078125, -15.5810546875, -14.861328125, -14.1416015625, -13.421875, -12.7021484375, -11.982421875, -11.2626953125, -10.54296875, -9.8232421875, -9.103515625, -8.3837890625, -7.6640625, -6.9443359375, -6.224609375, -5.5048828125, -4.78515625, -4.0654296875, -3.345703125, -2.6259765625, -1.90625, -1.1865234375, -0.466796875, 0.2529296875, 0.97265625, 1.6923828125, 2.412109375, 3.1318359375, 3.8515625, 4.5712890625, 5.291015625, 6.0107421875, 6.73046875, 7.4501953125, 8.169921875, 8.8896484375, 9.609375, 10.3291015625, 11.048828125, 11.7685546875, 12.48828125, 13.2080078125, 13.927734375, 14.6474609375, 15.3671875, 16.0869140625, 16.806640625, 17.5263671875, 18.24609375, 18.9658203125, 19.685546875, 20.4052734375, 21.125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 26.0, 38.0, 66.0, 97.0, 126.0, 132.0, 131.0, 115.0, 74.0, 63.0, 41.0, 26.0, 13.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-16.71875, -16.36932373046875, -16.0198974609375, -15.67047119140625, -15.321044921875, -14.97161865234375, -14.6221923828125, -14.27276611328125, -13.92333984375, -13.57391357421875, -13.2244873046875, -12.87506103515625, -12.525634765625, -12.17620849609375, -11.8267822265625, -11.47735595703125, -11.1279296875, -10.77850341796875, -10.4290771484375, -10.07965087890625, -9.730224609375, -9.38079833984375, -9.0313720703125, -8.68194580078125, -8.33251953125, -7.98309326171875, -7.6336669921875, -7.28424072265625, -6.934814453125, -6.58538818359375, -6.2359619140625, -5.88653564453125, -5.537109375, -5.18768310546875, -4.8382568359375, -4.48883056640625, -4.139404296875, -3.78997802734375, -3.4405517578125, -3.09112548828125, -2.74169921875, -2.39227294921875, -2.0428466796875, -1.69342041015625, -1.343994140625, -0.99456787109375, -0.6451416015625, -0.29571533203125, 0.0537109375, 0.40313720703125, 0.7525634765625, 1.10198974609375, 1.451416015625, 1.80084228515625, 2.1502685546875, 2.49969482421875, 2.84912109375, 3.19854736328125, 3.5479736328125, 3.89739990234375, 4.246826171875, 4.59625244140625, 4.9456787109375, 5.29510498046875, 5.64453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 16.0, 27.0, 77.0, 220.0, 328.0, 215.0, 86.0, 31.0, 6.0, 5.0, 2.0, 1.0, 1.0], "bins": [-496.0281982421875, -487.0992431640625, -478.1703186035156, -469.2413635253906, -460.31243896484375, -451.38348388671875, -442.45452880859375, -433.5256042480469, -424.5966491699219, -415.6676940917969, -406.73876953125, -397.809814453125, -388.880859375, -379.9519348144531, -371.0229797363281, -362.09405517578125, -353.16510009765625, -344.23614501953125, -335.3072204589844, -326.3782653808594, -317.4493408203125, -308.5203857421875, -299.5914306640625, -290.6625061035156, -281.7335510253906, -272.8045959472656, -263.87567138671875, -254.94671630859375, -246.0177764892578, -237.08883666992188, -228.15988159179688, -219.23094177246094, -210.30198669433594, -201.373046875, -192.444091796875, -183.51515197753906, -174.58621215820312, -165.6572723388672, -156.72833251953125, -147.79937744140625, -138.8704376220703, -129.94149780273438, -121.0125503540039, -112.08360290527344, -103.1546630859375, -94.22572326660156, -85.2967758178711, -76.36782836914062, -67.43888854980469, -58.509944915771484, -49.58100128173828, -40.65205764770508, -31.723114013671875, -22.794170379638672, -13.865226745605469, -4.936283111572266, 3.9926605224609375, 12.92160415649414, 21.850547790527344, 30.779491424560547, 39.70843505859375, 48.63737869262695, 57.566322326660156, 66.49526977539062, 75.42420959472656]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 9.0, 10.0, 7.0, 10.0, 12.0, 19.0, 20.0, 18.0, 16.0, 26.0, 40.0, 44.0, 41.0, 52.0, 45.0, 49.0, 62.0, 51.0, 51.0, 51.0, 47.0, 36.0, 39.0, 37.0, 43.0, 28.0, 22.0, 22.0, 9.0, 14.0, 15.0, 14.0, 9.0, 4.0, 3.0, 9.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-84.17637634277344, -81.90940856933594, -79.64244842529297, -77.37548065185547, -75.10851287841797, -72.841552734375, -70.5745849609375, -68.3076171875, -66.0406494140625, -63.773685455322266, -61.506717681884766, -59.23975372314453, -56.97278594970703, -54.7058219909668, -52.43885803222656, -50.17189025878906, -47.904930114746094, -45.63796615600586, -43.37099838256836, -41.104034423828125, -38.837066650390625, -36.57010269165039, -34.303138732910156, -32.036170959472656, -29.769207000732422, -27.502241134643555, -25.235275268554688, -22.968311309814453, -20.701345443725586, -18.43437957763672, -16.167415618896484, -13.900449752807617, -11.633476257324219, -9.366510391235352, -7.099545478820801, -4.832580089569092, -2.565614700317383, -0.2986488342285156, 1.9683160781860352, 4.235280990600586, 6.502246856689453, 8.76921272277832, 11.036177635192871, 13.303142547607422, 15.570108413696289, 17.837074279785156, 20.10403823852539, 22.371004104614258, 24.637969970703125, 26.904935836791992, 29.17190170288086, 31.438865661621094, 33.705833435058594, 35.97279739379883, 38.23976135253906, 40.50672912597656, 42.7736930847168, 45.04065704345703, 47.30762481689453, 49.574588775634766, 51.841552734375, 54.1085205078125, 56.375484466552734, 58.64244842529297, 60.90941619873047]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 0.0, 5.0, 4.0, 16.0, 22.0, 31.0, 49.0, 70.0, 130.0, 255.0, 560.0, 1527.0, 5085.0, 25281.0, 387373.0, 3708611.0, 52843.0, 8640.0, 2189.0, 779.0, 346.0, 173.0, 105.0, 60.0, 43.0, 36.0, 12.0, 15.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-60.0625, -58.072265625, -56.08203125, -54.091796875, -52.1015625, -50.111328125, -48.12109375, -46.130859375, -44.140625, -42.150390625, -40.16015625, -38.169921875, -36.1796875, -34.189453125, -32.19921875, -30.208984375, -28.21875, -26.228515625, -24.23828125, -22.248046875, -20.2578125, -18.267578125, -16.27734375, -14.287109375, -12.296875, -10.306640625, -8.31640625, -6.326171875, -4.3359375, -2.345703125, -0.35546875, 1.634765625, 3.625, 5.615234375, 7.60546875, 9.595703125, 11.5859375, 13.576171875, 15.56640625, 17.556640625, 19.546875, 21.537109375, 23.52734375, 25.517578125, 27.5078125, 29.498046875, 31.48828125, 33.478515625, 35.46875, 37.458984375, 39.44921875, 41.439453125, 43.4296875, 45.419921875, 47.41015625, 49.400390625, 51.390625, 53.380859375, 55.37109375, 57.361328125, 59.3515625, 61.341796875, 63.33203125, 65.322265625, 67.3125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 3.0, 2.0, 2.0, 7.0, 10.0, 11.0, 11.0, 26.0, 16.0, 49.0, 39.0, 48.0, 58.0, 66.0, 72.0, 67.0, 65.0, 84.0, 69.0, 69.0, 50.0, 51.0, 27.0, 19.0, 18.0, 11.0, 14.0, 16.0, 6.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.962890625, -2.875946044921875, -2.78900146484375, -2.702056884765625, -2.6151123046875, -2.528167724609375, -2.44122314453125, -2.354278564453125, -2.267333984375, -2.180389404296875, -2.09344482421875, -2.006500244140625, -1.9195556640625, -1.832611083984375, -1.74566650390625, -1.658721923828125, -1.57177734375, -1.484832763671875, -1.39788818359375, -1.310943603515625, -1.2239990234375, -1.137054443359375, -1.05010986328125, -0.963165283203125, -0.876220703125, -0.789276123046875, -0.70233154296875, -0.615386962890625, -0.5284423828125, -0.441497802734375, -0.35455322265625, -0.267608642578125, -0.1806640625, -0.093719482421875, -0.00677490234375, 0.080169677734375, 0.1671142578125, 0.254058837890625, 0.34100341796875, 0.427947998046875, 0.514892578125, 0.601837158203125, 0.68878173828125, 0.775726318359375, 0.8626708984375, 0.949615478515625, 1.03656005859375, 1.123504638671875, 1.21044921875, 1.297393798828125, 1.38433837890625, 1.471282958984375, 1.5582275390625, 1.645172119140625, 1.73211669921875, 1.819061279296875, 1.906005859375, 1.992950439453125, 2.07989501953125, 2.166839599609375, 2.2537841796875, 2.340728759765625, 2.42767333984375, 2.514617919921875, 2.6015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 8.0, 14.0, 20.0, 37.0, 61.0, 94.0, 177.0, 366.0, 769.0, 1862.0, 4734.0, 16425.0, 83836.0, 1416119.0, 2548224.0, 94046.0, 18358.0, 5359.0, 2012.0, 861.0, 406.0, 204.0, 115.0, 85.0, 39.0, 25.0, 16.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.46875, -42.19140625, -40.9140625, -39.63671875, -38.359375, -37.08203125, -35.8046875, -34.52734375, -33.25, -31.97265625, -30.6953125, -29.41796875, -28.140625, -26.86328125, -25.5859375, -24.30859375, -23.03125, -21.75390625, -20.4765625, -19.19921875, -17.921875, -16.64453125, -15.3671875, -14.08984375, -12.8125, -11.53515625, -10.2578125, -8.98046875, -7.703125, -6.42578125, -5.1484375, -3.87109375, -2.59375, -1.31640625, -0.0390625, 1.23828125, 2.515625, 3.79296875, 5.0703125, 6.34765625, 7.625, 8.90234375, 10.1796875, 11.45703125, 12.734375, 14.01171875, 15.2890625, 16.56640625, 17.84375, 19.12109375, 20.3984375, 21.67578125, 22.953125, 24.23046875, 25.5078125, 26.78515625, 28.0625, 29.33984375, 30.6171875, 31.89453125, 33.171875, 34.44921875, 35.7265625, 37.00390625, 38.28125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 1.0, 3.0, 4.0, 12.0, 12.0, 20.0, 25.0, 37.0, 81.0, 125.0, 293.0, 753.0, 1874.0, 412.0, 156.0, 100.0, 54.0, 45.0, 14.0, 17.0, 12.0, 8.0, 3.0, 8.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.4552001953125, -9.152587890625, -8.8499755859375, -8.54736328125, -8.2447509765625, -7.942138671875, -7.6395263671875, -7.3369140625, -7.0343017578125, -6.731689453125, -6.4290771484375, -6.12646484375, -5.8238525390625, -5.521240234375, -5.2186279296875, -4.916015625, -4.6134033203125, -4.310791015625, -4.0081787109375, -3.70556640625, -3.4029541015625, -3.100341796875, -2.7977294921875, -2.4951171875, -2.1925048828125, -1.889892578125, -1.5872802734375, -1.28466796875, -0.9820556640625, -0.679443359375, -0.3768310546875, -0.07421875, 0.2283935546875, 0.531005859375, 0.8336181640625, 1.13623046875, 1.4388427734375, 1.741455078125, 2.0440673828125, 2.3466796875, 2.6492919921875, 2.951904296875, 3.2545166015625, 3.55712890625, 3.8597412109375, 4.162353515625, 4.4649658203125, 4.767578125, 5.0701904296875, 5.372802734375, 5.6754150390625, 5.97802734375, 6.2806396484375, 6.583251953125, 6.8858642578125, 7.1884765625, 7.4910888671875, 7.793701171875, 8.0963134765625, 8.39892578125, 8.7015380859375, 9.004150390625, 9.3067626953125, 9.609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 14.0, 17.0, 28.0, 51.0, 70.0, 118.0, 163.0, 167.0, 132.0, 112.0, 53.0, 31.0, 23.0, 11.0, 8.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.6428451538086, -69.5374755859375, -67.4321060180664, -65.32673645019531, -63.22136306762695, -61.11599349975586, -59.010623931884766, -56.90525436401367, -54.79988098144531, -52.69451141357422, -50.589141845703125, -48.48377227783203, -46.37839889526367, -44.27302932739258, -42.167659759521484, -40.06229019165039, -37.9569206237793, -35.8515510559082, -33.74618148803711, -31.640810012817383, -29.535438537597656, -27.430068969726562, -25.32469940185547, -23.219329833984375, -21.11395835876465, -19.008588790893555, -16.903217315673828, -14.797847747802734, -12.692477226257324, -10.587106704711914, -8.48173713684082, -6.37636661529541, -4.270992279052734, -2.1656219959259033, -0.060251712799072266, 2.0451183319091797, 4.15048885345459, 6.255859375, 8.361228942871094, 10.466599464416504, 12.571969985961914, 14.677340507507324, 16.782711029052734, 18.888080596923828, 20.993450164794922, 23.09882164001465, 25.204191207885742, 27.30956268310547, 29.414932250976562, 31.520301818847656, 33.62567138671875, 35.731040954589844, 37.8364143371582, 39.9417839050293, 42.04715347290039, 44.152523040771484, 46.257896423339844, 48.36326599121094, 50.46863555908203, 52.574005126953125, 54.679378509521484, 56.78474807739258, 58.89011764526367, 60.995487213134766, 63.10085678100586]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 14.0, 6.0, 18.0, 37.0, 30.0, 43.0, 73.0, 71.0, 98.0, 83.0, 94.0, 98.0, 74.0, 59.0, 57.0, 39.0, 42.0, 27.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.262306213378906, -30.87497329711914, -29.487640380859375, -28.100309371948242, -26.712976455688477, -25.32564353942871, -23.938312530517578, -22.550979614257812, -21.163646697998047, -19.77631378173828, -18.388980865478516, -17.001649856567383, -15.614316940307617, -14.226984024047852, -12.839652061462402, -11.452320098876953, -10.064987182617188, -8.677654266357422, -7.290322303771973, -5.902989864349365, -4.515657424926758, -3.1283249855041504, -1.740992546081543, -0.35366058349609375, 1.0336723327636719, 2.4210047721862793, 3.8083372116088867, 5.195669651031494, 6.583002090454102, 7.970334529876709, 9.357666969299316, 10.744998931884766, 12.132331848144531, 13.519664764404297, 14.906996726989746, 16.294328689575195, 17.68166160583496, 19.068994522094727, 20.45632553100586, 21.843658447265625, 23.23099136352539, 24.618324279785156, 26.005657196044922, 27.392988204956055, 28.78032112121582, 30.167654037475586, 31.55498504638672, 32.942317962646484, 34.32965087890625, 35.716983795166016, 37.10431671142578, 38.49164962768555, 39.87898254394531, 41.26631164550781, 42.65364456176758, 44.040977478027344, 45.42831039428711, 46.815643310546875, 48.20297622680664, 49.590309143066406, 50.977638244628906, 52.36497116088867, 53.75230407714844, 55.1396369934082, 56.52696990966797]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 8.0, 7.0, 16.0, 16.0, 21.0, 35.0, 29.0, 56.0, 71.0, 96.0, 163.0, 219.0, 364.0, 643.0, 1160.0, 2351.0, 5808.0, 19027.0, 71520.0, 265729.0, 447576.0, 169658.0, 43502.0, 12206.0, 4087.0, 1781.0, 966.0, 503.0, 335.0, 187.0, 126.0, 77.0, 51.0, 40.0, 32.0, 19.0, 16.0, 16.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.375, -20.713623046875, -20.05224609375, -19.390869140625, -18.7294921875, -18.068115234375, -17.40673828125, -16.745361328125, -16.083984375, -15.422607421875, -14.76123046875, -14.099853515625, -13.4384765625, -12.777099609375, -12.11572265625, -11.454345703125, -10.79296875, -10.131591796875, -9.47021484375, -8.808837890625, -8.1474609375, -7.486083984375, -6.82470703125, -6.163330078125, -5.501953125, -4.840576171875, -4.17919921875, -3.517822265625, -2.8564453125, -2.195068359375, -1.53369140625, -0.872314453125, -0.2109375, 0.450439453125, 1.11181640625, 1.773193359375, 2.4345703125, 3.095947265625, 3.75732421875, 4.418701171875, 5.080078125, 5.741455078125, 6.40283203125, 7.064208984375, 7.7255859375, 8.386962890625, 9.04833984375, 9.709716796875, 10.37109375, 11.032470703125, 11.69384765625, 12.355224609375, 13.0166015625, 13.677978515625, 14.33935546875, 15.000732421875, 15.662109375, 16.323486328125, 16.98486328125, 17.646240234375, 18.3076171875, 18.968994140625, 19.63037109375, 20.291748046875, 20.953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 1.0, 5.0, 7.0, 14.0, 18.0, 22.0, 53.0, 43.0, 70.0, 80.0, 100.0, 98.0, 102.0, 95.0, 77.0, 52.0, 47.0, 40.0, 23.0, 18.0, 12.0, 8.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.822265625, -2.703460693359375, -2.58465576171875, -2.465850830078125, -2.3470458984375, -2.228240966796875, -2.10943603515625, -1.990631103515625, -1.871826171875, -1.753021240234375, -1.63421630859375, -1.515411376953125, -1.3966064453125, -1.277801513671875, -1.15899658203125, -1.040191650390625, -0.92138671875, -0.802581787109375, -0.68377685546875, -0.564971923828125, -0.4461669921875, -0.327362060546875, -0.20855712890625, -0.089752197265625, 0.029052734375, 0.147857666015625, 0.26666259765625, 0.385467529296875, 0.5042724609375, 0.623077392578125, 0.74188232421875, 0.860687255859375, 0.9794921875, 1.098297119140625, 1.21710205078125, 1.335906982421875, 1.4547119140625, 1.573516845703125, 1.69232177734375, 1.811126708984375, 1.929931640625, 2.048736572265625, 2.16754150390625, 2.286346435546875, 2.4051513671875, 2.523956298828125, 2.64276123046875, 2.761566162109375, 2.88037109375, 2.999176025390625, 3.11798095703125, 3.236785888671875, 3.3555908203125, 3.474395751953125, 3.59320068359375, 3.712005615234375, 3.830810546875, 3.949615478515625, 4.06842041015625, 4.187225341796875, 4.3060302734375, 4.424835205078125, 4.54364013671875, 4.662445068359375, 4.78125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 10.0, 12.0, 4.0, 8.0, 21.0, 22.0, 28.0, 43.0, 63.0, 68.0, 117.0, 163.0, 238.0, 338.0, 482.0, 821.0, 1497.0, 2928.0, 6018.0, 13807.0, 32886.0, 80919.0, 184810.0, 298212.0, 233529.0, 111256.0, 45316.0, 18408.0, 7966.0, 3731.0, 1870.0, 1024.0, 621.0, 381.0, 256.0, 213.0, 125.0, 93.0, 57.0, 52.0, 33.0, 33.0, 20.0, 16.0, 16.0, 11.0, 4.0, 4.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.44091796875, -10.1005859375, -9.76025390625, -9.419921875, -9.07958984375, -8.7392578125, -8.39892578125, -8.05859375, -7.71826171875, -7.3779296875, -7.03759765625, -6.697265625, -6.35693359375, -6.0166015625, -5.67626953125, -5.3359375, -4.99560546875, -4.6552734375, -4.31494140625, -3.974609375, -3.63427734375, -3.2939453125, -2.95361328125, -2.61328125, -2.27294921875, -1.9326171875, -1.59228515625, -1.251953125, -0.91162109375, -0.5712890625, -0.23095703125, 0.109375, 0.44970703125, 0.7900390625, 1.13037109375, 1.470703125, 1.81103515625, 2.1513671875, 2.49169921875, 2.83203125, 3.17236328125, 3.5126953125, 3.85302734375, 4.193359375, 4.53369140625, 4.8740234375, 5.21435546875, 5.5546875, 5.89501953125, 6.2353515625, 6.57568359375, 6.916015625, 7.25634765625, 7.5966796875, 7.93701171875, 8.27734375, 8.61767578125, 8.9580078125, 9.29833984375, 9.638671875, 9.97900390625, 10.3193359375, 10.65966796875, 11.0]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 6.0, 14.0, 11.0, 11.0, 17.0, 16.0, 34.0, 30.0, 29.0, 42.0, 30.0, 37.0, 40.0, 42.0, 49.0, 47.0, 44.0, 38.0, 43.0, 36.0, 34.0, 33.0, 47.0, 49.0, 27.0, 30.0, 24.0, 27.0, 25.0, 9.0, 8.0, 8.0, 10.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-9.0703125, -8.8079833984375, -8.545654296875, -8.2833251953125, -8.02099609375, -7.7586669921875, -7.496337890625, -7.2340087890625, -6.9716796875, -6.7093505859375, -6.447021484375, -6.1846923828125, -5.92236328125, -5.6600341796875, -5.397705078125, -5.1353759765625, -4.873046875, -4.6107177734375, -4.348388671875, -4.0860595703125, -3.82373046875, -3.5614013671875, -3.299072265625, -3.0367431640625, -2.7744140625, -2.5120849609375, -2.249755859375, -1.9874267578125, -1.72509765625, -1.4627685546875, -1.200439453125, -0.9381103515625, -0.67578125, -0.4134521484375, -0.151123046875, 0.1112060546875, 0.37353515625, 0.6358642578125, 0.898193359375, 1.1605224609375, 1.4228515625, 1.6851806640625, 1.947509765625, 2.2098388671875, 2.47216796875, 2.7344970703125, 2.996826171875, 3.2591552734375, 3.521484375, 3.7838134765625, 4.046142578125, 4.3084716796875, 4.57080078125, 4.8331298828125, 5.095458984375, 5.3577880859375, 5.6201171875, 5.8824462890625, 6.144775390625, 6.4071044921875, 6.66943359375, 6.9317626953125, 7.194091796875, 7.4564208984375, 7.71875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 14.0, 15.0, 13.0, 19.0, 31.0, 72.0, 104.0, 155.0, 210.0, 351.0, 641.0, 1199.0, 2685.0, 6208.0, 16692.0, 46269.0, 126360.0, 277033.0, 312074.0, 161155.0, 60854.0, 21627.0, 8199.0, 3138.0, 1522.0, 756.0, 394.0, 242.0, 158.0, 103.0, 72.0, 42.0, 43.0, 31.0, 10.0, 13.0, 11.0, 6.0, 6.0, 8.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45306396484375, -4.2889404296875, -4.12481689453125, -3.960693359375, -3.79656982421875, -3.6324462890625, -3.46832275390625, -3.30419921875, -3.14007568359375, -2.9759521484375, -2.81182861328125, -2.647705078125, -2.48358154296875, -2.3194580078125, -2.15533447265625, -1.9912109375, -1.82708740234375, -1.6629638671875, -1.49884033203125, -1.334716796875, -1.17059326171875, -1.0064697265625, -0.84234619140625, -0.67822265625, -0.51409912109375, -0.3499755859375, -0.18585205078125, -0.021728515625, 0.14239501953125, 0.3065185546875, 0.47064208984375, 0.634765625, 0.79888916015625, 0.9630126953125, 1.12713623046875, 1.291259765625, 1.45538330078125, 1.6195068359375, 1.78363037109375, 1.94775390625, 2.11187744140625, 2.2760009765625, 2.44012451171875, 2.604248046875, 2.76837158203125, 2.9324951171875, 3.09661865234375, 3.2607421875, 3.42486572265625, 3.5889892578125, 3.75311279296875, 3.917236328125, 4.08135986328125, 4.2454833984375, 4.40960693359375, 4.57373046875, 4.73785400390625, 4.9019775390625, 5.06610107421875, 5.230224609375, 5.39434814453125, 5.5584716796875, 5.72259521484375, 5.88671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 5.0, 5.0, 9.0, 6.0, 7.0, 8.0, 15.0, 14.0, 21.0, 25.0, 29.0, 47.0, 56.0, 67.0, 67.0, 93.0, 105.0, 77.0, 71.0, 38.0, 54.0, 36.0, 24.0, 21.0, 21.0, 12.0, 10.0, 17.0, 8.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009593963623046875, -0.0009296610951423645, -0.0008999258279800415, -0.0008701905608177185, -0.0008404552936553955, -0.0008107200264930725, -0.0007809847593307495, -0.0007512494921684265, -0.0007215142250061035, -0.0006917789578437805, -0.0006620436906814575, -0.0006323084235191345, -0.0006025731563568115, -0.0005728378891944885, -0.0005431026220321655, -0.0005133673548698425, -0.00048363208770751953, -0.00045389682054519653, -0.00042416155338287354, -0.00039442628622055054, -0.00036469101905822754, -0.00033495575189590454, -0.00030522048473358154, -0.00027548521757125854, -0.00024574995040893555, -0.00021601468324661255, -0.00018627941608428955, -0.00015654414892196655, -0.00012680888175964355, -9.707361459732056e-05, -6.733834743499756e-05, -3.760308027267456e-05, -7.867813110351562e-06, 2.1867454051971436e-05, 5.1602721214294434e-05, 8.133798837661743e-05, 0.00011107325553894043, 0.00014080852270126343, 0.00017054378986358643, 0.00020027905702590942, 0.00023001432418823242, 0.0002597495913505554, 0.0002894848585128784, 0.0003192201256752014, 0.0003489553928375244, 0.0003786906599998474, 0.0004084259271621704, 0.0004381611943244934, 0.0004678964614868164, 0.0004976317286491394, 0.0005273669958114624, 0.0005571022629737854, 0.0005868375301361084, 0.0006165727972984314, 0.0006463080644607544, 0.0006760433316230774, 0.0007057785987854004, 0.0007355138659477234, 0.0007652491331100464, 0.0007949844002723694, 0.0008247196674346924, 0.0008544549345970154, 0.0008841902017593384, 0.0009139254689216614, 0.0009436607360839844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 8.0, 5.0, 13.0, 15.0, 19.0, 27.0, 30.0, 54.0, 67.0, 95.0, 153.0, 186.0, 309.0, 477.0, 812.0, 1501.0, 2830.0, 5980.0, 13732.0, 35468.0, 95553.0, 232597.0, 326363.0, 201221.0, 79209.0, 29236.0, 11534.0, 5031.0, 2453.0, 1363.0, 788.0, 469.0, 299.0, 173.0, 141.0, 123.0, 54.0, 48.0, 27.0, 21.0, 17.0, 14.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 5.0, 0.0, 1.0, 1.0], "bins": [-5.33203125, -5.16748046875, -5.0029296875, -4.83837890625, -4.673828125, -4.50927734375, -4.3447265625, -4.18017578125, -4.015625, -3.85107421875, -3.6865234375, -3.52197265625, -3.357421875, -3.19287109375, -3.0283203125, -2.86376953125, -2.69921875, -2.53466796875, -2.3701171875, -2.20556640625, -2.041015625, -1.87646484375, -1.7119140625, -1.54736328125, -1.3828125, -1.21826171875, -1.0537109375, -0.88916015625, -0.724609375, -0.56005859375, -0.3955078125, -0.23095703125, -0.06640625, 0.09814453125, 0.2626953125, 0.42724609375, 0.591796875, 0.75634765625, 0.9208984375, 1.08544921875, 1.25, 1.41455078125, 1.5791015625, 1.74365234375, 1.908203125, 2.07275390625, 2.2373046875, 2.40185546875, 2.56640625, 2.73095703125, 2.8955078125, 3.06005859375, 3.224609375, 3.38916015625, 3.5537109375, 3.71826171875, 3.8828125, 4.04736328125, 4.2119140625, 4.37646484375, 4.541015625, 4.70556640625, 4.8701171875, 5.03466796875, 5.19921875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 8.0, 13.0, 7.0, 17.0, 14.0, 21.0, 21.0, 35.0, 27.0, 34.0, 33.0, 35.0, 48.0, 50.0, 60.0, 76.0, 68.0, 57.0, 54.0, 55.0, 54.0, 48.0, 20.0, 26.0, 26.0, 13.0, 18.0, 17.0, 13.0, 4.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.48046875, -3.374359130859375, -3.26824951171875, -3.162139892578125, -3.0560302734375, -2.949920654296875, -2.84381103515625, -2.737701416015625, -2.631591796875, -2.525482177734375, -2.41937255859375, -2.313262939453125, -2.2071533203125, -2.101043701171875, -1.99493408203125, -1.888824462890625, -1.78271484375, -1.676605224609375, -1.57049560546875, -1.464385986328125, -1.3582763671875, -1.252166748046875, -1.14605712890625, -1.039947509765625, -0.933837890625, -0.827728271484375, -0.72161865234375, -0.615509033203125, -0.5093994140625, -0.403289794921875, -0.29718017578125, -0.191070556640625, -0.0849609375, 0.021148681640625, 0.12725830078125, 0.233367919921875, 0.3394775390625, 0.445587158203125, 0.55169677734375, 0.657806396484375, 0.763916015625, 0.870025634765625, 0.97613525390625, 1.082244873046875, 1.1883544921875, 1.294464111328125, 1.40057373046875, 1.506683349609375, 1.61279296875, 1.718902587890625, 1.82501220703125, 1.931121826171875, 2.0372314453125, 2.143341064453125, 2.24945068359375, 2.355560302734375, 2.461669921875, 2.567779541015625, 2.67388916015625, 2.779998779296875, 2.8861083984375, 2.992218017578125, 3.09832763671875, 3.204437255859375, 3.310546875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 16.0, 33.0, 50.0, 59.0, 130.0, 128.0, 143.0, 133.0, 98.0, 73.0, 47.0, 27.0, 21.0, 17.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.74972534179688, -70.46208190917969, -67.1744384765625, -63.88679885864258, -60.599159240722656, -57.31151580810547, -54.02387237548828, -50.736228942871094, -47.44858932495117, -44.160945892333984, -40.87330627441406, -37.585662841796875, -34.29801940917969, -31.010379791259766, -27.722736358642578, -24.435094833374023, -21.14745330810547, -17.859811782836914, -14.572169303894043, -11.284526824951172, -7.996885299682617, -4.7092437744140625, -1.421600341796875, 1.8660411834716797, 5.153682708740234, 8.441324234008789, 11.72896671295166, 15.016609191894531, 18.304250717163086, 21.59189224243164, 24.879535675048828, 28.167177200317383, 31.454818725585938, 34.742462158203125, 38.03010177612305, 41.317745208740234, 44.605384826660156, 47.893028259277344, 51.18067169189453, 54.46831512451172, 57.75595474243164, 61.04359817504883, 64.33123779296875, 67.61888122558594, 70.90652465820312, 74.19416809082031, 77.4818115234375, 80.76944732666016, 84.05709075927734, 87.34473419189453, 90.63237762451172, 93.92001342773438, 97.20765686035156, 100.49530029296875, 103.78294372558594, 107.07058715820312, 110.35823059082031, 113.6458740234375, 116.93351745605469, 120.22116088867188, 123.50879669189453, 126.79644012451172, 130.08407592773438, 133.37171936035156, 136.65936279296875]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 7.0, 14.0, 21.0, 23.0, 22.0, 38.0, 23.0, 41.0, 40.0, 46.0, 63.0, 59.0, 66.0, 71.0, 70.0, 42.0, 51.0, 49.0, 54.0, 42.0, 29.0, 30.0, 22.0, 19.0, 13.0, 12.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11974334716797, -67.11236572265625, -65.10498046875, -63.09760284423828, -61.0902214050293, -59.08283996582031, -57.075462341308594, -55.06808090209961, -53.060699462890625, -51.05331802368164, -49.04594039916992, -47.03855895996094, -45.03117752075195, -43.02379608154297, -41.01641845703125, -39.009037017822266, -37.00165939331055, -34.99427795410156, -32.986900329589844, -30.97951889038086, -28.972137451171875, -26.964757919311523, -24.957378387451172, -22.949996948242188, -20.942617416381836, -18.935237884521484, -16.9278564453125, -14.920476913452148, -12.91309642791748, -10.905715942382812, -8.898336410522461, -6.890955924987793, -4.883579254150391, -2.8761990070343018, -0.8688187599182129, 1.1385612487792969, 3.145941734313965, 5.153322219848633, 7.160701751708984, 9.168082237243652, 11.17546272277832, 13.182843208312988, 15.190223693847656, 17.197603225708008, 19.20498275756836, 21.212364196777344, 23.219743728637695, 25.227123260498047, 27.23450469970703, 29.241884231567383, 31.249265670776367, 33.25664520263672, 35.2640266418457, 37.27140808105469, 39.278785705566406, 41.28616714477539, 43.293548583984375, 45.30093002319336, 47.30830764770508, 49.31568908691406, 51.32307052612305, 53.33045196533203, 55.33782958984375, 57.345211029052734, 59.35258865356445]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 14.0, 21.0, 24.0, 42.0, 52.0, 90.0, 138.0, 182.0, 343.0, 653.0, 1317.0, 3203.0, 9775.0, 41473.0, 537638.0, 3511248.0, 67167.0, 13597.0, 3940.0, 1550.0, 692.0, 397.0, 248.0, 130.0, 87.0, 49.0, 61.0, 30.0, 13.0, 29.0, 13.0, 10.0, 8.0, 13.0, 4.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-32.0625, -30.9619140625, -29.861328125, -28.7607421875, -27.66015625, -26.5595703125, -25.458984375, -24.3583984375, -23.2578125, -22.1572265625, -21.056640625, -19.9560546875, -18.85546875, -17.7548828125, -16.654296875, -15.5537109375, -14.453125, -13.3525390625, -12.251953125, -11.1513671875, -10.05078125, -8.9501953125, -7.849609375, -6.7490234375, -5.6484375, -4.5478515625, -3.447265625, -2.3466796875, -1.24609375, -0.1455078125, 0.955078125, 2.0556640625, 3.15625, 4.2568359375, 5.357421875, 6.4580078125, 7.55859375, 8.6591796875, 9.759765625, 10.8603515625, 11.9609375, 13.0615234375, 14.162109375, 15.2626953125, 16.36328125, 17.4638671875, 18.564453125, 19.6650390625, 20.765625, 21.8662109375, 22.966796875, 24.0673828125, 25.16796875, 26.2685546875, 27.369140625, 28.4697265625, 29.5703125, 30.6708984375, 31.771484375, 32.8720703125, 33.97265625, 35.0732421875, 36.173828125, 37.2744140625, 38.375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 12.0, 15.0, 19.0, 19.0, 32.0, 47.0, 47.0, 53.0, 61.0, 72.0, 73.0, 76.0, 82.0, 66.0, 64.0, 58.0, 56.0, 35.0, 32.0, 16.0, 16.0, 12.0, 8.0, 5.0, 1.0, 1.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.50079345703125, -2.4019775390625, -2.30316162109375, -2.204345703125, -2.10552978515625, -2.0067138671875, -1.90789794921875, -1.80908203125, -1.71026611328125, -1.6114501953125, -1.51263427734375, -1.413818359375, -1.31500244140625, -1.2161865234375, -1.11737060546875, -1.0185546875, -0.91973876953125, -0.8209228515625, -0.72210693359375, -0.623291015625, -0.52447509765625, -0.4256591796875, -0.32684326171875, -0.22802734375, -0.12921142578125, -0.0303955078125, 0.06842041015625, 0.167236328125, 0.26605224609375, 0.3648681640625, 0.46368408203125, 0.5625, 0.66131591796875, 0.7601318359375, 0.85894775390625, 0.957763671875, 1.05657958984375, 1.1553955078125, 1.25421142578125, 1.35302734375, 1.45184326171875, 1.5506591796875, 1.64947509765625, 1.748291015625, 1.84710693359375, 1.9459228515625, 2.04473876953125, 2.1435546875, 2.24237060546875, 2.3411865234375, 2.44000244140625, 2.538818359375, 2.63763427734375, 2.7364501953125, 2.83526611328125, 2.93408203125, 3.03289794921875, 3.1317138671875, 3.23052978515625, 3.329345703125, 3.42816162109375, 3.5269775390625, 3.62579345703125, 3.724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 9.0, 6.0, 10.0, 11.0, 25.0, 21.0, 41.0, 42.0, 80.0, 88.0, 127.0, 177.0, 292.0, 532.0, 936.0, 1788.0, 3959.0, 10021.0, 32929.0, 144125.0, 2583833.0, 1250510.0, 120739.0, 28459.0, 8825.0, 3380.0, 1503.0, 709.0, 389.0, 223.0, 157.0, 107.0, 75.0, 38.0, 38.0, 20.0, 22.0, 10.0, 9.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.53125, -18.8564453125, -18.181640625, -17.5068359375, -16.83203125, -16.1572265625, -15.482421875, -14.8076171875, -14.1328125, -13.4580078125, -12.783203125, -12.1083984375, -11.43359375, -10.7587890625, -10.083984375, -9.4091796875, -8.734375, -8.0595703125, -7.384765625, -6.7099609375, -6.03515625, -5.3603515625, -4.685546875, -4.0107421875, -3.3359375, -2.6611328125, -1.986328125, -1.3115234375, -0.63671875, 0.0380859375, 0.712890625, 1.3876953125, 2.0625, 2.7373046875, 3.412109375, 4.0869140625, 4.76171875, 5.4365234375, 6.111328125, 6.7861328125, 7.4609375, 8.1357421875, 8.810546875, 9.4853515625, 10.16015625, 10.8349609375, 11.509765625, 12.1845703125, 12.859375, 13.5341796875, 14.208984375, 14.8837890625, 15.55859375, 16.2333984375, 16.908203125, 17.5830078125, 18.2578125, 18.9326171875, 19.607421875, 20.2822265625, 20.95703125, 21.6318359375, 22.306640625, 22.9814453125, 23.65625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 8.0, 17.0, 20.0, 32.0, 50.0, 91.0, 175.0, 399.0, 1880.0, 791.0, 264.0, 139.0, 79.0, 54.0, 28.0, 22.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.21063232421875, -9.9603271484375, -9.71002197265625, -9.459716796875, -9.20941162109375, -8.9591064453125, -8.70880126953125, -8.45849609375, -8.20819091796875, -7.9578857421875, -7.70758056640625, -7.457275390625, -7.20697021484375, -6.9566650390625, -6.70635986328125, -6.4560546875, -6.20574951171875, -5.9554443359375, -5.70513916015625, -5.454833984375, -5.20452880859375, -4.9542236328125, -4.70391845703125, -4.45361328125, -4.20330810546875, -3.9530029296875, -3.70269775390625, -3.452392578125, -3.20208740234375, -2.9517822265625, -2.70147705078125, -2.451171875, -2.20086669921875, -1.9505615234375, -1.70025634765625, -1.449951171875, -1.19964599609375, -0.9493408203125, -0.69903564453125, -0.44873046875, -0.19842529296875, 0.0518798828125, 0.30218505859375, 0.552490234375, 0.80279541015625, 1.0531005859375, 1.30340576171875, 1.5537109375, 1.80401611328125, 2.0543212890625, 2.30462646484375, 2.554931640625, 2.80523681640625, 3.0555419921875, 3.30584716796875, 3.55615234375, 3.80645751953125, 4.0567626953125, 4.30706787109375, 4.557373046875, 4.80767822265625, 5.0579833984375, 5.30828857421875, 5.55859375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 7.0, 18.0, 11.0, 29.0, 25.0, 43.0, 46.0, 93.0, 100.0, 117.0, 105.0, 97.0, 100.0, 65.0, 47.0, 39.0, 21.0, 11.0, 11.0, 4.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.752973556518555, -27.701313018798828, -26.649654388427734, -25.597993850708008, -24.54633331298828, -23.494674682617188, -22.44301414489746, -21.391353607177734, -20.33969497680664, -19.288034439086914, -18.23637580871582, -17.184715270996094, -16.133054733276367, -15.081395149230957, -14.029735565185547, -12.97807502746582, -11.926414489746094, -10.874754905700684, -9.823094367980957, -8.771434783935547, -7.7197747230529785, -6.66811466217041, -5.616455078125, -4.564795017242432, -3.5131349563598633, -2.461474895477295, -1.4098150730133057, -0.3581552505493164, 0.693504810333252, 1.7451648712158203, 2.7968244552612305, 3.848484516143799, 4.900142669677734, 5.951802730560303, 7.003462791442871, 8.055122375488281, 9.106782913208008, 10.158442497253418, 11.210102081298828, 12.261762619018555, 13.313422203063965, 14.365081787109375, 15.416742324829102, 16.468402862548828, 17.520061492919922, 18.57172203063965, 19.623382568359375, 20.67504119873047, 21.726701736450195, 22.778362274169922, 23.830020904541016, 24.881681442260742, 25.93334197998047, 26.985000610351562, 28.03666114807129, 29.088321685791016, 30.13998031616211, 31.191640853881836, 32.24330139160156, 33.294960021972656, 34.34661865234375, 35.39828109741211, 36.4499397277832, 37.5015983581543, 38.553260803222656]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 14.0, 5.0, 12.0, 8.0, 14.0, 11.0, 12.0, 13.0, 10.0, 12.0, 20.0, 22.0, 16.0, 34.0, 36.0, 23.0, 18.0, 33.0, 40.0, 26.0, 33.0, 54.0, 41.0, 37.0, 30.0, 42.0, 38.0, 30.0, 31.0, 29.0, 30.0, 23.0, 31.0, 41.0, 15.0, 16.0, 16.0, 16.0, 12.0, 13.0, 10.0, 7.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.96296501159668, -15.47378921508789, -14.984614372253418, -14.495438575744629, -14.00626277923584, -13.517087936401367, -13.027912139892578, -12.538736343383789, -12.049560546875, -11.560384750366211, -11.071209907531738, -10.58203411102295, -10.09285831451416, -9.603683471679688, -9.114507675170898, -8.62533187866211, -8.136157035827637, -7.646981716156006, -7.157805919647217, -6.668630599975586, -6.179454803466797, -5.690279483795166, -5.201104164123535, -4.711928367614746, -4.222753047943115, -3.7335774898529053, -3.2444019317626953, -2.7552266120910645, -2.2660510540008545, -1.7768754959106445, -1.2877001762390137, -0.7985246181488037, -0.30934810638427734, 0.17982739210128784, 0.669002890586853, 1.1581783294677734, 1.6473538875579834, 2.1365294456481934, 2.625704765319824, 3.114880323410034, 3.604055881500244, 4.093231201171875, 4.582406997680664, 5.071582317352295, 5.560757637023926, 6.049933433532715, 6.539108753204346, 7.028284072875977, 7.517459869384766, 8.006635665893555, 8.495810508728027, 8.984986305236816, 9.474162101745605, 9.963336944580078, 10.452512741088867, 10.941688537597656, 11.430864334106445, 11.920040130615234, 12.409214973449707, 12.898390769958496, 13.387566566467285, 13.876741409301758, 14.365917205810547, 14.855093002319336, 15.344267845153809]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 13.0, 14.0, 24.0, 29.0, 29.0, 40.0, 48.0, 53.0, 97.0, 137.0, 221.0, 329.0, 596.0, 1049.0, 2310.0, 5913.0, 18109.0, 67582.0, 271669.0, 469183.0, 153685.0, 38502.0, 11209.0, 3882.0, 1663.0, 803.0, 439.0, 285.0, 205.0, 117.0, 83.0, 52.0, 41.0, 33.0, 33.0, 22.0, 14.0, 7.0, 7.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.056640625, -19.39453125, -18.732421875, -18.0703125, -17.408203125, -16.74609375, -16.083984375, -15.421875, -14.759765625, -14.09765625, -13.435546875, -12.7734375, -12.111328125, -11.44921875, -10.787109375, -10.125, -9.462890625, -8.80078125, -8.138671875, -7.4765625, -6.814453125, -6.15234375, -5.490234375, -4.828125, -4.166015625, -3.50390625, -2.841796875, -2.1796875, -1.517578125, -0.85546875, -0.193359375, 0.46875, 1.130859375, 1.79296875, 2.455078125, 3.1171875, 3.779296875, 4.44140625, 5.103515625, 5.765625, 6.427734375, 7.08984375, 7.751953125, 8.4140625, 9.076171875, 9.73828125, 10.400390625, 11.0625, 11.724609375, 12.38671875, 13.048828125, 13.7109375, 14.373046875, 15.03515625, 15.697265625, 16.359375, 17.021484375, 17.68359375, 18.345703125, 19.0078125, 19.669921875, 20.33203125, 20.994140625, 21.65625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 19.0, 19.0, 19.0, 41.0, 51.0, 51.0, 47.0, 71.0, 89.0, 83.0, 86.0, 79.0, 72.0, 78.0, 46.0, 35.0, 35.0, 24.0, 19.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.21856689453125, -3.1070556640625, -2.99554443359375, -2.884033203125, -2.77252197265625, -2.6610107421875, -2.54949951171875, -2.43798828125, -2.32647705078125, -2.2149658203125, -2.10345458984375, -1.991943359375, -1.88043212890625, -1.7689208984375, -1.65740966796875, -1.5458984375, -1.43438720703125, -1.3228759765625, -1.21136474609375, -1.099853515625, -0.98834228515625, -0.8768310546875, -0.76531982421875, -0.65380859375, -0.54229736328125, -0.4307861328125, -0.31927490234375, -0.207763671875, -0.09625244140625, 0.0152587890625, 0.12677001953125, 0.23828125, 0.34979248046875, 0.4613037109375, 0.57281494140625, 0.684326171875, 0.79583740234375, 0.9073486328125, 1.01885986328125, 1.13037109375, 1.24188232421875, 1.3533935546875, 1.46490478515625, 1.576416015625, 1.68792724609375, 1.7994384765625, 1.91094970703125, 2.0224609375, 2.13397216796875, 2.2454833984375, 2.35699462890625, 2.468505859375, 2.58001708984375, 2.6915283203125, 2.80303955078125, 2.91455078125, 3.02606201171875, 3.1375732421875, 3.24908447265625, 3.360595703125, 3.47210693359375, 3.5836181640625, 3.69512939453125, 3.806640625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 12.0, 11.0, 11.0, 19.0, 33.0, 42.0, 60.0, 68.0, 111.0, 167.0, 232.0, 338.0, 482.0, 760.0, 1352.0, 2387.0, 4731.0, 9774.0, 22522.0, 52419.0, 122348.0, 246607.0, 291300.0, 161688.0, 73082.0, 30936.0, 13238.0, 6180.0, 3110.0, 1647.0, 1010.0, 647.0, 399.0, 254.0, 153.0, 105.0, 81.0, 72.0, 42.0, 39.0, 23.0, 18.0, 9.0, 5.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-9.421875, -9.129150390625, -8.83642578125, -8.543701171875, -8.2509765625, -7.958251953125, -7.66552734375, -7.372802734375, -7.080078125, -6.787353515625, -6.49462890625, -6.201904296875, -5.9091796875, -5.616455078125, -5.32373046875, -5.031005859375, -4.73828125, -4.445556640625, -4.15283203125, -3.860107421875, -3.5673828125, -3.274658203125, -2.98193359375, -2.689208984375, -2.396484375, -2.103759765625, -1.81103515625, -1.518310546875, -1.2255859375, -0.932861328125, -0.64013671875, -0.347412109375, -0.0546875, 0.238037109375, 0.53076171875, 0.823486328125, 1.1162109375, 1.408935546875, 1.70166015625, 1.994384765625, 2.287109375, 2.579833984375, 2.87255859375, 3.165283203125, 3.4580078125, 3.750732421875, 4.04345703125, 4.336181640625, 4.62890625, 4.921630859375, 5.21435546875, 5.507080078125, 5.7998046875, 6.092529296875, 6.38525390625, 6.677978515625, 6.970703125, 7.263427734375, 7.55615234375, 7.848876953125, 8.1416015625, 8.434326171875, 8.72705078125, 9.019775390625, 9.3125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 9.0, 9.0, 7.0, 10.0, 9.0, 12.0, 22.0, 21.0, 22.0, 25.0, 27.0, 41.0, 36.0, 38.0, 35.0, 46.0, 35.0, 40.0, 47.0, 39.0, 47.0, 39.0, 36.0, 33.0, 37.0, 38.0, 35.0, 26.0, 30.0, 20.0, 20.0, 15.0, 14.0, 13.0, 14.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.4453125, -8.185791015625, -7.92626953125, -7.666748046875, -7.4072265625, -7.147705078125, -6.88818359375, -6.628662109375, -6.369140625, -6.109619140625, -5.85009765625, -5.590576171875, -5.3310546875, -5.071533203125, -4.81201171875, -4.552490234375, -4.29296875, -4.033447265625, -3.77392578125, -3.514404296875, -3.2548828125, -2.995361328125, -2.73583984375, -2.476318359375, -2.216796875, -1.957275390625, -1.69775390625, -1.438232421875, -1.1787109375, -0.919189453125, -0.65966796875, -0.400146484375, -0.140625, 0.118896484375, 0.37841796875, 0.637939453125, 0.8974609375, 1.156982421875, 1.41650390625, 1.676025390625, 1.935546875, 2.195068359375, 2.45458984375, 2.714111328125, 2.9736328125, 3.233154296875, 3.49267578125, 3.752197265625, 4.01171875, 4.271240234375, 4.53076171875, 4.790283203125, 5.0498046875, 5.309326171875, 5.56884765625, 5.828369140625, 6.087890625, 6.347412109375, 6.60693359375, 6.866455078125, 7.1259765625, 7.385498046875, 7.64501953125, 7.904541015625, 8.1640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 8.0, 11.0, 9.0, 14.0, 16.0, 29.0, 45.0, 74.0, 67.0, 158.0, 216.0, 449.0, 874.0, 2170.0, 6025.0, 20871.0, 83151.0, 336391.0, 430040.0, 124660.0, 29780.0, 8454.0, 2808.0, 1081.0, 471.0, 282.0, 144.0, 89.0, 61.0, 32.0, 26.0, 25.0, 11.0, 9.0, 7.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.6015625, -8.38177490234375, -8.1619873046875, -7.94219970703125, -7.722412109375, -7.50262451171875, -7.2828369140625, -7.06304931640625, -6.84326171875, -6.62347412109375, -6.4036865234375, -6.18389892578125, -5.964111328125, -5.74432373046875, -5.5245361328125, -5.30474853515625, -5.0849609375, -4.86517333984375, -4.6453857421875, -4.42559814453125, -4.205810546875, -3.98602294921875, -3.7662353515625, -3.54644775390625, -3.32666015625, -3.10687255859375, -2.8870849609375, -2.66729736328125, -2.447509765625, -2.22772216796875, -2.0079345703125, -1.78814697265625, -1.568359375, -1.34857177734375, -1.1287841796875, -0.90899658203125, -0.689208984375, -0.46942138671875, -0.2496337890625, -0.02984619140625, 0.18994140625, 0.40972900390625, 0.6295166015625, 0.84930419921875, 1.069091796875, 1.28887939453125, 1.5086669921875, 1.72845458984375, 1.9482421875, 2.16802978515625, 2.3878173828125, 2.60760498046875, 2.827392578125, 3.04718017578125, 3.2669677734375, 3.48675537109375, 3.70654296875, 3.92633056640625, 4.1461181640625, 4.36590576171875, 4.585693359375, 4.80548095703125, 5.0252685546875, 5.24505615234375, 5.46484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 8.0, 7.0, 6.0, 8.0, 12.0, 8.0, 25.0, 29.0, 25.0, 33.0, 35.0, 42.0, 64.0, 68.0, 91.0, 88.0, 92.0, 66.0, 65.0, 51.0, 33.0, 25.0, 20.0, 17.0, 15.0, 7.0, 12.0, 7.0, 2.0, 12.0, 6.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007719993591308594, -0.0007464438676834106, -0.0007208883762359619, -0.0006953328847885132, -0.0006697773933410645, -0.0006442219018936157, -0.000618666410446167, -0.0005931109189987183, -0.0005675554275512695, -0.0005419999361038208, -0.0005164444446563721, -0.0004908889532089233, -0.0004653334617614746, -0.0004397779703140259, -0.00041422247886657715, -0.0003886669874191284, -0.0003631114959716797, -0.00033755600452423096, -0.0003120005130767822, -0.0002864450216293335, -0.00026088953018188477, -0.00023533403873443604, -0.0002097785472869873, -0.00018422305583953857, -0.00015866756439208984, -0.0001331120729446411, -0.00010755658149719238, -8.200109004974365e-05, -5.644559860229492e-05, -3.089010715484619e-05, -5.334615707397461e-06, 2.022087574005127e-05, 4.57763671875e-05, 7.133185863494873e-05, 9.688735008239746e-05, 0.0001224428415298462, 0.00014799833297729492, 0.00017355382442474365, 0.00019910931587219238, 0.0002246648073196411, 0.00025022029876708984, 0.0002757757902145386, 0.0003013312816619873, 0.00032688677310943604, 0.00035244226455688477, 0.0003779977560043335, 0.0004035532474517822, 0.00042910873889923096, 0.0004546642303466797, 0.0004802197217941284, 0.0005057752132415771, 0.0005313307046890259, 0.0005568861961364746, 0.0005824416875839233, 0.0006079971790313721, 0.0006335526704788208, 0.0006591081619262695, 0.0006846636533737183, 0.000710219144821167, 0.0007357746362686157, 0.0007613301277160645, 0.0007868856191635132, 0.0008124411106109619, 0.0008379966020584106, 0.0008635520935058594]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 17.0, 28.0, 31.0, 58.0, 80.0, 119.0, 221.0, 439.0, 868.0, 1743.0, 3902.0, 10818.0, 36629.0, 139531.0, 434858.0, 304301.0, 80124.0, 22091.0, 7180.0, 2800.0, 1266.0, 635.0, 327.0, 167.0, 102.0, 65.0, 49.0, 27.0, 21.0, 15.0, 9.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.08856201171875, -6.8724365234375, -6.65631103515625, -6.440185546875, -6.22406005859375, -6.0079345703125, -5.79180908203125, -5.57568359375, -5.35955810546875, -5.1434326171875, -4.92730712890625, -4.711181640625, -4.49505615234375, -4.2789306640625, -4.06280517578125, -3.8466796875, -3.63055419921875, -3.4144287109375, -3.19830322265625, -2.982177734375, -2.76605224609375, -2.5499267578125, -2.33380126953125, -2.11767578125, -1.90155029296875, -1.6854248046875, -1.46929931640625, -1.253173828125, -1.03704833984375, -0.8209228515625, -0.60479736328125, -0.388671875, -0.17254638671875, 0.0435791015625, 0.25970458984375, 0.475830078125, 0.69195556640625, 0.9080810546875, 1.12420654296875, 1.34033203125, 1.55645751953125, 1.7725830078125, 1.98870849609375, 2.204833984375, 2.42095947265625, 2.6370849609375, 2.85321044921875, 3.0693359375, 3.28546142578125, 3.5015869140625, 3.71771240234375, 3.933837890625, 4.14996337890625, 4.3660888671875, 4.58221435546875, 4.79833984375, 5.01446533203125, 5.2305908203125, 5.44671630859375, 5.662841796875, 5.87896728515625, 6.0950927734375, 6.31121826171875, 6.52734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 10.0, 8.0, 16.0, 11.0, 14.0, 14.0, 21.0, 33.0, 21.0, 31.0, 38.0, 48.0, 33.0, 52.0, 59.0, 35.0, 69.0, 61.0, 64.0, 48.0, 41.0, 32.0, 37.0, 40.0, 26.0, 23.0, 18.0, 22.0, 12.0, 8.0, 7.0, 8.0, 9.0, 2.0, 6.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.470703125, -3.369415283203125, -3.26812744140625, -3.166839599609375, -3.0655517578125, -2.964263916015625, -2.86297607421875, -2.761688232421875, -2.660400390625, -2.559112548828125, -2.45782470703125, -2.356536865234375, -2.2552490234375, -2.153961181640625, -2.05267333984375, -1.951385498046875, -1.85009765625, -1.748809814453125, -1.64752197265625, -1.546234130859375, -1.4449462890625, -1.343658447265625, -1.24237060546875, -1.141082763671875, -1.039794921875, -0.938507080078125, -0.83721923828125, -0.735931396484375, -0.6346435546875, -0.533355712890625, -0.43206787109375, -0.330780029296875, -0.2294921875, -0.128204345703125, -0.02691650390625, 0.074371337890625, 0.1756591796875, 0.276947021484375, 0.37823486328125, 0.479522705078125, 0.580810546875, 0.682098388671875, 0.78338623046875, 0.884674072265625, 0.9859619140625, 1.087249755859375, 1.18853759765625, 1.289825439453125, 1.39111328125, 1.492401123046875, 1.59368896484375, 1.694976806640625, 1.7962646484375, 1.897552490234375, 1.99884033203125, 2.100128173828125, 2.201416015625, 2.302703857421875, 2.40399169921875, 2.505279541015625, 2.6065673828125, 2.707855224609375, 2.80914306640625, 2.910430908203125, 3.01171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 7.0, 8.0, 13.0, 14.0, 31.0, 47.0, 56.0, 63.0, 106.0, 114.0, 109.0, 107.0, 93.0, 77.0, 51.0, 31.0, 17.0, 17.0, 13.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.70713806152344, -79.26144409179688, -76.81575012207031, -74.37005615234375, -71.92436218261719, -69.47866821289062, -67.03297424316406, -64.5872802734375, -62.14158248901367, -59.69588851928711, -57.25019454956055, -54.804500579833984, -52.358802795410156, -49.913108825683594, -47.46741485595703, -45.02172088623047, -42.576026916503906, -40.130332946777344, -37.68463897705078, -35.23894500732422, -32.793251037597656, -30.34755516052246, -27.901859283447266, -25.456165313720703, -23.01047134399414, -20.564777374267578, -18.119083404541016, -15.67338752746582, -13.227693557739258, -10.781999588012695, -8.336304664611816, -5.8906097412109375, -3.444915771484375, -0.9992213249206543, 1.4464731216430664, 3.892167568206787, 6.337862014770508, 8.78355598449707, 11.22925090789795, 13.674945831298828, 16.12063980102539, 18.566333770751953, 21.012027740478516, 23.45772361755371, 25.903417587280273, 28.349111557006836, 30.79480743408203, 33.240501403808594, 35.686195373535156, 38.13188934326172, 40.57758331298828, 43.023277282714844, 45.468971252441406, 47.91466522216797, 50.3603630065918, 52.80605697631836, 55.25175094604492, 57.697444915771484, 60.14313888549805, 62.58883285522461, 65.03453063964844, 67.480224609375, 69.92591857910156, 72.37161254882812, 74.81730651855469]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 3.0, 7.0, 10.0, 13.0, 15.0, 17.0, 17.0, 24.0, 29.0, 26.0, 39.0, 39.0, 46.0, 45.0, 42.0, 46.0, 46.0, 52.0, 49.0, 44.0, 41.0, 36.0, 41.0, 34.0, 47.0, 27.0, 22.0, 16.0, 16.0, 21.0, 18.0, 12.0, 18.0, 11.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.153602600097656, -57.57966613769531, -56.00572967529297, -54.431793212890625, -52.85785675048828, -51.2839241027832, -49.70998764038086, -48.136051177978516, -46.56211471557617, -44.98817825317383, -43.414241790771484, -41.84030532836914, -40.26637268066406, -38.69243621826172, -37.118499755859375, -35.54456329345703, -33.97062683105469, -32.396690368652344, -30.82275390625, -29.24881935119629, -27.674882888793945, -26.1009464263916, -24.52701187133789, -22.953075408935547, -21.379138946533203, -19.80520248413086, -18.231266021728516, -16.657331466674805, -15.083395004272461, -13.509458541870117, -11.93552303314209, -10.361587524414062, -8.787651062011719, -7.213715076446533, -5.639779090881348, -4.065843105316162, -2.4919071197509766, -0.917971134185791, 0.6559648513793945, 2.229900360107422, 3.8038368225097656, 5.377772808074951, 6.951708793640137, 8.525644302368164, 10.099580764770508, 11.673517227172852, 13.247452735900879, 14.821388244628906, 16.39532470703125, 17.969261169433594, 19.543197631835938, 21.11713218688965, 22.691068649291992, 24.265005111694336, 25.838939666748047, 27.41287612915039, 28.986812591552734, 30.560749053955078, 32.13468551635742, 33.708621978759766, 35.282554626464844, 36.85649108886719, 38.43042755126953, 40.004364013671875, 41.57830047607422]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 8.0, 9.0, 20.0, 16.0, 31.0, 52.0, 72.0, 137.0, 256.0, 557.0, 1218.0, 2986.0, 10728.0, 63543.0, 3406484.0, 657788.0, 38821.0, 7337.0, 2242.0, 918.0, 379.0, 215.0, 164.0, 84.0, 57.0, 42.0, 28.0, 16.0, 24.0, 15.0, 11.0, 2.0, 2.0, 6.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.984375, -28.728759765625, -27.47314453125, -26.217529296875, -24.9619140625, -23.706298828125, -22.45068359375, -21.195068359375, -19.939453125, -18.683837890625, -17.42822265625, -16.172607421875, -14.9169921875, -13.661376953125, -12.40576171875, -11.150146484375, -9.89453125, -8.638916015625, -7.38330078125, -6.127685546875, -4.8720703125, -3.616455078125, -2.36083984375, -1.105224609375, 0.150390625, 1.406005859375, 2.66162109375, 3.917236328125, 5.1728515625, 6.428466796875, 7.68408203125, 8.939697265625, 10.1953125, 11.450927734375, 12.70654296875, 13.962158203125, 15.2177734375, 16.473388671875, 17.72900390625, 18.984619140625, 20.240234375, 21.495849609375, 22.75146484375, 24.007080078125, 25.2626953125, 26.518310546875, 27.77392578125, 29.029541015625, 30.28515625, 31.540771484375, 32.79638671875, 34.052001953125, 35.3076171875, 36.563232421875, 37.81884765625, 39.074462890625, 40.330078125, 41.585693359375, 42.84130859375, 44.096923828125, 45.3525390625, 46.608154296875, 47.86376953125, 49.119384765625, 50.375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 7.0, 5.0, 17.0, 20.0, 31.0, 30.0, 37.0, 54.0, 60.0, 69.0, 78.0, 76.0, 86.0, 80.0, 75.0, 55.0, 56.0, 35.0, 33.0, 25.0, 26.0, 13.0, 8.0, 12.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.958984375, -2.857086181640625, -2.75518798828125, -2.653289794921875, -2.5513916015625, -2.449493408203125, -2.34759521484375, -2.245697021484375, -2.143798828125, -2.041900634765625, -1.94000244140625, -1.838104248046875, -1.7362060546875, -1.634307861328125, -1.53240966796875, -1.430511474609375, -1.32861328125, -1.226715087890625, -1.12481689453125, -1.022918701171875, -0.9210205078125, -0.819122314453125, -0.71722412109375, -0.615325927734375, -0.513427734375, -0.411529541015625, -0.30963134765625, -0.207733154296875, -0.1058349609375, -0.003936767578125, 0.09796142578125, 0.199859619140625, 0.3017578125, 0.403656005859375, 0.50555419921875, 0.607452392578125, 0.7093505859375, 0.811248779296875, 0.91314697265625, 1.015045166015625, 1.116943359375, 1.218841552734375, 1.32073974609375, 1.422637939453125, 1.5245361328125, 1.626434326171875, 1.72833251953125, 1.830230712890625, 1.93212890625, 2.034027099609375, 2.13592529296875, 2.237823486328125, 2.3397216796875, 2.441619873046875, 2.54351806640625, 2.645416259765625, 2.747314453125, 2.849212646484375, 2.95111083984375, 3.053009033203125, 3.1549072265625, 3.256805419921875, 3.35870361328125, 3.460601806640625, 3.5625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 12.0, 16.0, 24.0, 42.0, 50.0, 93.0, 127.0, 213.0, 327.0, 661.0, 1194.0, 2791.0, 8953.0, 58016.0, 3097091.0, 976754.0, 35987.0, 6850.0, 2478.0, 1124.0, 601.0, 343.0, 206.0, 120.0, 66.0, 44.0, 29.0, 19.0, 16.0, 11.0, 5.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.71826171875, -35.5302734375, -34.34228515625, -33.154296875, -31.96630859375, -30.7783203125, -29.59033203125, -28.40234375, -27.21435546875, -26.0263671875, -24.83837890625, -23.650390625, -22.46240234375, -21.2744140625, -20.08642578125, -18.8984375, -17.71044921875, -16.5224609375, -15.33447265625, -14.146484375, -12.95849609375, -11.7705078125, -10.58251953125, -9.39453125, -8.20654296875, -7.0185546875, -5.83056640625, -4.642578125, -3.45458984375, -2.2666015625, -1.07861328125, 0.109375, 1.29736328125, 2.4853515625, 3.67333984375, 4.861328125, 6.04931640625, 7.2373046875, 8.42529296875, 9.61328125, 10.80126953125, 11.9892578125, 13.17724609375, 14.365234375, 15.55322265625, 16.7412109375, 17.92919921875, 19.1171875, 20.30517578125, 21.4931640625, 22.68115234375, 23.869140625, 25.05712890625, 26.2451171875, 27.43310546875, 28.62109375, 29.80908203125, 30.9970703125, 32.18505859375, 33.373046875, 34.56103515625, 35.7490234375, 36.93701171875, 38.125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 9.0, 7.0, 13.0, 23.0, 49.0, 81.0, 191.0, 508.0, 2026.0, 737.0, 242.0, 92.0, 47.0, 16.0, 15.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.828125, -12.3802490234375, -11.932373046875, -11.4844970703125, -11.03662109375, -10.5887451171875, -10.140869140625, -9.6929931640625, -9.2451171875, -8.7972412109375, -8.349365234375, -7.9014892578125, -7.45361328125, -7.0057373046875, -6.557861328125, -6.1099853515625, -5.662109375, -5.2142333984375, -4.766357421875, -4.3184814453125, -3.87060546875, -3.4227294921875, -2.974853515625, -2.5269775390625, -2.0791015625, -1.6312255859375, -1.183349609375, -0.7354736328125, -0.28759765625, 0.1602783203125, 0.608154296875, 1.0560302734375, 1.50390625, 1.9517822265625, 2.399658203125, 2.8475341796875, 3.29541015625, 3.7432861328125, 4.191162109375, 4.6390380859375, 5.0869140625, 5.5347900390625, 5.982666015625, 6.4305419921875, 6.87841796875, 7.3262939453125, 7.774169921875, 8.2220458984375, 8.669921875, 9.1177978515625, 9.565673828125, 10.0135498046875, 10.46142578125, 10.9093017578125, 11.357177734375, 11.8050537109375, 12.2529296875, 12.7008056640625, 13.148681640625, 13.5965576171875, 14.04443359375, 14.4923095703125, 14.940185546875, 15.3880615234375, 15.8359375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 15.0, 37.0, 63.0, 97.0, 172.0, 220.0, 158.0, 117.0, 59.0, 28.0, 15.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.96316528320312, -104.12205505371094, -101.28095245361328, -98.43984985351562, -95.59873962402344, -92.75762939453125, -89.9165267944336, -87.07542419433594, -84.23431396484375, -81.39320373535156, -78.5521011352539, -75.71099853515625, -72.86988830566406, -70.02877807617188, -67.18767547607422, -64.34657287597656, -61.505462646484375, -58.66435623168945, -55.82324981689453, -52.98214340209961, -50.14103698730469, -47.299930572509766, -44.458824157714844, -41.61771774291992, -38.776611328125, -35.93550491333008, -33.094398498535156, -30.253292083740234, -27.412185668945312, -24.57107925415039, -21.72997283935547, -18.888866424560547, -16.047767639160156, -13.206661224365234, -10.365554809570312, -7.524448394775391, -4.683341979980469, -1.8422355651855469, 0.998870849609375, 3.839977264404297, 6.681083679199219, 9.52219009399414, 12.363296508789062, 15.204402923583984, 18.045509338378906, 20.886615753173828, 23.72772216796875, 26.568828582763672, 29.409934997558594, 32.251041412353516, 35.09214782714844, 37.93325424194336, 40.77436065673828, 43.6154670715332, 46.456573486328125, 49.29767990112305, 52.13878631591797, 54.97989273071289, 57.82099914550781, 60.662105560302734, 63.503211975097656, 66.34431457519531, 69.1854248046875, 72.02653503417969, 74.86763763427734]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 10.0, 18.0, 36.0, 31.0, 48.0, 73.0, 66.0, 69.0, 88.0, 97.0, 71.0, 86.0, 83.0, 67.0, 47.0, 30.0, 38.0, 15.0, 13.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.20011901855469, -30.490598678588867, -28.781078338623047, -27.07155990600586, -25.36203956604004, -23.65251922607422, -21.9429988861084, -20.233478546142578, -18.52396011352539, -16.81443977355957, -15.104920387268066, -13.395400047302246, -11.685880661010742, -9.976360321044922, -8.266839981079102, -6.557320594787598, -4.847799301147461, -3.138279438018799, -1.4287593364715576, 0.2807607650756836, 1.9902806282043457, 3.699800491333008, 5.409320831298828, 7.118840217590332, 8.828360557556152, 10.537880897521973, 12.247400283813477, 13.956920623779297, 15.666440963745117, 17.375961303710938, 19.085479736328125, 20.795000076293945, 22.504520416259766, 24.214040756225586, 25.923561096191406, 27.633079528808594, 29.342599868774414, 31.052120208740234, 32.76164245605469, 34.471160888671875, 36.18067932128906, 37.89019775390625, 39.5997200012207, 41.30923843383789, 43.018760681152344, 44.72827911376953, 46.43779754638672, 48.14731979370117, 49.856842041015625, 51.56636047363281, 53.275882720947266, 54.98540115356445, 56.694923400878906, 58.404441833496094, 60.11396026611328, 61.823482513427734, 63.53300094604492, 65.24252319335938, 66.95204162597656, 68.66156005859375, 70.37107849121094, 72.08059692382812, 73.79012298583984, 75.49964141845703, 77.20915985107422]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 10.0, 15.0, 25.0, 21.0, 41.0, 59.0, 114.0, 212.0, 425.0, 973.0, 3205.0, 30011.0, 741554.0, 256363.0, 12023.0, 2043.0, 745.0, 311.0, 168.0, 87.0, 58.0, 34.0, 23.0, 13.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.6875, -65.01318359375, -63.3388671875, -61.66455078125, -59.990234375, -58.31591796875, -56.6416015625, -54.96728515625, -53.29296875, -51.61865234375, -49.9443359375, -48.27001953125, -46.595703125, -44.92138671875, -43.2470703125, -41.57275390625, -39.8984375, -38.22412109375, -36.5498046875, -34.87548828125, -33.201171875, -31.52685546875, -29.8525390625, -28.17822265625, -26.50390625, -24.82958984375, -23.1552734375, -21.48095703125, -19.806640625, -18.13232421875, -16.4580078125, -14.78369140625, -13.109375, -11.43505859375, -9.7607421875, -8.08642578125, -6.412109375, -4.73779296875, -3.0634765625, -1.38916015625, 0.28515625, 1.95947265625, 3.6337890625, 5.30810546875, 6.982421875, 8.65673828125, 10.3310546875, 12.00537109375, 13.6796875, 15.35400390625, 17.0283203125, 18.70263671875, 20.376953125, 22.05126953125, 23.7255859375, 25.39990234375, 27.07421875, 28.74853515625, 30.4228515625, 32.09716796875, 33.771484375, 35.44580078125, 37.1201171875, 38.79443359375, 40.46875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 11.0, 13.0, 22.0, 30.0, 53.0, 67.0, 78.0, 114.0, 124.0, 134.0, 96.0, 75.0, 64.0, 46.0, 32.0, 22.0, 12.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.24609375, -3.0904541015625, -2.934814453125, -2.7791748046875, -2.62353515625, -2.4678955078125, -2.312255859375, -2.1566162109375, -2.0009765625, -1.8453369140625, -1.689697265625, -1.5340576171875, -1.37841796875, -1.2227783203125, -1.067138671875, -0.9114990234375, -0.755859375, -0.6002197265625, -0.444580078125, -0.2889404296875, -0.13330078125, 0.0223388671875, 0.177978515625, 0.3336181640625, 0.4892578125, 0.6448974609375, 0.800537109375, 0.9561767578125, 1.11181640625, 1.2674560546875, 1.423095703125, 1.5787353515625, 1.734375, 1.8900146484375, 2.045654296875, 2.2012939453125, 2.35693359375, 2.5125732421875, 2.668212890625, 2.8238525390625, 2.9794921875, 3.1351318359375, 3.290771484375, 3.4464111328125, 3.60205078125, 3.7576904296875, 3.913330078125, 4.0689697265625, 4.224609375, 4.3802490234375, 4.535888671875, 4.6915283203125, 4.84716796875, 5.0028076171875, 5.158447265625, 5.3140869140625, 5.4697265625, 5.6253662109375, 5.781005859375, 5.9366455078125, 6.09228515625, 6.2479248046875, 6.403564453125, 6.5592041015625, 6.71484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 4.0, 7.0, 12.0, 21.0, 14.0, 38.0, 52.0, 76.0, 125.0, 190.0, 302.0, 471.0, 879.0, 1545.0, 2941.0, 6225.0, 13440.0, 30479.0, 70720.0, 167880.0, 357604.0, 226558.0, 94085.0, 40650.0, 18049.0, 7946.0, 3707.0, 1914.0, 1022.0, 585.0, 326.0, 234.0, 171.0, 82.0, 55.0, 41.0, 35.0, 18.0, 13.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.8189697265625, -7.536376953125, -7.2537841796875, -6.97119140625, -6.6885986328125, -6.406005859375, -6.1234130859375, -5.8408203125, -5.5582275390625, -5.275634765625, -4.9930419921875, -4.71044921875, -4.4278564453125, -4.145263671875, -3.8626708984375, -3.580078125, -3.2974853515625, -3.014892578125, -2.7322998046875, -2.44970703125, -2.1671142578125, -1.884521484375, -1.6019287109375, -1.3193359375, -1.0367431640625, -0.754150390625, -0.4715576171875, -0.18896484375, 0.0936279296875, 0.376220703125, 0.6588134765625, 0.94140625, 1.2239990234375, 1.506591796875, 1.7891845703125, 2.07177734375, 2.3543701171875, 2.636962890625, 2.9195556640625, 3.2021484375, 3.4847412109375, 3.767333984375, 4.0499267578125, 4.33251953125, 4.6151123046875, 4.897705078125, 5.1802978515625, 5.462890625, 5.7454833984375, 6.028076171875, 6.3106689453125, 6.59326171875, 6.8758544921875, 7.158447265625, 7.4410400390625, 7.7236328125, 8.0062255859375, 8.288818359375, 8.5714111328125, 8.85400390625, 9.1365966796875, 9.419189453125, 9.7017822265625, 9.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 9.0, 10.0, 8.0, 12.0, 24.0, 26.0, 24.0, 22.0, 40.0, 44.0, 47.0, 48.0, 44.0, 45.0, 43.0, 55.0, 49.0, 48.0, 57.0, 49.0, 47.0, 45.0, 36.0, 35.0, 20.0, 26.0, 17.0, 17.0, 15.0, 7.0, 8.0, 4.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.34765625, -10.03125, -9.71484375, -9.3984375, -9.08203125, -8.765625, -8.44921875, -8.1328125, -7.81640625, -7.5, -7.18359375, -6.8671875, -6.55078125, -6.234375, -5.91796875, -5.6015625, -5.28515625, -4.96875, -4.65234375, -4.3359375, -4.01953125, -3.703125, -3.38671875, -3.0703125, -2.75390625, -2.4375, -2.12109375, -1.8046875, -1.48828125, -1.171875, -0.85546875, -0.5390625, -0.22265625, 0.09375, 0.41015625, 0.7265625, 1.04296875, 1.359375, 1.67578125, 1.9921875, 2.30859375, 2.625, 2.94140625, 3.2578125, 3.57421875, 3.890625, 4.20703125, 4.5234375, 4.83984375, 5.15625, 5.47265625, 5.7890625, 6.10546875, 6.421875, 6.73828125, 7.0546875, 7.37109375, 7.6875, 8.00390625, 8.3203125, 8.63671875, 8.953125, 9.26953125, 9.5859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 11.0, 12.0, 9.0, 21.0, 24.0, 31.0, 48.0, 75.0, 111.0, 194.0, 326.0, 565.0, 945.0, 1996.0, 4202.0, 9942.0, 26958.0, 84111.0, 283441.0, 426617.0, 139135.0, 43043.0, 15067.0, 5907.0, 2652.0, 1343.0, 693.0, 395.0, 232.0, 152.0, 90.0, 62.0, 49.0, 25.0, 15.0, 10.0, 6.0, 10.0, 6.0, 7.0, 0.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.30126953125, -5.1064453125, -4.91162109375, -4.716796875, -4.52197265625, -4.3271484375, -4.13232421875, -3.9375, -3.74267578125, -3.5478515625, -3.35302734375, -3.158203125, -2.96337890625, -2.7685546875, -2.57373046875, -2.37890625, -2.18408203125, -1.9892578125, -1.79443359375, -1.599609375, -1.40478515625, -1.2099609375, -1.01513671875, -0.8203125, -0.62548828125, -0.4306640625, -0.23583984375, -0.041015625, 0.15380859375, 0.3486328125, 0.54345703125, 0.73828125, 0.93310546875, 1.1279296875, 1.32275390625, 1.517578125, 1.71240234375, 1.9072265625, 2.10205078125, 2.296875, 2.49169921875, 2.6865234375, 2.88134765625, 3.076171875, 3.27099609375, 3.4658203125, 3.66064453125, 3.85546875, 4.05029296875, 4.2451171875, 4.43994140625, 4.634765625, 4.82958984375, 5.0244140625, 5.21923828125, 5.4140625, 5.60888671875, 5.8037109375, 5.99853515625, 6.193359375, 6.38818359375, 6.5830078125, 6.77783203125, 6.97265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 9.0, 9.0, 8.0, 23.0, 16.0, 26.0, 41.0, 52.0, 73.0, 108.0, 150.0, 144.0, 105.0, 67.0, 40.0, 38.0, 28.0, 18.0, 11.0, 12.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001331329345703125, -0.0012942701578140259, -0.0012572109699249268, -0.0012201517820358276, -0.0011830925941467285, -0.0011460334062576294, -0.0011089742183685303, -0.0010719150304794312, -0.001034855842590332, -0.000997796654701233, -0.0009607374668121338, -0.0009236782789230347, -0.0008866190910339355, -0.0008495599031448364, -0.0008125007152557373, -0.0007754415273666382, -0.0007383823394775391, -0.0007013231515884399, -0.0006642639636993408, -0.0006272047758102417, -0.0005901455879211426, -0.0005530864000320435, -0.0005160272121429443, -0.0004789680242538452, -0.0004419088363647461, -0.00040484964847564697, -0.00036779046058654785, -0.00033073127269744873, -0.0002936720848083496, -0.0002566128969192505, -0.00021955370903015137, -0.00018249452114105225, -0.00014543533325195312, -0.000108376145362854, -7.131695747375488e-05, -3.425776958465576e-05, 2.8014183044433594e-06, 3.986060619354248e-05, 7.69197940826416e-05, 0.00011397898197174072, 0.00015103816986083984, 0.00018809735774993896, 0.00022515654563903809, 0.0002622157335281372, 0.00029927492141723633, 0.00033633410930633545, 0.00037339329719543457, 0.0004104524850845337, 0.0004475116729736328, 0.00048457086086273193, 0.0005216300487518311, 0.0005586892366409302, 0.0005957484245300293, 0.0006328076124191284, 0.0006698668003082275, 0.0007069259881973267, 0.0007439851760864258, 0.0007810443639755249, 0.000818103551864624, 0.0008551627397537231, 0.0008922219276428223, 0.0009292811155319214, 0.0009663403034210205, 0.0010033994913101196, 0.0010404586791992188]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 6.0, 7.0, 5.0, 12.0, 7.0, 19.0, 26.0, 40.0, 53.0, 73.0, 112.0, 167.0, 246.0, 373.0, 652.0, 1023.0, 1702.0, 2960.0, 5713.0, 11757.0, 27466.0, 72430.0, 210120.0, 408758.0, 190725.0, 65431.0, 25233.0, 10876.0, 5503.0, 2854.0, 1589.0, 952.0, 588.0, 350.0, 249.0, 157.0, 102.0, 64.0, 51.0, 36.0, 23.0, 12.0, 15.0, 9.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.62109375, -5.4423828125, -5.263671875, -5.0849609375, -4.90625, -4.7275390625, -4.548828125, -4.3701171875, -4.19140625, -4.0126953125, -3.833984375, -3.6552734375, -3.4765625, -3.2978515625, -3.119140625, -2.9404296875, -2.76171875, -2.5830078125, -2.404296875, -2.2255859375, -2.046875, -1.8681640625, -1.689453125, -1.5107421875, -1.33203125, -1.1533203125, -0.974609375, -0.7958984375, -0.6171875, -0.4384765625, -0.259765625, -0.0810546875, 0.09765625, 0.2763671875, 0.455078125, 0.6337890625, 0.8125, 0.9912109375, 1.169921875, 1.3486328125, 1.52734375, 1.7060546875, 1.884765625, 2.0634765625, 2.2421875, 2.4208984375, 2.599609375, 2.7783203125, 2.95703125, 3.1357421875, 3.314453125, 3.4931640625, 3.671875, 3.8505859375, 4.029296875, 4.2080078125, 4.38671875, 4.5654296875, 4.744140625, 4.9228515625, 5.1015625, 5.2802734375, 5.458984375, 5.6376953125, 5.81640625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 9.0, 9.0, 16.0, 16.0, 21.0, 32.0, 34.0, 47.0, 77.0, 91.0, 83.0, 77.0, 100.0, 62.0, 80.0, 59.0, 44.0, 24.0, 19.0, 17.0, 13.0, 14.0, 12.0, 8.0, 1.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.30517578125, -5.1416015625, -4.97802734375, -4.814453125, -4.65087890625, -4.4873046875, -4.32373046875, -4.16015625, -3.99658203125, -3.8330078125, -3.66943359375, -3.505859375, -3.34228515625, -3.1787109375, -3.01513671875, -2.8515625, -2.68798828125, -2.5244140625, -2.36083984375, -2.197265625, -2.03369140625, -1.8701171875, -1.70654296875, -1.54296875, -1.37939453125, -1.2158203125, -1.05224609375, -0.888671875, -0.72509765625, -0.5615234375, -0.39794921875, -0.234375, -0.07080078125, 0.0927734375, 0.25634765625, 0.419921875, 0.58349609375, 0.7470703125, 0.91064453125, 1.07421875, 1.23779296875, 1.4013671875, 1.56494140625, 1.728515625, 1.89208984375, 2.0556640625, 2.21923828125, 2.3828125, 2.54638671875, 2.7099609375, 2.87353515625, 3.037109375, 3.20068359375, 3.3642578125, 3.52783203125, 3.69140625, 3.85498046875, 4.0185546875, 4.18212890625, 4.345703125, 4.50927734375, 4.6728515625, 4.83642578125, 5.0]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 17.0, 37.0, 64.0, 163.0, 239.0, 226.0, 140.0, 66.0, 26.0, 13.0, 8.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.753631591796875, -51.51547622680664, -46.27731704711914, -41.039161682128906, -35.801002502441406, -30.562847137451172, -25.324691772460938, -20.086532592773438, -14.848377227783203, -9.610219955444336, -4.372063636779785, 0.8660926818847656, 6.104249954223633, 11.3424072265625, 16.580562591552734, 21.818721771240234, 27.05687713623047, 32.2950325012207, 37.5331916809082, 42.77134704589844, 48.00950622558594, 53.24766159057617, 58.485816955566406, 63.723976135253906, 68.96212768554688, 74.20028686523438, 79.43843841552734, 84.67659759521484, 89.91475677490234, 95.15290832519531, 100.39106750488281, 105.62922668457031, 110.86738586425781, 116.10554504394531, 121.34369659423828, 126.58185577392578, 131.82000732421875, 137.05816650390625, 142.29632568359375, 147.53448486328125, 152.77264404296875, 158.01080322265625, 163.24896240234375, 168.48712158203125, 173.7252655029297, 178.9634246826172, 184.2015838623047, 189.4397430419922, 194.67788696289062, 199.91604614257812, 205.15420532226562, 210.39236450195312, 215.63050842285156, 220.86866760253906, 226.10682678222656, 231.34498596191406, 236.58314514160156, 241.82130432128906, 247.05946350097656, 252.297607421875, 257.5357666015625, 262.77392578125, 268.0120849609375, 273.250244140625, 278.4884033203125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 3.0, 10.0, 7.0, 3.0, 11.0, 13.0, 9.0, 20.0, 16.0, 19.0, 14.0, 20.0, 35.0, 27.0, 26.0, 36.0, 39.0, 35.0, 43.0, 40.0, 26.0, 49.0, 49.0, 58.0, 41.0, 43.0, 29.0, 33.0, 33.0, 25.0, 26.0, 26.0, 27.0, 12.0, 17.0, 13.0, 19.0, 15.0, 8.0, 5.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.838951110839844, -43.33690643310547, -41.83486557006836, -40.332820892333984, -38.83077621459961, -37.3287353515625, -35.826690673828125, -34.32464599609375, -32.82260513305664, -31.3205623626709, -29.818517684936523, -28.31647491455078, -26.81443214416504, -25.312389373779297, -23.810344696044922, -22.30830192565918, -20.806257247924805, -19.304214477539062, -17.802169799804688, -16.300127029418945, -14.798084259033203, -13.296040534973145, -11.793996810913086, -10.291954040527344, -8.789910316467285, -7.287867069244385, -5.785823822021484, -4.283780097961426, -2.7817368507385254, -1.279693603515625, 0.2223501205444336, 1.7243928909301758, 3.2264366149902344, 4.728479862213135, 6.230523109436035, 7.732566833496094, 9.234609603881836, 10.736653327941895, 12.238697052001953, 13.740739822387695, 15.242783546447754, 16.744827270507812, 18.246870040893555, 19.748912811279297, 21.250957489013672, 22.753000259399414, 24.255043029785156, 25.75708770751953, 27.259130477905273, 28.761173248291016, 30.26321792602539, 31.765260696411133, 33.267303466796875, 34.76934814453125, 36.271392822265625, 37.773433685302734, 39.27547836303711, 40.777523040771484, 42.279563903808594, 43.78160858154297, 45.283653259277344, 46.78569412231445, 48.28773880004883, 49.78977966308594, 51.29182434082031]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 13.0, 13.0, 29.0, 49.0, 117.0, 237.0, 568.0, 1943.0, 12872.0, 3396902.0, 768697.0, 10079.0, 1632.0, 574.0, 240.0, 130.0, 57.0, 46.0, 28.0, 14.0, 7.0, 6.0, 8.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.25, -56.005859375, -53.76171875, -51.517578125, -49.2734375, -47.029296875, -44.78515625, -42.541015625, -40.296875, -38.052734375, -35.80859375, -33.564453125, -31.3203125, -29.076171875, -26.83203125, -24.587890625, -22.34375, -20.099609375, -17.85546875, -15.611328125, -13.3671875, -11.123046875, -8.87890625, -6.634765625, -4.390625, -2.146484375, 0.09765625, 2.341796875, 4.5859375, 6.830078125, 9.07421875, 11.318359375, 13.5625, 15.806640625, 18.05078125, 20.294921875, 22.5390625, 24.783203125, 27.02734375, 29.271484375, 31.515625, 33.759765625, 36.00390625, 38.248046875, 40.4921875, 42.736328125, 44.98046875, 47.224609375, 49.46875, 51.712890625, 53.95703125, 56.201171875, 58.4453125, 60.689453125, 62.93359375, 65.177734375, 67.421875, 69.666015625, 71.91015625, 74.154296875, 76.3984375, 78.642578125, 80.88671875, 83.130859375, 85.375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 24.0, 41.0, 46.0, 47.0, 80.0, 110.0, 131.0, 124.0, 98.0, 79.0, 72.0, 44.0, 33.0, 28.0, 13.0, 6.0, 9.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3203125, -3.163330078125, -3.00634765625, -2.849365234375, -2.6923828125, -2.535400390625, -2.37841796875, -2.221435546875, -2.064453125, -1.907470703125, -1.75048828125, -1.593505859375, -1.4365234375, -1.279541015625, -1.12255859375, -0.965576171875, -0.80859375, -0.651611328125, -0.49462890625, -0.337646484375, -0.1806640625, -0.023681640625, 0.13330078125, 0.290283203125, 0.447265625, 0.604248046875, 0.76123046875, 0.918212890625, 1.0751953125, 1.232177734375, 1.38916015625, 1.546142578125, 1.703125, 1.860107421875, 2.01708984375, 2.174072265625, 2.3310546875, 2.488037109375, 2.64501953125, 2.802001953125, 2.958984375, 3.115966796875, 3.27294921875, 3.429931640625, 3.5869140625, 3.743896484375, 3.90087890625, 4.057861328125, 4.21484375, 4.371826171875, 4.52880859375, 4.685791015625, 4.8427734375, 4.999755859375, 5.15673828125, 5.313720703125, 5.470703125, 5.627685546875, 5.78466796875, 5.941650390625, 6.0986328125, 6.255615234375, 6.41259765625, 6.569580078125, 6.7265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 5.0, 8.0, 10.0, 15.0, 14.0, 35.0, 38.0, 33.0, 70.0, 81.0, 128.0, 189.0, 337.0, 570.0, 1106.0, 2347.0, 5389.0, 13391.0, 38067.0, 125194.0, 625981.0, 2956726.0, 305452.0, 76445.0, 25501.0, 9269.0, 3926.0, 1832.0, 862.0, 487.0, 246.0, 164.0, 97.0, 71.0, 54.0, 31.0, 27.0, 21.0, 12.0, 16.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-13.5234375, -13.0772705078125, -12.631103515625, -12.1849365234375, -11.73876953125, -11.2926025390625, -10.846435546875, -10.4002685546875, -9.9541015625, -9.5079345703125, -9.061767578125, -8.6156005859375, -8.16943359375, -7.7232666015625, -7.277099609375, -6.8309326171875, -6.384765625, -5.9385986328125, -5.492431640625, -5.0462646484375, -4.60009765625, -4.1539306640625, -3.707763671875, -3.2615966796875, -2.8154296875, -2.3692626953125, -1.923095703125, -1.4769287109375, -1.03076171875, -0.5845947265625, -0.138427734375, 0.3077392578125, 0.75390625, 1.2000732421875, 1.646240234375, 2.0924072265625, 2.53857421875, 2.9847412109375, 3.430908203125, 3.8770751953125, 4.3232421875, 4.7694091796875, 5.215576171875, 5.6617431640625, 6.10791015625, 6.5540771484375, 7.000244140625, 7.4464111328125, 7.892578125, 8.3387451171875, 8.784912109375, 9.2310791015625, 9.67724609375, 10.1234130859375, 10.569580078125, 11.0157470703125, 11.4619140625, 11.9080810546875, 12.354248046875, 12.8004150390625, 13.24658203125, 13.6927490234375, 14.138916015625, 14.5850830078125, 15.03125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 5.0, 10.0, 22.0, 28.0, 37.0, 56.0, 93.0, 156.0, 272.0, 622.0, 1663.0, 528.0, 225.0, 129.0, 86.0, 47.0, 29.0, 21.0, 9.0, 10.0, 8.0, 6.0, 7.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.078125, -8.847900390625, -8.61767578125, -8.387451171875, -8.1572265625, -7.927001953125, -7.69677734375, -7.466552734375, -7.236328125, -7.006103515625, -6.77587890625, -6.545654296875, -6.3154296875, -6.085205078125, -5.85498046875, -5.624755859375, -5.39453125, -5.164306640625, -4.93408203125, -4.703857421875, -4.4736328125, -4.243408203125, -4.01318359375, -3.782958984375, -3.552734375, -3.322509765625, -3.09228515625, -2.862060546875, -2.6318359375, -2.401611328125, -2.17138671875, -1.941162109375, -1.7109375, -1.480712890625, -1.25048828125, -1.020263671875, -0.7900390625, -0.559814453125, -0.32958984375, -0.099365234375, 0.130859375, 0.361083984375, 0.59130859375, 0.821533203125, 1.0517578125, 1.281982421875, 1.51220703125, 1.742431640625, 1.97265625, 2.202880859375, 2.43310546875, 2.663330078125, 2.8935546875, 3.123779296875, 3.35400390625, 3.584228515625, 3.814453125, 4.044677734375, 4.27490234375, 4.505126953125, 4.7353515625, 4.965576171875, 5.19580078125, 5.426025390625, 5.65625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 13.0, 14.0, 29.0, 45.0, 63.0, 85.0, 72.0, 96.0, 85.0, 104.0, 104.0, 76.0, 68.0, 43.0, 33.0, 32.0, 7.0, 5.0, 3.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.733978271484375, -38.596065521240234, -37.458152770996094, -36.32024002075195, -35.18232727050781, -34.04441452026367, -32.90650177001953, -31.76858901977539, -30.63067626953125, -29.49276351928711, -28.35485076904297, -27.216938018798828, -26.079025268554688, -24.941112518310547, -23.803199768066406, -22.665287017822266, -21.527372360229492, -20.38945960998535, -19.25154685974121, -18.11363410949707, -16.97572135925293, -15.837808609008789, -14.699894905090332, -13.561982154846191, -12.42406940460205, -11.28615665435791, -10.14824390411377, -9.010330200195312, -7.87241792678833, -6.7345051765441895, -5.596591949462891, -4.45867919921875, -3.3207664489746094, -2.1828536987304688, -1.044940710067749, 0.0929722785949707, 1.2308850288391113, 2.368797779083252, 3.506711006164551, 4.644623756408691, 5.782536506652832, 6.920449256896973, 8.058362007141113, 9.19627571105957, 10.334188461303711, 11.472101211547852, 12.610013961791992, 13.747926712036133, 14.885839462280273, 16.023752212524414, 17.161664962768555, 18.299577713012695, 19.437490463256836, 20.575403213500977, 21.71331787109375, 22.85123062133789, 23.98914337158203, 25.127056121826172, 26.264968872070312, 27.402881622314453, 28.540794372558594, 29.678707122802734, 30.816619873046875, 31.954532623291016, 33.092445373535156]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 10.0, 16.0, 13.0, 13.0, 16.0, 20.0, 24.0, 25.0, 32.0, 29.0, 37.0, 37.0, 37.0, 42.0, 50.0, 49.0, 46.0, 51.0, 49.0, 43.0, 51.0, 43.0, 37.0, 38.0, 36.0, 30.0, 16.0, 20.0, 11.0, 16.0, 12.0, 20.0, 7.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.554555892944336, -17.885683059692383, -17.21681022644043, -16.54793930053711, -15.879066467285156, -15.210193634033203, -14.54132080078125, -13.872447967529297, -13.20357608795166, -12.534703254699707, -11.86583137512207, -11.196958541870117, -10.528085708618164, -9.859213829040527, -9.190340995788574, -8.521469116210938, -7.852596282958984, -7.1837239265441895, -6.5148515701293945, -5.845978736877441, -5.1771063804626465, -4.508234024047852, -3.8393611907958984, -3.1704888343811035, -2.5016164779663086, -1.8327440023422241, -1.1638715267181396, -0.4949989318847656, 0.1738734245300293, 0.8427457809448242, 1.5116186141967773, 2.1804909706115723, 2.849363327026367, 3.518235683441162, 4.187108039855957, 4.85598087310791, 5.524853229522705, 6.1937255859375, 6.862598419189453, 7.531470775604248, 8.200343132019043, 8.869215965270996, 9.538087844848633, 10.206960678100586, 10.875833511352539, 11.544705390930176, 12.213578224182129, 12.882450103759766, 13.551322937011719, 14.220195770263672, 14.889067649841309, 15.557940483093262, 16.2268123626709, 16.89568519592285, 17.564558029174805, 18.233430862426758, 18.902301788330078, 19.57117462158203, 20.240047454833984, 20.908920288085938, 21.577791213989258, 22.24666404724121, 22.915536880493164, 23.584409713745117, 24.25328254699707]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 13.0, 4.0, 13.0, 18.0, 26.0, 52.0, 63.0, 93.0, 185.0, 338.0, 666.0, 1585.0, 5447.0, 37278.0, 441513.0, 509324.0, 42764.0, 5981.0, 1639.0, 704.0, 292.0, 194.0, 126.0, 70.0, 50.0, 30.0, 32.0, 13.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0], "bins": [-50.65625, -49.421630859375, -48.18701171875, -46.952392578125, -45.7177734375, -44.483154296875, -43.24853515625, -42.013916015625, -40.779296875, -39.544677734375, -38.31005859375, -37.075439453125, -35.8408203125, -34.606201171875, -33.37158203125, -32.136962890625, -30.90234375, -29.667724609375, -28.43310546875, -27.198486328125, -25.9638671875, -24.729248046875, -23.49462890625, -22.260009765625, -21.025390625, -19.790771484375, -18.55615234375, -17.321533203125, -16.0869140625, -14.852294921875, -13.61767578125, -12.383056640625, -11.1484375, -9.913818359375, -8.67919921875, -7.444580078125, -6.2099609375, -4.975341796875, -3.74072265625, -2.506103515625, -1.271484375, -0.036865234375, 1.19775390625, 2.432373046875, 3.6669921875, 4.901611328125, 6.13623046875, 7.370849609375, 8.60546875, 9.840087890625, 11.07470703125, 12.309326171875, 13.5439453125, 14.778564453125, 16.01318359375, 17.247802734375, 18.482421875, 19.717041015625, 20.95166015625, 22.186279296875, 23.4208984375, 24.655517578125, 25.89013671875, 27.124755859375, 28.359375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 17.0, 20.0, 42.0, 37.0, 61.0, 91.0, 129.0, 111.0, 114.0, 87.0, 87.0, 59.0, 51.0, 35.0, 23.0, 11.0, 9.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.186248779296875, -3.02679443359375, -2.867340087890625, -2.7078857421875, -2.548431396484375, -2.38897705078125, -2.229522705078125, -2.070068359375, -1.910614013671875, -1.75115966796875, -1.591705322265625, -1.4322509765625, -1.272796630859375, -1.11334228515625, -0.953887939453125, -0.79443359375, -0.634979248046875, -0.47552490234375, -0.316070556640625, -0.1566162109375, 0.002838134765625, 0.16229248046875, 0.321746826171875, 0.481201171875, 0.640655517578125, 0.80010986328125, 0.959564208984375, 1.1190185546875, 1.278472900390625, 1.43792724609375, 1.597381591796875, 1.7568359375, 1.916290283203125, 2.07574462890625, 2.235198974609375, 2.3946533203125, 2.554107666015625, 2.71356201171875, 2.873016357421875, 3.032470703125, 3.191925048828125, 3.35137939453125, 3.510833740234375, 3.6702880859375, 3.829742431640625, 3.98919677734375, 4.148651123046875, 4.30810546875, 4.467559814453125, 4.62701416015625, 4.786468505859375, 4.9459228515625, 5.105377197265625, 5.26483154296875, 5.424285888671875, 5.583740234375, 5.743194580078125, 5.90264892578125, 6.062103271484375, 6.2215576171875, 6.381011962890625, 6.54046630859375, 6.699920654296875, 6.859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 8.0, 5.0, 7.0, 7.0, 14.0, 23.0, 38.0, 62.0, 84.0, 91.0, 167.0, 234.0, 343.0, 587.0, 1180.0, 2756.0, 7887.0, 26492.0, 96854.0, 328316.0, 402681.0, 128377.0, 35601.0, 10078.0, 3421.0, 1393.0, 669.0, 425.0, 241.0, 178.0, 119.0, 68.0, 43.0, 43.0, 24.0, 7.0, 13.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.66943359375, -11.2685546875, -10.86767578125, -10.466796875, -10.06591796875, -9.6650390625, -9.26416015625, -8.86328125, -8.46240234375, -8.0615234375, -7.66064453125, -7.259765625, -6.85888671875, -6.4580078125, -6.05712890625, -5.65625, -5.25537109375, -4.8544921875, -4.45361328125, -4.052734375, -3.65185546875, -3.2509765625, -2.85009765625, -2.44921875, -2.04833984375, -1.6474609375, -1.24658203125, -0.845703125, -0.44482421875, -0.0439453125, 0.35693359375, 0.7578125, 1.15869140625, 1.5595703125, 1.96044921875, 2.361328125, 2.76220703125, 3.1630859375, 3.56396484375, 3.96484375, 4.36572265625, 4.7666015625, 5.16748046875, 5.568359375, 5.96923828125, 6.3701171875, 6.77099609375, 7.171875, 7.57275390625, 7.9736328125, 8.37451171875, 8.775390625, 9.17626953125, 9.5771484375, 9.97802734375, 10.37890625, 10.77978515625, 11.1806640625, 11.58154296875, 11.982421875, 12.38330078125, 12.7841796875, 13.18505859375, 13.5859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 3.0, 9.0, 9.0, 11.0, 13.0, 10.0, 15.0, 20.0, 21.0, 29.0, 31.0, 25.0, 20.0, 30.0, 31.0, 37.0, 29.0, 44.0, 32.0, 31.0, 28.0, 38.0, 34.0, 53.0, 28.0, 31.0, 33.0, 30.0, 25.0, 41.0, 22.0, 22.0, 18.0, 17.0, 20.0, 19.0, 11.0, 19.0, 7.0, 14.0, 2.0, 4.0, 11.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.72265625, -6.495849609375, -6.26904296875, -6.042236328125, -5.8154296875, -5.588623046875, -5.36181640625, -5.135009765625, -4.908203125, -4.681396484375, -4.45458984375, -4.227783203125, -4.0009765625, -3.774169921875, -3.54736328125, -3.320556640625, -3.09375, -2.866943359375, -2.64013671875, -2.413330078125, -2.1865234375, -1.959716796875, -1.73291015625, -1.506103515625, -1.279296875, -1.052490234375, -0.82568359375, -0.598876953125, -0.3720703125, -0.145263671875, 0.08154296875, 0.308349609375, 0.53515625, 0.761962890625, 0.98876953125, 1.215576171875, 1.4423828125, 1.669189453125, 1.89599609375, 2.122802734375, 2.349609375, 2.576416015625, 2.80322265625, 3.030029296875, 3.2568359375, 3.483642578125, 3.71044921875, 3.937255859375, 4.1640625, 4.390869140625, 4.61767578125, 4.844482421875, 5.0712890625, 5.298095703125, 5.52490234375, 5.751708984375, 5.978515625, 6.205322265625, 6.43212890625, 6.658935546875, 6.8857421875, 7.112548828125, 7.33935546875, 7.566162109375, 7.79296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 12.0, 20.0, 14.0, 28.0, 45.0, 70.0, 113.0, 260.0, 557.0, 1748.0, 6195.0, 28932.0, 221458.0, 675841.0, 92545.0, 15163.0, 3688.0, 1066.0, 399.0, 173.0, 78.0, 54.0, 22.0, 23.0, 16.0, 17.0, 11.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.8270263671875, -13.411865234375, -12.9967041015625, -12.58154296875, -12.1663818359375, -11.751220703125, -11.3360595703125, -10.9208984375, -10.5057373046875, -10.090576171875, -9.6754150390625, -9.26025390625, -8.8450927734375, -8.429931640625, -8.0147705078125, -7.599609375, -7.1844482421875, -6.769287109375, -6.3541259765625, -5.93896484375, -5.5238037109375, -5.108642578125, -4.6934814453125, -4.2783203125, -3.8631591796875, -3.447998046875, -3.0328369140625, -2.61767578125, -2.2025146484375, -1.787353515625, -1.3721923828125, -0.95703125, -0.5418701171875, -0.126708984375, 0.2884521484375, 0.70361328125, 1.1187744140625, 1.533935546875, 1.9490966796875, 2.3642578125, 2.7794189453125, 3.194580078125, 3.6097412109375, 4.02490234375, 4.4400634765625, 4.855224609375, 5.2703857421875, 5.685546875, 6.1007080078125, 6.515869140625, 6.9310302734375, 7.34619140625, 7.7613525390625, 8.176513671875, 8.5916748046875, 9.0068359375, 9.4219970703125, 9.837158203125, 10.2523193359375, 10.66748046875, 11.0826416015625, 11.497802734375, 11.9129638671875, 12.328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 11.0, 18.0, 20.0, 22.0, 29.0, 47.0, 61.0, 97.0, 156.0, 155.0, 108.0, 71.0, 41.0, 34.0, 29.0, 15.0, 20.0, 12.0, 6.0, 12.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016269683837890625, -0.0015861988067626953, -0.0015454292297363281, -0.001504659652709961, -0.0014638900756835938, -0.0014231204986572266, -0.0013823509216308594, -0.0013415813446044922, -0.001300811767578125, -0.0012600421905517578, -0.0012192726135253906, -0.0011785030364990234, -0.0011377334594726562, -0.001096963882446289, -0.0010561943054199219, -0.0010154247283935547, -0.0009746551513671875, -0.0009338855743408203, -0.0008931159973144531, -0.0008523464202880859, -0.0008115768432617188, -0.0007708072662353516, -0.0007300376892089844, -0.0006892681121826172, -0.00064849853515625, -0.0006077289581298828, -0.0005669593811035156, -0.0005261898040771484, -0.00048542022705078125, -0.00044465065002441406, -0.0004038810729980469, -0.0003631114959716797, -0.0003223419189453125, -0.0002815723419189453, -0.00024080276489257812, -0.00020003318786621094, -0.00015926361083984375, -0.00011849403381347656, -7.772445678710938e-05, -3.695487976074219e-05, 3.814697265625e-06, 4.458427429199219e-05, 8.535385131835938e-05, 0.00012612342834472656, 0.00016689300537109375, 0.00020766258239746094, 0.0002484321594238281, 0.0002892017364501953, 0.0003299713134765625, 0.0003707408905029297, 0.0004115104675292969, 0.00045228004455566406, 0.0004930496215820312, 0.0005338191986083984, 0.0005745887756347656, 0.0006153583526611328, 0.0006561279296875, 0.0006968975067138672, 0.0007376670837402344, 0.0007784366607666016, 0.0008192062377929688, 0.0008599758148193359, 0.0009007453918457031, 0.0009415149688720703, 0.0009822845458984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 18.0, 22.0, 23.0, 53.0, 75.0, 119.0, 232.0, 562.0, 1678.0, 6554.0, 35321.0, 407865.0, 540351.0, 44605.0, 7754.0, 1991.0, 670.0, 281.0, 154.0, 75.0, 59.0, 32.0, 16.0, 13.0, 5.0, 6.0, 5.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.6875, -17.1829833984375, -16.678466796875, -16.1739501953125, -15.66943359375, -15.1649169921875, -14.660400390625, -14.1558837890625, -13.6513671875, -13.1468505859375, -12.642333984375, -12.1378173828125, -11.63330078125, -11.1287841796875, -10.624267578125, -10.1197509765625, -9.615234375, -9.1107177734375, -8.606201171875, -8.1016845703125, -7.59716796875, -7.0926513671875, -6.588134765625, -6.0836181640625, -5.5791015625, -5.0745849609375, -4.570068359375, -4.0655517578125, -3.56103515625, -3.0565185546875, -2.552001953125, -2.0474853515625, -1.54296875, -1.0384521484375, -0.533935546875, -0.0294189453125, 0.47509765625, 0.9796142578125, 1.484130859375, 1.9886474609375, 2.4931640625, 2.9976806640625, 3.502197265625, 4.0067138671875, 4.51123046875, 5.0157470703125, 5.520263671875, 6.0247802734375, 6.529296875, 7.0338134765625, 7.538330078125, 8.0428466796875, 8.54736328125, 9.0518798828125, 9.556396484375, 10.0609130859375, 10.5654296875, 11.0699462890625, 11.574462890625, 12.0789794921875, 12.58349609375, 13.0880126953125, 13.592529296875, 14.0970458984375, 14.6015625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 5.0, 4.0, 13.0, 6.0, 13.0, 12.0, 25.0, 31.0, 42.0, 51.0, 65.0, 86.0, 122.0, 126.0, 85.0, 89.0, 53.0, 43.0, 35.0, 18.0, 22.0, 9.0, 15.0, 7.0, 8.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -4.98333740234375, -4.7674560546875, -4.55157470703125, -4.335693359375, -4.11981201171875, -3.9039306640625, -3.68804931640625, -3.47216796875, -3.25628662109375, -3.0404052734375, -2.82452392578125, -2.608642578125, -2.39276123046875, -2.1768798828125, -1.96099853515625, -1.7451171875, -1.52923583984375, -1.3133544921875, -1.09747314453125, -0.881591796875, -0.66571044921875, -0.4498291015625, -0.23394775390625, -0.01806640625, 0.19781494140625, 0.4136962890625, 0.62957763671875, 0.845458984375, 1.06134033203125, 1.2772216796875, 1.49310302734375, 1.708984375, 1.92486572265625, 2.1407470703125, 2.35662841796875, 2.572509765625, 2.78839111328125, 3.0042724609375, 3.22015380859375, 3.43603515625, 3.65191650390625, 3.8677978515625, 4.08367919921875, 4.299560546875, 4.51544189453125, 4.7313232421875, 4.94720458984375, 5.1630859375, 5.37896728515625, 5.5948486328125, 5.81072998046875, 6.026611328125, 6.24249267578125, 6.4583740234375, 6.67425537109375, 6.89013671875, 7.10601806640625, 7.3218994140625, 7.53778076171875, 7.753662109375, 7.96954345703125, 8.1854248046875, 8.40130615234375, 8.6171875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 12.0, 27.0, 41.0, 66.0, 108.0, 129.0, 162.0, 157.0, 117.0, 71.0, 49.0, 22.0, 15.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.517333984375, -57.0521354675293, -53.586936950683594, -50.121742248535156, -46.65654373168945, -43.19134521484375, -39.72614669799805, -36.260948181152344, -32.795753479003906, -29.330554962158203, -25.865358352661133, -22.40015983581543, -18.93496322631836, -15.469764709472656, -12.004566192626953, -8.539369583129883, -5.074169158935547, -1.608971357345581, 1.8562264442443848, 5.32142448425293, 8.786622047424316, 12.251819610595703, 15.717018127441406, 19.182214736938477, 22.64741325378418, 26.112611770629883, 29.577808380126953, 33.043006896972656, 36.50820541381836, 39.97340393066406, 43.4385986328125, 46.9037971496582, 50.368995666503906, 53.83419418334961, 57.29939270019531, 60.76458740234375, 64.22978973388672, 67.69498443603516, 71.16018676757812, 74.62538146972656, 78.090576171875, 81.55577087402344, 85.0209732055664, 88.48616790771484, 91.95137023925781, 95.41656494140625, 98.88175964355469, 102.34696197509766, 105.81216430664062, 109.27735900878906, 112.74256134033203, 116.20775604248047, 119.67295837402344, 123.13815307617188, 126.60334777832031, 130.06854248046875, 133.5337371826172, 136.99893188476562, 140.46412658691406, 143.92933654785156, 147.39453125, 150.85972595214844, 154.32492065429688, 157.7901153564453, 161.2553253173828]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 6.0, 7.0, 6.0, 10.0, 10.0, 21.0, 17.0, 24.0, 22.0, 22.0, 25.0, 31.0, 26.0, 32.0, 34.0, 33.0, 46.0, 33.0, 29.0, 38.0, 36.0, 43.0, 48.0, 37.0, 35.0, 27.0, 38.0, 36.0, 30.0, 17.0, 28.0, 12.0, 21.0, 15.0, 15.0, 14.0, 5.0, 10.0, 8.0, 5.0, 7.0, 4.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-41.34233093261719, -40.033485412597656, -38.72464370727539, -37.41579818725586, -36.106956481933594, -34.79811096191406, -33.48926544189453, -32.180423736572266, -30.871578216552734, -29.562734603881836, -28.253890991210938, -26.945045471191406, -25.636201858520508, -24.32735824584961, -23.01851463317871, -21.709671020507812, -20.400827407836914, -19.091983795166016, -17.783140182495117, -16.47429656982422, -15.165451049804688, -13.856607437133789, -12.54776382446289, -11.238919258117676, -9.930075645446777, -8.621232032775879, -7.312387466430664, -6.003543853759766, -4.694699764251709, -3.3858556747436523, -2.077012062072754, -0.7681674957275391, 0.5406761169433594, 1.8495200872421265, 3.1583640575408936, 4.467207908630371, 5.776051998138428, 7.084896087646484, 8.393739700317383, 9.702584266662598, 11.011427879333496, 12.320271492004395, 13.62911605834961, 14.937959671020508, 16.246803283691406, 17.555648803710938, 18.864490509033203, 20.173336029052734, 21.482179641723633, 22.79102325439453, 24.09986686706543, 25.408710479736328, 26.71755599975586, 28.026399612426758, 29.335243225097656, 30.644088745117188, 31.952930450439453, 33.261775970458984, 34.57061767578125, 35.87946319580078, 37.18830490112305, 38.49715042114258, 39.805992126464844, 41.114837646484375, 42.423683166503906]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 16.0, 11.0, 8.0, 41.0, 49.0, 73.0, 105.0, 204.0, 355.0, 751.0, 1644.0, 4582.0, 20646.0, 210670.0, 3787669.0, 144107.0, 16275.0, 3984.0, 1392.0, 651.0, 324.0, 216.0, 145.0, 92.0, 67.0, 58.0, 28.0, 17.0, 21.0, 16.0, 6.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.8125, -30.455078125, -29.09765625, -27.740234375, -26.3828125, -25.025390625, -23.66796875, -22.310546875, -20.953125, -19.595703125, -18.23828125, -16.880859375, -15.5234375, -14.166015625, -12.80859375, -11.451171875, -10.09375, -8.736328125, -7.37890625, -6.021484375, -4.6640625, -3.306640625, -1.94921875, -0.591796875, 0.765625, 2.123046875, 3.48046875, 4.837890625, 6.1953125, 7.552734375, 8.91015625, 10.267578125, 11.625, 12.982421875, 14.33984375, 15.697265625, 17.0546875, 18.412109375, 19.76953125, 21.126953125, 22.484375, 23.841796875, 25.19921875, 26.556640625, 27.9140625, 29.271484375, 30.62890625, 31.986328125, 33.34375, 34.701171875, 36.05859375, 37.416015625, 38.7734375, 40.130859375, 41.48828125, 42.845703125, 44.203125, 45.560546875, 46.91796875, 48.275390625, 49.6328125, 50.990234375, 52.34765625, 53.705078125, 55.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 19.0, 23.0, 33.0, 41.0, 68.0, 79.0, 116.0, 125.0, 103.0, 90.0, 95.0, 65.0, 55.0, 32.0, 22.0, 8.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37890625, -3.21807861328125, -3.0572509765625, -2.89642333984375, -2.735595703125, -2.57476806640625, -2.4139404296875, -2.25311279296875, -2.09228515625, -1.93145751953125, -1.7706298828125, -1.60980224609375, -1.448974609375, -1.28814697265625, -1.1273193359375, -0.96649169921875, -0.8056640625, -0.64483642578125, -0.4840087890625, -0.32318115234375, -0.162353515625, -0.00152587890625, 0.1593017578125, 0.32012939453125, 0.48095703125, 0.64178466796875, 0.8026123046875, 0.96343994140625, 1.124267578125, 1.28509521484375, 1.4459228515625, 1.60675048828125, 1.767578125, 1.92840576171875, 2.0892333984375, 2.25006103515625, 2.410888671875, 2.57171630859375, 2.7325439453125, 2.89337158203125, 3.05419921875, 3.21502685546875, 3.3758544921875, 3.53668212890625, 3.697509765625, 3.85833740234375, 4.0191650390625, 4.17999267578125, 4.3408203125, 4.50164794921875, 4.6624755859375, 4.82330322265625, 4.984130859375, 5.14495849609375, 5.3057861328125, 5.46661376953125, 5.62744140625, 5.78826904296875, 5.9490966796875, 6.10992431640625, 6.270751953125, 6.43157958984375, 6.5924072265625, 6.75323486328125, 6.9140625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 5.0, 9.0, 6.0, 20.0, 18.0, 18.0, 19.0, 43.0, 63.0, 108.0, 131.0, 270.0, 519.0, 1108.0, 3176.0, 11418.0, 53983.0, 415936.0, 3319884.0, 327402.0, 45297.0, 9771.0, 2831.0, 1067.0, 446.0, 245.0, 146.0, 97.0, 73.0, 48.0, 36.0, 24.0, 18.0, 11.0, 10.0, 11.0, 5.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.953125, -26.2333984375, -25.513671875, -24.7939453125, -24.07421875, -23.3544921875, -22.634765625, -21.9150390625, -21.1953125, -20.4755859375, -19.755859375, -19.0361328125, -18.31640625, -17.5966796875, -16.876953125, -16.1572265625, -15.4375, -14.7177734375, -13.998046875, -13.2783203125, -12.55859375, -11.8388671875, -11.119140625, -10.3994140625, -9.6796875, -8.9599609375, -8.240234375, -7.5205078125, -6.80078125, -6.0810546875, -5.361328125, -4.6416015625, -3.921875, -3.2021484375, -2.482421875, -1.7626953125, -1.04296875, -0.3232421875, 0.396484375, 1.1162109375, 1.8359375, 2.5556640625, 3.275390625, 3.9951171875, 4.71484375, 5.4345703125, 6.154296875, 6.8740234375, 7.59375, 8.3134765625, 9.033203125, 9.7529296875, 10.47265625, 11.1923828125, 11.912109375, 12.6318359375, 13.3515625, 14.0712890625, 14.791015625, 15.5107421875, 16.23046875, 16.9501953125, 17.669921875, 18.3896484375, 19.109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 9.0, 9.0, 17.0, 32.0, 35.0, 81.0, 115.0, 243.0, 466.0, 1363.0, 889.0, 358.0, 191.0, 123.0, 55.0, 36.0, 15.0, 19.0, 7.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.42327880859375, -5.1004638671875, -4.77764892578125, -4.454833984375, -4.13201904296875, -3.8092041015625, -3.48638916015625, -3.16357421875, -2.84075927734375, -2.5179443359375, -2.19512939453125, -1.872314453125, -1.54949951171875, -1.2266845703125, -0.90386962890625, -0.5810546875, -0.25823974609375, 0.0645751953125, 0.38739013671875, 0.710205078125, 1.03302001953125, 1.3558349609375, 1.67864990234375, 2.00146484375, 2.32427978515625, 2.6470947265625, 2.96990966796875, 3.292724609375, 3.61553955078125, 3.9383544921875, 4.26116943359375, 4.583984375, 4.90679931640625, 5.2296142578125, 5.55242919921875, 5.875244140625, 6.19805908203125, 6.5208740234375, 6.84368896484375, 7.16650390625, 7.48931884765625, 7.8121337890625, 8.13494873046875, 8.457763671875, 8.78057861328125, 9.1033935546875, 9.42620849609375, 9.7490234375, 10.07183837890625, 10.3946533203125, 10.71746826171875, 11.040283203125, 11.36309814453125, 11.6859130859375, 12.00872802734375, 12.33154296875, 12.65435791015625, 12.9771728515625, 13.29998779296875, 13.622802734375, 13.94561767578125, 14.2684326171875, 14.59124755859375, 14.9140625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 1.0, 7.0, 2.0, 12.0, 10.0, 19.0, 19.0, 24.0, 38.0, 47.0, 59.0, 70.0, 84.0, 79.0, 94.0, 86.0, 89.0, 79.0, 61.0, 40.0, 22.0, 20.0, 15.0, 12.0, 8.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.11328887939453, -33.76093673706055, -32.40858840942383, -31.056236267089844, -29.70388412475586, -28.351533889770508, -26.999183654785156, -25.646831512451172, -24.29448127746582, -22.94213104248047, -21.589778900146484, -20.237428665161133, -18.88507843017578, -17.532726287841797, -16.180376052856445, -14.828024864196777, -13.47567367553711, -12.123322486877441, -10.770971298217773, -9.418621063232422, -8.066269874572754, -6.713918685913086, -5.361568450927734, -4.009217262268066, -2.6568660736083984, -1.3045151233673096, 0.0478358268737793, 1.400186538696289, 2.752537727355957, 4.104888916015625, 5.457239151000977, 6.8095903396606445, 8.161941528320312, 9.51429271697998, 10.866643905639648, 12.218994140625, 13.571345329284668, 14.923696517944336, 16.276046752929688, 17.628398895263672, 18.980749130249023, 20.333099365234375, 21.68545150756836, 23.03780174255371, 24.390151977539062, 25.742504119873047, 27.0948543548584, 28.44720458984375, 29.799556732177734, 31.151906967163086, 32.50425720214844, 33.85660934448242, 35.208961486816406, 36.561309814453125, 37.91366195678711, 39.266014099121094, 40.61836242675781, 41.9707145690918, 43.323062896728516, 44.6754150390625, 46.027767181396484, 47.38011932373047, 48.73246765136719, 50.08481979370117, 51.437171936035156]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 9.0, 6.0, 14.0, 17.0, 14.0, 21.0, 22.0, 27.0, 29.0, 40.0, 47.0, 32.0, 45.0, 44.0, 40.0, 56.0, 37.0, 38.0, 48.0, 39.0, 37.0, 42.0, 38.0, 46.0, 32.0, 27.0, 22.0, 16.0, 21.0, 9.0, 15.0, 10.0, 9.0, 11.0, 10.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.292917251586914, -22.46396255493164, -21.635007858276367, -20.806053161621094, -19.977100372314453, -19.148143768310547, -18.319190979003906, -17.490236282348633, -16.66128158569336, -15.832326889038086, -15.003372192382812, -14.174418449401855, -13.345463752746582, -12.516509056091309, -11.687555313110352, -10.858600616455078, -10.029645919799805, -9.200691223144531, -8.371736526489258, -7.542782783508301, -6.713828086853027, -5.884873390197754, -5.055919170379639, -4.226964950561523, -3.39801025390625, -2.5690557956695557, -1.7401013374328613, -0.911146879196167, -0.08219242095947266, 0.7467622756958008, 1.575716495513916, 2.4046707153320312, 3.233623504638672, 4.062578201293945, 4.8915324211120605, 5.720486640930176, 6.549441337585449, 7.378396034240723, 8.20734977722168, 9.036304473876953, 9.865259170532227, 10.6942138671875, 11.523168563842773, 12.35212230682373, 13.181077003479004, 14.010031700134277, 14.838985443115234, 15.667940139770508, 16.49689483642578, 17.325849533081055, 18.154804229736328, 18.9837589263916, 19.812713623046875, 20.641666412353516, 21.47062110900879, 22.299575805664062, 23.128530502319336, 23.95748519897461, 24.786439895629883, 25.615394592285156, 26.444347381591797, 27.273303985595703, 28.102256774902344, 28.931211471557617, 29.76016616821289]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 9.0, 12.0, 18.0, 36.0, 52.0, 67.0, 105.0, 196.0, 377.0, 786.0, 2151.0, 10022.0, 88933.0, 831478.0, 99485.0, 10835.0, 2286.0, 797.0, 375.0, 215.0, 109.0, 66.0, 31.0, 34.0, 22.0, 8.0, 17.0, 3.0, 2.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.125, -39.73193359375, -38.3388671875, -36.94580078125, -35.552734375, -34.15966796875, -32.7666015625, -31.37353515625, -29.98046875, -28.58740234375, -27.1943359375, -25.80126953125, -24.408203125, -23.01513671875, -21.6220703125, -20.22900390625, -18.8359375, -17.44287109375, -16.0498046875, -14.65673828125, -13.263671875, -11.87060546875, -10.4775390625, -9.08447265625, -7.69140625, -6.29833984375, -4.9052734375, -3.51220703125, -2.119140625, -0.72607421875, 0.6669921875, 2.06005859375, 3.453125, 4.84619140625, 6.2392578125, 7.63232421875, 9.025390625, 10.41845703125, 11.8115234375, 13.20458984375, 14.59765625, 15.99072265625, 17.3837890625, 18.77685546875, 20.169921875, 21.56298828125, 22.9560546875, 24.34912109375, 25.7421875, 27.13525390625, 28.5283203125, 29.92138671875, 31.314453125, 32.70751953125, 34.1005859375, 35.49365234375, 36.88671875, 38.27978515625, 39.6728515625, 41.06591796875, 42.458984375, 43.85205078125, 45.2451171875, 46.63818359375, 48.03125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 18.0, 20.0, 38.0, 55.0, 62.0, 97.0, 107.0, 113.0, 123.0, 105.0, 76.0, 69.0, 43.0, 32.0, 6.0, 12.0, 11.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.880859375, -3.710357666015625, -3.53985595703125, -3.369354248046875, -3.1988525390625, -3.028350830078125, -2.85784912109375, -2.687347412109375, -2.516845703125, -2.346343994140625, -2.17584228515625, -2.005340576171875, -1.8348388671875, -1.664337158203125, -1.49383544921875, -1.323333740234375, -1.15283203125, -0.982330322265625, -0.81182861328125, -0.641326904296875, -0.4708251953125, -0.300323486328125, -0.12982177734375, 0.040679931640625, 0.211181640625, 0.381683349609375, 0.55218505859375, 0.722686767578125, 0.8931884765625, 1.063690185546875, 1.23419189453125, 1.404693603515625, 1.5751953125, 1.745697021484375, 1.91619873046875, 2.086700439453125, 2.2572021484375, 2.427703857421875, 2.59820556640625, 2.768707275390625, 2.939208984375, 3.109710693359375, 3.28021240234375, 3.450714111328125, 3.6212158203125, 3.791717529296875, 3.96221923828125, 4.132720947265625, 4.30322265625, 4.473724365234375, 4.64422607421875, 4.814727783203125, 4.9852294921875, 5.155731201171875, 5.32623291015625, 5.496734619140625, 5.667236328125, 5.837738037109375, 6.00823974609375, 6.178741455078125, 6.3492431640625, 6.519744873046875, 6.69024658203125, 6.860748291015625, 7.03125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 7.0, 11.0, 10.0, 15.0, 19.0, 37.0, 42.0, 61.0, 80.0, 100.0, 148.0, 193.0, 326.0, 498.0, 855.0, 1573.0, 3618.0, 8902.0, 23910.0, 69676.0, 250168.0, 504110.0, 119490.0, 39920.0, 13931.0, 5548.0, 2350.0, 1063.0, 660.0, 337.0, 252.0, 160.0, 150.0, 87.0, 66.0, 50.0, 43.0, 25.0, 22.0, 8.0, 9.0, 8.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.8699951171875, -11.489990234375, -11.1099853515625, -10.72998046875, -10.3499755859375, -9.969970703125, -9.5899658203125, -9.2099609375, -8.8299560546875, -8.449951171875, -8.0699462890625, -7.68994140625, -7.3099365234375, -6.929931640625, -6.5499267578125, -6.169921875, -5.7899169921875, -5.409912109375, -5.0299072265625, -4.64990234375, -4.2698974609375, -3.889892578125, -3.5098876953125, -3.1298828125, -2.7498779296875, -2.369873046875, -1.9898681640625, -1.60986328125, -1.2298583984375, -0.849853515625, -0.4698486328125, -0.08984375, 0.2901611328125, 0.670166015625, 1.0501708984375, 1.43017578125, 1.8101806640625, 2.190185546875, 2.5701904296875, 2.9501953125, 3.3302001953125, 3.710205078125, 4.0902099609375, 4.47021484375, 4.8502197265625, 5.230224609375, 5.6102294921875, 5.990234375, 6.3702392578125, 6.750244140625, 7.1302490234375, 7.51025390625, 7.8902587890625, 8.270263671875, 8.6502685546875, 9.0302734375, 9.4102783203125, 9.790283203125, 10.1702880859375, 10.55029296875, 10.9302978515625, 11.310302734375, 11.6903076171875, 12.0703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 11.0, 12.0, 15.0, 19.0, 23.0, 39.0, 26.0, 39.0, 40.0, 44.0, 38.0, 55.0, 44.0, 50.0, 60.0, 49.0, 40.0, 53.0, 48.0, 34.0, 46.0, 36.0, 25.0, 33.0, 27.0, 15.0, 21.0, 10.0, 15.0, 8.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.390625, -8.0714111328125, -7.752197265625, -7.4329833984375, -7.11376953125, -6.7945556640625, -6.475341796875, -6.1561279296875, -5.8369140625, -5.5177001953125, -5.198486328125, -4.8792724609375, -4.56005859375, -4.2408447265625, -3.921630859375, -3.6024169921875, -3.283203125, -2.9639892578125, -2.644775390625, -2.3255615234375, -2.00634765625, -1.6871337890625, -1.367919921875, -1.0487060546875, -0.7294921875, -0.4102783203125, -0.091064453125, 0.2281494140625, 0.54736328125, 0.8665771484375, 1.185791015625, 1.5050048828125, 1.82421875, 2.1434326171875, 2.462646484375, 2.7818603515625, 3.10107421875, 3.4202880859375, 3.739501953125, 4.0587158203125, 4.3779296875, 4.6971435546875, 5.016357421875, 5.3355712890625, 5.65478515625, 5.9739990234375, 6.293212890625, 6.6124267578125, 6.931640625, 7.2508544921875, 7.570068359375, 7.8892822265625, 8.20849609375, 8.5277099609375, 8.846923828125, 9.1661376953125, 9.4853515625, 9.8045654296875, 10.123779296875, 10.4429931640625, 10.76220703125, 11.0814208984375, 11.400634765625, 11.7198486328125, 12.0390625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 9.0, 3.0, 5.0, 16.0, 13.0, 19.0, 27.0, 43.0, 55.0, 86.0, 160.0, 310.0, 682.0, 1611.0, 4617.0, 14834.0, 58425.0, 394976.0, 479008.0, 68387.0, 16743.0, 5250.0, 1777.0, 700.0, 329.0, 160.0, 68.0, 69.0, 41.0, 30.0, 29.0, 12.0, 12.0, 8.0, 10.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.7109375, -8.46240234375, -8.2138671875, -7.96533203125, -7.716796875, -7.46826171875, -7.2197265625, -6.97119140625, -6.72265625, -6.47412109375, -6.2255859375, -5.97705078125, -5.728515625, -5.47998046875, -5.2314453125, -4.98291015625, -4.734375, -4.48583984375, -4.2373046875, -3.98876953125, -3.740234375, -3.49169921875, -3.2431640625, -2.99462890625, -2.74609375, -2.49755859375, -2.2490234375, -2.00048828125, -1.751953125, -1.50341796875, -1.2548828125, -1.00634765625, -0.7578125, -0.50927734375, -0.2607421875, -0.01220703125, 0.236328125, 0.48486328125, 0.7333984375, 0.98193359375, 1.23046875, 1.47900390625, 1.7275390625, 1.97607421875, 2.224609375, 2.47314453125, 2.7216796875, 2.97021484375, 3.21875, 3.46728515625, 3.7158203125, 3.96435546875, 4.212890625, 4.46142578125, 4.7099609375, 4.95849609375, 5.20703125, 5.45556640625, 5.7041015625, 5.95263671875, 6.201171875, 6.44970703125, 6.6982421875, 6.94677734375, 7.1953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 1.0, 6.0, 4.0, 14.0, 9.0, 13.0, 11.0, 21.0, 16.0, 27.0, 35.0, 67.0, 115.0, 220.0, 189.0, 64.0, 39.0, 33.0, 21.0, 21.0, 6.0, 12.0, 12.0, 11.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0015316009521484375, -0.001493014395236969, -0.0014544278383255005, -0.001415841281414032, -0.0013772547245025635, -0.001338668167591095, -0.0013000816106796265, -0.001261495053768158, -0.0012229084968566895, -0.001184321939945221, -0.0011457353830337524, -0.001107148826122284, -0.0010685622692108154, -0.001029975712299347, -0.0009913891553878784, -0.0009528025984764099, -0.0009142160415649414, -0.0008756294846534729, -0.0008370429277420044, -0.0007984563708305359, -0.0007598698139190674, -0.0007212832570075989, -0.0006826967000961304, -0.0006441101431846619, -0.0006055235862731934, -0.0005669370293617249, -0.0005283504724502563, -0.0004897639155387878, -0.00045117735862731934, -0.00041259080171585083, -0.0003740042448043823, -0.0003354176878929138, -0.0002968311309814453, -0.0002582445740699768, -0.0002196580171585083, -0.0001810714602470398, -0.0001424849033355713, -0.00010389834642410278, -6.531178951263428e-05, -2.672523260116577e-05, 1.1861324310302734e-05, 5.044788122177124e-05, 8.903443813323975e-05, 0.00012762099504470825, 0.00016620755195617676, 0.00020479410886764526, 0.00024338066577911377, 0.0002819672226905823, 0.0003205537796020508, 0.0003591403365135193, 0.0003977268934249878, 0.0004363134503364563, 0.0004749000072479248, 0.0005134865641593933, 0.0005520731210708618, 0.0005906596779823303, 0.0006292462348937988, 0.0006678327918052673, 0.0007064193487167358, 0.0007450059056282043, 0.0007835924625396729, 0.0008221790194511414, 0.0008607655763626099, 0.0008993521332740784, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 4.0, 5.0, 23.0, 27.0, 36.0, 62.0, 104.0, 181.0, 302.0, 667.0, 1513.0, 4067.0, 14047.0, 66311.0, 563851.0, 336773.0, 44759.0, 10198.0, 3193.0, 1160.0, 551.0, 266.0, 161.0, 111.0, 56.0, 33.0, 26.0, 20.0, 18.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-10.6171875, -10.329345703125, -10.04150390625, -9.753662109375, -9.4658203125, -9.177978515625, -8.89013671875, -8.602294921875, -8.314453125, -8.026611328125, -7.73876953125, -7.450927734375, -7.1630859375, -6.875244140625, -6.58740234375, -6.299560546875, -6.01171875, -5.723876953125, -5.43603515625, -5.148193359375, -4.8603515625, -4.572509765625, -4.28466796875, -3.996826171875, -3.708984375, -3.421142578125, -3.13330078125, -2.845458984375, -2.5576171875, -2.269775390625, -1.98193359375, -1.694091796875, -1.40625, -1.118408203125, -0.83056640625, -0.542724609375, -0.2548828125, 0.032958984375, 0.32080078125, 0.608642578125, 0.896484375, 1.184326171875, 1.47216796875, 1.760009765625, 2.0478515625, 2.335693359375, 2.62353515625, 2.911376953125, 3.19921875, 3.487060546875, 3.77490234375, 4.062744140625, 4.3505859375, 4.638427734375, 4.92626953125, 5.214111328125, 5.501953125, 5.789794921875, 6.07763671875, 6.365478515625, 6.6533203125, 6.941162109375, 7.22900390625, 7.516845703125, 7.8046875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 6.0, 0.0, 7.0, 3.0, 2.0, 10.0, 13.0, 17.0, 24.0, 22.0, 48.0, 57.0, 80.0, 130.0, 171.0, 132.0, 76.0, 56.0, 32.0, 33.0, 26.0, 20.0, 12.0, 14.0, 3.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-7.76953125, -7.591217041015625, -7.41290283203125, -7.234588623046875, -7.0562744140625, -6.877960205078125, -6.69964599609375, -6.521331787109375, -6.343017578125, -6.164703369140625, -5.98638916015625, -5.808074951171875, -5.6297607421875, -5.451446533203125, -5.27313232421875, -5.094818115234375, -4.91650390625, -4.738189697265625, -4.55987548828125, -4.381561279296875, -4.2032470703125, -4.024932861328125, -3.84661865234375, -3.668304443359375, -3.489990234375, -3.311676025390625, -3.13336181640625, -2.955047607421875, -2.7767333984375, -2.598419189453125, -2.42010498046875, -2.241790771484375, -2.0634765625, -1.885162353515625, -1.70684814453125, -1.528533935546875, -1.3502197265625, -1.171905517578125, -0.99359130859375, -0.815277099609375, -0.636962890625, -0.458648681640625, -0.28033447265625, -0.102020263671875, 0.0762939453125, 0.254608154296875, 0.43292236328125, 0.611236572265625, 0.78955078125, 0.967864990234375, 1.14617919921875, 1.324493408203125, 1.5028076171875, 1.681121826171875, 1.85943603515625, 2.037750244140625, 2.216064453125, 2.394378662109375, 2.57269287109375, 2.751007080078125, 2.9293212890625, 3.107635498046875, 3.28594970703125, 3.464263916015625, 3.642578125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 11.0, 18.0, 40.0, 98.0, 147.0, 208.0, 189.0, 132.0, 89.0, 41.0, 20.0, 9.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.54129028320312, -113.21691131591797, -108.89253234863281, -104.56814575195312, -100.24376678466797, -95.91938781738281, -91.59500122070312, -87.27062225341797, -82.94624328613281, -78.62186431884766, -74.2974853515625, -69.97309875488281, -65.64871978759766, -61.3243408203125, -56.99995803833008, -52.675575256347656, -48.3511962890625, -44.026817321777344, -39.70243453979492, -35.3780517578125, -31.053672790527344, -26.729291915893555, -22.404911041259766, -18.080530166625977, -13.756149291992188, -9.431768417358398, -5.107387542724609, -0.7830066680908203, 3.5413742065429688, 7.865755081176758, 12.190135955810547, 16.514516830444336, 20.838882446289062, 25.16326332092285, 29.48764419555664, 33.81202697753906, 38.13640594482422, 42.460784912109375, 46.7851676940918, 51.10955047607422, 55.433929443359375, 59.75830841064453, 64.08268737792969, 68.40707397460938, 72.73145294189453, 77.05583190917969, 81.38021850585938, 85.70459747314453, 90.02897644042969, 94.35335540771484, 98.677734375, 103.00212097167969, 107.32649993896484, 111.65087890625, 115.97526550292969, 120.29964447021484, 124.6240234375, 128.9484100341797, 133.2727813720703, 137.59716796875, 141.92153930664062, 146.2459259033203, 150.5703125, 154.89468383789062, 159.2190704345703]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 10.0, 12.0, 17.0, 21.0, 22.0, 19.0, 16.0, 17.0, 31.0, 36.0, 42.0, 42.0, 29.0, 35.0, 45.0, 39.0, 42.0, 39.0, 53.0, 40.0, 36.0, 38.0, 32.0, 32.0, 24.0, 27.0, 22.0, 23.0, 24.0, 17.0, 24.0, 12.0, 12.0, 11.0, 6.0, 8.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.39265441894531, -42.098670959472656, -40.8046875, -39.510704040527344, -38.21672058105469, -36.922733306884766, -35.62874984741211, -34.33476638793945, -33.0407829284668, -31.74679946899414, -30.452816009521484, -29.158830642700195, -27.86484718322754, -26.570863723754883, -25.276878356933594, -23.982894897460938, -22.68891143798828, -21.394927978515625, -20.10094451904297, -18.80695915222168, -17.512975692749023, -16.218992233276367, -14.925007820129395, -13.631023406982422, -12.337039947509766, -11.04305648803711, -9.749072074890137, -8.455087661743164, -7.161104202270508, -5.867120265960693, -4.573136329650879, -3.2791519165039062, -1.98516845703125, -0.6911845207214355, 0.6027994155883789, 1.8967833518981934, 3.190767288208008, 4.484751224517822, 5.778735160827637, 7.072719573974609, 8.366703033447266, 9.660686492919922, 10.954670906066895, 12.248655319213867, 13.542638778686523, 14.83662223815918, 16.13060760498047, 17.424591064453125, 18.71857452392578, 20.012557983398438, 21.306541442871094, 22.600526809692383, 23.89451026916504, 25.188493728637695, 26.482479095458984, 27.77646255493164, 29.070446014404297, 30.364429473876953, 31.65841293334961, 32.952396392822266, 34.24638366699219, 35.540367126464844, 36.8343505859375, 38.128334045410156, 39.42231750488281]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 12.0, 23.0, 30.0, 57.0, 111.0, 206.0, 438.0, 1015.0, 3434.0, 20672.0, 603760.0, 3525151.0, 32386.0, 4549.0, 1268.0, 527.0, 241.0, 124.0, 71.0, 63.0, 42.0, 25.0, 15.0, 14.0, 12.0, 7.0, 9.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.3125, -37.3564453125, -35.400390625, -33.4443359375, -31.48828125, -29.5322265625, -27.576171875, -25.6201171875, -23.6640625, -21.7080078125, -19.751953125, -17.7958984375, -15.83984375, -13.8837890625, -11.927734375, -9.9716796875, -8.015625, -6.0595703125, -4.103515625, -2.1474609375, -0.19140625, 1.7646484375, 3.720703125, 5.6767578125, 7.6328125, 9.5888671875, 11.544921875, 13.5009765625, 15.45703125, 17.4130859375, 19.369140625, 21.3251953125, 23.28125, 25.2373046875, 27.193359375, 29.1494140625, 31.10546875, 33.0615234375, 35.017578125, 36.9736328125, 38.9296875, 40.8857421875, 42.841796875, 44.7978515625, 46.75390625, 48.7099609375, 50.666015625, 52.6220703125, 54.578125, 56.5341796875, 58.490234375, 60.4462890625, 62.40234375, 64.3583984375, 66.314453125, 68.2705078125, 70.2265625, 72.1826171875, 74.138671875, 76.0947265625, 78.05078125, 80.0068359375, 81.962890625, 83.9189453125, 85.875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 15.0, 22.0, 23.0, 35.0, 47.0, 90.0, 86.0, 106.0, 111.0, 115.0, 94.0, 70.0, 55.0, 55.0, 24.0, 18.0, 9.0, 10.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.615631103515625, -3.44805908203125, -3.280487060546875, -3.1129150390625, -2.945343017578125, -2.77777099609375, -2.610198974609375, -2.442626953125, -2.275054931640625, -2.10748291015625, -1.939910888671875, -1.7723388671875, -1.604766845703125, -1.43719482421875, -1.269622802734375, -1.10205078125, -0.934478759765625, -0.76690673828125, -0.599334716796875, -0.4317626953125, -0.264190673828125, -0.09661865234375, 0.070953369140625, 0.238525390625, 0.406097412109375, 0.57366943359375, 0.741241455078125, 0.9088134765625, 1.076385498046875, 1.24395751953125, 1.411529541015625, 1.5791015625, 1.746673583984375, 1.91424560546875, 2.081817626953125, 2.2493896484375, 2.416961669921875, 2.58453369140625, 2.752105712890625, 2.919677734375, 3.087249755859375, 3.25482177734375, 3.422393798828125, 3.5899658203125, 3.757537841796875, 3.92510986328125, 4.092681884765625, 4.26025390625, 4.427825927734375, 4.59539794921875, 4.762969970703125, 4.9305419921875, 5.098114013671875, 5.26568603515625, 5.433258056640625, 5.600830078125, 5.768402099609375, 5.93597412109375, 6.103546142578125, 6.2711181640625, 6.438690185546875, 6.60626220703125, 6.773834228515625, 6.94140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 1.0, 6.0, 5.0, 6.0, 9.0, 20.0, 19.0, 20.0, 42.0, 61.0, 81.0, 118.0, 217.0, 407.0, 794.0, 1990.0, 5424.0, 17762.0, 71384.0, 479924.0, 3313200.0, 238441.0, 45280.0, 12128.0, 3925.0, 1572.0, 630.0, 322.0, 186.0, 104.0, 60.0, 34.0, 26.0, 22.0, 13.0, 11.0, 8.0, 9.0, 10.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.4150390625, -18.705078125, -17.9951171875, -17.28515625, -16.5751953125, -15.865234375, -15.1552734375, -14.4453125, -13.7353515625, -13.025390625, -12.3154296875, -11.60546875, -10.8955078125, -10.185546875, -9.4755859375, -8.765625, -8.0556640625, -7.345703125, -6.6357421875, -5.92578125, -5.2158203125, -4.505859375, -3.7958984375, -3.0859375, -2.3759765625, -1.666015625, -0.9560546875, -0.24609375, 0.4638671875, 1.173828125, 1.8837890625, 2.59375, 3.3037109375, 4.013671875, 4.7236328125, 5.43359375, 6.1435546875, 6.853515625, 7.5634765625, 8.2734375, 8.9833984375, 9.693359375, 10.4033203125, 11.11328125, 11.8232421875, 12.533203125, 13.2431640625, 13.953125, 14.6630859375, 15.373046875, 16.0830078125, 16.79296875, 17.5029296875, 18.212890625, 18.9228515625, 19.6328125, 20.3427734375, 21.052734375, 21.7626953125, 22.47265625, 23.1826171875, 23.892578125, 24.6025390625, 25.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 12.0, 18.0, 21.0, 40.0, 48.0, 76.0, 103.0, 188.0, 334.0, 1267.0, 1067.0, 401.0, 173.0, 110.0, 57.0, 48.0, 31.0, 18.0, 15.0, 11.0, 5.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.234375, -10.972900390625, -10.71142578125, -10.449951171875, -10.1884765625, -9.927001953125, -9.66552734375, -9.404052734375, -9.142578125, -8.881103515625, -8.61962890625, -8.358154296875, -8.0966796875, -7.835205078125, -7.57373046875, -7.312255859375, -7.05078125, -6.789306640625, -6.52783203125, -6.266357421875, -6.0048828125, -5.743408203125, -5.48193359375, -5.220458984375, -4.958984375, -4.697509765625, -4.43603515625, -4.174560546875, -3.9130859375, -3.651611328125, -3.39013671875, -3.128662109375, -2.8671875, -2.605712890625, -2.34423828125, -2.082763671875, -1.8212890625, -1.559814453125, -1.29833984375, -1.036865234375, -0.775390625, -0.513916015625, -0.25244140625, 0.009033203125, 0.2705078125, 0.531982421875, 0.79345703125, 1.054931640625, 1.31640625, 1.577880859375, 1.83935546875, 2.100830078125, 2.3623046875, 2.623779296875, 2.88525390625, 3.146728515625, 3.408203125, 3.669677734375, 3.93115234375, 4.192626953125, 4.4541015625, 4.715576171875, 4.97705078125, 5.238525390625, 5.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 12.0, 24.0, 28.0, 41.0, 44.0, 66.0, 78.0, 78.0, 91.0, 100.0, 101.0, 81.0, 64.0, 54.0, 40.0, 16.0, 23.0, 16.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.32663917541504, -29.106979370117188, -27.887319564819336, -26.667659759521484, -25.447999954223633, -24.22834014892578, -23.008678436279297, -21.789020538330078, -20.569358825683594, -19.349699020385742, -18.13003921508789, -16.91037940979004, -15.690719604492188, -14.471059799194336, -13.251399040222168, -12.031739234924316, -10.812080383300781, -9.59242057800293, -8.372760772705078, -7.153100490570068, -5.933440685272217, -4.713780879974365, -3.4941205978393555, -2.274460792541504, -1.0548009872436523, 0.16485893726348877, 1.3845188617706299, 2.6041789054870605, 3.823838710784912, 5.043498516082764, 6.263158798217773, 7.482818603515625, 8.702476501464844, 9.922136306762695, 11.141796112060547, 12.361455917358398, 13.58111572265625, 14.800775527954102, 16.020435333251953, 17.240097045898438, 18.459754943847656, 19.679414749145508, 20.89907455444336, 22.11873435974121, 23.338394165039062, 24.558053970336914, 25.777713775634766, 26.99737548828125, 28.2170352935791, 29.436695098876953, 30.656354904174805, 31.876014709472656, 33.09567642211914, 34.31533432006836, 35.534996032714844, 36.75465393066406, 37.97431564331055, 39.19397735595703, 40.41363525390625, 41.633296966552734, 42.85295486450195, 44.07261657714844, 45.292274475097656, 46.51193618774414, 47.73159408569336]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 15.0, 11.0, 7.0, 18.0, 13.0, 16.0, 19.0, 24.0, 27.0, 19.0, 33.0, 34.0, 38.0, 56.0, 34.0, 29.0, 41.0, 51.0, 54.0, 39.0, 29.0, 41.0, 47.0, 35.0, 28.0, 40.0, 29.0, 20.0, 23.0, 18.0, 16.0, 20.0, 16.0, 12.0, 8.0, 10.0, 11.0, 6.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.020980834960938, -21.336862564086914, -20.65274429321289, -19.9686279296875, -19.284509658813477, -18.600391387939453, -17.91627311706543, -17.232154846191406, -16.548038482666016, -15.863920211791992, -15.179802894592285, -14.495684623718262, -13.811567306518555, -13.127449035644531, -12.443330764770508, -11.759212493896484, -11.075094223022461, -10.390975952148438, -9.70685863494873, -9.022740364074707, -8.338623046875, -7.654504776000977, -6.970386505126953, -6.286268711090088, -5.602150917053223, -4.918033123016357, -4.233915328979492, -3.5497970581054688, -2.8656792640686035, -2.1815614700317383, -1.4974431991577148, -0.8133254051208496, -0.1292095184326172, 0.5549083948135376, 1.2390263080596924, 1.9231443405151367, 2.607262134552002, 3.291379928588867, 3.9754981994628906, 4.659615993499756, 5.343733787536621, 6.027851581573486, 6.711969375610352, 7.396087646484375, 8.080205917358398, 8.764323234558105, 9.448441505432129, 10.132558822631836, 10.81667709350586, 11.500795364379883, 12.18491268157959, 12.869030952453613, 13.55314826965332, 14.237266540527344, 14.921384811401367, 15.60550308227539, 16.28961944580078, 16.973737716674805, 17.657855987548828, 18.34197235107422, 19.026090621948242, 19.710208892822266, 20.39432716369629, 21.078445434570312, 21.762563705444336]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 9.0, 5.0, 10.0, 10.0, 18.0, 34.0, 60.0, 72.0, 179.0, 313.0, 844.0, 2841.0, 22822.0, 496092.0, 498119.0, 22621.0, 2875.0, 853.0, 353.0, 183.0, 90.0, 69.0, 29.0, 14.0, 17.0, 6.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.109375, -29.553955078125, -27.99853515625, -26.443115234375, -24.8876953125, -23.332275390625, -21.77685546875, -20.221435546875, -18.666015625, -17.110595703125, -15.55517578125, -13.999755859375, -12.4443359375, -10.888916015625, -9.33349609375, -7.778076171875, -6.22265625, -4.667236328125, -3.11181640625, -1.556396484375, -0.0009765625, 1.554443359375, 3.10986328125, 4.665283203125, 6.220703125, 7.776123046875, 9.33154296875, 10.886962890625, 12.4423828125, 13.997802734375, 15.55322265625, 17.108642578125, 18.6640625, 20.219482421875, 21.77490234375, 23.330322265625, 24.8857421875, 26.441162109375, 27.99658203125, 29.552001953125, 31.107421875, 32.662841796875, 34.21826171875, 35.773681640625, 37.3291015625, 38.884521484375, 40.43994140625, 41.995361328125, 43.55078125, 45.106201171875, 46.66162109375, 48.217041015625, 49.7724609375, 51.327880859375, 52.88330078125, 54.438720703125, 55.994140625, 57.549560546875, 59.10498046875, 60.660400390625, 62.2158203125, 63.771240234375, 65.32666015625, 66.882080078125, 68.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 17.0, 11.0, 16.0, 39.0, 41.0, 60.0, 89.0, 99.0, 96.0, 106.0, 95.0, 85.0, 80.0, 48.0, 43.0, 28.0, 13.0, 13.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.72265625, -3.5552978515625, -3.387939453125, -3.2205810546875, -3.05322265625, -2.8858642578125, -2.718505859375, -2.5511474609375, -2.3837890625, -2.2164306640625, -2.049072265625, -1.8817138671875, -1.71435546875, -1.5469970703125, -1.379638671875, -1.2122802734375, -1.044921875, -0.8775634765625, -0.710205078125, -0.5428466796875, -0.37548828125, -0.2081298828125, -0.040771484375, 0.1265869140625, 0.2939453125, 0.4613037109375, 0.628662109375, 0.7960205078125, 0.96337890625, 1.1307373046875, 1.298095703125, 1.4654541015625, 1.6328125, 1.8001708984375, 1.967529296875, 2.1348876953125, 2.30224609375, 2.4696044921875, 2.636962890625, 2.8043212890625, 2.9716796875, 3.1390380859375, 3.306396484375, 3.4737548828125, 3.64111328125, 3.8084716796875, 3.975830078125, 4.1431884765625, 4.310546875, 4.4779052734375, 4.645263671875, 4.8126220703125, 4.97998046875, 5.1473388671875, 5.314697265625, 5.4820556640625, 5.6494140625, 5.8167724609375, 5.984130859375, 6.1514892578125, 6.31884765625, 6.4862060546875, 6.653564453125, 6.8209228515625, 6.98828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 5.0, 6.0, 13.0, 18.0, 12.0, 28.0, 34.0, 56.0, 127.0, 154.0, 332.0, 616.0, 1188.0, 2623.0, 5893.0, 13638.0, 31727.0, 82487.0, 397323.0, 377168.0, 79776.0, 31209.0, 13196.0, 5762.0, 2638.0, 1151.0, 600.0, 311.0, 161.0, 113.0, 61.0, 35.0, 29.0, 18.0, 12.0, 10.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5703125, -11.1844482421875, -10.798583984375, -10.4127197265625, -10.02685546875, -9.6409912109375, -9.255126953125, -8.8692626953125, -8.4833984375, -8.0975341796875, -7.711669921875, -7.3258056640625, -6.93994140625, -6.5540771484375, -6.168212890625, -5.7823486328125, -5.396484375, -5.0106201171875, -4.624755859375, -4.2388916015625, -3.85302734375, -3.4671630859375, -3.081298828125, -2.6954345703125, -2.3095703125, -1.9237060546875, -1.537841796875, -1.1519775390625, -0.76611328125, -0.3802490234375, 0.005615234375, 0.3914794921875, 0.77734375, 1.1632080078125, 1.549072265625, 1.9349365234375, 2.32080078125, 2.7066650390625, 3.092529296875, 3.4783935546875, 3.8642578125, 4.2501220703125, 4.635986328125, 5.0218505859375, 5.40771484375, 5.7935791015625, 6.179443359375, 6.5653076171875, 6.951171875, 7.3370361328125, 7.722900390625, 8.1087646484375, 8.49462890625, 8.8804931640625, 9.266357421875, 9.6522216796875, 10.0380859375, 10.4239501953125, 10.809814453125, 11.1956787109375, 11.58154296875, 11.9674072265625, 12.353271484375, 12.7391357421875, 13.125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 12.0, 13.0, 15.0, 19.0, 32.0, 22.0, 38.0, 34.0, 42.0, 46.0, 54.0, 47.0, 56.0, 46.0, 42.0, 40.0, 57.0, 57.0, 37.0, 43.0, 40.0, 24.0, 30.0, 25.0, 22.0, 25.0, 12.0, 16.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.9296875, -10.5806884765625, -10.231689453125, -9.8826904296875, -9.53369140625, -9.1846923828125, -8.835693359375, -8.4866943359375, -8.1376953125, -7.7886962890625, -7.439697265625, -7.0906982421875, -6.74169921875, -6.3927001953125, -6.043701171875, -5.6947021484375, -5.345703125, -4.9967041015625, -4.647705078125, -4.2987060546875, -3.94970703125, -3.6007080078125, -3.251708984375, -2.9027099609375, -2.5537109375, -2.2047119140625, -1.855712890625, -1.5067138671875, -1.15771484375, -0.8087158203125, -0.459716796875, -0.1107177734375, 0.23828125, 0.5872802734375, 0.936279296875, 1.2852783203125, 1.63427734375, 1.9832763671875, 2.332275390625, 2.6812744140625, 3.0302734375, 3.3792724609375, 3.728271484375, 4.0772705078125, 4.42626953125, 4.7752685546875, 5.124267578125, 5.4732666015625, 5.822265625, 6.1712646484375, 6.520263671875, 6.8692626953125, 7.21826171875, 7.5672607421875, 7.916259765625, 8.2652587890625, 8.6142578125, 8.9632568359375, 9.312255859375, 9.6612548828125, 10.01025390625, 10.3592529296875, 10.708251953125, 11.0572509765625, 11.40625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 13.0, 9.0, 19.0, 26.0, 24.0, 56.0, 61.0, 116.0, 159.0, 294.0, 562.0, 1191.0, 2672.0, 6231.0, 16236.0, 45079.0, 173982.0, 581058.0, 153034.0, 41694.0, 15239.0, 5774.0, 2545.0, 1172.0, 558.0, 267.0, 159.0, 83.0, 73.0, 56.0, 35.0, 15.0, 15.0, 10.0, 5.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.2152099609375, -5.031982421875, -4.8487548828125, -4.66552734375, -4.4822998046875, -4.299072265625, -4.1158447265625, -3.9326171875, -3.7493896484375, -3.566162109375, -3.3829345703125, -3.19970703125, -3.0164794921875, -2.833251953125, -2.6500244140625, -2.466796875, -2.2835693359375, -2.100341796875, -1.9171142578125, -1.73388671875, -1.5506591796875, -1.367431640625, -1.1842041015625, -1.0009765625, -0.8177490234375, -0.634521484375, -0.4512939453125, -0.26806640625, -0.0848388671875, 0.098388671875, 0.2816162109375, 0.46484375, 0.6480712890625, 0.831298828125, 1.0145263671875, 1.19775390625, 1.3809814453125, 1.564208984375, 1.7474365234375, 1.9306640625, 2.1138916015625, 2.297119140625, 2.4803466796875, 2.66357421875, 2.8468017578125, 3.030029296875, 3.2132568359375, 3.396484375, 3.5797119140625, 3.762939453125, 3.9461669921875, 4.12939453125, 4.3126220703125, 4.495849609375, 4.6790771484375, 4.8623046875, 5.0455322265625, 5.228759765625, 5.4119873046875, 5.59521484375, 5.7784423828125, 5.961669921875, 6.1448974609375, 6.328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 7.0, 11.0, 12.0, 16.0, 9.0, 17.0, 22.0, 56.0, 133.0, 298.0, 194.0, 80.0, 29.0, 21.0, 12.0, 14.0, 17.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011692047119140625, -0.001123771071434021, -0.0010783374309539795, -0.001032903790473938, -0.0009874701499938965, -0.000942036509513855, -0.0008966028690338135, -0.000851169228553772, -0.0008057355880737305, -0.000760301947593689, -0.0007148683071136475, -0.000669434666633606, -0.0006240010261535645, -0.000578567385673523, -0.0005331337451934814, -0.00048770010471343994, -0.00044226646423339844, -0.00039683282375335693, -0.00035139918327331543, -0.0003059655427932739, -0.0002605319023132324, -0.00021509826183319092, -0.00016966462135314941, -0.0001242309808731079, -7.87973403930664e-05, -3.33636999130249e-05, 1.2069940567016602e-05, 5.7503581047058105e-05, 0.00010293722152709961, 0.0001483708620071411, 0.00019380450248718262, 0.00023923814296722412, 0.0002846717834472656, 0.00033010542392730713, 0.00037553906440734863, 0.00042097270488739014, 0.00046640634536743164, 0.0005118399858474731, 0.0005572736263275146, 0.0006027072668075562, 0.0006481409072875977, 0.0006935745477676392, 0.0007390081882476807, 0.0007844418287277222, 0.0008298754692077637, 0.0008753091096878052, 0.0009207427501678467, 0.0009661763906478882, 0.0010116100311279297, 0.0010570436716079712, 0.0011024773120880127, 0.0011479109525680542, 0.0011933445930480957, 0.0012387782335281372, 0.0012842118740081787, 0.0013296455144882202, 0.0013750791549682617, 0.0014205127954483032, 0.0014659464359283447, 0.0015113800764083862, 0.0015568137168884277, 0.0016022473573684692, 0.0016476809978485107, 0.0016931146383285522, 0.0017385482788085938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 9.0, 22.0, 23.0, 56.0, 75.0, 130.0, 233.0, 394.0, 785.0, 1611.0, 4027.0, 11533.0, 38178.0, 152849.0, 617076.0, 162222.0, 39590.0, 12161.0, 4119.0, 1750.0, 772.0, 359.0, 217.0, 132.0, 70.0, 53.0, 28.0, 20.0, 17.0, 10.0, 8.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.39300537109375, -6.1688232421875, -5.94464111328125, -5.720458984375, -5.49627685546875, -5.2720947265625, -5.04791259765625, -4.82373046875, -4.59954833984375, -4.3753662109375, -4.15118408203125, -3.927001953125, -3.70281982421875, -3.4786376953125, -3.25445556640625, -3.0302734375, -2.80609130859375, -2.5819091796875, -2.35772705078125, -2.133544921875, -1.90936279296875, -1.6851806640625, -1.46099853515625, -1.23681640625, -1.01263427734375, -0.7884521484375, -0.56427001953125, -0.340087890625, -0.11590576171875, 0.1082763671875, 0.33245849609375, 0.556640625, 0.78082275390625, 1.0050048828125, 1.22918701171875, 1.453369140625, 1.67755126953125, 1.9017333984375, 2.12591552734375, 2.35009765625, 2.57427978515625, 2.7984619140625, 3.02264404296875, 3.246826171875, 3.47100830078125, 3.6951904296875, 3.91937255859375, 4.1435546875, 4.36773681640625, 4.5919189453125, 4.81610107421875, 5.040283203125, 5.26446533203125, 5.4886474609375, 5.71282958984375, 5.93701171875, 6.16119384765625, 6.3853759765625, 6.60955810546875, 6.833740234375, 7.05792236328125, 7.2821044921875, 7.50628662109375, 7.73046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 6.0, 5.0, 6.0, 7.0, 10.0, 12.0, 20.0, 18.0, 35.0, 38.0, 59.0, 90.0, 122.0, 139.0, 118.0, 96.0, 50.0, 40.0, 32.0, 27.0, 26.0, 10.0, 14.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9053955078125, -4.713134765625, -4.5208740234375, -4.32861328125, -4.1363525390625, -3.944091796875, -3.7518310546875, -3.5595703125, -3.3673095703125, -3.175048828125, -2.9827880859375, -2.79052734375, -2.5982666015625, -2.406005859375, -2.2137451171875, -2.021484375, -1.8292236328125, -1.636962890625, -1.4447021484375, -1.25244140625, -1.0601806640625, -0.867919921875, -0.6756591796875, -0.4833984375, -0.2911376953125, -0.098876953125, 0.0933837890625, 0.28564453125, 0.4779052734375, 0.670166015625, 0.8624267578125, 1.0546875, 1.2469482421875, 1.439208984375, 1.6314697265625, 1.82373046875, 2.0159912109375, 2.208251953125, 2.4005126953125, 2.5927734375, 2.7850341796875, 2.977294921875, 3.1695556640625, 3.36181640625, 3.5540771484375, 3.746337890625, 3.9385986328125, 4.130859375, 4.3231201171875, 4.515380859375, 4.7076416015625, 4.89990234375, 5.0921630859375, 5.284423828125, 5.4766845703125, 5.6689453125, 5.8612060546875, 6.053466796875, 6.2457275390625, 6.43798828125, 6.6302490234375, 6.822509765625, 7.0147705078125, 7.20703125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 3.0, 6.0, 8.0, 13.0, 19.0, 30.0, 31.0, 42.0, 58.0, 60.0, 56.0, 95.0, 75.0, 88.0, 90.0, 83.0, 47.0, 53.0, 40.0, 28.0, 24.0, 18.0, 10.0, 9.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-75.55586242675781, -73.69187927246094, -71.82788848876953, -69.96390533447266, -68.09991455078125, -66.23593139648438, -64.3719482421875, -62.507957458496094, -60.64397430419922, -58.77998733520508, -56.91600036621094, -55.05201721191406, -53.18803024291992, -51.32404327392578, -49.46005630493164, -47.5960693359375, -45.73208236694336, -43.86809539794922, -42.00410842895508, -40.14012145996094, -38.27613830566406, -36.41215133666992, -34.54816436767578, -32.68417739868164, -30.820192337036133, -28.956205368041992, -27.092220306396484, -25.228233337402344, -23.364246368408203, -21.500261306762695, -19.636274337768555, -17.772289276123047, -15.90829849243164, -14.044312477111816, -12.180326461791992, -10.316339492797852, -8.452353477478027, -6.588367462158203, -4.7243804931640625, -2.8603944778442383, -0.9964084625244141, 0.8675777912139893, 2.7315640449523926, 4.595550537109375, 6.459536552429199, 8.323522567749023, 10.187509536743164, 12.051495552062988, 13.915481567382812, 15.779467582702637, 17.64345359802246, 19.5074405670166, 21.37142562866211, 23.23541259765625, 25.09939956665039, 26.96338653564453, 28.82737159729004, 30.69135856628418, 32.55534362792969, 34.41933059692383, 36.28331756591797, 38.147300720214844, 40.01129150390625, 41.875274658203125, 43.739261627197266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 9.0, 6.0, 6.0, 13.0, 14.0, 6.0, 23.0, 21.0, 26.0, 13.0, 28.0, 37.0, 25.0, 39.0, 28.0, 38.0, 36.0, 46.0, 27.0, 32.0, 32.0, 38.0, 36.0, 35.0, 40.0, 43.0, 37.0, 30.0, 35.0, 18.0, 24.0, 20.0, 19.0, 18.0, 20.0, 14.0, 13.0, 8.0, 11.0, 5.0, 3.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-40.06098937988281, -38.774513244628906, -37.488037109375, -36.201560974121094, -34.91508483886719, -33.62860870361328, -32.342132568359375, -31.0556583404541, -29.769182205200195, -28.48270606994629, -27.196229934692383, -25.909753799438477, -24.623279571533203, -23.336803436279297, -22.05032730102539, -20.763851165771484, -19.477375030517578, -18.190898895263672, -16.904422760009766, -15.617947578430176, -14.33147144317627, -13.044995307922363, -11.758520126342773, -10.472043991088867, -9.185567855834961, -7.899091720581055, -6.612616062164307, -5.326140403747559, -4.039664268493652, -2.753188133239746, -1.466712474822998, -0.18023681640625, 1.1062393188476562, 2.3927152156829834, 3.6791911125183105, 4.965666770935059, 6.252142906188965, 7.538619041442871, 8.825094223022461, 10.111570358276367, 11.398046493530273, 12.68452262878418, 13.970998764038086, 15.257473945617676, 16.543949127197266, 17.830425262451172, 19.116901397705078, 20.403377532958984, 21.68985366821289, 22.976329803466797, 24.262805938720703, 25.54928207397461, 26.835758209228516, 28.122234344482422, 29.408708572387695, 30.6951847076416, 31.981660842895508, 33.26813507080078, 34.55461120605469, 35.841087341308594, 37.1275634765625, 38.414039611816406, 39.70051574707031, 40.98699188232422, 42.273468017578125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 11.0, 19.0, 25.0, 34.0, 48.0, 85.0, 159.0, 280.0, 575.0, 1404.0, 4282.0, 18365.0, 163416.0, 3877149.0, 108302.0, 14212.0, 3529.0, 1183.0, 473.0, 233.0, 162.0, 90.0, 66.0, 41.0, 29.0, 24.0, 16.0, 9.0, 13.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.5, -47.81787109375, -46.1357421875, -44.45361328125, -42.771484375, -41.08935546875, -39.4072265625, -37.72509765625, -36.04296875, -34.36083984375, -32.6787109375, -30.99658203125, -29.314453125, -27.63232421875, -25.9501953125, -24.26806640625, -22.5859375, -20.90380859375, -19.2216796875, -17.53955078125, -15.857421875, -14.17529296875, -12.4931640625, -10.81103515625, -9.12890625, -7.44677734375, -5.7646484375, -4.08251953125, -2.400390625, -0.71826171875, 0.9638671875, 2.64599609375, 4.328125, 6.01025390625, 7.6923828125, 9.37451171875, 11.056640625, 12.73876953125, 14.4208984375, 16.10302734375, 17.78515625, 19.46728515625, 21.1494140625, 22.83154296875, 24.513671875, 26.19580078125, 27.8779296875, 29.56005859375, 31.2421875, 32.92431640625, 34.6064453125, 36.28857421875, 37.970703125, 39.65283203125, 41.3349609375, 43.01708984375, 44.69921875, 46.38134765625, 48.0634765625, 49.74560546875, 51.427734375, 53.10986328125, 54.7919921875, 56.47412109375, 58.15625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 16.0, 26.0, 26.0, 37.0, 64.0, 75.0, 101.0, 94.0, 103.0, 101.0, 80.0, 72.0, 68.0, 52.0, 28.0, 13.0, 14.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.544921875, -3.379730224609375, -3.21453857421875, -3.049346923828125, -2.8841552734375, -2.718963623046875, -2.55377197265625, -2.388580322265625, -2.223388671875, -2.058197021484375, -1.89300537109375, -1.727813720703125, -1.5626220703125, -1.397430419921875, -1.23223876953125, -1.067047119140625, -0.90185546875, -0.736663818359375, -0.57147216796875, -0.406280517578125, -0.2410888671875, -0.075897216796875, 0.08929443359375, 0.254486083984375, 0.419677734375, 0.584869384765625, 0.75006103515625, 0.915252685546875, 1.0804443359375, 1.245635986328125, 1.41082763671875, 1.576019287109375, 1.7412109375, 1.906402587890625, 2.07159423828125, 2.236785888671875, 2.4019775390625, 2.567169189453125, 2.73236083984375, 2.897552490234375, 3.062744140625, 3.227935791015625, 3.39312744140625, 3.558319091796875, 3.7235107421875, 3.888702392578125, 4.05389404296875, 4.219085693359375, 4.38427734375, 4.549468994140625, 4.71466064453125, 4.879852294921875, 5.0450439453125, 5.210235595703125, 5.37542724609375, 5.540618896484375, 5.705810546875, 5.871002197265625, 6.03619384765625, 6.201385498046875, 6.3665771484375, 6.531768798828125, 6.69696044921875, 6.862152099609375, 7.02734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 3.0, 9.0, 6.0, 11.0, 9.0, 12.0, 23.0, 35.0, 53.0, 73.0, 115.0, 161.0, 230.0, 302.0, 517.0, 739.0, 1130.0, 1781.0, 2714.0, 4397.0, 7429.0, 12962.0, 23705.0, 45350.0, 95566.0, 244408.0, 2143720.0, 1204827.0, 219820.0, 88275.0, 42509.0, 22425.0, 12329.0, 7050.0, 4198.0, 2611.0, 1676.0, 1066.0, 644.0, 427.0, 295.0, 202.0, 132.0, 102.0, 63.0, 56.0, 35.0, 26.0, 17.0, 10.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.71875, -10.3724365234375, -10.026123046875, -9.6798095703125, -9.33349609375, -8.9871826171875, -8.640869140625, -8.2945556640625, -7.9482421875, -7.6019287109375, -7.255615234375, -6.9093017578125, -6.56298828125, -6.2166748046875, -5.870361328125, -5.5240478515625, -5.177734375, -4.8314208984375, -4.485107421875, -4.1387939453125, -3.79248046875, -3.4461669921875, -3.099853515625, -2.7535400390625, -2.4072265625, -2.0609130859375, -1.714599609375, -1.3682861328125, -1.02197265625, -0.6756591796875, -0.329345703125, 0.0169677734375, 0.36328125, 0.7095947265625, 1.055908203125, 1.4022216796875, 1.74853515625, 2.0948486328125, 2.441162109375, 2.7874755859375, 3.1337890625, 3.4801025390625, 3.826416015625, 4.1727294921875, 4.51904296875, 4.8653564453125, 5.211669921875, 5.5579833984375, 5.904296875, 6.2506103515625, 6.596923828125, 6.9432373046875, 7.28955078125, 7.6358642578125, 7.982177734375, 8.3284912109375, 8.6748046875, 9.0211181640625, 9.367431640625, 9.7137451171875, 10.06005859375, 10.4063720703125, 10.752685546875, 11.0989990234375, 11.4453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 7.0, 13.0, 24.0, 33.0, 60.0, 70.0, 103.0, 133.0, 221.0, 497.0, 1690.0, 475.0, 240.0, 139.0, 91.0, 55.0, 48.0, 30.0, 21.0, 17.0, 22.0, 11.0, 10.0, 7.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.14990234375, -6.9365234375, -6.72314453125, -6.509765625, -6.29638671875, -6.0830078125, -5.86962890625, -5.65625, -5.44287109375, -5.2294921875, -5.01611328125, -4.802734375, -4.58935546875, -4.3759765625, -4.16259765625, -3.94921875, -3.73583984375, -3.5224609375, -3.30908203125, -3.095703125, -2.88232421875, -2.6689453125, -2.45556640625, -2.2421875, -2.02880859375, -1.8154296875, -1.60205078125, -1.388671875, -1.17529296875, -0.9619140625, -0.74853515625, -0.53515625, -0.32177734375, -0.1083984375, 0.10498046875, 0.318359375, 0.53173828125, 0.7451171875, 0.95849609375, 1.171875, 1.38525390625, 1.5986328125, 1.81201171875, 2.025390625, 2.23876953125, 2.4521484375, 2.66552734375, 2.87890625, 3.09228515625, 3.3056640625, 3.51904296875, 3.732421875, 3.94580078125, 4.1591796875, 4.37255859375, 4.5859375, 4.79931640625, 5.0126953125, 5.22607421875, 5.439453125, 5.65283203125, 5.8662109375, 6.07958984375, 6.29296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 15.0, 24.0, 47.0, 63.0, 89.0, 144.0, 124.0, 128.0, 114.0, 79.0, 63.0, 50.0, 24.0, 14.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-61.917701721191406, -60.19791793823242, -58.47813415527344, -56.75835418701172, -55.038570404052734, -53.31878662109375, -51.599002838134766, -49.87921905517578, -48.15943908691406, -46.43965530395508, -44.719871520996094, -43.000091552734375, -41.28030776977539, -39.560523986816406, -37.84074020385742, -36.12095642089844, -34.40117263793945, -32.68138885498047, -30.961606979370117, -29.241823196411133, -27.52204132080078, -25.802257537841797, -24.082473754882812, -22.362689971923828, -20.642908096313477, -18.923124313354492, -17.20334243774414, -15.483558654785156, -13.763775825500488, -12.04399299621582, -10.324209213256836, -8.604426383972168, -6.8846435546875, -5.164860725402832, -3.445077419281006, -1.7252941131591797, -0.005511283874511719, 1.7142715454101562, 3.4340553283691406, 5.153838157653809, 6.873620986938477, 8.593403816223145, 10.313186645507812, 12.032970428466797, 13.752753257751465, 15.472536087036133, 17.192319869995117, 18.91210174560547, 20.631885528564453, 22.351669311523438, 24.07145118713379, 25.791234970092773, 27.511016845703125, 29.23080062866211, 30.950584411621094, 32.67036819458008, 34.39015197753906, 36.10993576049805, 37.82971954345703, 39.54949951171875, 41.269283294677734, 42.98906707763672, 44.7088508605957, 46.42863464355469, 48.148414611816406]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 4.0, 9.0, 13.0, 12.0, 16.0, 13.0, 10.0, 26.0, 14.0, 46.0, 32.0, 34.0, 35.0, 29.0, 41.0, 52.0, 38.0, 45.0, 38.0, 51.0, 47.0, 39.0, 34.0, 31.0, 38.0, 25.0, 18.0, 26.0, 22.0, 12.0, 23.0, 23.0, 14.0, 12.0, 12.0, 10.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.265933990478516, -19.642507553100586, -19.019081115722656, -18.39565658569336, -17.77223014831543, -17.1488037109375, -16.52537727355957, -15.90195083618164, -15.278525352478027, -14.655098915100098, -14.031673431396484, -13.408246994018555, -12.784820556640625, -12.161395072937012, -11.537968635559082, -10.914543151855469, -10.291116714477539, -9.66769027709961, -9.044264793395996, -8.420838356018066, -7.797412395477295, -7.173986434936523, -6.550559997558594, -5.927134037017822, -5.303708076477051, -4.680282115936279, -4.056856155395508, -3.433429718017578, -2.8100037574768066, -2.186577796936035, -1.5631515979766846, -0.939725399017334, -0.3162994384765625, 0.30712664127349854, 0.9305527210235596, 1.5539788007736206, 2.1774048805236816, 2.800830841064453, 3.4242570400238037, 4.047683238983154, 4.671109199523926, 5.294535160064697, 5.917961120605469, 6.541387557983398, 7.16481351852417, 7.788239479064941, 8.411665916442871, 9.035091400146484, 9.658517837524414, 10.281944274902344, 10.905369758605957, 11.528796195983887, 12.1522216796875, 12.77564811706543, 13.39907455444336, 14.022500991821289, 14.645926475524902, 15.269352912902832, 15.892778396606445, 16.516204833984375, 17.139631271362305, 17.763057708740234, 18.38648223876953, 19.00990867614746, 19.63333511352539]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 7.0, 6.0, 5.0, 17.0, 25.0, 42.0, 58.0, 119.0, 195.0, 357.0, 800.0, 2062.0, 8520.0, 57400.0, 445965.0, 460972.0, 59515.0, 8687.0, 2108.0, 802.0, 373.0, 189.0, 122.0, 75.0, 44.0, 23.0, 22.0, 17.0, 8.0, 6.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.21875, -44.142333984375, -43.06591796875, -41.989501953125, -40.9130859375, -39.836669921875, -38.76025390625, -37.683837890625, -36.607421875, -35.531005859375, -34.45458984375, -33.378173828125, -32.3017578125, -31.225341796875, -30.14892578125, -29.072509765625, -27.99609375, -26.919677734375, -25.84326171875, -24.766845703125, -23.6904296875, -22.614013671875, -21.53759765625, -20.461181640625, -19.384765625, -18.308349609375, -17.23193359375, -16.155517578125, -15.0791015625, -14.002685546875, -12.92626953125, -11.849853515625, -10.7734375, -9.697021484375, -8.62060546875, -7.544189453125, -6.4677734375, -5.391357421875, -4.31494140625, -3.238525390625, -2.162109375, -1.085693359375, -0.00927734375, 1.067138671875, 2.1435546875, 3.219970703125, 4.29638671875, 5.372802734375, 6.44921875, 7.525634765625, 8.60205078125, 9.678466796875, 10.7548828125, 11.831298828125, 12.90771484375, 13.984130859375, 15.060546875, 16.136962890625, 17.21337890625, 18.289794921875, 19.3662109375, 20.442626953125, 21.51904296875, 22.595458984375, 23.671875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 10.0, 15.0, 21.0, 26.0, 42.0, 51.0, 72.0, 82.0, 90.0, 94.0, 93.0, 92.0, 73.0, 62.0, 48.0, 39.0, 33.0, 20.0, 10.0, 7.0, 10.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.677734375, -3.510162353515625, -3.34259033203125, -3.175018310546875, -3.0074462890625, -2.839874267578125, -2.67230224609375, -2.504730224609375, -2.337158203125, -2.169586181640625, -2.00201416015625, -1.834442138671875, -1.6668701171875, -1.499298095703125, -1.33172607421875, -1.164154052734375, -0.99658203125, -0.829010009765625, -0.66143798828125, -0.493865966796875, -0.3262939453125, -0.158721923828125, 0.00885009765625, 0.176422119140625, 0.343994140625, 0.511566162109375, 0.67913818359375, 0.846710205078125, 1.0142822265625, 1.181854248046875, 1.34942626953125, 1.516998291015625, 1.6845703125, 1.852142333984375, 2.01971435546875, 2.187286376953125, 2.3548583984375, 2.522430419921875, 2.69000244140625, 2.857574462890625, 3.025146484375, 3.192718505859375, 3.36029052734375, 3.527862548828125, 3.6954345703125, 3.863006591796875, 4.03057861328125, 4.198150634765625, 4.36572265625, 4.533294677734375, 4.70086669921875, 4.868438720703125, 5.0360107421875, 5.203582763671875, 5.37115478515625, 5.538726806640625, 5.706298828125, 5.873870849609375, 6.04144287109375, 6.209014892578125, 6.3765869140625, 6.544158935546875, 6.71173095703125, 6.879302978515625, 7.046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 8.0, 6.0, 11.0, 12.0, 12.0, 15.0, 19.0, 36.0, 34.0, 47.0, 73.0, 95.0, 111.0, 158.0, 179.0, 240.0, 325.0, 526.0, 911.0, 2027.0, 4997.0, 14657.0, 46029.0, 147491.0, 472937.0, 247112.0, 73207.0, 23250.0, 7683.0, 2733.0, 1334.0, 675.0, 436.0, 289.0, 203.0, 139.0, 135.0, 119.0, 79.0, 48.0, 36.0, 40.0, 20.0, 18.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.8203125, -13.3843994140625, -12.948486328125, -12.5125732421875, -12.07666015625, -11.6407470703125, -11.204833984375, -10.7689208984375, -10.3330078125, -9.8970947265625, -9.461181640625, -9.0252685546875, -8.58935546875, -8.1534423828125, -7.717529296875, -7.2816162109375, -6.845703125, -6.4097900390625, -5.973876953125, -5.5379638671875, -5.10205078125, -4.6661376953125, -4.230224609375, -3.7943115234375, -3.3583984375, -2.9224853515625, -2.486572265625, -2.0506591796875, -1.61474609375, -1.1788330078125, -0.742919921875, -0.3070068359375, 0.12890625, 0.5648193359375, 1.000732421875, 1.4366455078125, 1.87255859375, 2.3084716796875, 2.744384765625, 3.1802978515625, 3.6162109375, 4.0521240234375, 4.488037109375, 4.9239501953125, 5.35986328125, 5.7957763671875, 6.231689453125, 6.6676025390625, 7.103515625, 7.5394287109375, 7.975341796875, 8.4112548828125, 8.84716796875, 9.2830810546875, 9.718994140625, 10.1549072265625, 10.5908203125, 11.0267333984375, 11.462646484375, 11.8985595703125, 12.33447265625, 12.7703857421875, 13.206298828125, 13.6422119140625, 14.078125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 10.0, 4.0, 6.0, 6.0, 8.0, 9.0, 22.0, 16.0, 19.0, 28.0, 31.0, 35.0, 39.0, 38.0, 45.0, 42.0, 39.0, 56.0, 35.0, 47.0, 41.0, 44.0, 39.0, 41.0, 39.0, 37.0, 24.0, 25.0, 18.0, 30.0, 21.0, 16.0, 16.0, 15.0, 14.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.625, -10.2867431640625, -9.948486328125, -9.6102294921875, -9.27197265625, -8.9337158203125, -8.595458984375, -8.2572021484375, -7.9189453125, -7.5806884765625, -7.242431640625, -6.9041748046875, -6.56591796875, -6.2276611328125, -5.889404296875, -5.5511474609375, -5.212890625, -4.8746337890625, -4.536376953125, -4.1981201171875, -3.85986328125, -3.5216064453125, -3.183349609375, -2.8450927734375, -2.5068359375, -2.1685791015625, -1.830322265625, -1.4920654296875, -1.15380859375, -0.8155517578125, -0.477294921875, -0.1390380859375, 0.19921875, 0.5374755859375, 0.875732421875, 1.2139892578125, 1.55224609375, 1.8905029296875, 2.228759765625, 2.5670166015625, 2.9052734375, 3.2435302734375, 3.581787109375, 3.9200439453125, 4.25830078125, 4.5965576171875, 4.934814453125, 5.2730712890625, 5.611328125, 5.9495849609375, 6.287841796875, 6.6260986328125, 6.96435546875, 7.3026123046875, 7.640869140625, 7.9791259765625, 8.3173828125, 8.6556396484375, 8.993896484375, 9.3321533203125, 9.67041015625, 10.0086669921875, 10.346923828125, 10.6851806640625, 11.0234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 12.0, 7.0, 9.0, 11.0, 31.0, 48.0, 70.0, 129.0, 229.0, 400.0, 834.0, 1822.0, 4290.0, 11481.0, 33740.0, 111732.0, 450250.0, 311371.0, 81622.0, 25122.0, 8852.0, 3396.0, 1532.0, 731.0, 371.0, 177.0, 98.0, 77.0, 39.0, 35.0, 17.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.3798828125, -9.150390625, -8.9208984375, -8.69140625, -8.4619140625, -8.232421875, -8.0029296875, -7.7734375, -7.5439453125, -7.314453125, -7.0849609375, -6.85546875, -6.6259765625, -6.396484375, -6.1669921875, -5.9375, -5.7080078125, -5.478515625, -5.2490234375, -5.01953125, -4.7900390625, -4.560546875, -4.3310546875, -4.1015625, -3.8720703125, -3.642578125, -3.4130859375, -3.18359375, -2.9541015625, -2.724609375, -2.4951171875, -2.265625, -2.0361328125, -1.806640625, -1.5771484375, -1.34765625, -1.1181640625, -0.888671875, -0.6591796875, -0.4296875, -0.2001953125, 0.029296875, 0.2587890625, 0.48828125, 0.7177734375, 0.947265625, 1.1767578125, 1.40625, 1.6357421875, 1.865234375, 2.0947265625, 2.32421875, 2.5537109375, 2.783203125, 3.0126953125, 3.2421875, 3.4716796875, 3.701171875, 3.9306640625, 4.16015625, 4.3896484375, 4.619140625, 4.8486328125, 5.078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 7.0, 9.0, 25.0, 33.0, 52.0, 59.0, 100.0, 303.0, 162.0, 75.0, 59.0, 47.0, 20.0, 16.0, 16.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002582550048828125, -0.0025057196617126465, -0.002428889274597168, -0.0023520588874816895, -0.002275228500366211, -0.0021983981132507324, -0.002121567726135254, -0.0020447373390197754, -0.001967906951904297, -0.0018910765647888184, -0.0018142461776733398, -0.0017374157905578613, -0.0016605854034423828, -0.0015837550163269043, -0.0015069246292114258, -0.0014300942420959473, -0.0013532638549804688, -0.0012764334678649902, -0.0011996030807495117, -0.0011227726936340332, -0.0010459423065185547, -0.0009691119194030762, -0.0008922815322875977, -0.0008154511451721191, -0.0007386207580566406, -0.0006617903709411621, -0.0005849599838256836, -0.0005081295967102051, -0.00043129920959472656, -0.00035446882247924805, -0.00027763843536376953, -0.00020080804824829102, -0.0001239776611328125, -4.7147274017333984e-05, 2.968311309814453e-05, 0.00010651350021362305, 0.00018334388732910156, 0.0002601742744445801, 0.0003370046615600586, 0.0004138350486755371, 0.0004906654357910156, 0.0005674958229064941, 0.0006443262100219727, 0.0007211565971374512, 0.0007979869842529297, 0.0008748173713684082, 0.0009516477584838867, 0.0010284781455993652, 0.0011053085327148438, 0.0011821389198303223, 0.0012589693069458008, 0.0013357996940612793, 0.0014126300811767578, 0.0014894604682922363, 0.0015662908554077148, 0.0016431212425231934, 0.0017199516296386719, 0.0017967820167541504, 0.001873612403869629, 0.0019504427909851074, 0.002027273178100586, 0.0021041035652160645, 0.002180933952331543, 0.0022577643394470215, 0.0023345947265625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 1.0, 8.0, 8.0, 11.0, 23.0, 26.0, 33.0, 46.0, 70.0, 120.0, 220.0, 422.0, 833.0, 1995.0, 6026.0, 21965.0, 118002.0, 623556.0, 224908.0, 36421.0, 8762.0, 2776.0, 1093.0, 528.0, 278.0, 156.0, 98.0, 57.0, 34.0, 26.0, 18.0, 9.0, 8.0, 3.0, 2.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.859375, -12.5179443359375, -12.176513671875, -11.8350830078125, -11.49365234375, -11.1522216796875, -10.810791015625, -10.4693603515625, -10.1279296875, -9.7864990234375, -9.445068359375, -9.1036376953125, -8.76220703125, -8.4207763671875, -8.079345703125, -7.7379150390625, -7.396484375, -7.0550537109375, -6.713623046875, -6.3721923828125, -6.03076171875, -5.6893310546875, -5.347900390625, -5.0064697265625, -4.6650390625, -4.3236083984375, -3.982177734375, -3.6407470703125, -3.29931640625, -2.9578857421875, -2.616455078125, -2.2750244140625, -1.93359375, -1.5921630859375, -1.250732421875, -0.9093017578125, -0.56787109375, -0.2264404296875, 0.114990234375, 0.4564208984375, 0.7978515625, 1.1392822265625, 1.480712890625, 1.8221435546875, 2.16357421875, 2.5050048828125, 2.846435546875, 3.1878662109375, 3.529296875, 3.8707275390625, 4.212158203125, 4.5535888671875, 4.89501953125, 5.2364501953125, 5.577880859375, 5.9193115234375, 6.2607421875, 6.6021728515625, 6.943603515625, 7.2850341796875, 7.62646484375, 7.9678955078125, 8.309326171875, 8.6507568359375, 8.9921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 6.0, 3.0, 4.0, 12.0, 15.0, 11.0, 21.0, 24.0, 27.0, 45.0, 48.0, 74.0, 96.0, 118.0, 108.0, 91.0, 67.0, 46.0, 35.0, 44.0, 28.0, 17.0, 13.0, 14.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.79248046875, -6.5654296875, -6.33837890625, -6.111328125, -5.88427734375, -5.6572265625, -5.43017578125, -5.203125, -4.97607421875, -4.7490234375, -4.52197265625, -4.294921875, -4.06787109375, -3.8408203125, -3.61376953125, -3.38671875, -3.15966796875, -2.9326171875, -2.70556640625, -2.478515625, -2.25146484375, -2.0244140625, -1.79736328125, -1.5703125, -1.34326171875, -1.1162109375, -0.88916015625, -0.662109375, -0.43505859375, -0.2080078125, 0.01904296875, 0.24609375, 0.47314453125, 0.7001953125, 0.92724609375, 1.154296875, 1.38134765625, 1.6083984375, 1.83544921875, 2.0625, 2.28955078125, 2.5166015625, 2.74365234375, 2.970703125, 3.19775390625, 3.4248046875, 3.65185546875, 3.87890625, 4.10595703125, 4.3330078125, 4.56005859375, 4.787109375, 5.01416015625, 5.2412109375, 5.46826171875, 5.6953125, 5.92236328125, 6.1494140625, 6.37646484375, 6.603515625, 6.83056640625, 7.0576171875, 7.28466796875, 7.51171875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 8.0, 22.0, 60.0, 195.0, 274.0, 272.0, 123.0, 37.0, 15.0, 6.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.87677001953125, -114.7883071899414, -105.69984436035156, -96.61138916015625, -87.5229263305664, -78.43446350097656, -69.34600830078125, -60.257545471191406, -51.16908264160156, -42.08061981201172, -32.99216079711914, -23.90369987487793, -14.815238952636719, -5.726776123046875, 3.361682891845703, 12.450141906738281, 21.538604736328125, 30.627065658569336, 39.71552658081055, 48.803985595703125, 57.89244842529297, 66.98091125488281, 76.06936645507812, 85.15782928466797, 94.24629211425781, 103.33475494384766, 112.4232177734375, 121.51167297363281, 130.60012817382812, 139.6885986328125, 148.7770538330078, 157.86550903320312, 166.95394897460938, 176.0424041748047, 185.13087463378906, 194.21932983398438, 203.30780029296875, 212.39625549316406, 221.48471069335938, 230.57318115234375, 239.66163635253906, 248.75009155273438, 257.83856201171875, 266.9270324707031, 276.0154724121094, 285.10394287109375, 294.1924133300781, 303.2808532714844, 312.36932373046875, 321.4577941894531, 330.5462341308594, 339.63470458984375, 348.7231750488281, 357.8116455078125, 366.90008544921875, 375.9885559082031, 385.0770263671875, 394.1654968261719, 403.2539367675781, 412.3424072265625, 421.4308776855469, 430.51934814453125, 439.6077880859375, 448.6962585449219, 457.7846984863281]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 12.0, 9.0, 12.0, 14.0, 20.0, 21.0, 21.0, 22.0, 27.0, 34.0, 29.0, 46.0, 31.0, 26.0, 42.0, 51.0, 53.0, 48.0, 35.0, 44.0, 53.0, 47.0, 27.0, 34.0, 31.0, 24.0, 14.0, 20.0, 27.0, 20.0, 19.0, 16.0, 14.0, 10.0, 8.0, 1.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-59.82958984375, -58.04922103881836, -56.268856048583984, -54.488487243652344, -52.7081184387207, -50.92774963378906, -49.14738464355469, -47.36701583862305, -45.586647033691406, -43.806278228759766, -42.02591323852539, -40.24554443359375, -38.46517562866211, -36.68480682373047, -34.904441833496094, -33.12407302856445, -31.343708038330078, -29.56334114074707, -27.78297233581543, -26.002605438232422, -24.22223663330078, -22.441869735717773, -20.661502838134766, -18.881134033203125, -17.100767135620117, -15.320399284362793, -13.540031433105469, -11.759664535522461, -9.979296684265137, -8.198928833007812, -6.418561935424805, -4.6381940841674805, -2.8578262329101562, -1.0774586200714111, 0.702908992767334, 2.4832763671875, 4.263644218444824, 6.044012069702148, 7.824378967285156, 9.60474681854248, 11.385114669799805, 13.165482521057129, 14.945850372314453, 16.72621726989746, 18.50658416748047, 20.28695297241211, 22.067319869995117, 23.847686767578125, 25.628055572509766, 27.408422470092773, 29.188791275024414, 30.969158172607422, 32.74952697753906, 34.52989196777344, 36.31026077270508, 38.09062957763672, 39.870994567871094, 41.651363372802734, 43.43172836303711, 45.21209716796875, 46.99246597290039, 48.77283477783203, 50.553199768066406, 52.33356857299805, 54.11393737792969]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 6.0, 8.0, 6.0, 18.0, 17.0, 32.0, 38.0, 60.0, 119.0, 196.0, 330.0, 572.0, 1057.0, 2466.0, 6733.0, 25503.0, 164980.0, 3620998.0, 317776.0, 38054.0, 9079.0, 3056.0, 1378.0, 652.0, 373.0, 267.0, 138.0, 106.0, 69.0, 51.0, 33.0, 15.0, 28.0, 15.0, 11.0, 12.0, 7.0, 3.0, 8.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.59375, -28.56005859375, -27.5263671875, -26.49267578125, -25.458984375, -24.42529296875, -23.3916015625, -22.35791015625, -21.32421875, -20.29052734375, -19.2568359375, -18.22314453125, -17.189453125, -16.15576171875, -15.1220703125, -14.08837890625, -13.0546875, -12.02099609375, -10.9873046875, -9.95361328125, -8.919921875, -7.88623046875, -6.8525390625, -5.81884765625, -4.78515625, -3.75146484375, -2.7177734375, -1.68408203125, -0.650390625, 0.38330078125, 1.4169921875, 2.45068359375, 3.484375, 4.51806640625, 5.5517578125, 6.58544921875, 7.619140625, 8.65283203125, 9.6865234375, 10.72021484375, 11.75390625, 12.78759765625, 13.8212890625, 14.85498046875, 15.888671875, 16.92236328125, 17.9560546875, 18.98974609375, 20.0234375, 21.05712890625, 22.0908203125, 23.12451171875, 24.158203125, 25.19189453125, 26.2255859375, 27.25927734375, 28.29296875, 29.32666015625, 30.3603515625, 31.39404296875, 32.427734375, 33.46142578125, 34.4951171875, 35.52880859375, 36.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 4.0, 10.0, 22.0, 21.0, 37.0, 56.0, 62.0, 77.0, 86.0, 95.0, 92.0, 91.0, 97.0, 64.0, 54.0, 40.0, 27.0, 19.0, 19.0, 12.0, 7.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.57818603515625, -3.4102783203125, -3.24237060546875, -3.074462890625, -2.90655517578125, -2.7386474609375, -2.57073974609375, -2.40283203125, -2.23492431640625, -2.0670166015625, -1.89910888671875, -1.731201171875, -1.56329345703125, -1.3953857421875, -1.22747802734375, -1.0595703125, -0.89166259765625, -0.7237548828125, -0.55584716796875, -0.387939453125, -0.22003173828125, -0.0521240234375, 0.11578369140625, 0.28369140625, 0.45159912109375, 0.6195068359375, 0.78741455078125, 0.955322265625, 1.12322998046875, 1.2911376953125, 1.45904541015625, 1.626953125, 1.79486083984375, 1.9627685546875, 2.13067626953125, 2.298583984375, 2.46649169921875, 2.6343994140625, 2.80230712890625, 2.97021484375, 3.13812255859375, 3.3060302734375, 3.47393798828125, 3.641845703125, 3.80975341796875, 3.9776611328125, 4.14556884765625, 4.3134765625, 4.48138427734375, 4.6492919921875, 4.81719970703125, 4.985107421875, 5.15301513671875, 5.3209228515625, 5.48883056640625, 5.65673828125, 5.82464599609375, 5.9925537109375, 6.16046142578125, 6.328369140625, 6.49627685546875, 6.6641845703125, 6.83209228515625, 7.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 8.0, 4.0, 5.0, 13.0, 23.0, 31.0, 38.0, 45.0, 58.0, 76.0, 104.0, 168.0, 193.0, 299.0, 457.0, 842.0, 1828.0, 4117.0, 11583.0, 38098.0, 160341.0, 1364056.0, 2359362.0, 186924.0, 43808.0, 12901.0, 4559.0, 1838.0, 918.0, 475.0, 313.0, 219.0, 147.0, 126.0, 75.0, 63.0, 50.0, 37.0, 26.0, 8.0, 13.0, 12.0, 12.0, 6.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.6220703125, -18.041015625, -17.4599609375, -16.87890625, -16.2978515625, -15.716796875, -15.1357421875, -14.5546875, -13.9736328125, -13.392578125, -12.8115234375, -12.23046875, -11.6494140625, -11.068359375, -10.4873046875, -9.90625, -9.3251953125, -8.744140625, -8.1630859375, -7.58203125, -7.0009765625, -6.419921875, -5.8388671875, -5.2578125, -4.6767578125, -4.095703125, -3.5146484375, -2.93359375, -2.3525390625, -1.771484375, -1.1904296875, -0.609375, -0.0283203125, 0.552734375, 1.1337890625, 1.71484375, 2.2958984375, 2.876953125, 3.4580078125, 4.0390625, 4.6201171875, 5.201171875, 5.7822265625, 6.36328125, 6.9443359375, 7.525390625, 8.1064453125, 8.6875, 9.2685546875, 9.849609375, 10.4306640625, 11.01171875, 11.5927734375, 12.173828125, 12.7548828125, 13.3359375, 13.9169921875, 14.498046875, 15.0791015625, 15.66015625, 16.2412109375, 16.822265625, 17.4033203125, 17.984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 6.0, 4.0, 4.0, 6.0, 8.0, 11.0, 19.0, 20.0, 28.0, 47.0, 68.0, 100.0, 142.0, 193.0, 331.0, 707.0, 1245.0, 399.0, 237.0, 168.0, 107.0, 68.0, 52.0, 29.0, 17.0, 15.0, 16.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -5.987060546875, -5.73974609375, -5.492431640625, -5.2451171875, -4.997802734375, -4.75048828125, -4.503173828125, -4.255859375, -4.008544921875, -3.76123046875, -3.513916015625, -3.2666015625, -3.019287109375, -2.77197265625, -2.524658203125, -2.27734375, -2.030029296875, -1.78271484375, -1.535400390625, -1.2880859375, -1.040771484375, -0.79345703125, -0.546142578125, -0.298828125, -0.051513671875, 0.19580078125, 0.443115234375, 0.6904296875, 0.937744140625, 1.18505859375, 1.432373046875, 1.6796875, 1.927001953125, 2.17431640625, 2.421630859375, 2.6689453125, 2.916259765625, 3.16357421875, 3.410888671875, 3.658203125, 3.905517578125, 4.15283203125, 4.400146484375, 4.6474609375, 4.894775390625, 5.14208984375, 5.389404296875, 5.63671875, 5.884033203125, 6.13134765625, 6.378662109375, 6.6259765625, 6.873291015625, 7.12060546875, 7.367919921875, 7.615234375, 7.862548828125, 8.10986328125, 8.357177734375, 8.6044921875, 8.851806640625, 9.09912109375, 9.346435546875, 9.59375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 12.0, 18.0, 34.0, 58.0, 85.0, 106.0, 138.0, 129.0, 126.0, 111.0, 69.0, 51.0, 24.0, 12.0, 10.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.6125602722168, -58.34540939331055, -56.07825469970703, -53.81110382080078, -51.543949127197266, -49.276798248291016, -47.0096435546875, -44.74249267578125, -42.475341796875, -40.20819091796875, -37.941036224365234, -35.673885345458984, -33.40673065185547, -31.13957977294922, -28.872426986694336, -26.605274200439453, -24.338119506835938, -22.070966720581055, -19.803813934326172, -17.536663055419922, -15.269509315490723, -13.00235652923584, -10.735204696655273, -8.46805191040039, -6.200899124145508, -3.933746576309204, -1.6665940284729004, 0.6005582809448242, 2.867711067199707, 5.13486385345459, 7.402015686035156, 9.669168472290039, 11.936317443847656, 14.203470230102539, 16.470623016357422, 18.737773895263672, 21.004928588867188, 23.272079467773438, 25.53923225402832, 27.806385040283203, 30.073537826538086, 32.34069061279297, 34.60784149169922, 36.874996185302734, 39.142147064208984, 41.4093017578125, 43.67645263671875, 45.943603515625, 48.210758209228516, 50.477909088134766, 52.74506378173828, 55.01221466064453, 57.27936935424805, 59.5465202331543, 61.81367492675781, 64.08082580566406, 66.34797668457031, 68.61512756347656, 70.88227844238281, 73.1494369506836, 75.41658782958984, 77.6837387084961, 79.95088958740234, 82.21804809570312, 84.48519897460938]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 13.0, 7.0, 9.0, 17.0, 25.0, 19.0, 24.0, 34.0, 30.0, 28.0, 34.0, 31.0, 46.0, 36.0, 42.0, 50.0, 37.0, 38.0, 39.0, 47.0, 51.0, 37.0, 43.0, 30.0, 35.0, 24.0, 32.0, 25.0, 18.0, 9.0, 10.0, 11.0, 7.0, 14.0, 13.0, 1.0, 5.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.631668090820312, -25.734140396118164, -24.836612701416016, -23.939083099365234, -23.041555404663086, -22.144027709960938, -21.24650001525879, -20.34897232055664, -19.45144271850586, -18.55391502380371, -17.656387329101562, -16.75885772705078, -15.861330032348633, -14.963802337646484, -14.066274642944336, -13.168746948242188, -12.271219253540039, -11.37369155883789, -10.476162910461426, -9.578635215759277, -8.681106567382812, -7.783578872680664, -6.886051177978516, -5.988523006439209, -5.090994834899902, -4.193466663360596, -3.295938730239868, -2.3984107971191406, -1.500882625579834, -0.6033544540405273, 0.2941732406616211, 1.1917014122009277, 2.0892295837402344, 2.986757755279541, 3.8842856884002686, 4.781813621520996, 5.679341793060303, 6.576869964599609, 7.474397659301758, 8.371925354003906, 9.269454002380371, 10.16698169708252, 11.064510345458984, 11.962038040161133, 12.859565734863281, 13.757094383239746, 14.654622077941895, 15.55215072631836, 16.449678421020508, 17.347206115722656, 18.244733810424805, 19.142261505126953, 20.039791107177734, 20.937318801879883, 21.83484649658203, 22.73237419128418, 23.629901885986328, 24.527429580688477, 25.424957275390625, 26.322486877441406, 27.220014572143555, 28.117542266845703, 29.01506996154785, 29.91259765625, 30.81012725830078]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 7.0, 8.0, 25.0, 24.0, 51.0, 112.0, 244.0, 533.0, 1711.0, 8902.0, 93079.0, 741358.0, 184277.0, 14511.0, 2447.0, 712.0, 278.0, 136.0, 73.0, 27.0, 16.0, 13.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.75, -34.5009765625, -33.251953125, -32.0029296875, -30.75390625, -29.5048828125, -28.255859375, -27.0068359375, -25.7578125, -24.5087890625, -23.259765625, -22.0107421875, -20.76171875, -19.5126953125, -18.263671875, -17.0146484375, -15.765625, -14.5166015625, -13.267578125, -12.0185546875, -10.76953125, -9.5205078125, -8.271484375, -7.0224609375, -5.7734375, -4.5244140625, -3.275390625, -2.0263671875, -0.77734375, 0.4716796875, 1.720703125, 2.9697265625, 4.21875, 5.4677734375, 6.716796875, 7.9658203125, 9.21484375, 10.4638671875, 11.712890625, 12.9619140625, 14.2109375, 15.4599609375, 16.708984375, 17.9580078125, 19.20703125, 20.4560546875, 21.705078125, 22.9541015625, 24.203125, 25.4521484375, 26.701171875, 27.9501953125, 29.19921875, 30.4482421875, 31.697265625, 32.9462890625, 34.1953125, 35.4443359375, 36.693359375, 37.9423828125, 39.19140625, 40.4404296875, 41.689453125, 42.9384765625, 44.1875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 5.0, 9.0, 12.0, 25.0, 28.0, 44.0, 45.0, 69.0, 80.0, 72.0, 82.0, 76.0, 85.0, 88.0, 67.0, 63.0, 34.0, 31.0, 39.0, 15.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.869140625, -3.696014404296875, -3.52288818359375, -3.349761962890625, -3.1766357421875, -3.003509521484375, -2.83038330078125, -2.657257080078125, -2.484130859375, -2.311004638671875, -2.13787841796875, -1.964752197265625, -1.7916259765625, -1.618499755859375, -1.44537353515625, -1.272247314453125, -1.09912109375, -0.925994873046875, -0.75286865234375, -0.579742431640625, -0.4066162109375, -0.233489990234375, -0.06036376953125, 0.112762451171875, 0.285888671875, 0.459014892578125, 0.63214111328125, 0.805267333984375, 0.9783935546875, 1.151519775390625, 1.32464599609375, 1.497772216796875, 1.6708984375, 1.844024658203125, 2.01715087890625, 2.190277099609375, 2.3634033203125, 2.536529541015625, 2.70965576171875, 2.882781982421875, 3.055908203125, 3.229034423828125, 3.40216064453125, 3.575286865234375, 3.7484130859375, 3.921539306640625, 4.09466552734375, 4.267791748046875, 4.44091796875, 4.614044189453125, 4.78717041015625, 4.960296630859375, 5.1334228515625, 5.306549072265625, 5.47967529296875, 5.652801513671875, 5.825927734375, 5.999053955078125, 6.17218017578125, 6.345306396484375, 6.5184326171875, 6.691558837890625, 6.86468505859375, 7.037811279296875, 7.2109375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 7.0, 7.0, 5.0, 15.0, 12.0, 27.0, 37.0, 53.0, 66.0, 105.0, 146.0, 174.0, 274.0, 369.0, 581.0, 927.0, 2007.0, 4952.0, 15885.0, 58169.0, 253198.0, 507997.0, 149640.0, 36077.0, 10459.0, 3540.0, 1474.0, 723.0, 488.0, 314.0, 228.0, 175.0, 129.0, 79.0, 61.0, 37.0, 35.0, 25.0, 17.0, 11.0, 7.0, 6.0, 4.0, 8.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.109375, -16.580078125, -16.05078125, -15.521484375, -14.9921875, -14.462890625, -13.93359375, -13.404296875, -12.875, -12.345703125, -11.81640625, -11.287109375, -10.7578125, -10.228515625, -9.69921875, -9.169921875, -8.640625, -8.111328125, -7.58203125, -7.052734375, -6.5234375, -5.994140625, -5.46484375, -4.935546875, -4.40625, -3.876953125, -3.34765625, -2.818359375, -2.2890625, -1.759765625, -1.23046875, -0.701171875, -0.171875, 0.357421875, 0.88671875, 1.416015625, 1.9453125, 2.474609375, 3.00390625, 3.533203125, 4.0625, 4.591796875, 5.12109375, 5.650390625, 6.1796875, 6.708984375, 7.23828125, 7.767578125, 8.296875, 8.826171875, 9.35546875, 9.884765625, 10.4140625, 10.943359375, 11.47265625, 12.001953125, 12.53125, 13.060546875, 13.58984375, 14.119140625, 14.6484375, 15.177734375, 15.70703125, 16.236328125, 16.765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 10.0, 10.0, 11.0, 14.0, 13.0, 10.0, 17.0, 21.0, 21.0, 23.0, 40.0, 31.0, 38.0, 38.0, 44.0, 53.0, 45.0, 43.0, 47.0, 51.0, 50.0, 45.0, 43.0, 45.0, 35.0, 30.0, 24.0, 26.0, 24.0, 16.0, 20.0, 10.0, 9.0, 11.0, 7.0, 10.0, 2.0, 3.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.5, -12.02392578125, -11.5478515625, -11.07177734375, -10.595703125, -10.11962890625, -9.6435546875, -9.16748046875, -8.69140625, -8.21533203125, -7.7392578125, -7.26318359375, -6.787109375, -6.31103515625, -5.8349609375, -5.35888671875, -4.8828125, -4.40673828125, -3.9306640625, -3.45458984375, -2.978515625, -2.50244140625, -2.0263671875, -1.55029296875, -1.07421875, -0.59814453125, -0.1220703125, 0.35400390625, 0.830078125, 1.30615234375, 1.7822265625, 2.25830078125, 2.734375, 3.21044921875, 3.6865234375, 4.16259765625, 4.638671875, 5.11474609375, 5.5908203125, 6.06689453125, 6.54296875, 7.01904296875, 7.4951171875, 7.97119140625, 8.447265625, 8.92333984375, 9.3994140625, 9.87548828125, 10.3515625, 10.82763671875, 11.3037109375, 11.77978515625, 12.255859375, 12.73193359375, 13.2080078125, 13.68408203125, 14.16015625, 14.63623046875, 15.1123046875, 15.58837890625, 16.064453125, 16.54052734375, 17.0166015625, 17.49267578125, 17.96875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 9.0, 10.0, 10.0, 20.0, 32.0, 32.0, 75.0, 91.0, 164.0, 262.0, 471.0, 716.0, 1480.0, 3219.0, 8442.0, 26174.0, 92159.0, 302682.0, 402587.0, 147520.0, 40919.0, 12703.0, 4541.0, 1887.0, 955.0, 533.0, 309.0, 187.0, 97.0, 90.0, 56.0, 34.0, 26.0, 16.0, 9.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.7265625, -6.52978515625, -6.3330078125, -6.13623046875, -5.939453125, -5.74267578125, -5.5458984375, -5.34912109375, -5.15234375, -4.95556640625, -4.7587890625, -4.56201171875, -4.365234375, -4.16845703125, -3.9716796875, -3.77490234375, -3.578125, -3.38134765625, -3.1845703125, -2.98779296875, -2.791015625, -2.59423828125, -2.3974609375, -2.20068359375, -2.00390625, -1.80712890625, -1.6103515625, -1.41357421875, -1.216796875, -1.02001953125, -0.8232421875, -0.62646484375, -0.4296875, -0.23291015625, -0.0361328125, 0.16064453125, 0.357421875, 0.55419921875, 0.7509765625, 0.94775390625, 1.14453125, 1.34130859375, 1.5380859375, 1.73486328125, 1.931640625, 2.12841796875, 2.3251953125, 2.52197265625, 2.71875, 2.91552734375, 3.1123046875, 3.30908203125, 3.505859375, 3.70263671875, 3.8994140625, 4.09619140625, 4.29296875, 4.48974609375, 4.6865234375, 4.88330078125, 5.080078125, 5.27685546875, 5.4736328125, 5.67041015625, 5.8671875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 2.0, 3.0, 6.0, 6.0, 5.0, 3.0, 15.0, 14.0, 24.0, 16.0, 30.0, 38.0, 49.0, 58.0, 57.0, 75.0, 76.0, 78.0, 80.0, 62.0, 59.0, 52.0, 34.0, 33.0, 24.0, 21.0, 15.0, 16.0, 9.0, 7.0, 3.0, 3.0, 6.0, 2.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010242462158203125, -0.000990167260169983, -0.0009560883045196533, -0.0009220093488693237, -0.0008879303932189941, -0.0008538514375686646, -0.000819772481918335, -0.0007856935262680054, -0.0007516145706176758, -0.0007175356149673462, -0.0006834566593170166, -0.000649377703666687, -0.0006152987480163574, -0.0005812197923660278, -0.0005471408367156982, -0.0005130618810653687, -0.00047898292541503906, -0.00044490396976470947, -0.0004108250141143799, -0.0003767460584640503, -0.0003426671028137207, -0.0003085881471633911, -0.0002745091915130615, -0.00024043023586273193, -0.00020635128021240234, -0.00017227232456207275, -0.00013819336891174316, -0.00010411441326141357, -7.003545761108398e-05, -3.5956501960754395e-05, -1.8775463104248047e-06, 3.2201409339904785e-05, 6.628036499023438e-05, 0.00010035932064056396, 0.00013443827629089355, 0.00016851723194122314, 0.00020259618759155273, 0.00023667514324188232, 0.0002707540988922119, 0.0003048330545425415, 0.0003389120101928711, 0.0003729909658432007, 0.0004070699214935303, 0.00044114887714385986, 0.00047522783279418945, 0.000509306788444519, 0.0005433857440948486, 0.0005774646997451782, 0.0006115436553955078, 0.0006456226110458374, 0.000679701566696167, 0.0007137805223464966, 0.0007478594779968262, 0.0007819384336471558, 0.0008160173892974854, 0.0008500963449478149, 0.0008841753005981445, 0.0009182542562484741, 0.0009523332118988037, 0.0009864121675491333, 0.0010204911231994629, 0.0010545700788497925, 0.001088649034500122, 0.0011227279901504517, 0.0011568069458007812]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 16.0, 14.0, 37.0, 36.0, 53.0, 84.0, 151.0, 261.0, 540.0, 1024.0, 2664.0, 8394.0, 46387.0, 356135.0, 530507.0, 83280.0, 12713.0, 3457.0, 1295.0, 649.0, 341.0, 181.0, 104.0, 75.0, 46.0, 26.0, 23.0, 9.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.53125, -12.19384765625, -11.8564453125, -11.51904296875, -11.181640625, -10.84423828125, -10.5068359375, -10.16943359375, -9.83203125, -9.49462890625, -9.1572265625, -8.81982421875, -8.482421875, -8.14501953125, -7.8076171875, -7.47021484375, -7.1328125, -6.79541015625, -6.4580078125, -6.12060546875, -5.783203125, -5.44580078125, -5.1083984375, -4.77099609375, -4.43359375, -4.09619140625, -3.7587890625, -3.42138671875, -3.083984375, -2.74658203125, -2.4091796875, -2.07177734375, -1.734375, -1.39697265625, -1.0595703125, -0.72216796875, -0.384765625, -0.04736328125, 0.2900390625, 0.62744140625, 0.96484375, 1.30224609375, 1.6396484375, 1.97705078125, 2.314453125, 2.65185546875, 2.9892578125, 3.32666015625, 3.6640625, 4.00146484375, 4.3388671875, 4.67626953125, 5.013671875, 5.35107421875, 5.6884765625, 6.02587890625, 6.36328125, 6.70068359375, 7.0380859375, 7.37548828125, 7.712890625, 8.05029296875, 8.3876953125, 8.72509765625, 9.0625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 15.0, 13.0, 17.0, 25.0, 38.0, 42.0, 53.0, 66.0, 80.0, 95.0, 93.0, 89.0, 88.0, 59.0, 68.0, 32.0, 20.0, 32.0, 18.0, 15.0, 7.0, 8.0, 2.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.98681640625, -7.7548828125, -7.52294921875, -7.291015625, -7.05908203125, -6.8271484375, -6.59521484375, -6.36328125, -6.13134765625, -5.8994140625, -5.66748046875, -5.435546875, -5.20361328125, -4.9716796875, -4.73974609375, -4.5078125, -4.27587890625, -4.0439453125, -3.81201171875, -3.580078125, -3.34814453125, -3.1162109375, -2.88427734375, -2.65234375, -2.42041015625, -2.1884765625, -1.95654296875, -1.724609375, -1.49267578125, -1.2607421875, -1.02880859375, -0.796875, -0.56494140625, -0.3330078125, -0.10107421875, 0.130859375, 0.36279296875, 0.5947265625, 0.82666015625, 1.05859375, 1.29052734375, 1.5224609375, 1.75439453125, 1.986328125, 2.21826171875, 2.4501953125, 2.68212890625, 2.9140625, 3.14599609375, 3.3779296875, 3.60986328125, 3.841796875, 4.07373046875, 4.3056640625, 4.53759765625, 4.76953125, 5.00146484375, 5.2333984375, 5.46533203125, 5.697265625, 5.92919921875, 6.1611328125, 6.39306640625, 6.625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 13.0, 22.0, 50.0, 94.0, 163.0, 178.0, 186.0, 139.0, 83.0, 40.0, 22.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-277.1130065917969, -271.21820068359375, -265.3233642578125, -259.4285583496094, -253.53372192382812, -247.638916015625, -241.7440948486328, -235.84927368164062, -229.95445251464844, -224.05963134765625, -218.16481018066406, -212.26998901367188, -206.37518310546875, -200.48036193847656, -194.58554077148438, -188.6907196044922, -182.7958984375, -176.9010772705078, -171.00625610351562, -165.11143493652344, -159.21661376953125, -153.32180786132812, -147.42698669433594, -141.53216552734375, -135.63734436035156, -129.74252319335938, -123.84770202636719, -117.95288848876953, -112.05806732177734, -106.16324615478516, -100.2684326171875, -94.37361145019531, -88.47879028320312, -82.58396911621094, -76.68914794921875, -70.7943344116211, -64.8995132446289, -59.00469207763672, -53.1098747253418, -47.215057373046875, -41.32023620605469, -35.4254150390625, -29.530597686767578, -23.635778427124023, -17.74095916748047, -11.846139907836914, -5.951320648193359, -0.0565032958984375, 5.83831787109375, 11.733137130737305, 17.62795639038086, 23.522775650024414, 29.41759490966797, 35.312416076660156, 41.20723342895508, 47.10205078125, 52.99687194824219, 58.891693115234375, 64.78651428222656, 70.68132781982422, 76.5761489868164, 82.4709701538086, 88.36578369140625, 94.26060485839844, 100.15542602539062]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 0.0, 6.0, 4.0, 3.0, 8.0, 15.0, 9.0, 19.0, 14.0, 17.0, 15.0, 30.0, 30.0, 42.0, 42.0, 43.0, 37.0, 47.0, 53.0, 55.0, 61.0, 61.0, 49.0, 41.0, 38.0, 45.0, 32.0, 28.0, 38.0, 25.0, 19.0, 23.0, 6.0, 13.0, 6.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-87.02273559570312, -84.3149185180664, -81.60710906982422, -78.8992919921875, -76.19147491455078, -73.48365783691406, -70.77584838867188, -68.06803131103516, -65.36021423339844, -62.652400970458984, -59.944583892822266, -57.23677062988281, -54.528953552246094, -51.82114028930664, -49.11332702636719, -46.40550994873047, -43.69770050048828, -40.98988723754883, -38.28207015991211, -35.574256896972656, -32.86643981933594, -30.158626556396484, -27.45081329345703, -24.742998123168945, -22.03518295288086, -19.327367782592773, -16.619552612304688, -13.911739349365234, -11.203924179077148, -8.496109008789062, -5.788295745849609, -3.0804805755615234, -0.3726654052734375, 2.3351492881774902, 5.042963981628418, 7.7507781982421875, 10.458593368530273, 13.16640853881836, 15.874221801757812, 18.5820369720459, 21.289852142333984, 23.99766731262207, 26.705482482910156, 29.41329574584961, 32.12110900878906, 34.82892608642578, 37.536739349365234, 40.24455261230469, 42.952369689941406, 45.66018295288086, 48.36800003051758, 51.07581329345703, 53.78363037109375, 56.4914436340332, 59.199256896972656, 61.907073974609375, 64.61488342285156, 67.32270050048828, 70.03050994873047, 72.73832702636719, 75.4461441040039, 78.15396118164062, 80.86177062988281, 83.56958770751953, 86.27740478515625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 12.0, 16.0, 16.0, 37.0, 81.0, 129.0, 275.0, 667.0, 1962.0, 8350.0, 133038.0, 4029866.0, 15189.0, 3018.0, 907.0, 361.0, 147.0, 76.0, 40.0, 34.0, 19.0, 11.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.4609375, -61.546875, -59.6328125, -57.71875, -55.8046875, -53.890625, -51.9765625, -50.0625, -48.1484375, -46.234375, -44.3203125, -42.40625, -40.4921875, -38.578125, -36.6640625, -34.75, -32.8359375, -30.921875, -29.0078125, -27.09375, -25.1796875, -23.265625, -21.3515625, -19.4375, -17.5234375, -15.609375, -13.6953125, -11.78125, -9.8671875, -7.953125, -6.0390625, -4.125, -2.2109375, -0.296875, 1.6171875, 3.53125, 5.4453125, 7.359375, 9.2734375, 11.1875, 13.1015625, 15.015625, 16.9296875, 18.84375, 20.7578125, 22.671875, 24.5859375, 26.5, 28.4140625, 30.328125, 32.2421875, 34.15625, 36.0703125, 37.984375, 39.8984375, 41.8125, 43.7265625, 45.640625, 47.5546875, 49.46875, 51.3828125, 53.296875, 55.2109375, 57.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 9.0, 20.0, 22.0, 31.0, 34.0, 52.0, 63.0, 55.0, 59.0, 68.0, 69.0, 78.0, 71.0, 66.0, 62.0, 53.0, 41.0, 40.0, 25.0, 18.0, 20.0, 13.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96484375, -3.791015625, -3.6171875, -3.443359375, -3.26953125, -3.095703125, -2.921875, -2.748046875, -2.57421875, -2.400390625, -2.2265625, -2.052734375, -1.87890625, -1.705078125, -1.53125, -1.357421875, -1.18359375, -1.009765625, -0.8359375, -0.662109375, -0.48828125, -0.314453125, -0.140625, 0.033203125, 0.20703125, 0.380859375, 0.5546875, 0.728515625, 0.90234375, 1.076171875, 1.25, 1.423828125, 1.59765625, 1.771484375, 1.9453125, 2.119140625, 2.29296875, 2.466796875, 2.640625, 2.814453125, 2.98828125, 3.162109375, 3.3359375, 3.509765625, 3.68359375, 3.857421875, 4.03125, 4.205078125, 4.37890625, 4.552734375, 4.7265625, 4.900390625, 5.07421875, 5.248046875, 5.421875, 5.595703125, 5.76953125, 5.943359375, 6.1171875, 6.291015625, 6.46484375, 6.638671875, 6.8125, 6.986328125, 7.16015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 20.0, 25.0, 33.0, 63.0, 132.0, 197.0, 384.0, 670.0, 1308.0, 2635.0, 6319.0, 21173.0, 144911.0, 3936707.0, 58273.0, 12800.0, 4502.0, 1951.0, 986.0, 502.0, 275.0, 176.0, 89.0, 56.0, 40.0, 22.0, 9.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -33.004150390625, -32.16455078125, -31.324951171875, -30.4853515625, -29.645751953125, -28.80615234375, -27.966552734375, -27.126953125, -26.287353515625, -25.44775390625, -24.608154296875, -23.7685546875, -22.928955078125, -22.08935546875, -21.249755859375, -20.41015625, -19.570556640625, -18.73095703125, -17.891357421875, -17.0517578125, -16.212158203125, -15.37255859375, -14.532958984375, -13.693359375, -12.853759765625, -12.01416015625, -11.174560546875, -10.3349609375, -9.495361328125, -8.65576171875, -7.816162109375, -6.9765625, -6.136962890625, -5.29736328125, -4.457763671875, -3.6181640625, -2.778564453125, -1.93896484375, -1.099365234375, -0.259765625, 0.579833984375, 1.41943359375, 2.259033203125, 3.0986328125, 3.938232421875, 4.77783203125, 5.617431640625, 6.45703125, 7.296630859375, 8.13623046875, 8.975830078125, 9.8154296875, 10.655029296875, 11.49462890625, 12.334228515625, 13.173828125, 14.013427734375, 14.85302734375, 15.692626953125, 16.5322265625, 17.371826171875, 18.21142578125, 19.051025390625, 19.890625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 14.0, 7.0, 22.0, 33.0, 34.0, 79.0, 167.0, 3099.0, 320.0, 110.0, 52.0, 36.0, 21.0, 20.0, 12.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.074310302734375, -3.95330810546875, -3.832305908203125, -3.7113037109375, -3.590301513671875, -3.46929931640625, -3.348297119140625, -3.227294921875, -3.106292724609375, -2.98529052734375, -2.864288330078125, -2.7432861328125, -2.622283935546875, -2.50128173828125, -2.380279541015625, -2.25927734375, -2.138275146484375, -2.01727294921875, -1.896270751953125, -1.7752685546875, -1.654266357421875, -1.53326416015625, -1.412261962890625, -1.291259765625, -1.170257568359375, -1.04925537109375, -0.928253173828125, -0.8072509765625, -0.686248779296875, -0.56524658203125, -0.444244384765625, -0.3232421875, -0.202239990234375, -0.08123779296875, 0.039764404296875, 0.1607666015625, 0.281768798828125, 0.40277099609375, 0.523773193359375, 0.644775390625, 0.765777587890625, 0.88677978515625, 1.007781982421875, 1.1287841796875, 1.249786376953125, 1.37078857421875, 1.491790771484375, 1.61279296875, 1.733795166015625, 1.85479736328125, 1.975799560546875, 2.0968017578125, 2.217803955078125, 2.33880615234375, 2.459808349609375, 2.580810546875, 2.701812744140625, 2.82281494140625, 2.943817138671875, 3.0648193359375, 3.185821533203125, 3.30682373046875, 3.427825927734375, 3.548828125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 8.0, 12.0, 17.0, 33.0, 41.0, 62.0, 60.0, 76.0, 99.0, 91.0, 89.0, 96.0, 80.0, 67.0, 43.0, 37.0, 23.0, 11.0, 15.0, 9.0, 6.0, 6.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.29732894897461, -18.775888442993164, -18.25444793701172, -17.733007431030273, -17.211566925048828, -16.690128326416016, -16.16868782043457, -15.647247314453125, -15.12580680847168, -14.604366302490234, -14.082925796508789, -13.56148624420166, -13.040045738220215, -12.51860523223877, -11.99716567993164, -11.475725173950195, -10.95428466796875, -10.432844161987305, -9.91140365600586, -9.38996410369873, -8.868523597717285, -8.34708309173584, -7.825643062591553, -7.304203033447266, -6.78276252746582, -6.261322021484375, -5.739881992340088, -5.218441963195801, -4.6970014572143555, -4.17556095123291, -3.654120922088623, -3.132680654525757, -2.6112422943115234, -2.0898020267486572, -1.568361759185791, -1.0469214916229248, -0.5254812240600586, -0.004040956497192383, 0.5173993110656738, 1.03883957862854, 1.5602798461914062, 2.0817201137542725, 2.6031603813171387, 3.124600648880005, 3.646040916442871, 4.167481422424316, 4.6889214515686035, 5.210361480712891, 5.731801986694336, 6.253242492675781, 6.774682521820068, 7.2961225509643555, 7.817563056945801, 8.339003562927246, 8.860443115234375, 9.38188362121582, 9.903324127197266, 10.424764633178711, 10.946205139160156, 11.467644691467285, 11.98908519744873, 12.510525703430176, 13.031965255737305, 13.55340576171875, 14.074846267700195]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 4.0, 5.0, 12.0, 12.0, 13.0, 16.0, 16.0, 17.0, 27.0, 18.0, 32.0, 31.0, 44.0, 35.0, 41.0, 44.0, 45.0, 35.0, 44.0, 33.0, 48.0, 29.0, 36.0, 42.0, 29.0, 30.0, 35.0, 30.0, 24.0, 27.0, 25.0, 22.0, 14.0, 9.0, 14.0, 9.0, 11.0, 5.0, 6.0, 7.0, 3.0, 7.0, 1.0, 3.0, 7.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.998217582702637, -7.764782428741455, -7.531347274780273, -7.297912120819092, -7.06447696685791, -6.8310418128967285, -6.597606658935547, -6.364171504974365, -6.130736351013184, -5.897301197052002, -5.66386604309082, -5.430430889129639, -5.196995735168457, -4.963560581207275, -4.730125427246094, -4.496690273284912, -4.2632551193237305, -4.029819965362549, -3.796384811401367, -3.5629496574401855, -3.329514503479004, -3.0960793495178223, -2.8626441955566406, -2.629209041595459, -2.3957738876342773, -2.1623387336730957, -1.928903579711914, -1.6954684257507324, -1.4620332717895508, -1.2285981178283691, -0.9951629638671875, -0.7617278099060059, -0.5282926559448242, -0.2948575019836426, -0.06142234802246094, 0.1720128059387207, 0.40544795989990234, 0.638883113861084, 0.8723182678222656, 1.1057534217834473, 1.339188575744629, 1.5726237297058105, 1.8060588836669922, 2.039494037628174, 2.2729291915893555, 2.506364345550537, 2.7397994995117188, 2.9732346534729004, 3.206669807434082, 3.4401049613952637, 3.6735401153564453, 3.906975269317627, 4.140410423278809, 4.37384557723999, 4.607280731201172, 4.8407158851623535, 5.074151039123535, 5.307586193084717, 5.541021347045898, 5.77445650100708, 6.007891654968262, 6.241326808929443, 6.474761962890625, 6.708197116851807, 6.941632270812988]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 13.0, 33.0, 36.0, 68.0, 120.0, 245.0, 540.0, 1358.0, 4731.0, 22283.0, 121462.0, 574537.0, 265471.0, 45099.0, 8768.0, 2299.0, 779.0, 319.0, 159.0, 92.0, 39.0, 33.0, 26.0, 15.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.078125, -25.347900390625, -24.61767578125, -23.887451171875, -23.1572265625, -22.427001953125, -21.69677734375, -20.966552734375, -20.236328125, -19.506103515625, -18.77587890625, -18.045654296875, -17.3154296875, -16.585205078125, -15.85498046875, -15.124755859375, -14.39453125, -13.664306640625, -12.93408203125, -12.203857421875, -11.4736328125, -10.743408203125, -10.01318359375, -9.282958984375, -8.552734375, -7.822509765625, -7.09228515625, -6.362060546875, -5.6318359375, -4.901611328125, -4.17138671875, -3.441162109375, -2.7109375, -1.980712890625, -1.25048828125, -0.520263671875, 0.2099609375, 0.940185546875, 1.67041015625, 2.400634765625, 3.130859375, 3.861083984375, 4.59130859375, 5.321533203125, 6.0517578125, 6.781982421875, 7.51220703125, 8.242431640625, 8.97265625, 9.702880859375, 10.43310546875, 11.163330078125, 11.8935546875, 12.623779296875, 13.35400390625, 14.084228515625, 14.814453125, 15.544677734375, 16.27490234375, 17.005126953125, 17.7353515625, 18.465576171875, 19.19580078125, 19.926025390625, 20.65625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 3.0, 1.0, 4.0, 8.0, 16.0, 15.0, 20.0, 20.0, 28.0, 35.0, 48.0, 49.0, 47.0, 69.0, 52.0, 74.0, 75.0, 78.0, 55.0, 48.0, 53.0, 42.0, 45.0, 26.0, 23.0, 24.0, 18.0, 6.0, 6.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.8719482421875, -3.697021484375, -3.5220947265625, -3.34716796875, -3.1722412109375, -2.997314453125, -2.8223876953125, -2.6474609375, -2.4725341796875, -2.297607421875, -2.1226806640625, -1.94775390625, -1.7728271484375, -1.597900390625, -1.4229736328125, -1.248046875, -1.0731201171875, -0.898193359375, -0.7232666015625, -0.54833984375, -0.3734130859375, -0.198486328125, -0.0235595703125, 0.1513671875, 0.3262939453125, 0.501220703125, 0.6761474609375, 0.85107421875, 1.0260009765625, 1.200927734375, 1.3758544921875, 1.55078125, 1.7257080078125, 1.900634765625, 2.0755615234375, 2.25048828125, 2.4254150390625, 2.600341796875, 2.7752685546875, 2.9501953125, 3.1251220703125, 3.300048828125, 3.4749755859375, 3.64990234375, 3.8248291015625, 3.999755859375, 4.1746826171875, 4.349609375, 4.5245361328125, 4.699462890625, 4.8743896484375, 5.04931640625, 5.2242431640625, 5.399169921875, 5.5740966796875, 5.7490234375, 5.9239501953125, 6.098876953125, 6.2738037109375, 6.44873046875, 6.6236572265625, 6.798583984375, 6.9735107421875, 7.1484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 15.0, 12.0, 16.0, 27.0, 38.0, 40.0, 67.0, 77.0, 126.0, 131.0, 199.0, 268.0, 433.0, 517.0, 883.0, 1542.0, 3660.0, 12252.0, 50825.0, 278105.0, 557140.0, 106926.0, 23340.0, 6212.0, 2208.0, 1081.0, 679.0, 486.0, 349.0, 233.0, 181.0, 138.0, 92.0, 66.0, 55.0, 41.0, 28.0, 16.0, 8.0, 13.0, 6.0, 7.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.546875, -16.01708984375, -15.4873046875, -14.95751953125, -14.427734375, -13.89794921875, -13.3681640625, -12.83837890625, -12.30859375, -11.77880859375, -11.2490234375, -10.71923828125, -10.189453125, -9.65966796875, -9.1298828125, -8.60009765625, -8.0703125, -7.54052734375, -7.0107421875, -6.48095703125, -5.951171875, -5.42138671875, -4.8916015625, -4.36181640625, -3.83203125, -3.30224609375, -2.7724609375, -2.24267578125, -1.712890625, -1.18310546875, -0.6533203125, -0.12353515625, 0.40625, 0.93603515625, 1.4658203125, 1.99560546875, 2.525390625, 3.05517578125, 3.5849609375, 4.11474609375, 4.64453125, 5.17431640625, 5.7041015625, 6.23388671875, 6.763671875, 7.29345703125, 7.8232421875, 8.35302734375, 8.8828125, 9.41259765625, 9.9423828125, 10.47216796875, 11.001953125, 11.53173828125, 12.0615234375, 12.59130859375, 13.12109375, 13.65087890625, 14.1806640625, 14.71044921875, 15.240234375, 15.77001953125, 16.2998046875, 16.82958984375, 17.359375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 5.0, 9.0, 4.0, 8.0, 18.0, 17.0, 21.0, 30.0, 27.0, 34.0, 38.0, 36.0, 44.0, 55.0, 44.0, 51.0, 56.0, 50.0, 58.0, 47.0, 50.0, 59.0, 39.0, 32.0, 33.0, 24.0, 20.0, 26.0, 16.0, 9.0, 11.0, 8.0, 5.0, 3.0, 3.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.171875, -20.55078125, -19.9296875, -19.30859375, -18.6875, -18.06640625, -17.4453125, -16.82421875, -16.203125, -15.58203125, -14.9609375, -14.33984375, -13.71875, -13.09765625, -12.4765625, -11.85546875, -11.234375, -10.61328125, -9.9921875, -9.37109375, -8.75, -8.12890625, -7.5078125, -6.88671875, -6.265625, -5.64453125, -5.0234375, -4.40234375, -3.78125, -3.16015625, -2.5390625, -1.91796875, -1.296875, -0.67578125, -0.0546875, 0.56640625, 1.1875, 1.80859375, 2.4296875, 3.05078125, 3.671875, 4.29296875, 4.9140625, 5.53515625, 6.15625, 6.77734375, 7.3984375, 8.01953125, 8.640625, 9.26171875, 9.8828125, 10.50390625, 11.125, 11.74609375, 12.3671875, 12.98828125, 13.609375, 14.23046875, 14.8515625, 15.47265625, 16.09375, 16.71484375, 17.3359375, 17.95703125, 18.578125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 3.0, 3.0, 6.0, 12.0, 16.0, 34.0, 40.0, 74.0, 107.0, 152.0, 228.0, 459.0, 854.0, 1898.0, 4350.0, 12983.0, 49121.0, 253997.0, 560317.0, 123151.0, 26998.0, 7969.0, 2928.0, 1268.0, 677.0, 339.0, 218.0, 123.0, 87.0, 45.0, 36.0, 20.0, 11.0, 7.0, 12.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.41015625, -7.15716552734375, -6.9041748046875, -6.65118408203125, -6.398193359375, -6.14520263671875, -5.8922119140625, -5.63922119140625, -5.38623046875, -5.13323974609375, -4.8802490234375, -4.62725830078125, -4.374267578125, -4.12127685546875, -3.8682861328125, -3.61529541015625, -3.3623046875, -3.10931396484375, -2.8563232421875, -2.60333251953125, -2.350341796875, -2.09735107421875, -1.8443603515625, -1.59136962890625, -1.33837890625, -1.08538818359375, -0.8323974609375, -0.57940673828125, -0.326416015625, -0.07342529296875, 0.1795654296875, 0.43255615234375, 0.685546875, 0.93853759765625, 1.1915283203125, 1.44451904296875, 1.697509765625, 1.95050048828125, 2.2034912109375, 2.45648193359375, 2.70947265625, 2.96246337890625, 3.2154541015625, 3.46844482421875, 3.721435546875, 3.97442626953125, 4.2274169921875, 4.48040771484375, 4.7333984375, 4.98638916015625, 5.2393798828125, 5.49237060546875, 5.745361328125, 5.99835205078125, 6.2513427734375, 6.50433349609375, 6.75732421875, 7.01031494140625, 7.2633056640625, 7.51629638671875, 7.769287109375, 8.02227783203125, 8.2752685546875, 8.52825927734375, 8.78125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 2.0, 8.0, 5.0, 12.0, 14.0, 21.0, 13.0, 37.0, 34.0, 42.0, 58.0, 65.0, 73.0, 83.0, 81.0, 75.0, 82.0, 80.0, 48.0, 34.0, 27.0, 20.0, 17.0, 13.0, 7.0, 12.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0013275146484375, -0.0012937411665916443, -0.0012599676847457886, -0.0012261942028999329, -0.0011924207210540771, -0.0011586472392082214, -0.0011248737573623657, -0.00109110027551651, -0.0010573267936706543, -0.0010235533118247986, -0.0009897798299789429, -0.0009560063481330872, -0.0009222328662872314, -0.0008884593844413757, -0.00085468590259552, -0.0008209124207496643, -0.0007871389389038086, -0.0007533654570579529, -0.0007195919752120972, -0.0006858184933662415, -0.0006520450115203857, -0.00061827152967453, -0.0005844980478286743, -0.0005507245659828186, -0.0005169510841369629, -0.0004831776022911072, -0.00044940412044525146, -0.00041563063859939575, -0.00038185715675354004, -0.0003480836749076843, -0.0003143101930618286, -0.0002805367112159729, -0.0002467632293701172, -0.00021298974752426147, -0.00017921626567840576, -0.00014544278383255005, -0.00011166930198669434, -7.789582014083862e-05, -4.412233829498291e-05, -1.0348856449127197e-05, 2.3424625396728516e-05, 5.719810724258423e-05, 9.097158908843994e-05, 0.00012474507093429565, 0.00015851855278015137, 0.00019229203462600708, 0.0002260655164718628, 0.0002598389983177185, 0.0002936124801635742, 0.00032738596200942993, 0.00036115944385528564, 0.00039493292570114136, 0.00042870640754699707, 0.0004624798893928528, 0.0004962533712387085, 0.0005300268530845642, 0.0005638003349304199, 0.0005975738167762756, 0.0006313472986221313, 0.0006651207804679871, 0.0006988942623138428, 0.0007326677441596985, 0.0007664412260055542, 0.0008002147078514099, 0.0008339881896972656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 8.0, 13.0, 6.0, 17.0, 34.0, 54.0, 96.0, 142.0, 338.0, 696.0, 1820.0, 6689.0, 41693.0, 575256.0, 384428.0, 29143.0, 5301.0, 1583.0, 634.0, 271.0, 151.0, 67.0, 43.0, 28.0, 12.0, 10.0, 5.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8828125, -11.4571533203125, -11.031494140625, -10.6058349609375, -10.18017578125, -9.7545166015625, -9.328857421875, -8.9031982421875, -8.4775390625, -8.0518798828125, -7.626220703125, -7.2005615234375, -6.77490234375, -6.3492431640625, -5.923583984375, -5.4979248046875, -5.072265625, -4.6466064453125, -4.220947265625, -3.7952880859375, -3.36962890625, -2.9439697265625, -2.518310546875, -2.0926513671875, -1.6669921875, -1.2413330078125, -0.815673828125, -0.3900146484375, 0.03564453125, 0.4613037109375, 0.886962890625, 1.3126220703125, 1.73828125, 2.1639404296875, 2.589599609375, 3.0152587890625, 3.44091796875, 3.8665771484375, 4.292236328125, 4.7178955078125, 5.1435546875, 5.5692138671875, 5.994873046875, 6.4205322265625, 6.84619140625, 7.2718505859375, 7.697509765625, 8.1231689453125, 8.548828125, 8.9744873046875, 9.400146484375, 9.8258056640625, 10.25146484375, 10.6771240234375, 11.102783203125, 11.5284423828125, 11.9541015625, 12.3797607421875, 12.805419921875, 13.2310791015625, 13.65673828125, 14.0823974609375, 14.508056640625, 14.9337158203125, 15.359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 13.0, 18.0, 25.0, 27.0, 39.0, 64.0, 92.0, 109.0, 114.0, 129.0, 95.0, 71.0, 61.0, 43.0, 28.0, 12.0, 18.0, 10.0, 6.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.15435791015625, -5.8438720703125, -5.53338623046875, -5.222900390625, -4.91241455078125, -4.6019287109375, -4.29144287109375, -3.98095703125, -3.67047119140625, -3.3599853515625, -3.04949951171875, -2.739013671875, -2.42852783203125, -2.1180419921875, -1.80755615234375, -1.4970703125, -1.18658447265625, -0.8760986328125, -0.56561279296875, -0.255126953125, 0.05535888671875, 0.3658447265625, 0.67633056640625, 0.98681640625, 1.29730224609375, 1.6077880859375, 1.91827392578125, 2.228759765625, 2.53924560546875, 2.8497314453125, 3.16021728515625, 3.470703125, 3.78118896484375, 4.0916748046875, 4.40216064453125, 4.712646484375, 5.02313232421875, 5.3336181640625, 5.64410400390625, 5.95458984375, 6.26507568359375, 6.5755615234375, 6.88604736328125, 7.196533203125, 7.50701904296875, 7.8175048828125, 8.12799072265625, 8.4384765625, 8.74896240234375, 9.0594482421875, 9.36993408203125, 9.680419921875, 9.99090576171875, 10.3013916015625, 10.61187744140625, 10.92236328125, 11.23284912109375, 11.5433349609375, 11.85382080078125, 12.164306640625, 12.47479248046875, 12.7852783203125, 13.09576416015625, 13.40625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 12.0, 21.0, 43.0, 64.0, 121.0, 144.0, 165.0, 170.0, 109.0, 66.0, 44.0, 19.0, 15.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-171.34573364257812, -166.12405395507812, -160.90235900878906, -155.68067932128906, -150.45899963378906, -145.2373046875, -140.015625, -134.7939453125, -129.57225036621094, -124.3505630493164, -119.1288833618164, -113.90719604492188, -108.68550872802734, -103.46382141113281, -98.24214172363281, -93.02045440673828, -87.79877471923828, -82.57708740234375, -77.35540771484375, -72.13372039794922, -66.91203308105469, -61.69034957885742, -56.468666076660156, -51.246978759765625, -46.02529525756836, -40.803611755371094, -35.58192443847656, -30.360240936279297, -25.1385555267334, -19.9168701171875, -14.695186614990234, -9.473499298095703, -4.2518157958984375, 0.9698691368103027, 6.191554069519043, 11.413238525390625, 16.634923934936523, 21.856609344482422, 27.078292846679688, 32.29998016357422, 37.521663665771484, 42.74334716796875, 47.96503448486328, 53.18671798706055, 58.40840148925781, 63.630088806152344, 68.85177612304688, 74.07345581054688, 79.2951431274414, 84.51683044433594, 89.73851013183594, 94.96019744873047, 100.181884765625, 105.403564453125, 110.62525177001953, 115.84693908691406, 121.06861877441406, 126.2903060913086, 131.51199340820312, 136.73367309570312, 141.95535278320312, 147.1770477294922, 152.3987274169922, 157.62042236328125, 162.84210205078125]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 5.0, 9.0, 9.0, 11.0, 9.0, 9.0, 15.0, 17.0, 16.0, 21.0, 26.0, 33.0, 36.0, 33.0, 38.0, 42.0, 34.0, 40.0, 50.0, 52.0, 49.0, 64.0, 42.0, 41.0, 43.0, 28.0, 46.0, 21.0, 25.0, 19.0, 16.0, 19.0, 12.0, 13.0, 10.0, 6.0, 5.0, 11.0, 3.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.07047271728516, -75.499755859375, -72.92903137207031, -70.35831451416016, -67.78759765625, -65.21687316894531, -62.646156311035156, -60.075435638427734, -57.50471496582031, -54.93399429321289, -52.36327362060547, -49.79255676269531, -47.22183609008789, -44.65111541748047, -42.08039855957031, -39.50967788696289, -36.93895721435547, -34.36823654174805, -31.797517776489258, -29.22679901123047, -26.656078338623047, -24.085357666015625, -21.514638900756836, -18.943920135498047, -16.373199462890625, -13.80247974395752, -11.231760025024414, -8.661040306091309, -6.090320587158203, -3.5196008682250977, -0.9488811492919922, 1.6218376159667969, 4.1925506591796875, 6.763270378112793, 9.333990097045898, 11.904709815979004, 14.47542953491211, 17.04615020751953, 19.61686897277832, 22.18758773803711, 24.75830841064453, 27.329029083251953, 29.899747848510742, 32.47046661376953, 35.04118728637695, 37.611907958984375, 40.18262481689453, 42.75334548950195, 45.324066162109375, 47.8947868347168, 50.46550750732422, 53.036224365234375, 55.6069450378418, 58.17766571044922, 60.748382568359375, 63.3191032409668, 65.88982391357422, 68.46054077148438, 71.03126525878906, 73.60198211669922, 76.17269897460938, 78.74342346191406, 81.31414031982422, 83.88485717773438, 86.45558166503906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 8.0, 5.0, 9.0, 10.0, 20.0, 25.0, 54.0, 73.0, 153.0, 293.0, 679.0, 1806.0, 5839.0, 31804.0, 4001709.0, 133753.0, 12762.0, 3138.0, 1168.0, 471.0, 217.0, 112.0, 67.0, 30.0, 23.0, 14.0, 13.0, 9.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -32.77685546875, -31.3974609375, -30.01806640625, -28.638671875, -27.25927734375, -25.8798828125, -24.50048828125, -23.12109375, -21.74169921875, -20.3623046875, -18.98291015625, -17.603515625, -16.22412109375, -14.8447265625, -13.46533203125, -12.0859375, -10.70654296875, -9.3271484375, -7.94775390625, -6.568359375, -5.18896484375, -3.8095703125, -2.43017578125, -1.05078125, 0.32861328125, 1.7080078125, 3.08740234375, 4.466796875, 5.84619140625, 7.2255859375, 8.60498046875, 9.984375, 11.36376953125, 12.7431640625, 14.12255859375, 15.501953125, 16.88134765625, 18.2607421875, 19.64013671875, 21.01953125, 22.39892578125, 23.7783203125, 25.15771484375, 26.537109375, 27.91650390625, 29.2958984375, 30.67529296875, 32.0546875, 33.43408203125, 34.8134765625, 36.19287109375, 37.572265625, 38.95166015625, 40.3310546875, 41.71044921875, 43.08984375, 44.46923828125, 45.8486328125, 47.22802734375, 48.607421875, 49.98681640625, 51.3662109375, 52.74560546875, 54.125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 14.0, 18.0, 21.0, 26.0, 25.0, 50.0, 51.0, 41.0, 61.0, 54.0, 74.0, 90.0, 64.0, 65.0, 68.0, 40.0, 55.0, 42.0, 28.0, 29.0, 20.0, 18.0, 12.0, 12.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.807342529296875, -3.63226318359375, -3.457183837890625, -3.2821044921875, -3.107025146484375, -2.93194580078125, -2.756866455078125, -2.581787109375, -2.406707763671875, -2.23162841796875, -2.056549072265625, -1.8814697265625, -1.706390380859375, -1.53131103515625, -1.356231689453125, -1.18115234375, -1.006072998046875, -0.83099365234375, -0.655914306640625, -0.4808349609375, -0.305755615234375, -0.13067626953125, 0.044403076171875, 0.219482421875, 0.394561767578125, 0.56964111328125, 0.744720458984375, 0.9197998046875, 1.094879150390625, 1.26995849609375, 1.445037841796875, 1.6201171875, 1.795196533203125, 1.97027587890625, 2.145355224609375, 2.3204345703125, 2.495513916015625, 2.67059326171875, 2.845672607421875, 3.020751953125, 3.195831298828125, 3.37091064453125, 3.545989990234375, 3.7210693359375, 3.896148681640625, 4.07122802734375, 4.246307373046875, 4.42138671875, 4.596466064453125, 4.77154541015625, 4.946624755859375, 5.1217041015625, 5.296783447265625, 5.47186279296875, 5.646942138671875, 5.822021484375, 5.997100830078125, 6.17218017578125, 6.347259521484375, 6.5223388671875, 6.697418212890625, 6.87249755859375, 7.047576904296875, 7.22265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 10.0, 17.0, 16.0, 35.0, 47.0, 88.0, 99.0, 177.0, 248.0, 376.0, 615.0, 921.0, 1478.0, 2427.0, 4201.0, 7355.0, 14419.0, 31117.0, 84851.0, 2928091.0, 972600.0, 82682.0, 30531.0, 14092.0, 7220.0, 4162.0, 2380.0, 1423.0, 888.0, 577.0, 390.0, 252.0, 166.0, 109.0, 71.0, 46.0, 39.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.578125, -11.1920166015625, -10.805908203125, -10.4197998046875, -10.03369140625, -9.6475830078125, -9.261474609375, -8.8753662109375, -8.4892578125, -8.1031494140625, -7.717041015625, -7.3309326171875, -6.94482421875, -6.5587158203125, -6.172607421875, -5.7864990234375, -5.400390625, -5.0142822265625, -4.628173828125, -4.2420654296875, -3.85595703125, -3.4698486328125, -3.083740234375, -2.6976318359375, -2.3115234375, -1.9254150390625, -1.539306640625, -1.1531982421875, -0.76708984375, -0.3809814453125, 0.005126953125, 0.3912353515625, 0.77734375, 1.1634521484375, 1.549560546875, 1.9356689453125, 2.32177734375, 2.7078857421875, 3.093994140625, 3.4801025390625, 3.8662109375, 4.2523193359375, 4.638427734375, 5.0245361328125, 5.41064453125, 5.7967529296875, 6.182861328125, 6.5689697265625, 6.955078125, 7.3411865234375, 7.727294921875, 8.1134033203125, 8.49951171875, 8.8856201171875, 9.271728515625, 9.6578369140625, 10.0439453125, 10.4300537109375, 10.816162109375, 11.2022705078125, 11.58837890625, 11.9744873046875, 12.360595703125, 12.7467041015625, 13.1328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 9.0, 7.0, 11.0, 7.0, 20.0, 19.0, 30.0, 56.0, 49.0, 85.0, 184.0, 2544.0, 622.0, 162.0, 69.0, 45.0, 29.0, 21.0, 24.0, 11.0, 16.0, 12.0, 10.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78125, -3.672943115234375, -3.56463623046875, -3.456329345703125, -3.3480224609375, -3.239715576171875, -3.13140869140625, -3.023101806640625, -2.914794921875, -2.806488037109375, -2.69818115234375, -2.589874267578125, -2.4815673828125, -2.373260498046875, -2.26495361328125, -2.156646728515625, -2.04833984375, -1.940032958984375, -1.83172607421875, -1.723419189453125, -1.6151123046875, -1.506805419921875, -1.39849853515625, -1.290191650390625, -1.181884765625, -1.073577880859375, -0.96527099609375, -0.856964111328125, -0.7486572265625, -0.640350341796875, -0.53204345703125, -0.423736572265625, -0.3154296875, -0.207122802734375, -0.09881591796875, 0.009490966796875, 0.1177978515625, 0.226104736328125, 0.33441162109375, 0.442718505859375, 0.551025390625, 0.659332275390625, 0.76763916015625, 0.875946044921875, 0.9842529296875, 1.092559814453125, 1.20086669921875, 1.309173583984375, 1.41748046875, 1.525787353515625, 1.63409423828125, 1.742401123046875, 1.8507080078125, 1.959014892578125, 2.06732177734375, 2.175628662109375, 2.283935546875, 2.392242431640625, 2.50054931640625, 2.608856201171875, 2.7171630859375, 2.825469970703125, 2.93377685546875, 3.042083740234375, 3.150390625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 14.0, 9.0, 22.0, 37.0, 42.0, 52.0, 64.0, 80.0, 92.0, 81.0, 96.0, 83.0, 74.0, 64.0, 63.0, 41.0, 28.0, 24.0, 14.0, 12.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78056526184082, -21.241167068481445, -20.701766967773438, -20.162368774414062, -19.622970581054688, -19.08357048034668, -18.544172286987305, -18.004772186279297, -17.465373992919922, -16.925975799560547, -16.38657569885254, -15.847177505493164, -15.307778358459473, -14.768379211425781, -14.228981018066406, -13.689581871032715, -13.150182723999023, -12.610783576965332, -12.07138442993164, -11.531986236572266, -10.992587089538574, -10.453187942504883, -9.913789749145508, -9.374390602111816, -8.834991455078125, -8.295592308044434, -7.7561936378479, -7.216794967651367, -6.677395820617676, -6.137996673583984, -5.598598003387451, -5.059199333190918, -4.519800186157227, -3.9804012775421143, -3.441002368927002, -2.9016034603118896, -2.3622045516967773, -1.822805643081665, -1.2834067344665527, -0.7440078258514404, -0.20460891723632812, 0.3347899913787842, 0.8741888999938965, 1.4135878086090088, 1.952986717224121, 2.4923856258392334, 3.0317845344543457, 3.571183443069458, 4.11058235168457, 4.649981498718262, 5.189380168914795, 5.728778839111328, 6.2681779861450195, 6.807577133178711, 7.346975803375244, 7.886374473571777, 8.425773620605469, 8.96517276763916, 9.504571914672852, 10.043970108032227, 10.583369255065918, 11.12276840209961, 11.662166595458984, 12.201565742492676, 12.740964889526367]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 6.0, 7.0, 9.0, 19.0, 23.0, 13.0, 14.0, 21.0, 19.0, 22.0, 32.0, 37.0, 29.0, 32.0, 41.0, 36.0, 46.0, 47.0, 45.0, 28.0, 47.0, 39.0, 35.0, 30.0, 33.0, 32.0, 23.0, 24.0, 27.0, 27.0, 26.0, 16.0, 12.0, 16.0, 8.0, 8.0, 10.0, 13.0, 4.0, 5.0, 5.0, 7.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.702902793884277, -8.4434814453125, -8.184060096740723, -7.924638748168945, -7.665217399597168, -7.405796051025391, -7.146374702453613, -6.886953353881836, -6.627532005310059, -6.368110656738281, -6.108689308166504, -5.849267959594727, -5.589846611022949, -5.330425262451172, -5.0710039138793945, -4.811582565307617, -4.552161693572998, -4.292740345001221, -4.033318996429443, -3.773897647857666, -3.5144762992858887, -3.2550549507141113, -2.995633840560913, -2.7362124919891357, -2.4767911434173584, -2.217369794845581, -1.9579484462738037, -1.698527216911316, -1.4391058683395386, -1.1796845197677612, -0.9202632904052734, -0.6608419418334961, -0.40142059326171875, -0.1419992744922638, 0.11742204427719116, 0.37684333324432373, 0.6362646818161011, 0.8956860303878784, 1.1551072597503662, 1.4145286083221436, 1.673949956893921, 1.9333713054656982, 2.1927926540374756, 2.452213764190674, 2.711635112762451, 2.9710564613342285, 3.230477809906006, 3.489899158477783, 3.7493205070495605, 4.008741855621338, 4.268163204193115, 4.527584552764893, 4.78700590133667, 5.046427249908447, 5.305848121643066, 5.565269470214844, 5.824690818786621, 6.084112167358398, 6.343533515930176, 6.602954864501953, 6.8623762130737305, 7.121797561645508, 7.381218910217285, 7.6406402587890625, 7.90006160736084]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 20.0, 25.0, 48.0, 70.0, 144.0, 271.0, 638.0, 1778.0, 5685.0, 23299.0, 128421.0, 511452.0, 304329.0, 55752.0, 11521.0, 3083.0, 1077.0, 437.0, 209.0, 141.0, 57.0, 29.0, 22.0, 18.0, 5.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.984375, -20.4429931640625, -19.901611328125, -19.3602294921875, -18.81884765625, -18.2774658203125, -17.736083984375, -17.1947021484375, -16.6533203125, -16.1119384765625, -15.570556640625, -15.0291748046875, -14.48779296875, -13.9464111328125, -13.405029296875, -12.8636474609375, -12.322265625, -11.7808837890625, -11.239501953125, -10.6981201171875, -10.15673828125, -9.6153564453125, -9.073974609375, -8.5325927734375, -7.9912109375, -7.4498291015625, -6.908447265625, -6.3670654296875, -5.82568359375, -5.2843017578125, -4.742919921875, -4.2015380859375, -3.66015625, -3.1187744140625, -2.577392578125, -2.0360107421875, -1.49462890625, -0.9532470703125, -0.411865234375, 0.1295166015625, 0.6708984375, 1.2122802734375, 1.753662109375, 2.2950439453125, 2.83642578125, 3.3778076171875, 3.919189453125, 4.4605712890625, 5.001953125, 5.5433349609375, 6.084716796875, 6.6260986328125, 7.16748046875, 7.7088623046875, 8.250244140625, 8.7916259765625, 9.3330078125, 9.8743896484375, 10.415771484375, 10.9571533203125, 11.49853515625, 12.0399169921875, 12.581298828125, 13.1226806640625, 13.6640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 18.0, 21.0, 23.0, 39.0, 39.0, 43.0, 47.0, 52.0, 57.0, 70.0, 74.0, 72.0, 57.0, 66.0, 50.0, 51.0, 38.0, 29.0, 25.0, 31.0, 14.0, 15.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.84356689453125, -3.6676025390625, -3.49163818359375, -3.315673828125, -3.13970947265625, -2.9637451171875, -2.78778076171875, -2.61181640625, -2.43585205078125, -2.2598876953125, -2.08392333984375, -1.907958984375, -1.73199462890625, -1.5560302734375, -1.38006591796875, -1.2041015625, -1.02813720703125, -0.8521728515625, -0.67620849609375, -0.500244140625, -0.32427978515625, -0.1483154296875, 0.02764892578125, 0.20361328125, 0.37957763671875, 0.5555419921875, 0.73150634765625, 0.907470703125, 1.08343505859375, 1.2593994140625, 1.43536376953125, 1.611328125, 1.78729248046875, 1.9632568359375, 2.13922119140625, 2.315185546875, 2.49114990234375, 2.6671142578125, 2.84307861328125, 3.01904296875, 3.19500732421875, 3.3709716796875, 3.54693603515625, 3.722900390625, 3.89886474609375, 4.0748291015625, 4.25079345703125, 4.4267578125, 4.60272216796875, 4.7786865234375, 4.95465087890625, 5.130615234375, 5.30657958984375, 5.4825439453125, 5.65850830078125, 5.83447265625, 6.01043701171875, 6.1864013671875, 6.36236572265625, 6.538330078125, 6.71429443359375, 6.8902587890625, 7.06622314453125, 7.2421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 10.0, 10.0, 19.0, 42.0, 59.0, 129.0, 223.0, 364.0, 650.0, 1356.0, 4078.0, 38437.0, 773800.0, 214567.0, 10527.0, 2160.0, 948.0, 516.0, 290.0, 163.0, 84.0, 53.0, 34.0, 19.0, 7.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.77099609375, -20.8544921875, -19.93798828125, -19.021484375, -18.10498046875, -17.1884765625, -16.27197265625, -15.35546875, -14.43896484375, -13.5224609375, -12.60595703125, -11.689453125, -10.77294921875, -9.8564453125, -8.93994140625, -8.0234375, -7.10693359375, -6.1904296875, -5.27392578125, -4.357421875, -3.44091796875, -2.5244140625, -1.60791015625, -0.69140625, 0.22509765625, 1.1416015625, 2.05810546875, 2.974609375, 3.89111328125, 4.8076171875, 5.72412109375, 6.640625, 7.55712890625, 8.4736328125, 9.39013671875, 10.306640625, 11.22314453125, 12.1396484375, 13.05615234375, 13.97265625, 14.88916015625, 15.8056640625, 16.72216796875, 17.638671875, 18.55517578125, 19.4716796875, 20.38818359375, 21.3046875, 22.22119140625, 23.1376953125, 24.05419921875, 24.970703125, 25.88720703125, 26.8037109375, 27.72021484375, 28.63671875, 29.55322265625, 30.4697265625, 31.38623046875, 32.302734375, 33.21923828125, 34.1357421875, 35.05224609375, 35.96875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 3.0, 7.0, 4.0, 7.0, 8.0, 17.0, 11.0, 15.0, 22.0, 22.0, 22.0, 37.0, 31.0, 32.0, 56.0, 29.0, 42.0, 43.0, 35.0, 45.0, 45.0, 30.0, 46.0, 56.0, 40.0, 40.0, 33.0, 31.0, 30.0, 27.0, 28.0, 16.0, 17.0, 14.0, 9.0, 11.0, 5.0, 8.0, 9.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.234375, -16.7138671875, -16.193359375, -15.6728515625, -15.15234375, -14.6318359375, -14.111328125, -13.5908203125, -13.0703125, -12.5498046875, -12.029296875, -11.5087890625, -10.98828125, -10.4677734375, -9.947265625, -9.4267578125, -8.90625, -8.3857421875, -7.865234375, -7.3447265625, -6.82421875, -6.3037109375, -5.783203125, -5.2626953125, -4.7421875, -4.2216796875, -3.701171875, -3.1806640625, -2.66015625, -2.1396484375, -1.619140625, -1.0986328125, -0.578125, -0.0576171875, 0.462890625, 0.9833984375, 1.50390625, 2.0244140625, 2.544921875, 3.0654296875, 3.5859375, 4.1064453125, 4.626953125, 5.1474609375, 5.66796875, 6.1884765625, 6.708984375, 7.2294921875, 7.75, 8.2705078125, 8.791015625, 9.3115234375, 9.83203125, 10.3525390625, 10.873046875, 11.3935546875, 11.9140625, 12.4345703125, 12.955078125, 13.4755859375, 13.99609375, 14.5166015625, 15.037109375, 15.5576171875, 16.078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 11.0, 12.0, 17.0, 16.0, 21.0, 27.0, 33.0, 58.0, 85.0, 144.0, 235.0, 423.0, 870.0, 2120.0, 6913.0, 31118.0, 261956.0, 650603.0, 74148.0, 13251.0, 3680.0, 1295.0, 605.0, 313.0, 174.0, 114.0, 83.0, 57.0, 41.0, 24.0, 20.0, 16.0, 14.0, 9.0, 8.0, 7.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.4921875, -9.20654296875, -8.9208984375, -8.63525390625, -8.349609375, -8.06396484375, -7.7783203125, -7.49267578125, -7.20703125, -6.92138671875, -6.6357421875, -6.35009765625, -6.064453125, -5.77880859375, -5.4931640625, -5.20751953125, -4.921875, -4.63623046875, -4.3505859375, -4.06494140625, -3.779296875, -3.49365234375, -3.2080078125, -2.92236328125, -2.63671875, -2.35107421875, -2.0654296875, -1.77978515625, -1.494140625, -1.20849609375, -0.9228515625, -0.63720703125, -0.3515625, -0.06591796875, 0.2197265625, 0.50537109375, 0.791015625, 1.07666015625, 1.3623046875, 1.64794921875, 1.93359375, 2.21923828125, 2.5048828125, 2.79052734375, 3.076171875, 3.36181640625, 3.6474609375, 3.93310546875, 4.21875, 4.50439453125, 4.7900390625, 5.07568359375, 5.361328125, 5.64697265625, 5.9326171875, 6.21826171875, 6.50390625, 6.78955078125, 7.0751953125, 7.36083984375, 7.646484375, 7.93212890625, 8.2177734375, 8.50341796875, 8.7890625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 9.0, 12.0, 19.0, 30.0, 51.0, 83.0, 117.0, 168.0, 172.0, 127.0, 76.0, 39.0, 26.0, 16.0, 8.0, 11.0, 9.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001140594482421875, -0.001079946756362915, -0.001019299030303955, -0.0009586513042449951, -0.0008980035781860352, -0.0008373558521270752, -0.0007767081260681152, -0.0007160604000091553, -0.0006554126739501953, -0.0005947649478912354, -0.0005341172218322754, -0.00047346949577331543, -0.00041282176971435547, -0.0003521740436553955, -0.00029152631759643555, -0.00023087859153747559, -0.00017023086547851562, -0.00010958313941955566, -4.89354133605957e-05, 1.1712312698364258e-05, 7.236003875732422e-05, 0.00013300776481628418, 0.00019365549087524414, 0.0002543032169342041, 0.00031495094299316406, 0.000375598669052124, 0.000436246395111084, 0.0004968941211700439, 0.0005575418472290039, 0.0006181895732879639, 0.0006788372993469238, 0.0007394850254058838, 0.0008001327514648438, 0.0008607804775238037, 0.0009214282035827637, 0.0009820759296417236, 0.0010427236557006836, 0.0011033713817596436, 0.0011640191078186035, 0.0012246668338775635, 0.0012853145599365234, 0.0013459622859954834, 0.0014066100120544434, 0.0014672577381134033, 0.0015279054641723633, 0.0015885531902313232, 0.0016492009162902832, 0.0017098486423492432, 0.0017704963684082031, 0.001831144094467163, 0.001891791820526123, 0.001952439546585083, 0.002013087272644043, 0.002073734998703003, 0.002134382724761963, 0.002195030450820923, 0.002255678176879883, 0.0023163259029388428, 0.0023769736289978027, 0.0024376213550567627, 0.0024982690811157227, 0.0025589168071746826, 0.0026195645332336426, 0.0026802122592926025, 0.0027408599853515625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 7.0, 12.0, 21.0, 24.0, 36.0, 59.0, 94.0, 185.0, 305.0, 668.0, 2143.0, 10363.0, 150358.0, 823110.0, 52897.0, 5756.0, 1364.0, 546.0, 282.0, 146.0, 62.0, 34.0, 32.0, 20.0, 10.0, 10.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8660888671875, -15.404052734375, -14.9420166015625, -14.47998046875, -14.0179443359375, -13.555908203125, -13.0938720703125, -12.6318359375, -12.1697998046875, -11.707763671875, -11.2457275390625, -10.78369140625, -10.3216552734375, -9.859619140625, -9.3975830078125, -8.935546875, -8.4735107421875, -8.011474609375, -7.5494384765625, -7.08740234375, -6.6253662109375, -6.163330078125, -5.7012939453125, -5.2392578125, -4.7772216796875, -4.315185546875, -3.8531494140625, -3.39111328125, -2.9290771484375, -2.467041015625, -2.0050048828125, -1.54296875, -1.0809326171875, -0.618896484375, -0.1568603515625, 0.30517578125, 0.7672119140625, 1.229248046875, 1.6912841796875, 2.1533203125, 2.6153564453125, 3.077392578125, 3.5394287109375, 4.00146484375, 4.4635009765625, 4.925537109375, 5.3875732421875, 5.849609375, 6.3116455078125, 6.773681640625, 7.2357177734375, 7.69775390625, 8.1597900390625, 8.621826171875, 9.0838623046875, 9.5458984375, 10.0079345703125, 10.469970703125, 10.9320068359375, 11.39404296875, 11.8560791015625, 12.318115234375, 12.7801513671875, 13.2421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 12.0, 12.0, 20.0, 28.0, 64.0, 93.0, 121.0, 142.0, 150.0, 101.0, 89.0, 53.0, 40.0, 22.0, 12.0, 4.0, 6.0, 9.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-15.8359375, -15.4912109375, -15.146484375, -14.8017578125, -14.45703125, -14.1123046875, -13.767578125, -13.4228515625, -13.078125, -12.7333984375, -12.388671875, -12.0439453125, -11.69921875, -11.3544921875, -11.009765625, -10.6650390625, -10.3203125, -9.9755859375, -9.630859375, -9.2861328125, -8.94140625, -8.5966796875, -8.251953125, -7.9072265625, -7.5625, -7.2177734375, -6.873046875, -6.5283203125, -6.18359375, -5.8388671875, -5.494140625, -5.1494140625, -4.8046875, -4.4599609375, -4.115234375, -3.7705078125, -3.42578125, -3.0810546875, -2.736328125, -2.3916015625, -2.046875, -1.7021484375, -1.357421875, -1.0126953125, -0.66796875, -0.3232421875, 0.021484375, 0.3662109375, 0.7109375, 1.0556640625, 1.400390625, 1.7451171875, 2.08984375, 2.4345703125, 2.779296875, 3.1240234375, 3.46875, 3.8134765625, 4.158203125, 4.5029296875, 4.84765625, 5.1923828125, 5.537109375, 5.8818359375, 6.2265625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 4.0, 9.0, 12.0, 27.0, 76.0, 104.0, 149.0, 171.0, 165.0, 133.0, 68.0, 40.0, 14.0, 18.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.68679809570312, -84.5965805053711, -79.50636291503906, -74.41615295410156, -69.32593536376953, -64.2357177734375, -59.145503997802734, -54.05529022216797, -48.96507263183594, -43.874855041503906, -38.78464126586914, -33.694427490234375, -28.604209899902344, -23.513994216918945, -18.423778533935547, -13.333564758300781, -8.24334716796875, -3.1531314849853516, 1.9370841979980469, 7.027299880981445, 12.117515563964844, 17.207731246948242, 22.29794692993164, 27.388160705566406, 32.47837829589844, 37.56859588623047, 42.658809661865234, 47.7490234375, 52.83924102783203, 57.92945861816406, 63.01967239379883, 68.1098861694336, 73.20008850097656, 78.2903060913086, 83.38052368164062, 88.47073364257812, 93.56095123291016, 98.65116882324219, 103.74137878417969, 108.83159637451172, 113.92181396484375, 119.01203155517578, 124.10224914550781, 129.1924591064453, 134.28268432617188, 139.37289428710938, 144.46310424804688, 149.55331420898438, 154.64353942871094, 159.73374938964844, 164.823974609375, 169.9141845703125, 175.00439453125, 180.09461975097656, 185.18482971191406, 190.27505493164062, 195.36526489257812, 200.45547485351562, 205.5457000732422, 210.6359100341797, 215.72613525390625, 220.81634521484375, 225.90655517578125, 230.99676513671875, 236.0869903564453]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 8.0, 9.0, 18.0, 23.0, 27.0, 22.0, 25.0, 32.0, 31.0, 54.0, 39.0, 50.0, 45.0, 46.0, 62.0, 48.0, 49.0, 47.0, 38.0, 49.0, 36.0, 31.0, 25.0, 29.0, 28.0, 15.0, 17.0, 15.0, 14.0, 6.0, 16.0, 8.0, 5.0, 3.0, 0.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.55218505859375, -72.94676971435547, -70.34136199951172, -67.73594665527344, -65.13053894042969, -62.525123596191406, -59.919708251953125, -57.31429672241211, -54.708885192871094, -52.10347366333008, -49.49806213378906, -46.89264678955078, -44.287235260009766, -41.68182373046875, -39.07640838623047, -36.47099685668945, -33.86558532714844, -31.260173797607422, -28.654760360717773, -26.049346923828125, -23.44393539428711, -20.838523864746094, -18.233110427856445, -15.627696990966797, -13.022285461425781, -10.41687297821045, -7.811460494995117, -5.206048011779785, -2.600635528564453, 0.004776954650878906, 2.610189437866211, 5.215602874755859, 7.821014404296875, 10.426426887512207, 13.031839370727539, 15.637251853942871, 18.242664337158203, 20.84807586669922, 23.453489303588867, 26.058902740478516, 28.66431427001953, 31.269725799560547, 33.87513732910156, 36.480552673339844, 39.08596420288086, 41.691375732421875, 44.296791076660156, 46.90220260620117, 49.50761413574219, 52.1130256652832, 54.71843719482422, 57.3238525390625, 59.929264068603516, 62.53467559814453, 65.14009094238281, 67.74549865722656, 70.35091400146484, 72.95632934570312, 75.56173706054688, 78.16715240478516, 80.77256774902344, 83.37797546386719, 85.98339080810547, 88.58880615234375, 91.1942138671875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 8.0, 13.0, 21.0, 41.0, 58.0, 78.0, 127.0, 253.0, 521.0, 1080.0, 2553.0, 6606.0, 24020.0, 4024467.0, 111675.0, 14509.0, 4673.0, 1831.0, 839.0, 406.0, 200.0, 112.0, 70.0, 32.0, 16.0, 19.0, 7.0, 12.0, 8.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-33.8125, -32.841552734375, -31.87060546875, -30.899658203125, -29.9287109375, -28.957763671875, -27.98681640625, -27.015869140625, -26.044921875, -25.073974609375, -24.10302734375, -23.132080078125, -22.1611328125, -21.190185546875, -20.21923828125, -19.248291015625, -18.27734375, -17.306396484375, -16.33544921875, -15.364501953125, -14.3935546875, -13.422607421875, -12.45166015625, -11.480712890625, -10.509765625, -9.538818359375, -8.56787109375, -7.596923828125, -6.6259765625, -5.655029296875, -4.68408203125, -3.713134765625, -2.7421875, -1.771240234375, -0.80029296875, 0.170654296875, 1.1416015625, 2.112548828125, 3.08349609375, 4.054443359375, 5.025390625, 5.996337890625, 6.96728515625, 7.938232421875, 8.9091796875, 9.880126953125, 10.85107421875, 11.822021484375, 12.79296875, 13.763916015625, 14.73486328125, 15.705810546875, 16.6767578125, 17.647705078125, 18.61865234375, 19.589599609375, 20.560546875, 21.531494140625, 22.50244140625, 23.473388671875, 24.4443359375, 25.415283203125, 26.38623046875, 27.357177734375, 28.328125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 14.0, 19.0, 16.0, 17.0, 27.0, 24.0, 38.0, 48.0, 44.0, 53.0, 53.0, 73.0, 76.0, 58.0, 50.0, 53.0, 71.0, 46.0, 33.0, 36.0, 37.0, 15.0, 24.0, 14.0, 9.0, 5.0, 13.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.998046875, -3.824127197265625, -3.65020751953125, -3.476287841796875, -3.3023681640625, -3.128448486328125, -2.95452880859375, -2.780609130859375, -2.606689453125, -2.432769775390625, -2.25885009765625, -2.084930419921875, -1.9110107421875, -1.737091064453125, -1.56317138671875, -1.389251708984375, -1.21533203125, -1.041412353515625, -0.86749267578125, -0.693572998046875, -0.5196533203125, -0.345733642578125, -0.17181396484375, 0.002105712890625, 0.176025390625, 0.349945068359375, 0.52386474609375, 0.697784423828125, 0.8717041015625, 1.045623779296875, 1.21954345703125, 1.393463134765625, 1.5673828125, 1.741302490234375, 1.91522216796875, 2.089141845703125, 2.2630615234375, 2.436981201171875, 2.61090087890625, 2.784820556640625, 2.958740234375, 3.132659912109375, 3.30657958984375, 3.480499267578125, 3.6544189453125, 3.828338623046875, 4.00225830078125, 4.176177978515625, 4.35009765625, 4.524017333984375, 4.69793701171875, 4.871856689453125, 5.0457763671875, 5.219696044921875, 5.39361572265625, 5.567535400390625, 5.741455078125, 5.915374755859375, 6.08929443359375, 6.263214111328125, 6.4371337890625, 6.611053466796875, 6.78497314453125, 6.958892822265625, 7.1328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 9.0, 16.0, 21.0, 32.0, 43.0, 98.0, 107.0, 204.0, 362.0, 608.0, 1099.0, 2037.0, 4160.0, 9508.0, 29304.0, 3782421.0, 321699.0, 25664.0, 8701.0, 3837.0, 1900.0, 1010.0, 579.0, 347.0, 191.0, 107.0, 74.0, 54.0, 40.0, 18.0, 12.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.88525390625, -26.1767578125, -25.46826171875, -24.759765625, -24.05126953125, -23.3427734375, -22.63427734375, -21.92578125, -21.21728515625, -20.5087890625, -19.80029296875, -19.091796875, -18.38330078125, -17.6748046875, -16.96630859375, -16.2578125, -15.54931640625, -14.8408203125, -14.13232421875, -13.423828125, -12.71533203125, -12.0068359375, -11.29833984375, -10.58984375, -9.88134765625, -9.1728515625, -8.46435546875, -7.755859375, -7.04736328125, -6.3388671875, -5.63037109375, -4.921875, -4.21337890625, -3.5048828125, -2.79638671875, -2.087890625, -1.37939453125, -0.6708984375, 0.03759765625, 0.74609375, 1.45458984375, 2.1630859375, 2.87158203125, 3.580078125, 4.28857421875, 4.9970703125, 5.70556640625, 6.4140625, 7.12255859375, 7.8310546875, 8.53955078125, 9.248046875, 9.95654296875, 10.6650390625, 11.37353515625, 12.08203125, 12.79052734375, 13.4990234375, 14.20751953125, 14.916015625, 15.62451171875, 16.3330078125, 17.04150390625, 17.75]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 3.0, 12.0, 20.0, 17.0, 26.0, 79.0, 645.0, 3027.0, 82.0, 40.0, 21.0, 23.0, 14.0, 13.0, 4.0, 4.0, 7.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.0562744140625, -3.921142578125, -3.7860107421875, -3.65087890625, -3.5157470703125, -3.380615234375, -3.2454833984375, -3.1103515625, -2.9752197265625, -2.840087890625, -2.7049560546875, -2.56982421875, -2.4346923828125, -2.299560546875, -2.1644287109375, -2.029296875, -1.8941650390625, -1.759033203125, -1.6239013671875, -1.48876953125, -1.3536376953125, -1.218505859375, -1.0833740234375, -0.9482421875, -0.8131103515625, -0.677978515625, -0.5428466796875, -0.40771484375, -0.2725830078125, -0.137451171875, -0.0023193359375, 0.1328125, 0.2679443359375, 0.403076171875, 0.5382080078125, 0.67333984375, 0.8084716796875, 0.943603515625, 1.0787353515625, 1.2138671875, 1.3489990234375, 1.484130859375, 1.6192626953125, 1.75439453125, 1.8895263671875, 2.024658203125, 2.1597900390625, 2.294921875, 2.4300537109375, 2.565185546875, 2.7003173828125, 2.83544921875, 2.9705810546875, 3.105712890625, 3.2408447265625, 3.3759765625, 3.5111083984375, 3.646240234375, 3.7813720703125, 3.91650390625, 4.0516357421875, 4.186767578125, 4.3218994140625, 4.45703125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 14.0, 15.0, 33.0, 37.0, 61.0, 52.0, 85.0, 92.0, 111.0, 124.0, 91.0, 74.0, 55.0, 40.0, 34.0, 31.0, 14.0, 7.0, 9.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.199918746948242, -17.660322189331055, -17.1207275390625, -16.581130981445312, -16.041534423828125, -15.50193977355957, -14.962343215942383, -14.422747611999512, -13.88315200805664, -13.34355640411377, -12.803960800170898, -12.264364242553711, -11.72476863861084, -11.185173034667969, -10.645576477050781, -10.10598087310791, -9.566385269165039, -9.026789665222168, -8.487194061279297, -7.947597503662109, -7.408001899719238, -6.868406295776367, -6.328810214996338, -5.789214134216309, -5.2496185302734375, -4.710022926330566, -4.170426845550537, -3.630831003189087, -3.0912351608276367, -2.5516393184661865, -2.0120434761047363, -1.4724476337432861, -0.9328498840332031, -0.39325404167175293, 0.14634180068969727, 0.6859376430511475, 1.2255334854125977, 1.7651293277740479, 2.304725170135498, 2.8443210124969482, 3.3839168548583984, 3.9235126972198486, 4.463108539581299, 5.002704620361328, 5.542300224304199, 6.08189582824707, 6.6214919090271, 7.161087989807129, 7.70068359375, 8.240279197692871, 8.779874801635742, 9.31947135925293, 9.8590669631958, 10.398662567138672, 10.93825912475586, 11.47785472869873, 12.017450332641602, 12.557045936584473, 13.096641540527344, 13.636238098144531, 14.175833702087402, 14.715429306030273, 15.255025863647461, 15.794621467590332, 16.334217071533203]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 9.0, 8.0, 9.0, 9.0, 7.0, 16.0, 21.0, 21.0, 24.0, 22.0, 24.0, 25.0, 30.0, 44.0, 34.0, 40.0, 40.0, 41.0, 32.0, 37.0, 45.0, 37.0, 29.0, 40.0, 32.0, 37.0, 28.0, 34.0, 32.0, 28.0, 25.0, 23.0, 12.0, 16.0, 13.0, 8.0, 5.0, 10.0, 6.0, 6.0, 10.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.987802505493164, -7.732031345367432, -7.476259708404541, -7.220488548278809, -6.964717388153076, -6.708946228027344, -6.453174591064453, -6.197403430938721, -5.941632270812988, -5.685861110687256, -5.430089473724365, -5.174318313598633, -4.9185471534729, -4.662775993347168, -4.407004356384277, -4.151233196258545, -3.8954615592956543, -3.6396901607513428, -3.3839190006256104, -3.128147602081299, -2.8723764419555664, -2.616605043411255, -2.3608336448669434, -2.105062484741211, -1.8492910861968994, -1.5935198068618774, -1.3377485275268555, -1.081977128982544, -0.826205849647522, -0.5704345703125, -0.3146631717681885, -0.058891892433166504, 0.19687938690185547, 0.45265069603919983, 0.7084220051765442, 0.9641933441162109, 1.219964623451233, 1.4757359027862549, 1.7315073013305664, 1.9872785806655884, 2.2430498600006104, 2.498821258544922, 2.7545924186706543, 3.010363817214966, 3.2661352157592773, 3.5219063758850098, 3.7776777744293213, 4.033449172973633, 4.289220333099365, 4.544991493225098, 4.800763130187988, 5.056534290313721, 5.312305450439453, 5.568077087402344, 5.823848247528076, 6.079619407653809, 6.335391044616699, 6.591162204742432, 6.846933841705322, 7.102705001831055, 7.358476161956787, 7.6142473220825195, 7.87001895904541, 8.1257905960083, 8.381561279296875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 21.0, 35.0, 55.0, 95.0, 139.0, 260.0, 477.0, 1126.0, 2731.0, 7795.0, 25658.0, 93392.0, 314884.0, 404607.0, 140615.0, 38772.0, 11315.0, 3691.0, 1432.0, 643.0, 367.0, 154.0, 102.0, 59.0, 49.0, 18.0, 15.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.8792724609375, -10.492919921875, -10.1065673828125, -9.72021484375, -9.3338623046875, -8.947509765625, -8.5611572265625, -8.1748046875, -7.7884521484375, -7.402099609375, -7.0157470703125, -6.62939453125, -6.2430419921875, -5.856689453125, -5.4703369140625, -5.083984375, -4.6976318359375, -4.311279296875, -3.9249267578125, -3.53857421875, -3.1522216796875, -2.765869140625, -2.3795166015625, -1.9931640625, -1.6068115234375, -1.220458984375, -0.8341064453125, -0.44775390625, -0.0614013671875, 0.324951171875, 0.7113037109375, 1.09765625, 1.4840087890625, 1.870361328125, 2.2567138671875, 2.64306640625, 3.0294189453125, 3.415771484375, 3.8021240234375, 4.1884765625, 4.5748291015625, 4.961181640625, 5.3475341796875, 5.73388671875, 6.1202392578125, 6.506591796875, 6.8929443359375, 7.279296875, 7.6656494140625, 8.052001953125, 8.4383544921875, 8.82470703125, 9.2110595703125, 9.597412109375, 9.9837646484375, 10.3701171875, 10.7564697265625, 11.142822265625, 11.5291748046875, 11.91552734375, 12.3018798828125, 12.688232421875, 13.0745849609375, 13.4609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 16.0, 19.0, 14.0, 21.0, 27.0, 30.0, 41.0, 39.0, 44.0, 51.0, 57.0, 67.0, 62.0, 62.0, 57.0, 58.0, 42.0, 60.0, 40.0, 24.0, 29.0, 21.0, 30.0, 15.0, 11.0, 8.0, 6.0, 7.0, 8.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0347900390625, -3.858642578125, -3.6824951171875, -3.50634765625, -3.3302001953125, -3.154052734375, -2.9779052734375, -2.8017578125, -2.6256103515625, -2.449462890625, -2.2733154296875, -2.09716796875, -1.9210205078125, -1.744873046875, -1.5687255859375, -1.392578125, -1.2164306640625, -1.040283203125, -0.8641357421875, -0.68798828125, -0.5118408203125, -0.335693359375, -0.1595458984375, 0.0166015625, 0.1927490234375, 0.368896484375, 0.5450439453125, 0.72119140625, 0.8973388671875, 1.073486328125, 1.2496337890625, 1.42578125, 1.6019287109375, 1.778076171875, 1.9542236328125, 2.13037109375, 2.3065185546875, 2.482666015625, 2.6588134765625, 2.8349609375, 3.0111083984375, 3.187255859375, 3.3634033203125, 3.53955078125, 3.7156982421875, 3.891845703125, 4.0679931640625, 4.244140625, 4.4202880859375, 4.596435546875, 4.7725830078125, 4.94873046875, 5.1248779296875, 5.301025390625, 5.4771728515625, 5.6533203125, 5.8294677734375, 6.005615234375, 6.1817626953125, 6.35791015625, 6.5340576171875, 6.710205078125, 6.8863525390625, 7.0625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 9.0, 6.0, 8.0, 20.0, 16.0, 24.0, 29.0, 56.0, 63.0, 108.0, 162.0, 209.0, 295.0, 423.0, 733.0, 1113.0, 2581.0, 10957.0, 101474.0, 746283.0, 161853.0, 15421.0, 3157.0, 1297.0, 675.0, 482.0, 339.0, 206.0, 163.0, 124.0, 76.0, 60.0, 33.0, 34.0, 19.0, 18.0, 9.0, 8.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.296875, -17.69873046875, -17.1005859375, -16.50244140625, -15.904296875, -15.30615234375, -14.7080078125, -14.10986328125, -13.51171875, -12.91357421875, -12.3154296875, -11.71728515625, -11.119140625, -10.52099609375, -9.9228515625, -9.32470703125, -8.7265625, -8.12841796875, -7.5302734375, -6.93212890625, -6.333984375, -5.73583984375, -5.1376953125, -4.53955078125, -3.94140625, -3.34326171875, -2.7451171875, -2.14697265625, -1.548828125, -0.95068359375, -0.3525390625, 0.24560546875, 0.84375, 1.44189453125, 2.0400390625, 2.63818359375, 3.236328125, 3.83447265625, 4.4326171875, 5.03076171875, 5.62890625, 6.22705078125, 6.8251953125, 7.42333984375, 8.021484375, 8.61962890625, 9.2177734375, 9.81591796875, 10.4140625, 11.01220703125, 11.6103515625, 12.20849609375, 12.806640625, 13.40478515625, 14.0029296875, 14.60107421875, 15.19921875, 15.79736328125, 16.3955078125, 16.99365234375, 17.591796875, 18.18994140625, 18.7880859375, 19.38623046875, 19.984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 7.0, 5.0, 10.0, 14.0, 16.0, 26.0, 23.0, 18.0, 29.0, 37.0, 43.0, 53.0, 40.0, 43.0, 54.0, 59.0, 50.0, 48.0, 55.0, 43.0, 46.0, 42.0, 30.0, 25.0, 29.0, 28.0, 25.0, 11.0, 17.0, 21.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.59375, -21.927490234375, -21.26123046875, -20.594970703125, -19.9287109375, -19.262451171875, -18.59619140625, -17.929931640625, -17.263671875, -16.597412109375, -15.93115234375, -15.264892578125, -14.5986328125, -13.932373046875, -13.26611328125, -12.599853515625, -11.93359375, -11.267333984375, -10.60107421875, -9.934814453125, -9.2685546875, -8.602294921875, -7.93603515625, -7.269775390625, -6.603515625, -5.937255859375, -5.27099609375, -4.604736328125, -3.9384765625, -3.272216796875, -2.60595703125, -1.939697265625, -1.2734375, -0.607177734375, 0.05908203125, 0.725341796875, 1.3916015625, 2.057861328125, 2.72412109375, 3.390380859375, 4.056640625, 4.722900390625, 5.38916015625, 6.055419921875, 6.7216796875, 7.387939453125, 8.05419921875, 8.720458984375, 9.38671875, 10.052978515625, 10.71923828125, 11.385498046875, 12.0517578125, 12.718017578125, 13.38427734375, 14.050537109375, 14.716796875, 15.383056640625, 16.04931640625, 16.715576171875, 17.3818359375, 18.048095703125, 18.71435546875, 19.380615234375, 20.046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 12.0, 7.0, 14.0, 15.0, 24.0, 46.0, 59.0, 106.0, 160.0, 247.0, 516.0, 1272.0, 4753.0, 34527.0, 590646.0, 385539.0, 24693.0, 3766.0, 1076.0, 434.0, 232.0, 125.0, 95.0, 61.0, 41.0, 19.0, 17.0, 13.0, 10.0, 3.0, 10.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.1015625, -9.7640380859375, -9.426513671875, -9.0889892578125, -8.75146484375, -8.4139404296875, -8.076416015625, -7.7388916015625, -7.4013671875, -7.0638427734375, -6.726318359375, -6.3887939453125, -6.05126953125, -5.7137451171875, -5.376220703125, -5.0386962890625, -4.701171875, -4.3636474609375, -4.026123046875, -3.6885986328125, -3.35107421875, -3.0135498046875, -2.676025390625, -2.3385009765625, -2.0009765625, -1.6634521484375, -1.325927734375, -0.9884033203125, -0.65087890625, -0.3133544921875, 0.024169921875, 0.3616943359375, 0.69921875, 1.0367431640625, 1.374267578125, 1.7117919921875, 2.04931640625, 2.3868408203125, 2.724365234375, 3.0618896484375, 3.3994140625, 3.7369384765625, 4.074462890625, 4.4119873046875, 4.74951171875, 5.0870361328125, 5.424560546875, 5.7620849609375, 6.099609375, 6.4371337890625, 6.774658203125, 7.1121826171875, 7.44970703125, 7.7872314453125, 8.124755859375, 8.4622802734375, 8.7998046875, 9.1373291015625, 9.474853515625, 9.8123779296875, 10.14990234375, 10.4874267578125, 10.824951171875, 11.1624755859375, 11.5]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 11.0, 14.0, 13.0, 15.0, 29.0, 41.0, 57.0, 56.0, 100.0, 131.0, 117.0, 91.0, 74.0, 60.0, 41.0, 35.0, 23.0, 17.0, 16.0, 12.0, 7.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010776519775390625, -0.0010431110858917236, -0.0010085701942443848, -0.0009740293025970459, -0.000939488410949707, -0.0009049475193023682, -0.0008704066276550293, -0.0008358657360076904, -0.0008013248443603516, -0.0007667839527130127, -0.0007322430610656738, -0.000697702169418335, -0.0006631612777709961, -0.0006286203861236572, -0.0005940794944763184, -0.0005595386028289795, -0.0005249977111816406, -0.0004904568195343018, -0.0004559159278869629, -0.000421375036239624, -0.00038683414459228516, -0.0003522932529449463, -0.0003177523612976074, -0.00028321146965026855, -0.0002486705780029297, -0.00021412968635559082, -0.00017958879470825195, -0.00014504790306091309, -0.00011050701141357422, -7.596611976623535e-05, -4.1425228118896484e-05, -6.884336471557617e-06, 2.765655517578125e-05, 6.219744682312012e-05, 9.673833847045898e-05, 0.00013127923011779785, 0.00016582012176513672, 0.00020036101341247559, 0.00023490190505981445, 0.0002694427967071533, 0.0003039836883544922, 0.00033852458000183105, 0.0003730654716491699, 0.0004076063632965088, 0.00044214725494384766, 0.0004766881465911865, 0.0005112290382385254, 0.0005457699298858643, 0.0005803108215332031, 0.000614851713180542, 0.0006493926048278809, 0.0006839334964752197, 0.0007184743881225586, 0.0007530152797698975, 0.0007875561714172363, 0.0008220970630645752, 0.0008566379547119141, 0.0008911788463592529, 0.0009257197380065918, 0.0009602606296539307, 0.0009948015213012695, 0.0010293424129486084, 0.0010638833045959473, 0.0010984241962432861, 0.001132965087890625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 9.0, 13.0, 15.0, 36.0, 55.0, 101.0, 155.0, 338.0, 718.0, 2007.0, 8034.0, 89338.0, 827586.0, 107431.0, 9055.0, 2100.0, 765.0, 345.0, 176.0, 102.0, 61.0, 42.0, 29.0, 11.0, 8.0, 8.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.375, -7.967041015625, -7.55908203125, -7.151123046875, -6.7431640625, -6.335205078125, -5.92724609375, -5.519287109375, -5.111328125, -4.703369140625, -4.29541015625, -3.887451171875, -3.4794921875, -3.071533203125, -2.66357421875, -2.255615234375, -1.84765625, -1.439697265625, -1.03173828125, -0.623779296875, -0.2158203125, 0.192138671875, 0.60009765625, 1.008056640625, 1.416015625, 1.823974609375, 2.23193359375, 2.639892578125, 3.0478515625, 3.455810546875, 3.86376953125, 4.271728515625, 4.6796875, 5.087646484375, 5.49560546875, 5.903564453125, 6.3115234375, 6.719482421875, 7.12744140625, 7.535400390625, 7.943359375, 8.351318359375, 8.75927734375, 9.167236328125, 9.5751953125, 9.983154296875, 10.39111328125, 10.799072265625, 11.20703125, 11.614990234375, 12.02294921875, 12.430908203125, 12.8388671875, 13.246826171875, 13.65478515625, 14.062744140625, 14.470703125, 14.878662109375, 15.28662109375, 15.694580078125, 16.1025390625, 16.510498046875, 16.91845703125, 17.326416015625, 17.734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 9.0, 13.0, 21.0, 15.0, 29.0, 33.0, 48.0, 60.0, 70.0, 98.0, 95.0, 84.0, 92.0, 69.0, 54.0, 38.0, 42.0, 32.0, 23.0, 19.0, 10.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.23858642578125, -4.9888916015625, -4.73919677734375, -4.489501953125, -4.23980712890625, -3.9901123046875, -3.74041748046875, -3.49072265625, -3.24102783203125, -2.9913330078125, -2.74163818359375, -2.491943359375, -2.24224853515625, -1.9925537109375, -1.74285888671875, -1.4931640625, -1.24346923828125, -0.9937744140625, -0.74407958984375, -0.494384765625, -0.24468994140625, 0.0050048828125, 0.25469970703125, 0.50439453125, 0.75408935546875, 1.0037841796875, 1.25347900390625, 1.503173828125, 1.75286865234375, 2.0025634765625, 2.25225830078125, 2.501953125, 2.75164794921875, 3.0013427734375, 3.25103759765625, 3.500732421875, 3.75042724609375, 4.0001220703125, 4.24981689453125, 4.49951171875, 4.74920654296875, 4.9989013671875, 5.24859619140625, 5.498291015625, 5.74798583984375, 5.9976806640625, 6.24737548828125, 6.4970703125, 6.74676513671875, 6.9964599609375, 7.24615478515625, 7.495849609375, 7.74554443359375, 7.9952392578125, 8.24493408203125, 8.49462890625, 8.74432373046875, 8.9940185546875, 9.24371337890625, 9.493408203125, 9.74310302734375, 9.9927978515625, 10.24249267578125, 10.4921875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 58.0, 378.0, 467.0, 81.0, 20.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-569.9039916992188, -554.0897216796875, -538.2754516601562, -522.461181640625, -506.6469421386719, -490.83270263671875, -475.0184326171875, -459.20416259765625, -443.389892578125, -427.57562255859375, -411.7613830566406, -395.9471130371094, -380.1328430175781, -364.318603515625, -348.50433349609375, -332.6900634765625, -316.87579345703125, -301.0615234375, -285.2472839355469, -269.4330139160156, -253.61874389648438, -237.8044891357422, -221.990234375, -206.17596435546875, -190.36172485351562, -174.54747009277344, -158.7332000732422, -142.9189453125, -127.10467529296875, -111.29042053222656, -95.47615814208984, -79.66189575195312, -63.847625732421875, -48.033363342285156, -32.21910095214844, -16.404842376708984, -0.5905799865722656, 15.223678588867188, 31.037940979003906, 46.852203369140625, 62.666465759277344, 78.48072814941406, 94.29499053955078, 110.1092529296875, 125.92350769042969, 141.73776245117188, 157.55203247070312, 173.36630249023438, 189.18055725097656, 204.99481201171875, 220.80908203125, 236.6233367919922, 252.43760681152344, 268.2518615722656, 284.0661315917969, 299.88037109375, 315.69464111328125, 331.5089111328125, 347.3231506347656, 363.1374206542969, 378.9516906738281, 394.76593017578125, 410.5802001953125, 426.39447021484375, 442.208740234375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 6.0, 5.0, 5.0, 10.0, 20.0, 21.0, 20.0, 22.0, 22.0, 23.0, 33.0, 29.0, 27.0, 41.0, 44.0, 55.0, 40.0, 50.0, 49.0, 34.0, 48.0, 34.0, 48.0, 41.0, 39.0, 30.0, 33.0, 27.0, 15.0, 22.0, 20.0, 20.0, 15.0, 10.0, 10.0, 9.0, 5.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-81.88735961914062, -79.22712707519531, -76.56689453125, -73.90666198730469, -71.2464370727539, -68.5862045288086, -65.92597198486328, -63.26573944091797, -60.605506896972656, -57.945274353027344, -55.2850456237793, -52.624813079833984, -49.96458053588867, -47.304351806640625, -44.64411926269531, -41.98388671875, -39.32365798950195, -36.66342544555664, -34.003196716308594, -31.34296417236328, -28.68273162841797, -26.02250099182129, -23.36227035522461, -20.702037811279297, -18.041807174682617, -15.381575584411621, -12.721343994140625, -10.061113357543945, -7.400881767272949, -4.740650177001953, -2.0804195404052734, 0.5798130035400391, 3.2400436401367188, 5.900275230407715, 8.560506820678711, 11.22073745727539, 13.880969047546387, 16.541200637817383, 19.201431274414062, 21.861663818359375, 24.521894454956055, 27.182125091552734, 29.842357635498047, 32.502586364746094, 35.162818908691406, 37.82305145263672, 40.48328399658203, 43.143516540527344, 45.80374526977539, 48.4639778137207, 51.12420654296875, 53.78443908691406, 56.444671630859375, 59.10490417480469, 61.765132904052734, 64.42536926269531, 67.0855941772461, 69.7458267211914, 72.40605926513672, 75.0662841796875, 77.72651672363281, 80.38674926757812, 83.04698181152344, 85.70721435546875, 88.36744689941406]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 1.0, 5.0, 12.0, 10.0, 24.0, 49.0, 91.0, 141.0, 287.0, 628.0, 1324.0, 4011.0, 14591.0, 135207.0, 3992015.0, 34687.0, 7312.0, 2214.0, 836.0, 396.0, 192.0, 116.0, 42.0, 36.0, 15.0, 16.0, 8.0, 8.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.75, -21.88330078125, -21.0166015625, -20.14990234375, -19.283203125, -18.41650390625, -17.5498046875, -16.68310546875, -15.81640625, -14.94970703125, -14.0830078125, -13.21630859375, -12.349609375, -11.48291015625, -10.6162109375, -9.74951171875, -8.8828125, -8.01611328125, -7.1494140625, -6.28271484375, -5.416015625, -4.54931640625, -3.6826171875, -2.81591796875, -1.94921875, -1.08251953125, -0.2158203125, 0.65087890625, 1.517578125, 2.38427734375, 3.2509765625, 4.11767578125, 4.984375, 5.85107421875, 6.7177734375, 7.58447265625, 8.451171875, 9.31787109375, 10.1845703125, 11.05126953125, 11.91796875, 12.78466796875, 13.6513671875, 14.51806640625, 15.384765625, 16.25146484375, 17.1181640625, 17.98486328125, 18.8515625, 19.71826171875, 20.5849609375, 21.45166015625, 22.318359375, 23.18505859375, 24.0517578125, 24.91845703125, 25.78515625, 26.65185546875, 27.5185546875, 28.38525390625, 29.251953125, 30.11865234375, 30.9853515625, 31.85205078125, 32.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 8.0, 9.0, 14.0, 16.0, 18.0, 22.0, 25.0, 40.0, 48.0, 47.0, 65.0, 56.0, 64.0, 73.0, 63.0, 74.0, 55.0, 51.0, 37.0, 44.0, 35.0, 26.0, 26.0, 13.0, 14.0, 5.0, 15.0, 5.0, 13.0, 2.0, 5.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.3380126953125, -4.156494140625, -3.9749755859375, -3.79345703125, -3.6119384765625, -3.430419921875, -3.2489013671875, -3.0673828125, -2.8858642578125, -2.704345703125, -2.5228271484375, -2.34130859375, -2.1597900390625, -1.978271484375, -1.7967529296875, -1.615234375, -1.4337158203125, -1.252197265625, -1.0706787109375, -0.88916015625, -0.7076416015625, -0.526123046875, -0.3446044921875, -0.1630859375, 0.0184326171875, 0.199951171875, 0.3814697265625, 0.56298828125, 0.7445068359375, 0.926025390625, 1.1075439453125, 1.2890625, 1.4705810546875, 1.652099609375, 1.8336181640625, 2.01513671875, 2.1966552734375, 2.378173828125, 2.5596923828125, 2.7412109375, 2.9227294921875, 3.104248046875, 3.2857666015625, 3.46728515625, 3.6488037109375, 3.830322265625, 4.0118408203125, 4.193359375, 4.3748779296875, 4.556396484375, 4.7379150390625, 4.91943359375, 5.1009521484375, 5.282470703125, 5.4639892578125, 5.6455078125, 5.8270263671875, 6.008544921875, 6.1900634765625, 6.37158203125, 6.5531005859375, 6.734619140625, 6.9161376953125, 7.09765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 16.0, 21.0, 22.0, 41.0, 51.0, 83.0, 135.0, 228.0, 445.0, 873.0, 1727.0, 4537.0, 13553.0, 78514.0, 3971090.0, 98426.0, 15538.0, 4905.0, 2017.0, 924.0, 487.0, 239.0, 134.0, 88.0, 46.0, 31.0, 30.0, 15.0, 25.0, 12.0, 3.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0], "bins": [-27.765625, -27.0972900390625, -26.428955078125, -25.7606201171875, -25.09228515625, -24.4239501953125, -23.755615234375, -23.0872802734375, -22.4189453125, -21.7506103515625, -21.082275390625, -20.4139404296875, -19.74560546875, -19.0772705078125, -18.408935546875, -17.7406005859375, -17.072265625, -16.4039306640625, -15.735595703125, -15.0672607421875, -14.39892578125, -13.7305908203125, -13.062255859375, -12.3939208984375, -11.7255859375, -11.0572509765625, -10.388916015625, -9.7205810546875, -9.05224609375, -8.3839111328125, -7.715576171875, -7.0472412109375, -6.37890625, -5.7105712890625, -5.042236328125, -4.3739013671875, -3.70556640625, -3.0372314453125, -2.368896484375, -1.7005615234375, -1.0322265625, -0.3638916015625, 0.304443359375, 0.9727783203125, 1.64111328125, 2.3094482421875, 2.977783203125, 3.6461181640625, 4.314453125, 4.9827880859375, 5.651123046875, 6.3194580078125, 6.98779296875, 7.6561279296875, 8.324462890625, 8.9927978515625, 9.6611328125, 10.3294677734375, 10.997802734375, 11.6661376953125, 12.33447265625, 13.0028076171875, 13.671142578125, 14.3394775390625, 15.0078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 4.0, 14.0, 14.0, 22.0, 25.0, 56.0, 117.0, 328.0, 3038.0, 233.0, 88.0, 44.0, 22.0, 15.0, 12.0, 14.0, 2.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9140625, -7.68414306640625, -7.4542236328125, -7.22430419921875, -6.994384765625, -6.76446533203125, -6.5345458984375, -6.30462646484375, -6.07470703125, -5.84478759765625, -5.6148681640625, -5.38494873046875, -5.155029296875, -4.92510986328125, -4.6951904296875, -4.46527099609375, -4.2353515625, -4.00543212890625, -3.7755126953125, -3.54559326171875, -3.315673828125, -3.08575439453125, -2.8558349609375, -2.62591552734375, -2.39599609375, -2.16607666015625, -1.9361572265625, -1.70623779296875, -1.476318359375, -1.24639892578125, -1.0164794921875, -0.78656005859375, -0.556640625, -0.32672119140625, -0.0968017578125, 0.13311767578125, 0.363037109375, 0.59295654296875, 0.8228759765625, 1.05279541015625, 1.28271484375, 1.51263427734375, 1.7425537109375, 1.97247314453125, 2.202392578125, 2.43231201171875, 2.6622314453125, 2.89215087890625, 3.1220703125, 3.35198974609375, 3.5819091796875, 3.81182861328125, 4.041748046875, 4.27166748046875, 4.5015869140625, 4.73150634765625, 4.96142578125, 5.19134521484375, 5.4212646484375, 5.65118408203125, 5.881103515625, 6.11102294921875, 6.3409423828125, 6.57086181640625, 6.80078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 15.0, 17.0, 31.0, 61.0, 108.0, 148.0, 141.0, 164.0, 127.0, 74.0, 55.0, 28.0, 17.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-61.56011962890625, -60.20906448364258, -58.85800552368164, -57.50695037841797, -56.1558952331543, -54.80483627319336, -53.45378112792969, -52.10272216796875, -50.75166702270508, -49.400611877441406, -48.04955291748047, -46.6984977722168, -45.347442626953125, -43.99638366699219, -42.645328521728516, -41.294273376464844, -39.943214416503906, -38.592159271240234, -37.2411003112793, -35.890045166015625, -34.53899002075195, -33.187931060791016, -31.836875915527344, -30.48581886291504, -29.134765625, -27.783708572387695, -26.432653427124023, -25.08159637451172, -23.730539321899414, -22.37948226928711, -21.028427124023438, -19.677370071411133, -18.326311111450195, -16.97525405883789, -15.624197959899902, -14.273141860961914, -12.92208480834961, -11.571028709411621, -10.219972610473633, -8.868915557861328, -7.51785945892334, -6.166802883148193, -4.815746307373047, -3.4646902084350586, -2.113633632659912, -0.7625770568847656, 0.5884790420532227, 1.9395360946655273, 3.2905921936035156, 4.641648769378662, 5.992705345153809, 7.343761444091797, 8.694818496704102, 10.04587459564209, 11.396930694580078, 12.747987747192383, 14.099043846130371, 15.45009994506836, 16.801156997680664, 18.15221405029297, 19.50326919555664, 20.854326248168945, 22.20538330078125, 23.556438446044922, 24.907495498657227]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 14.0, 16.0, 20.0, 22.0, 24.0, 21.0, 26.0, 29.0, 43.0, 36.0, 34.0, 45.0, 39.0, 57.0, 43.0, 44.0, 41.0, 56.0, 39.0, 41.0, 49.0, 32.0, 37.0, 31.0, 27.0, 19.0, 20.0, 21.0, 16.0, 6.0, 11.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.312578201293945, -15.806832313537598, -15.301087379455566, -14.795341491699219, -14.289596557617188, -13.78385066986084, -13.278104782104492, -12.772359848022461, -12.266613960266113, -11.760868072509766, -11.255123138427734, -10.749377250671387, -10.243631362915039, -9.737886428833008, -9.23214054107666, -8.726394653320312, -8.220649719238281, -7.714904308319092, -7.209158897399902, -6.703413009643555, -6.197667598724365, -5.691922187805176, -5.186176300048828, -4.680430889129639, -4.174685478210449, -3.6689400672912598, -3.163194417953491, -2.6574487686157227, -2.151703357696533, -1.6459579467773438, -1.1402122974395752, -0.6344666481018066, -0.12871932983398438, 0.37702620029449463, 0.8827717304229736, 1.3885172605514526, 1.8942627906799316, 2.400008201599121, 2.9057538509368896, 3.411499500274658, 3.9172449111938477, 4.422990322113037, 4.928735733032227, 5.434481620788574, 5.940227031707764, 6.445972442626953, 6.951718330383301, 7.45746374130249, 7.96320915222168, 8.468955039978027, 8.974699974060059, 9.480445861816406, 9.986190795898438, 10.491936683654785, 10.997682571411133, 11.503427505493164, 12.009173393249512, 12.51491928100586, 13.02066421508789, 13.526410102844238, 14.032155990600586, 14.537900924682617, 15.043646812438965, 15.549392700195312, 16.055137634277344]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 16.0, 24.0, 47.0, 78.0, 142.0, 249.0, 489.0, 1050.0, 2452.0, 7092.0, 23054.0, 88408.0, 341679.0, 425838.0, 114107.0, 29894.0, 8500.0, 3019.0, 1151.0, 575.0, 290.0, 140.0, 89.0, 58.0, 36.0, 16.0, 9.0, 5.0, 7.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-24.921875, -24.30029296875, -23.6787109375, -23.05712890625, -22.435546875, -21.81396484375, -21.1923828125, -20.57080078125, -19.94921875, -19.32763671875, -18.7060546875, -18.08447265625, -17.462890625, -16.84130859375, -16.2197265625, -15.59814453125, -14.9765625, -14.35498046875, -13.7333984375, -13.11181640625, -12.490234375, -11.86865234375, -11.2470703125, -10.62548828125, -10.00390625, -9.38232421875, -8.7607421875, -8.13916015625, -7.517578125, -6.89599609375, -6.2744140625, -5.65283203125, -5.03125, -4.40966796875, -3.7880859375, -3.16650390625, -2.544921875, -1.92333984375, -1.3017578125, -0.68017578125, -0.05859375, 0.56298828125, 1.1845703125, 1.80615234375, 2.427734375, 3.04931640625, 3.6708984375, 4.29248046875, 4.9140625, 5.53564453125, 6.1572265625, 6.77880859375, 7.400390625, 8.02197265625, 8.6435546875, 9.26513671875, 9.88671875, 10.50830078125, 11.1298828125, 11.75146484375, 12.373046875, 12.99462890625, 13.6162109375, 14.23779296875, 14.859375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 6.0, 10.0, 6.0, 11.0, 15.0, 15.0, 18.0, 27.0, 26.0, 42.0, 41.0, 39.0, 65.0, 73.0, 52.0, 79.0, 71.0, 55.0, 65.0, 48.0, 42.0, 28.0, 37.0, 24.0, 26.0, 14.0, 13.0, 14.0, 14.0, 10.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.92645263671875, -4.7357177734375, -4.54498291015625, -4.354248046875, -4.16351318359375, -3.9727783203125, -3.78204345703125, -3.59130859375, -3.40057373046875, -3.2098388671875, -3.01910400390625, -2.828369140625, -2.63763427734375, -2.4468994140625, -2.25616455078125, -2.0654296875, -1.87469482421875, -1.6839599609375, -1.49322509765625, -1.302490234375, -1.11175537109375, -0.9210205078125, -0.73028564453125, -0.53955078125, -0.34881591796875, -0.1580810546875, 0.03265380859375, 0.223388671875, 0.41412353515625, 0.6048583984375, 0.79559326171875, 0.986328125, 1.17706298828125, 1.3677978515625, 1.55853271484375, 1.749267578125, 1.94000244140625, 2.1307373046875, 2.32147216796875, 2.51220703125, 2.70294189453125, 2.8936767578125, 3.08441162109375, 3.275146484375, 3.46588134765625, 3.6566162109375, 3.84735107421875, 4.0380859375, 4.22882080078125, 4.4195556640625, 4.61029052734375, 4.801025390625, 4.99176025390625, 5.1824951171875, 5.37322998046875, 5.56396484375, 5.75469970703125, 5.9454345703125, 6.13616943359375, 6.326904296875, 6.51763916015625, 6.7083740234375, 6.89910888671875, 7.08984375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 6.0, 5.0, 9.0, 9.0, 21.0, 40.0, 61.0, 106.0, 179.0, 309.0, 584.0, 1327.0, 4097.0, 39276.0, 790051.0, 197810.0, 10656.0, 2162.0, 825.0, 428.0, 248.0, 116.0, 89.0, 55.0, 32.0, 21.0, 11.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.5, -36.388671875, -35.27734375, -34.166015625, -33.0546875, -31.943359375, -30.83203125, -29.720703125, -28.609375, -27.498046875, -26.38671875, -25.275390625, -24.1640625, -23.052734375, -21.94140625, -20.830078125, -19.71875, -18.607421875, -17.49609375, -16.384765625, -15.2734375, -14.162109375, -13.05078125, -11.939453125, -10.828125, -9.716796875, -8.60546875, -7.494140625, -6.3828125, -5.271484375, -4.16015625, -3.048828125, -1.9375, -0.826171875, 0.28515625, 1.396484375, 2.5078125, 3.619140625, 4.73046875, 5.841796875, 6.953125, 8.064453125, 9.17578125, 10.287109375, 11.3984375, 12.509765625, 13.62109375, 14.732421875, 15.84375, 16.955078125, 18.06640625, 19.177734375, 20.2890625, 21.400390625, 22.51171875, 23.623046875, 24.734375, 25.845703125, 26.95703125, 28.068359375, 29.1796875, 30.291015625, 31.40234375, 32.513671875, 33.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 10.0, 8.0, 11.0, 10.0, 15.0, 12.0, 22.0, 23.0, 29.0, 25.0, 28.0, 35.0, 32.0, 44.0, 37.0, 42.0, 38.0, 40.0, 45.0, 38.0, 39.0, 42.0, 24.0, 33.0, 37.0, 36.0, 29.0, 25.0, 28.0, 22.0, 18.0, 23.0, 14.0, 12.0, 12.0, 10.0, 6.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.9296875, -14.4205322265625, -13.911376953125, -13.4022216796875, -12.89306640625, -12.3839111328125, -11.874755859375, -11.3656005859375, -10.8564453125, -10.3472900390625, -9.838134765625, -9.3289794921875, -8.81982421875, -8.3106689453125, -7.801513671875, -7.2923583984375, -6.783203125, -6.2740478515625, -5.764892578125, -5.2557373046875, -4.74658203125, -4.2374267578125, -3.728271484375, -3.2191162109375, -2.7099609375, -2.2008056640625, -1.691650390625, -1.1824951171875, -0.67333984375, -0.1641845703125, 0.344970703125, 0.8541259765625, 1.36328125, 1.8724365234375, 2.381591796875, 2.8907470703125, 3.39990234375, 3.9090576171875, 4.418212890625, 4.9273681640625, 5.4365234375, 5.9456787109375, 6.454833984375, 6.9639892578125, 7.47314453125, 7.9822998046875, 8.491455078125, 9.0006103515625, 9.509765625, 10.0189208984375, 10.528076171875, 11.0372314453125, 11.54638671875, 12.0555419921875, 12.564697265625, 13.0738525390625, 13.5830078125, 14.0921630859375, 14.601318359375, 15.1104736328125, 15.61962890625, 16.1287841796875, 16.637939453125, 17.1470947265625, 17.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 10.0, 14.0, 25.0, 31.0, 48.0, 62.0, 101.0, 197.0, 366.0, 687.0, 1518.0, 3737.0, 11686.0, 55358.0, 404600.0, 486311.0, 63347.0, 13206.0, 4095.0, 1555.0, 714.0, 387.0, 186.0, 121.0, 64.0, 45.0, 22.0, 10.0, 15.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6953125, -7.45513916015625, -7.2149658203125, -6.97479248046875, -6.734619140625, -6.49444580078125, -6.2542724609375, -6.01409912109375, -5.77392578125, -5.53375244140625, -5.2935791015625, -5.05340576171875, -4.813232421875, -4.57305908203125, -4.3328857421875, -4.09271240234375, -3.8525390625, -3.61236572265625, -3.3721923828125, -3.13201904296875, -2.891845703125, -2.65167236328125, -2.4114990234375, -2.17132568359375, -1.93115234375, -1.69097900390625, -1.4508056640625, -1.21063232421875, -0.970458984375, -0.73028564453125, -0.4901123046875, -0.24993896484375, -0.009765625, 0.23040771484375, 0.4705810546875, 0.71075439453125, 0.950927734375, 1.19110107421875, 1.4312744140625, 1.67144775390625, 1.91162109375, 2.15179443359375, 2.3919677734375, 2.63214111328125, 2.872314453125, 3.11248779296875, 3.3526611328125, 3.59283447265625, 3.8330078125, 4.07318115234375, 4.3133544921875, 4.55352783203125, 4.793701171875, 5.03387451171875, 5.2740478515625, 5.51422119140625, 5.75439453125, 5.99456787109375, 6.2347412109375, 6.47491455078125, 6.715087890625, 6.95526123046875, 7.1954345703125, 7.43560791015625, 7.67578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 8.0, 13.0, 14.0, 10.0, 10.0, 15.0, 24.0, 26.0, 18.0, 37.0, 40.0, 41.0, 70.0, 83.0, 103.0, 110.0, 81.0, 54.0, 44.0, 34.0, 34.0, 27.0, 25.0, 11.0, 19.0, 8.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.001495361328125, -0.0014546513557434082, -0.0014139413833618164, -0.0013732314109802246, -0.0013325214385986328, -0.001291811466217041, -0.0012511014938354492, -0.0012103915214538574, -0.0011696815490722656, -0.0011289715766906738, -0.001088261604309082, -0.0010475516319274902, -0.0010068416595458984, -0.0009661316871643066, -0.0009254217147827148, -0.000884711742401123, -0.0008440017700195312, -0.0008032917976379395, -0.0007625818252563477, -0.0007218718528747559, -0.0006811618804931641, -0.0006404519081115723, -0.0005997419357299805, -0.0005590319633483887, -0.0005183219909667969, -0.0004776120185852051, -0.0004369020462036133, -0.0003961920738220215, -0.0003554821014404297, -0.0003147721290588379, -0.0002740621566772461, -0.0002333521842956543, -0.0001926422119140625, -0.0001519322395324707, -0.0001112222671508789, -7.051229476928711e-05, -2.9802322387695312e-05, 1.0907649993896484e-05, 5.161762237548828e-05, 9.232759475708008e-05, 0.00013303756713867188, 0.00017374753952026367, 0.00021445751190185547, 0.00025516748428344727, 0.00029587745666503906, 0.00033658742904663086, 0.00037729740142822266, 0.00041800737380981445, 0.00045871734619140625, 0.000499427318572998, 0.0005401372909545898, 0.0005808472633361816, 0.0006215572357177734, 0.0006622672080993652, 0.000702977180480957, 0.0007436871528625488, 0.0007843971252441406, 0.0008251070976257324, 0.0008658170700073242, 0.000906527042388916, 0.0009472370147705078, 0.0009879469871520996, 0.0010286569595336914, 0.0010693669319152832, 0.001110076904296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 8.0, 7.0, 6.0, 20.0, 12.0, 23.0, 36.0, 38.0, 47.0, 72.0, 114.0, 189.0, 330.0, 563.0, 1121.0, 2534.0, 7517.0, 34216.0, 283265.0, 618654.0, 78887.0, 13560.0, 4000.0, 1531.0, 747.0, 374.0, 230.0, 123.0, 89.0, 59.0, 42.0, 35.0, 30.0, 24.0, 16.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.9765625, -8.706298828125, -8.43603515625, -8.165771484375, -7.8955078125, -7.625244140625, -7.35498046875, -7.084716796875, -6.814453125, -6.544189453125, -6.27392578125, -6.003662109375, -5.7333984375, -5.463134765625, -5.19287109375, -4.922607421875, -4.65234375, -4.382080078125, -4.11181640625, -3.841552734375, -3.5712890625, -3.301025390625, -3.03076171875, -2.760498046875, -2.490234375, -2.219970703125, -1.94970703125, -1.679443359375, -1.4091796875, -1.138916015625, -0.86865234375, -0.598388671875, -0.328125, -0.057861328125, 0.21240234375, 0.482666015625, 0.7529296875, 1.023193359375, 1.29345703125, 1.563720703125, 1.833984375, 2.104248046875, 2.37451171875, 2.644775390625, 2.9150390625, 3.185302734375, 3.45556640625, 3.725830078125, 3.99609375, 4.266357421875, 4.53662109375, 4.806884765625, 5.0771484375, 5.347412109375, 5.61767578125, 5.887939453125, 6.158203125, 6.428466796875, 6.69873046875, 6.968994140625, 7.2392578125, 7.509521484375, 7.77978515625, 8.050048828125, 8.3203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 7.0, 13.0, 12.0, 12.0, 12.0, 23.0, 30.0, 34.0, 32.0, 50.0, 48.0, 72.0, 67.0, 61.0, 64.0, 56.0, 75.0, 69.0, 48.0, 38.0, 28.0, 25.0, 16.0, 18.0, 14.0, 8.0, 18.0, 8.0, 7.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.71875, -4.55126953125, -4.3837890625, -4.21630859375, -4.048828125, -3.88134765625, -3.7138671875, -3.54638671875, -3.37890625, -3.21142578125, -3.0439453125, -2.87646484375, -2.708984375, -2.54150390625, -2.3740234375, -2.20654296875, -2.0390625, -1.87158203125, -1.7041015625, -1.53662109375, -1.369140625, -1.20166015625, -1.0341796875, -0.86669921875, -0.69921875, -0.53173828125, -0.3642578125, -0.19677734375, -0.029296875, 0.13818359375, 0.3056640625, 0.47314453125, 0.640625, 0.80810546875, 0.9755859375, 1.14306640625, 1.310546875, 1.47802734375, 1.6455078125, 1.81298828125, 1.98046875, 2.14794921875, 2.3154296875, 2.48291015625, 2.650390625, 2.81787109375, 2.9853515625, 3.15283203125, 3.3203125, 3.48779296875, 3.6552734375, 3.82275390625, 3.990234375, 4.15771484375, 4.3251953125, 4.49267578125, 4.66015625, 4.82763671875, 4.9951171875, 5.16259765625, 5.330078125, 5.49755859375, 5.6650390625, 5.83251953125, 6.0]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 14.0, 28.0, 67.0, 117.0, 202.0, 208.0, 163.0, 114.0, 38.0, 25.0, 10.0, 7.0, 8.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-350.2626953125, -342.99365234375, -335.724609375, -328.45556640625, -321.1864929199219, -313.9174499511719, -306.6484069824219, -299.3793640136719, -292.1103210449219, -284.8412780761719, -277.5722351074219, -270.30316162109375, -263.03411865234375, -255.76507568359375, -248.49603271484375, -241.22698974609375, -233.9579315185547, -226.6888885498047, -219.41983032226562, -212.15078735351562, -204.88174438476562, -197.61270141601562, -190.34364318847656, -183.07460021972656, -175.8055419921875, -168.5364990234375, -161.26744079589844, -153.99839782714844, -146.72935485839844, -139.46029663085938, -132.19125366210938, -124.92221069335938, -117.65316009521484, -110.38410949707031, -103.11506652832031, -95.84601593017578, -88.57696533203125, -81.30792236328125, -74.03887176513672, -66.76982116699219, -59.50077819824219, -52.23173141479492, -44.962684631347656, -37.693634033203125, -30.42458724975586, -23.155540466308594, -15.886489868164062, -8.617443084716797, -1.3483963012695312, 5.920651435852051, 13.189699172973633, 20.45874786376953, 27.727794647216797, 34.99684143066406, 42.265892028808594, 49.53493881225586, 56.803985595703125, 64.07303619384766, 71.34207916259766, 78.61112976074219, 85.88017272949219, 93.14922332763672, 100.41827392578125, 107.68731689453125, 114.95636749267578]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 6.0, 10.0, 17.0, 8.0, 16.0, 17.0, 18.0, 15.0, 24.0, 34.0, 35.0, 41.0, 44.0, 53.0, 44.0, 52.0, 58.0, 48.0, 59.0, 53.0, 46.0, 36.0, 30.0, 38.0, 28.0, 28.0, 34.0, 23.0, 15.0, 17.0, 16.0, 7.0, 5.0, 4.0, 4.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-83.4207763671875, -80.5611801147461, -77.70158386230469, -74.84198760986328, -71.98239135742188, -69.12278747558594, -66.26319885253906, -63.403594970703125, -60.54399871826172, -57.68440246582031, -54.824806213378906, -51.9652099609375, -49.10560989379883, -46.24601364135742, -43.386417388916016, -40.526817321777344, -37.6672248840332, -34.8076286315918, -31.948030471801758, -29.08843421936035, -26.228836059570312, -23.369239807128906, -20.5096435546875, -17.65004539489746, -14.790449142456055, -11.930851936340332, -9.07125473022461, -6.211658477783203, -3.3520612716674805, -0.4924640655517578, 2.3671321868896484, 5.2267303466796875, 8.086326599121094, 10.945923805236816, 13.805521011352539, 16.665117263793945, 19.524715423583984, 22.38431167602539, 25.243907928466797, 28.103506088256836, 30.963102340698242, 33.82270050048828, 36.68229675292969, 39.541893005371094, 42.4014892578125, 45.261085510253906, 48.12068176269531, 50.980281829833984, 53.83987808227539, 56.6994743347168, 59.5590705871582, 62.418670654296875, 65.27826690673828, 68.13786315917969, 70.9974594116211, 73.8570556640625, 76.7166519165039, 79.57624816894531, 82.43584442138672, 85.29544067382812, 88.15503692626953, 91.01463317871094, 93.87423706054688, 96.73383331298828, 99.59342956542969]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 5.0, 6.0, 10.0, 15.0, 21.0, 19.0, 40.0, 62.0, 94.0, 158.0, 218.0, 413.0, 669.0, 1240.0, 2376.0, 4768.0, 10230.0, 23543.0, 64721.0, 259439.0, 2578862.0, 1032371.0, 141509.0, 42068.0, 16479.0, 7227.0, 3536.0, 1791.0, 883.0, 568.0, 300.0, 205.0, 132.0, 81.0, 52.0, 54.0, 32.0, 21.0, 13.0, 15.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.92401123046875, -6.6331787109375, -6.34234619140625, -6.051513671875, -5.76068115234375, -5.4698486328125, -5.17901611328125, -4.88818359375, -4.59735107421875, -4.3065185546875, -4.01568603515625, -3.724853515625, -3.43402099609375, -3.1431884765625, -2.85235595703125, -2.5615234375, -2.27069091796875, -1.9798583984375, -1.68902587890625, -1.398193359375, -1.10736083984375, -0.8165283203125, -0.52569580078125, -0.23486328125, 0.05596923828125, 0.3468017578125, 0.63763427734375, 0.928466796875, 1.21929931640625, 1.5101318359375, 1.80096435546875, 2.091796875, 2.38262939453125, 2.6734619140625, 2.96429443359375, 3.255126953125, 3.54595947265625, 3.8367919921875, 4.12762451171875, 4.41845703125, 4.70928955078125, 5.0001220703125, 5.29095458984375, 5.581787109375, 5.87261962890625, 6.1634521484375, 6.45428466796875, 6.7451171875, 7.03594970703125, 7.3267822265625, 7.61761474609375, 7.908447265625, 8.19927978515625, 8.4901123046875, 8.78094482421875, 9.07177734375, 9.36260986328125, 9.6534423828125, 9.94427490234375, 10.235107421875, 10.52593994140625, 10.8167724609375, 11.10760498046875, 11.3984375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 7.0, 8.0, 5.0, 13.0, 18.0, 24.0, 26.0, 34.0, 32.0, 41.0, 53.0, 46.0, 46.0, 77.0, 57.0, 68.0, 56.0, 61.0, 41.0, 50.0, 49.0, 31.0, 30.0, 27.0, 20.0, 26.0, 13.0, 15.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34375, -4.16455078125, -3.9853515625, -3.80615234375, -3.626953125, -3.44775390625, -3.2685546875, -3.08935546875, -2.91015625, -2.73095703125, -2.5517578125, -2.37255859375, -2.193359375, -2.01416015625, -1.8349609375, -1.65576171875, -1.4765625, -1.29736328125, -1.1181640625, -0.93896484375, -0.759765625, -0.58056640625, -0.4013671875, -0.22216796875, -0.04296875, 0.13623046875, 0.3154296875, 0.49462890625, 0.673828125, 0.85302734375, 1.0322265625, 1.21142578125, 1.390625, 1.56982421875, 1.7490234375, 1.92822265625, 2.107421875, 2.28662109375, 2.4658203125, 2.64501953125, 2.82421875, 3.00341796875, 3.1826171875, 3.36181640625, 3.541015625, 3.72021484375, 3.8994140625, 4.07861328125, 4.2578125, 4.43701171875, 4.6162109375, 4.79541015625, 4.974609375, 5.15380859375, 5.3330078125, 5.51220703125, 5.69140625, 5.87060546875, 6.0498046875, 6.22900390625, 6.408203125, 6.58740234375, 6.7666015625, 6.94580078125, 7.125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 24.0, 28.0, 47.0, 95.0, 200.0, 375.0, 1060.0, 3148.0, 11401.0, 54108.0, 597135.0, 3340933.0, 151927.0, 24324.0, 6180.0, 1964.0, 697.0, 266.0, 128.0, 77.0, 46.0, 20.0, 16.0, 13.0, 10.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.5848388671875, -19.044677734375, -18.5045166015625, -17.96435546875, -17.4241943359375, -16.884033203125, -16.3438720703125, -15.8037109375, -15.2635498046875, -14.723388671875, -14.1832275390625, -13.64306640625, -13.1029052734375, -12.562744140625, -12.0225830078125, -11.482421875, -10.9422607421875, -10.402099609375, -9.8619384765625, -9.32177734375, -8.7816162109375, -8.241455078125, -7.7012939453125, -7.1611328125, -6.6209716796875, -6.080810546875, -5.5406494140625, -5.00048828125, -4.4603271484375, -3.920166015625, -3.3800048828125, -2.83984375, -2.2996826171875, -1.759521484375, -1.2193603515625, -0.67919921875, -0.1390380859375, 0.401123046875, 0.9412841796875, 1.4814453125, 2.0216064453125, 2.561767578125, 3.1019287109375, 3.64208984375, 4.1822509765625, 4.722412109375, 5.2625732421875, 5.802734375, 6.3428955078125, 6.883056640625, 7.4232177734375, 7.96337890625, 8.5035400390625, 9.043701171875, 9.5838623046875, 10.1240234375, 10.6641845703125, 11.204345703125, 11.7445068359375, 12.28466796875, 12.8248291015625, 13.364990234375, 13.9051513671875, 14.4453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 5.0, 8.0, 10.0, 17.0, 20.0, 30.0, 31.0, 51.0, 82.0, 117.0, 190.0, 267.0, 567.0, 947.0, 679.0, 358.0, 213.0, 144.0, 82.0, 56.0, 44.0, 28.0, 24.0, 13.0, 13.0, 13.0, 13.0, 10.0, 4.0, 10.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.2421875, -11.8553466796875, -11.468505859375, -11.0816650390625, -10.69482421875, -10.3079833984375, -9.921142578125, -9.5343017578125, -9.1474609375, -8.7606201171875, -8.373779296875, -7.9869384765625, -7.60009765625, -7.2132568359375, -6.826416015625, -6.4395751953125, -6.052734375, -5.6658935546875, -5.279052734375, -4.8922119140625, -4.50537109375, -4.1185302734375, -3.731689453125, -3.3448486328125, -2.9580078125, -2.5711669921875, -2.184326171875, -1.7974853515625, -1.41064453125, -1.0238037109375, -0.636962890625, -0.2501220703125, 0.13671875, 0.5235595703125, 0.910400390625, 1.2972412109375, 1.68408203125, 2.0709228515625, 2.457763671875, 2.8446044921875, 3.2314453125, 3.6182861328125, 4.005126953125, 4.3919677734375, 4.77880859375, 5.1656494140625, 5.552490234375, 5.9393310546875, 6.326171875, 6.7130126953125, 7.099853515625, 7.4866943359375, 7.87353515625, 8.2603759765625, 8.647216796875, 9.0340576171875, 9.4208984375, 9.8077392578125, 10.194580078125, 10.5814208984375, 10.96826171875, 11.3551025390625, 11.741943359375, 12.1287841796875, 12.515625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 12.0, 24.0, 37.0, 95.0, 216.0, 271.0, 193.0, 72.0, 34.0, 19.0, 5.0, 11.0, 8.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.68299865722656, -107.0890121459961, -100.49502563476562, -93.90104675292969, -87.30706024169922, -80.71307373046875, -74.11909484863281, -67.52510833740234, -60.931121826171875, -54.337135314941406, -47.7431526184082, -41.149169921875, -34.55518341064453, -27.961196899414062, -21.36721420288086, -14.773231506347656, -8.179244995117188, -1.5852603912353516, 5.008724212646484, 11.60270881652832, 18.196693420410156, 24.790679931640625, 31.384662628173828, 37.97864532470703, 44.5726318359375, 51.16661834716797, 57.76060104370117, 64.35458374023438, 70.94857025146484, 77.54255676269531, 84.13653564453125, 90.73052215576172, 97.32452392578125, 103.91851043701172, 110.51249694824219, 117.10647583007812, 123.7004623413086, 130.29444885253906, 136.888427734375, 143.482421875, 150.07640075683594, 156.67037963867188, 163.26437377929688, 169.8583526611328, 176.45233154296875, 183.04632568359375, 189.6403045654297, 196.23428344726562, 202.82827758789062, 209.42225646972656, 216.01625061035156, 222.6102294921875, 229.2042236328125, 235.79820251464844, 242.39218139648438, 248.98617553710938, 255.5801544189453, 262.17413330078125, 268.76812744140625, 275.36212158203125, 281.9560852050781, 288.5500793457031, 295.1440734863281, 301.738037109375, 308.33203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 13.0, 5.0, 8.0, 14.0, 10.0, 18.0, 22.0, 25.0, 22.0, 25.0, 32.0, 34.0, 37.0, 37.0, 41.0, 36.0, 43.0, 52.0, 50.0, 43.0, 45.0, 46.0, 42.0, 30.0, 31.0, 53.0, 28.0, 18.0, 16.0, 27.0, 16.0, 11.0, 20.0, 11.0, 5.0, 7.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-70.31375122070312, -68.34270477294922, -66.37165832519531, -64.4006118774414, -62.429569244384766, -60.45852279663086, -58.48748016357422, -56.51643371582031, -54.545387268066406, -52.5743408203125, -50.603294372558594, -48.63225173950195, -46.66120529174805, -44.69015884399414, -42.7191162109375, -40.748069763183594, -38.77702331542969, -36.80597686767578, -34.834930419921875, -32.863887786865234, -30.892841339111328, -28.921794891357422, -26.95075035095215, -24.979705810546875, -23.00865936279297, -21.037612915039062, -19.06656837463379, -17.095523834228516, -15.12447738647461, -13.15343189239502, -11.18238639831543, -9.21134090423584, -7.24029541015625, -5.26924991607666, -3.2982044219970703, -1.3271589279174805, 0.6438865661621094, 2.614932060241699, 4.585977554321289, 6.557023048400879, 8.528068542480469, 10.499114036560059, 12.470159530639648, 14.441205024719238, 16.412250518798828, 18.383296966552734, 20.354341506958008, 22.32538604736328, 24.296432495117188, 26.267478942871094, 28.238523483276367, 30.20956802368164, 32.18061447143555, 34.15166091918945, 36.122703552246094, 38.09375, 40.064796447753906, 42.03584289550781, 44.00688934326172, 45.97793197631836, 47.948978424072266, 49.92002487182617, 51.89106750488281, 53.86211395263672, 55.833160400390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 10.0, 15.0, 17.0, 26.0, 38.0, 81.0, 150.0, 213.0, 401.0, 770.0, 1499.0, 3062.0, 7076.0, 17537.0, 49133.0, 147556.0, 454754.0, 247304.0, 74369.0, 25992.0, 10026.0, 4299.0, 2026.0, 998.0, 504.0, 271.0, 163.0, 104.0, 57.0, 30.0, 21.0, 10.0, 11.0, 5.0, 3.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.664794921875, -11.24365234375, -10.822509765625, -10.4013671875, -9.980224609375, -9.55908203125, -9.137939453125, -8.716796875, -8.295654296875, -7.87451171875, -7.453369140625, -7.0322265625, -6.611083984375, -6.18994140625, -5.768798828125, -5.34765625, -4.926513671875, -4.50537109375, -4.084228515625, -3.6630859375, -3.241943359375, -2.82080078125, -2.399658203125, -1.978515625, -1.557373046875, -1.13623046875, -0.715087890625, -0.2939453125, 0.127197265625, 0.54833984375, 0.969482421875, 1.390625, 1.811767578125, 2.23291015625, 2.654052734375, 3.0751953125, 3.496337890625, 3.91748046875, 4.338623046875, 4.759765625, 5.180908203125, 5.60205078125, 6.023193359375, 6.4443359375, 6.865478515625, 7.28662109375, 7.707763671875, 8.12890625, 8.550048828125, 8.97119140625, 9.392333984375, 9.8134765625, 10.234619140625, 10.65576171875, 11.076904296875, 11.498046875, 11.919189453125, 12.34033203125, 12.761474609375, 13.1826171875, 13.603759765625, 14.02490234375, 14.446044921875, 14.8671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 7.0, 9.0, 5.0, 8.0, 21.0, 22.0, 24.0, 29.0, 42.0, 33.0, 39.0, 55.0, 50.0, 53.0, 57.0, 66.0, 72.0, 54.0, 52.0, 53.0, 41.0, 53.0, 35.0, 20.0, 17.0, 25.0, 21.0, 12.0, 14.0, 5.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.27947998046875, -4.0980224609375, -3.91656494140625, -3.735107421875, -3.55364990234375, -3.3721923828125, -3.19073486328125, -3.00927734375, -2.82781982421875, -2.6463623046875, -2.46490478515625, -2.283447265625, -2.10198974609375, -1.9205322265625, -1.73907470703125, -1.5576171875, -1.37615966796875, -1.1947021484375, -1.01324462890625, -0.831787109375, -0.65032958984375, -0.4688720703125, -0.28741455078125, -0.10595703125, 0.07550048828125, 0.2569580078125, 0.43841552734375, 0.619873046875, 0.80133056640625, 0.9827880859375, 1.16424560546875, 1.345703125, 1.52716064453125, 1.7086181640625, 1.89007568359375, 2.071533203125, 2.25299072265625, 2.4344482421875, 2.61590576171875, 2.79736328125, 2.97882080078125, 3.1602783203125, 3.34173583984375, 3.523193359375, 3.70465087890625, 3.8861083984375, 4.06756591796875, 4.2490234375, 4.43048095703125, 4.6119384765625, 4.79339599609375, 4.974853515625, 5.15631103515625, 5.3377685546875, 5.51922607421875, 5.70068359375, 5.88214111328125, 6.0635986328125, 6.24505615234375, 6.426513671875, 6.60797119140625, 6.7894287109375, 6.97088623046875, 7.15234375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 7.0, 11.0, 18.0, 23.0, 30.0, 57.0, 67.0, 99.0, 127.0, 248.0, 375.0, 737.0, 1498.0, 3860.0, 19586.0, 253895.0, 715485.0, 42105.0, 6228.0, 1935.0, 895.0, 427.0, 290.0, 195.0, 108.0, 65.0, 49.0, 36.0, 32.0, 23.0, 12.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.078125, -21.234619140625, -20.39111328125, -19.547607421875, -18.7041015625, -17.860595703125, -17.01708984375, -16.173583984375, -15.330078125, -14.486572265625, -13.64306640625, -12.799560546875, -11.9560546875, -11.112548828125, -10.26904296875, -9.425537109375, -8.58203125, -7.738525390625, -6.89501953125, -6.051513671875, -5.2080078125, -4.364501953125, -3.52099609375, -2.677490234375, -1.833984375, -0.990478515625, -0.14697265625, 0.696533203125, 1.5400390625, 2.383544921875, 3.22705078125, 4.070556640625, 4.9140625, 5.757568359375, 6.60107421875, 7.444580078125, 8.2880859375, 9.131591796875, 9.97509765625, 10.818603515625, 11.662109375, 12.505615234375, 13.34912109375, 14.192626953125, 15.0361328125, 15.879638671875, 16.72314453125, 17.566650390625, 18.41015625, 19.253662109375, 20.09716796875, 20.940673828125, 21.7841796875, 22.627685546875, 23.47119140625, 24.314697265625, 25.158203125, 26.001708984375, 26.84521484375, 27.688720703125, 28.5322265625, 29.375732421875, 30.21923828125, 31.062744140625, 31.90625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 4.0, 9.0, 7.0, 9.0, 12.0, 16.0, 27.0, 20.0, 28.0, 38.0, 34.0, 41.0, 66.0, 40.0, 65.0, 49.0, 56.0, 53.0, 56.0, 58.0, 49.0, 41.0, 37.0, 41.0, 32.0, 21.0, 18.0, 17.0, 9.0, 9.0, 9.0, 8.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-29.78125, -29.025146484375, -28.26904296875, -27.512939453125, -26.7568359375, -26.000732421875, -25.24462890625, -24.488525390625, -23.732421875, -22.976318359375, -22.22021484375, -21.464111328125, -20.7080078125, -19.951904296875, -19.19580078125, -18.439697265625, -17.68359375, -16.927490234375, -16.17138671875, -15.415283203125, -14.6591796875, -13.903076171875, -13.14697265625, -12.390869140625, -11.634765625, -10.878662109375, -10.12255859375, -9.366455078125, -8.6103515625, -7.854248046875, -7.09814453125, -6.342041015625, -5.5859375, -4.829833984375, -4.07373046875, -3.317626953125, -2.5615234375, -1.805419921875, -1.04931640625, -0.293212890625, 0.462890625, 1.218994140625, 1.97509765625, 2.731201171875, 3.4873046875, 4.243408203125, 4.99951171875, 5.755615234375, 6.51171875, 7.267822265625, 8.02392578125, 8.780029296875, 9.5361328125, 10.292236328125, 11.04833984375, 11.804443359375, 12.560546875, 13.316650390625, 14.07275390625, 14.828857421875, 15.5849609375, 16.341064453125, 17.09716796875, 17.853271484375, 18.609375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 15.0, 14.0, 23.0, 30.0, 50.0, 105.0, 166.0, 413.0, 1158.0, 4823.0, 40159.0, 811002.0, 174596.0, 12510.0, 2237.0, 639.0, 294.0, 136.0, 66.0, 27.0, 29.0, 20.0, 7.0, 7.0, 6.0, 4.0, 8.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.0, -14.6026611328125, -14.205322265625, -13.8079833984375, -13.41064453125, -13.0133056640625, -12.615966796875, -12.2186279296875, -11.8212890625, -11.4239501953125, -11.026611328125, -10.6292724609375, -10.23193359375, -9.8345947265625, -9.437255859375, -9.0399169921875, -8.642578125, -8.2452392578125, -7.847900390625, -7.4505615234375, -7.05322265625, -6.6558837890625, -6.258544921875, -5.8612060546875, -5.4638671875, -5.0665283203125, -4.669189453125, -4.2718505859375, -3.87451171875, -3.4771728515625, -3.079833984375, -2.6824951171875, -2.28515625, -1.8878173828125, -1.490478515625, -1.0931396484375, -0.69580078125, -0.2984619140625, 0.098876953125, 0.4962158203125, 0.8935546875, 1.2908935546875, 1.688232421875, 2.0855712890625, 2.48291015625, 2.8802490234375, 3.277587890625, 3.6749267578125, 4.072265625, 4.4696044921875, 4.866943359375, 5.2642822265625, 5.66162109375, 6.0589599609375, 6.456298828125, 6.8536376953125, 7.2509765625, 7.6483154296875, 8.045654296875, 8.4429931640625, 8.84033203125, 9.2376708984375, 9.635009765625, 10.0323486328125, 10.4296875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 8.0, 14.0, 11.0, 19.0, 14.0, 12.0, 18.0, 31.0, 37.0, 74.0, 106.0, 173.0, 150.0, 84.0, 49.0, 39.0, 28.0, 24.0, 18.0, 14.0, 15.0, 9.0, 7.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013780593872070312, -0.0013283789157867432, -0.001278698444366455, -0.001229017972946167, -0.001179337501525879, -0.0011296570301055908, -0.0010799765586853027, -0.0010302960872650146, -0.0009806156158447266, -0.0009309351444244385, -0.0008812546730041504, -0.0008315742015838623, -0.0007818937301635742, -0.0007322132587432861, -0.000682532787322998, -0.00063285231590271, -0.0005831718444824219, -0.0005334913730621338, -0.0004838109016418457, -0.0004341304302215576, -0.00038444995880126953, -0.00033476948738098145, -0.00028508901596069336, -0.00023540854454040527, -0.0001857280731201172, -0.0001360476016998291, -8.636713027954102e-05, -3.668665885925293e-05, 1.2993812561035156e-05, 6.267428398132324e-05, 0.00011235475540161133, 0.00016203522682189941, 0.0002117156982421875, 0.0002613961696624756, 0.00031107664108276367, 0.00036075711250305176, 0.00041043758392333984, 0.00046011805534362793, 0.000509798526763916, 0.0005594789981842041, 0.0006091594696044922, 0.0006588399410247803, 0.0007085204124450684, 0.0007582008838653564, 0.0008078813552856445, 0.0008575618267059326, 0.0009072422981262207, 0.0009569227695465088, 0.0010066032409667969, 0.001056283712387085, 0.001105964183807373, 0.0011556446552276611, 0.0012053251266479492, 0.0012550055980682373, 0.0013046860694885254, 0.0013543665409088135, 0.0014040470123291016, 0.0014537274837493896, 0.0015034079551696777, 0.0015530884265899658, 0.001602768898010254, 0.001652449369430542, 0.00170212984085083, 0.0017518103122711182, 0.0018014907836914062]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 22.0, 26.0, 34.0, 54.0, 105.0, 115.0, 164.0, 299.0, 585.0, 1031.0, 2349.0, 7500.0, 40156.0, 487434.0, 457646.0, 38768.0, 7431.0, 2373.0, 1014.0, 519.0, 330.0, 190.0, 120.0, 71.0, 54.0, 32.0, 28.0, 17.0, 10.0, 10.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.5859375, -8.2996826171875, -8.013427734375, -7.7271728515625, -7.44091796875, -7.1546630859375, -6.868408203125, -6.5821533203125, -6.2958984375, -6.0096435546875, -5.723388671875, -5.4371337890625, -5.15087890625, -4.8646240234375, -4.578369140625, -4.2921142578125, -4.005859375, -3.7196044921875, -3.433349609375, -3.1470947265625, -2.86083984375, -2.5745849609375, -2.288330078125, -2.0020751953125, -1.7158203125, -1.4295654296875, -1.143310546875, -0.8570556640625, -0.57080078125, -0.2845458984375, 0.001708984375, 0.2879638671875, 0.57421875, 0.8604736328125, 1.146728515625, 1.4329833984375, 1.71923828125, 2.0054931640625, 2.291748046875, 2.5780029296875, 2.8642578125, 3.1505126953125, 3.436767578125, 3.7230224609375, 4.00927734375, 4.2955322265625, 4.581787109375, 4.8680419921875, 5.154296875, 5.4405517578125, 5.726806640625, 6.0130615234375, 6.29931640625, 6.5855712890625, 6.871826171875, 7.1580810546875, 7.4443359375, 7.7305908203125, 8.016845703125, 8.3031005859375, 8.58935546875, 8.8756103515625, 9.161865234375, 9.4481201171875, 9.734375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 5.0, 3.0, 9.0, 5.0, 8.0, 22.0, 12.0, 12.0, 18.0, 17.0, 22.0, 30.0, 33.0, 48.0, 56.0, 57.0, 55.0, 56.0, 83.0, 70.0, 70.0, 53.0, 35.0, 38.0, 37.0, 25.0, 21.0, 13.0, 11.0, 8.0, 16.0, 9.0, 7.0, 5.0, 2.0, 5.0, 4.0, 6.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4715576171875, -4.310302734375, -4.1490478515625, -3.98779296875, -3.8265380859375, -3.665283203125, -3.5040283203125, -3.3427734375, -3.1815185546875, -3.020263671875, -2.8590087890625, -2.69775390625, -2.5364990234375, -2.375244140625, -2.2139892578125, -2.052734375, -1.8914794921875, -1.730224609375, -1.5689697265625, -1.40771484375, -1.2464599609375, -1.085205078125, -0.9239501953125, -0.7626953125, -0.6014404296875, -0.440185546875, -0.2789306640625, -0.11767578125, 0.0435791015625, 0.204833984375, 0.3660888671875, 0.52734375, 0.6885986328125, 0.849853515625, 1.0111083984375, 1.17236328125, 1.3336181640625, 1.494873046875, 1.6561279296875, 1.8173828125, 1.9786376953125, 2.139892578125, 2.3011474609375, 2.46240234375, 2.6236572265625, 2.784912109375, 2.9461669921875, 3.107421875, 3.2686767578125, 3.429931640625, 3.5911865234375, 3.75244140625, 3.9136962890625, 4.074951171875, 4.2362060546875, 4.3974609375, 4.5587158203125, 4.719970703125, 4.8812255859375, 5.04248046875, 5.2037353515625, 5.364990234375, 5.5262451171875, 5.6875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 31.0, 64.0, 118.0, 228.0, 228.0, 147.0, 95.0, 38.0, 17.0, 13.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.19520568847656, -146.1154327392578, -140.03565979003906, -133.95590209960938, -127.87612915039062, -121.79635620117188, -115.71658325195312, -109.63681030273438, -103.55704498291016, -97.4772720336914, -91.39750671386719, -85.31773376464844, -79.23796081542969, -73.15819549560547, -67.07842254638672, -60.998653411865234, -54.91888427734375, -48.839115142822266, -42.75934600830078, -36.67957305908203, -30.599803924560547, -24.520034790039062, -18.440261840820312, -12.360492706298828, -6.280723571777344, -0.20095348358154297, 5.878816604614258, 11.958587646484375, 18.03835678100586, 24.118125915527344, 30.197898864746094, 36.27766799926758, 42.35743713378906, 48.43720626831055, 54.51697540283203, 60.59674835205078, 66.676513671875, 72.75628662109375, 78.8360595703125, 84.91583251953125, 90.99559783935547, 97.07537078857422, 103.15513610839844, 109.23490905761719, 115.31468200683594, 121.39444732666016, 127.4742202758789, 133.55398559570312, 139.63375854492188, 145.71353149414062, 151.79330444335938, 157.87307739257812, 163.9528350830078, 170.03260803222656, 176.1123809814453, 182.19215393066406, 188.27191162109375, 194.3516845703125, 200.43145751953125, 206.51123046875, 212.5909881591797, 218.67076110839844, 224.7505340576172, 230.83030700683594, 236.9100799560547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 15.0, 16.0, 11.0, 23.0, 20.0, 13.0, 21.0, 28.0, 29.0, 40.0, 29.0, 48.0, 42.0, 48.0, 63.0, 55.0, 65.0, 47.0, 47.0, 45.0, 36.0, 31.0, 30.0, 32.0, 26.0, 13.0, 27.0, 21.0, 15.0, 14.0, 13.0, 9.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.97138977050781, -68.39381408691406, -65.81623840332031, -63.2386589050293, -60.66108322143555, -58.0835075378418, -55.50592803955078, -52.92835235595703, -50.35077667236328, -47.77320098876953, -45.19562530517578, -42.618045806884766, -40.040470123291016, -37.462894439697266, -34.88531494140625, -32.3077392578125, -29.73016357421875, -27.152587890625, -24.575010299682617, -21.997432708740234, -19.419857025146484, -16.842281341552734, -14.264703750610352, -11.687126159667969, -9.109550476074219, -6.531973838806152, -3.954397201538086, -1.3768205642700195, 1.2007560729980469, 3.7783327102661133, 6.35590934753418, 8.933486938476562, 11.511062622070312, 14.088639259338379, 16.666215896606445, 19.243793487548828, 21.821369171142578, 24.398944854736328, 26.97652244567871, 29.554100036621094, 32.131675720214844, 34.709251403808594, 37.286827087402344, 39.86440658569336, 42.44198226928711, 45.01955795288086, 47.597137451171875, 50.174713134765625, 52.752288818359375, 55.329864501953125, 57.907440185546875, 60.48501968383789, 63.06259536743164, 65.64017486572266, 68.2177505493164, 70.79532623291016, 73.3729019165039, 75.95047760009766, 78.5280532836914, 81.10562896728516, 83.68321228027344, 86.26078796386719, 88.83836364746094, 91.41593933105469, 93.99351501464844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 9.0, 9.0, 12.0, 17.0, 32.0, 30.0, 32.0, 54.0, 72.0, 85.0, 135.0, 162.0, 329.0, 1231.0, 11079.0, 2270857.0, 1897233.0, 10674.0, 1200.0, 335.0, 173.0, 135.0, 93.0, 60.0, 67.0, 43.0, 29.0, 14.0, 26.0, 12.0, 10.0, 6.0, 5.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-42.25, -41.137939453125, -40.02587890625, -38.913818359375, -37.8017578125, -36.689697265625, -35.57763671875, -34.465576171875, -33.353515625, -32.241455078125, -31.12939453125, -30.017333984375, -28.9052734375, -27.793212890625, -26.68115234375, -25.569091796875, -24.45703125, -23.344970703125, -22.23291015625, -21.120849609375, -20.0087890625, -18.896728515625, -17.78466796875, -16.672607421875, -15.560546875, -14.448486328125, -13.33642578125, -12.224365234375, -11.1123046875, -10.000244140625, -8.88818359375, -7.776123046875, -6.6640625, -5.552001953125, -4.43994140625, -3.327880859375, -2.2158203125, -1.103759765625, 0.00830078125, 1.120361328125, 2.232421875, 3.344482421875, 4.45654296875, 5.568603515625, 6.6806640625, 7.792724609375, 8.90478515625, 10.016845703125, 11.12890625, 12.240966796875, 13.35302734375, 14.465087890625, 15.5771484375, 16.689208984375, 17.80126953125, 18.913330078125, 20.025390625, 21.137451171875, 22.24951171875, 23.361572265625, 24.4736328125, 25.585693359375, 26.69775390625, 27.809814453125, 28.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 22.0, 33.0, 55.0, 57.0, 87.0, 113.0, 137.0, 137.0, 107.0, 88.0, 63.0, 42.0, 21.0, 14.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9405517578125, -11.576416015625, -11.2122802734375, -10.84814453125, -10.4840087890625, -10.119873046875, -9.7557373046875, -9.3916015625, -9.0274658203125, -8.663330078125, -8.2991943359375, -7.93505859375, -7.5709228515625, -7.206787109375, -6.8426513671875, -6.478515625, -6.1143798828125, -5.750244140625, -5.3861083984375, -5.02197265625, -4.6578369140625, -4.293701171875, -3.9295654296875, -3.5654296875, -3.2012939453125, -2.837158203125, -2.4730224609375, -2.10888671875, -1.7447509765625, -1.380615234375, -1.0164794921875, -0.65234375, -0.2882080078125, 0.075927734375, 0.4400634765625, 0.80419921875, 1.1683349609375, 1.532470703125, 1.8966064453125, 2.2607421875, 2.6248779296875, 2.989013671875, 3.3531494140625, 3.71728515625, 4.0814208984375, 4.445556640625, 4.8096923828125, 5.173828125, 5.5379638671875, 5.902099609375, 6.2662353515625, 6.63037109375, 6.9945068359375, 7.358642578125, 7.7227783203125, 8.0869140625, 8.4510498046875, 8.815185546875, 9.1793212890625, 9.54345703125, 9.9075927734375, 10.271728515625, 10.6358642578125, 11.0]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 20.0, 17.0, 30.0, 49.0, 95.0, 138.0, 261.0, 590.0, 1285.0, 3463.0, 11894.0, 56687.0, 924001.0, 3068882.0, 102290.0, 17233.0, 4519.0, 1510.0, 623.0, 264.0, 168.0, 103.0, 67.0, 35.0, 14.0, 18.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.439208984375, -14.90966796875, -14.380126953125, -13.8505859375, -13.321044921875, -12.79150390625, -12.261962890625, -11.732421875, -11.202880859375, -10.67333984375, -10.143798828125, -9.6142578125, -9.084716796875, -8.55517578125, -8.025634765625, -7.49609375, -6.966552734375, -6.43701171875, -5.907470703125, -5.3779296875, -4.848388671875, -4.31884765625, -3.789306640625, -3.259765625, -2.730224609375, -2.20068359375, -1.671142578125, -1.1416015625, -0.612060546875, -0.08251953125, 0.447021484375, 0.9765625, 1.506103515625, 2.03564453125, 2.565185546875, 3.0947265625, 3.624267578125, 4.15380859375, 4.683349609375, 5.212890625, 5.742431640625, 6.27197265625, 6.801513671875, 7.3310546875, 7.860595703125, 8.39013671875, 8.919677734375, 9.44921875, 9.978759765625, 10.50830078125, 11.037841796875, 11.5673828125, 12.096923828125, 12.62646484375, 13.156005859375, 13.685546875, 14.215087890625, 14.74462890625, 15.274169921875, 15.8037109375, 16.333251953125, 16.86279296875, 17.392333984375, 17.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 27.0, 32.0, 28.0, 52.0, 77.0, 114.0, 189.0, 337.0, 588.0, 952.0, 703.0, 382.0, 194.0, 123.0, 57.0, 50.0, 24.0, 27.0, 18.0, 12.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-13.4609375, -13.0926513671875, -12.724365234375, -12.3560791015625, -11.98779296875, -11.6195068359375, -11.251220703125, -10.8829345703125, -10.5146484375, -10.1463623046875, -9.778076171875, -9.4097900390625, -9.04150390625, -8.6732177734375, -8.304931640625, -7.9366455078125, -7.568359375, -7.2000732421875, -6.831787109375, -6.4635009765625, -6.09521484375, -5.7269287109375, -5.358642578125, -4.9903564453125, -4.6220703125, -4.2537841796875, -3.885498046875, -3.5172119140625, -3.14892578125, -2.7806396484375, -2.412353515625, -2.0440673828125, -1.67578125, -1.3074951171875, -0.939208984375, -0.5709228515625, -0.20263671875, 0.1656494140625, 0.533935546875, 0.9022216796875, 1.2705078125, 1.6387939453125, 2.007080078125, 2.3753662109375, 2.74365234375, 3.1119384765625, 3.480224609375, 3.8485107421875, 4.216796875, 4.5850830078125, 4.953369140625, 5.3216552734375, 5.68994140625, 6.0582275390625, 6.426513671875, 6.7947998046875, 7.1630859375, 7.5313720703125, 7.899658203125, 8.2679443359375, 8.63623046875, 9.0045166015625, 9.372802734375, 9.7410888671875, 10.109375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 6.0, 11.0, 11.0, 19.0, 33.0, 43.0, 76.0, 137.0, 165.0, 168.0, 123.0, 105.0, 53.0, 22.0, 14.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-115.77225494384766, -112.29562377929688, -108.81898498535156, -105.34235382080078, -101.86572265625, -98.38908386230469, -94.9124526977539, -91.43582153320312, -87.95918273925781, -84.48255157470703, -81.00591278076172, -77.52928161621094, -74.05265045166016, -70.57601928710938, -67.09938049316406, -63.62274932861328, -60.1461181640625, -56.66948318481445, -53.19285202026367, -49.716217041015625, -46.239585876464844, -42.7629508972168, -39.28631591796875, -35.80968475341797, -32.33304977416992, -28.856416702270508, -25.379783630371094, -21.903148651123047, -18.426515579223633, -14.949882507324219, -11.473247528076172, -7.996614456176758, -4.519989013671875, -1.0433554649353027, 2.4332780838012695, 5.909912109375, 9.386545181274414, 12.863178253173828, 16.339813232421875, 19.81644630432129, 23.293079376220703, 26.769712448120117, 30.24634552001953, 33.72298049926758, 37.199615478515625, 40.676246643066406, 44.15288162231445, 47.6295166015625, 51.10614776611328, 54.58278274536133, 58.05941390991211, 61.536048889160156, 65.01268005371094, 68.48931884765625, 71.96595001220703, 75.44258117675781, 78.91921997070312, 82.3958511352539, 85.87248992919922, 89.34912109375, 92.82575225830078, 96.30238342285156, 99.77902221679688, 103.25565338134766, 106.73228454589844]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 7.0, 4.0, 7.0, 12.0, 16.0, 19.0, 14.0, 15.0, 31.0, 26.0, 34.0, 43.0, 55.0, 36.0, 38.0, 46.0, 53.0, 52.0, 54.0, 51.0, 57.0, 49.0, 45.0, 30.0, 29.0, 36.0, 26.0, 25.0, 21.0, 22.0, 14.0, 1.0, 12.0, 4.0, 7.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.971282958984375, -41.211490631103516, -39.45170211791992, -37.69190979003906, -35.93212127685547, -34.17232894897461, -32.412540435791016, -30.652748107910156, -28.892959594726562, -27.133169174194336, -25.37337875366211, -23.613588333129883, -21.853797912597656, -20.094005584716797, -18.334217071533203, -16.574424743652344, -14.814634323120117, -13.05484390258789, -11.295053482055664, -9.535263061523438, -7.775472164154053, -6.015681266784668, -4.255890846252441, -2.496100425720215, -0.7363100051879883, 1.0234805345535278, 2.783271074295044, 4.54306173324585, 6.302852153778076, 8.062643051147461, 9.822433471679688, 11.582223892211914, 13.34201431274414, 15.101804733276367, 16.861595153808594, 18.62138557434082, 20.381175994873047, 22.140968322753906, 23.9007568359375, 25.66054916381836, 27.420337677001953, 29.18012809753418, 30.939918518066406, 32.699710845947266, 34.45949935913086, 36.21929168701172, 37.97908020019531, 39.73887252807617, 41.49866485595703, 43.25845718383789, 45.018245697021484, 46.778038024902344, 48.53782653808594, 50.2976188659668, 52.05740737915039, 53.81719970703125, 55.576988220214844, 57.3367805480957, 59.0965690612793, 60.856361389160156, 62.61614990234375, 64.37593841552734, 66.13573455810547, 67.89552307128906, 69.65531158447266]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 6.0, 7.0, 22.0, 16.0, 20.0, 38.0, 70.0, 87.0, 152.0, 251.0, 501.0, 909.0, 1790.0, 3482.0, 7497.0, 16720.0, 40533.0, 112881.0, 354989.0, 334298.0, 106091.0, 38324.0, 15772.0, 7121.0, 3334.0, 1666.0, 843.0, 456.0, 271.0, 152.0, 85.0, 61.0, 22.0, 31.0, 6.0, 14.0, 9.0, 9.0, 9.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-11.640625, -11.3077392578125, -10.974853515625, -10.6419677734375, -10.30908203125, -9.9761962890625, -9.643310546875, -9.3104248046875, -8.9775390625, -8.6446533203125, -8.311767578125, -7.9788818359375, -7.64599609375, -7.3131103515625, -6.980224609375, -6.6473388671875, -6.314453125, -5.9815673828125, -5.648681640625, -5.3157958984375, -4.98291015625, -4.6500244140625, -4.317138671875, -3.9842529296875, -3.6513671875, -3.3184814453125, -2.985595703125, -2.6527099609375, -2.31982421875, -1.9869384765625, -1.654052734375, -1.3211669921875, -0.98828125, -0.6553955078125, -0.322509765625, 0.0103759765625, 0.34326171875, 0.6761474609375, 1.009033203125, 1.3419189453125, 1.6748046875, 2.0076904296875, 2.340576171875, 2.6734619140625, 3.00634765625, 3.3392333984375, 3.672119140625, 4.0050048828125, 4.337890625, 4.6707763671875, 5.003662109375, 5.3365478515625, 5.66943359375, 6.0023193359375, 6.335205078125, 6.6680908203125, 7.0009765625, 7.3338623046875, 7.666748046875, 7.9996337890625, 8.33251953125, 8.6654052734375, 8.998291015625, 9.3311767578125, 9.6640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 4.0, 6.0, 8.0, 16.0, 15.0, 17.0, 25.0, 33.0, 33.0, 31.0, 48.0, 56.0, 56.0, 65.0, 56.0, 67.0, 65.0, 52.0, 62.0, 60.0, 39.0, 33.0, 24.0, 38.0, 24.0, 17.0, 12.0, 11.0, 11.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.67578125, -4.49151611328125, -4.3072509765625, -4.12298583984375, -3.938720703125, -3.75445556640625, -3.5701904296875, -3.38592529296875, -3.20166015625, -3.01739501953125, -2.8331298828125, -2.64886474609375, -2.464599609375, -2.28033447265625, -2.0960693359375, -1.91180419921875, -1.7275390625, -1.54327392578125, -1.3590087890625, -1.17474365234375, -0.990478515625, -0.80621337890625, -0.6219482421875, -0.43768310546875, -0.25341796875, -0.06915283203125, 0.1151123046875, 0.29937744140625, 0.483642578125, 0.66790771484375, 0.8521728515625, 1.03643798828125, 1.220703125, 1.40496826171875, 1.5892333984375, 1.77349853515625, 1.957763671875, 2.14202880859375, 2.3262939453125, 2.51055908203125, 2.69482421875, 2.87908935546875, 3.0633544921875, 3.24761962890625, 3.431884765625, 3.61614990234375, 3.8004150390625, 3.98468017578125, 4.1689453125, 4.35321044921875, 4.5374755859375, 4.72174072265625, 4.906005859375, 5.09027099609375, 5.2745361328125, 5.45880126953125, 5.64306640625, 5.82733154296875, 6.0115966796875, 6.19586181640625, 6.380126953125, 6.56439208984375, 6.7486572265625, 6.93292236328125, 7.1171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 10.0, 11.0, 12.0, 15.0, 28.0, 49.0, 66.0, 84.0, 165.0, 256.0, 376.0, 829.0, 1993.0, 6077.0, 28055.0, 215884.0, 697328.0, 77747.0, 13213.0, 3561.0, 1280.0, 642.0, 305.0, 190.0, 114.0, 85.0, 51.0, 36.0, 27.0, 20.0, 15.0, 9.0, 5.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.84375, -17.212646484375, -16.58154296875, -15.950439453125, -15.3193359375, -14.688232421875, -14.05712890625, -13.426025390625, -12.794921875, -12.163818359375, -11.53271484375, -10.901611328125, -10.2705078125, -9.639404296875, -9.00830078125, -8.377197265625, -7.74609375, -7.114990234375, -6.48388671875, -5.852783203125, -5.2216796875, -4.590576171875, -3.95947265625, -3.328369140625, -2.697265625, -2.066162109375, -1.43505859375, -0.803955078125, -0.1728515625, 0.458251953125, 1.08935546875, 1.720458984375, 2.3515625, 2.982666015625, 3.61376953125, 4.244873046875, 4.8759765625, 5.507080078125, 6.13818359375, 6.769287109375, 7.400390625, 8.031494140625, 8.66259765625, 9.293701171875, 9.9248046875, 10.555908203125, 11.18701171875, 11.818115234375, 12.44921875, 13.080322265625, 13.71142578125, 14.342529296875, 14.9736328125, 15.604736328125, 16.23583984375, 16.866943359375, 17.498046875, 18.129150390625, 18.76025390625, 19.391357421875, 20.0224609375, 20.653564453125, 21.28466796875, 21.915771484375, 22.546875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 6.0, 6.0, 11.0, 12.0, 11.0, 9.0, 22.0, 20.0, 25.0, 27.0, 26.0, 33.0, 41.0, 38.0, 43.0, 31.0, 61.0, 44.0, 46.0, 55.0, 52.0, 35.0, 57.0, 46.0, 40.0, 30.0, 33.0, 27.0, 19.0, 18.0, 18.0, 10.0, 9.0, 9.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.421875, -16.849609375, -16.27734375, -15.705078125, -15.1328125, -14.560546875, -13.98828125, -13.416015625, -12.84375, -12.271484375, -11.69921875, -11.126953125, -10.5546875, -9.982421875, -9.41015625, -8.837890625, -8.265625, -7.693359375, -7.12109375, -6.548828125, -5.9765625, -5.404296875, -4.83203125, -4.259765625, -3.6875, -3.115234375, -2.54296875, -1.970703125, -1.3984375, -0.826171875, -0.25390625, 0.318359375, 0.890625, 1.462890625, 2.03515625, 2.607421875, 3.1796875, 3.751953125, 4.32421875, 4.896484375, 5.46875, 6.041015625, 6.61328125, 7.185546875, 7.7578125, 8.330078125, 8.90234375, 9.474609375, 10.046875, 10.619140625, 11.19140625, 11.763671875, 12.3359375, 12.908203125, 13.48046875, 14.052734375, 14.625, 15.197265625, 15.76953125, 16.341796875, 16.9140625, 17.486328125, 18.05859375, 18.630859375, 19.203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 18.0, 25.0, 32.0, 67.0, 140.0, 293.0, 685.0, 3259.0, 26242.0, 719726.0, 281572.0, 13345.0, 2070.0, 541.0, 233.0, 104.0, 54.0, 32.0, 21.0, 15.0, 11.0, 8.0, 7.0, 1.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.8985595703125, -9.515869140625, -9.1331787109375, -8.75048828125, -8.3677978515625, -7.985107421875, -7.6024169921875, -7.2197265625, -6.8370361328125, -6.454345703125, -6.0716552734375, -5.68896484375, -5.3062744140625, -4.923583984375, -4.5408935546875, -4.158203125, -3.7755126953125, -3.392822265625, -3.0101318359375, -2.62744140625, -2.2447509765625, -1.862060546875, -1.4793701171875, -1.0966796875, -0.7139892578125, -0.331298828125, 0.0513916015625, 0.43408203125, 0.8167724609375, 1.199462890625, 1.5821533203125, 1.96484375, 2.3475341796875, 2.730224609375, 3.1129150390625, 3.49560546875, 3.8782958984375, 4.260986328125, 4.6436767578125, 5.0263671875, 5.4090576171875, 5.791748046875, 6.1744384765625, 6.55712890625, 6.9398193359375, 7.322509765625, 7.7052001953125, 8.087890625, 8.4705810546875, 8.853271484375, 9.2359619140625, 9.61865234375, 10.0013427734375, 10.384033203125, 10.7667236328125, 11.1494140625, 11.5321044921875, 11.914794921875, 12.2974853515625, 12.68017578125, 13.0628662109375, 13.445556640625, 13.8282470703125, 14.2109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 13.0, 12.0, 20.0, 48.0, 114.0, 262.0, 291.0, 114.0, 54.0, 30.0, 18.0, 6.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003963470458984375, -0.0038565993309020996, -0.0037497282028198242, -0.003642857074737549, -0.0035359859466552734, -0.003429114818572998, -0.0033222436904907227, -0.0032153725624084473, -0.003108501434326172, -0.0030016303062438965, -0.002894759178161621, -0.0027878880500793457, -0.0026810169219970703, -0.002574145793914795, -0.0024672746658325195, -0.002360403537750244, -0.0022535324096679688, -0.0021466612815856934, -0.002039790153503418, -0.0019329190254211426, -0.0018260478973388672, -0.0017191767692565918, -0.0016123056411743164, -0.001505434513092041, -0.0013985633850097656, -0.0012916922569274902, -0.0011848211288452148, -0.0010779500007629395, -0.0009710788726806641, -0.0008642077445983887, -0.0007573366165161133, -0.0006504654884338379, -0.0005435943603515625, -0.0004367232322692871, -0.0003298521041870117, -0.00022298097610473633, -0.00011610984802246094, -9.238719940185547e-06, 9.763240814208984e-05, 0.00020450353622436523, 0.0003113746643066406, 0.000418245792388916, 0.0005251169204711914, 0.0006319880485534668, 0.0007388591766357422, 0.0008457303047180176, 0.000952601432800293, 0.0010594725608825684, 0.0011663436889648438, 0.0012732148170471191, 0.0013800859451293945, 0.00148695707321167, 0.0015938282012939453, 0.0017006993293762207, 0.001807570457458496, 0.0019144415855407715, 0.002021312713623047, 0.0021281838417053223, 0.0022350549697875977, 0.002341926097869873, 0.0024487972259521484, 0.002555668354034424, 0.0026625394821166992, 0.0027694106101989746, 0.00287628173828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 18.0, 29.0, 50.0, 82.0, 164.0, 268.0, 651.0, 1603.0, 5396.0, 33723.0, 617344.0, 359321.0, 23113.0, 4306.0, 1334.0, 531.0, 282.0, 125.0, 67.0, 48.0, 25.0, 13.0, 13.0, 12.0, 5.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1749267578125, -8.857666015625, -8.5404052734375, -8.22314453125, -7.9058837890625, -7.588623046875, -7.2713623046875, -6.9541015625, -6.6368408203125, -6.319580078125, -6.0023193359375, -5.68505859375, -5.3677978515625, -5.050537109375, -4.7332763671875, -4.416015625, -4.0987548828125, -3.781494140625, -3.4642333984375, -3.14697265625, -2.8297119140625, -2.512451171875, -2.1951904296875, -1.8779296875, -1.5606689453125, -1.243408203125, -0.9261474609375, -0.60888671875, -0.2916259765625, 0.025634765625, 0.3428955078125, 0.66015625, 0.9774169921875, 1.294677734375, 1.6119384765625, 1.92919921875, 2.2464599609375, 2.563720703125, 2.8809814453125, 3.1982421875, 3.5155029296875, 3.832763671875, 4.1500244140625, 4.46728515625, 4.7845458984375, 5.101806640625, 5.4190673828125, 5.736328125, 6.0535888671875, 6.370849609375, 6.6881103515625, 7.00537109375, 7.3226318359375, 7.639892578125, 7.9571533203125, 8.2744140625, 8.5916748046875, 8.908935546875, 9.2261962890625, 9.54345703125, 9.8607177734375, 10.177978515625, 10.4952392578125, 10.8125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 5.0, 3.0, 4.0, 9.0, 12.0, 17.0, 19.0, 21.0, 29.0, 45.0, 68.0, 69.0, 85.0, 97.0, 87.0, 88.0, 85.0, 66.0, 55.0, 34.0, 30.0, 24.0, 14.0, 8.0, 5.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.9454345703125, -5.750244140625, -5.5550537109375, -5.35986328125, -5.1646728515625, -4.969482421875, -4.7742919921875, -4.5791015625, -4.3839111328125, -4.188720703125, -3.9935302734375, -3.79833984375, -3.6031494140625, -3.407958984375, -3.2127685546875, -3.017578125, -2.8223876953125, -2.627197265625, -2.4320068359375, -2.23681640625, -2.0416259765625, -1.846435546875, -1.6512451171875, -1.4560546875, -1.2608642578125, -1.065673828125, -0.8704833984375, -0.67529296875, -0.4801025390625, -0.284912109375, -0.0897216796875, 0.10546875, 0.3006591796875, 0.495849609375, 0.6910400390625, 0.88623046875, 1.0814208984375, 1.276611328125, 1.4718017578125, 1.6669921875, 1.8621826171875, 2.057373046875, 2.2525634765625, 2.44775390625, 2.6429443359375, 2.838134765625, 3.0333251953125, 3.228515625, 3.4237060546875, 3.618896484375, 3.8140869140625, 4.00927734375, 4.2044677734375, 4.399658203125, 4.5948486328125, 4.7900390625, 4.9852294921875, 5.180419921875, 5.3756103515625, 5.57080078125, 5.7659912109375, 5.961181640625, 6.1563720703125, 6.3515625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 8.0, 4.0, 7.0, 20.0, 37.0, 61.0, 95.0, 124.0, 175.0, 169.0, 114.0, 66.0, 39.0, 38.0, 12.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-131.46990966796875, -127.91560363769531, -124.3613052368164, -120.80699920654297, -117.25269317626953, -113.69839477539062, -110.14408874511719, -106.58978271484375, -103.03548431396484, -99.4811782836914, -95.9268798828125, -92.37257385253906, -88.81826782226562, -85.26396942138672, -81.70966339111328, -78.15536499023438, -74.60105895996094, -71.0467529296875, -67.4924545288086, -63.938148498535156, -60.383846282958984, -56.82954406738281, -53.275238037109375, -49.7209358215332, -46.1666259765625, -42.61232376098633, -39.05801773071289, -35.50371551513672, -31.949413299560547, -28.395109176635742, -24.840805053710938, -21.286502838134766, -17.732200622558594, -14.177897453308105, -10.623594284057617, -7.0692901611328125, -3.514986991882324, 0.03931617736816406, 3.5936203002929688, 7.147922515869141, 10.702226638793945, 14.256529808044434, 17.810832977294922, 21.365137100219727, 24.91944122314453, 28.473743438720703, 32.028045654296875, 35.58235168457031, 39.136653900146484, 42.690956115722656, 46.245262145996094, 49.799564361572266, 53.35386657714844, 56.908172607421875, 60.46247482299805, 64.01677703857422, 67.57108306884766, 71.1253890991211, 74.6796875, 78.23399353027344, 81.78829956054688, 85.34259796142578, 88.89690399169922, 92.45120239257812, 96.00550842285156]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 1.0, 5.0, 9.0, 6.0, 13.0, 12.0, 16.0, 13.0, 19.0, 24.0, 25.0, 31.0, 32.0, 35.0, 35.0, 49.0, 48.0, 30.0, 57.0, 63.0, 55.0, 50.0, 52.0, 43.0, 37.0, 36.0, 28.0, 17.0, 30.0, 16.0, 23.0, 16.0, 11.0, 11.0, 10.0, 12.0, 6.0, 4.0, 3.0, 4.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-77.99589538574219, -75.7314224243164, -73.46694946289062, -71.20246887207031, -68.93799591064453, -66.67352294921875, -64.40904235839844, -62.144569396972656, -59.880096435546875, -57.615623474121094, -55.35114669799805, -53.086669921875, -50.82219696044922, -48.55772399902344, -46.29324722290039, -44.028770446777344, -41.76429748535156, -39.49982452392578, -37.235347747802734, -34.97087097167969, -32.706398010253906, -30.441923141479492, -28.177448272705078, -25.912973403930664, -23.64849853515625, -21.384023666381836, -19.119548797607422, -16.855073928833008, -14.590599060058594, -12.32612419128418, -10.061649322509766, -7.797174453735352, -5.5326995849609375, -3.2682247161865234, -1.0037498474121094, 1.2607250213623047, 3.5251998901367188, 5.789674758911133, 8.054149627685547, 10.318624496459961, 12.583099365234375, 14.847574234008789, 17.112049102783203, 19.376523971557617, 21.64099884033203, 23.905473709106445, 26.16994857788086, 28.434423446655273, 30.698898315429688, 32.96337127685547, 35.227848052978516, 37.49232482910156, 39.756797790527344, 42.021270751953125, 44.28574752807617, 46.55022430419922, 48.814697265625, 51.07917022705078, 53.34364700317383, 55.608123779296875, 57.872596740722656, 60.13706970214844, 62.401546478271484, 64.66602325439453, 66.93049621582031]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 18.0, 14.0, 20.0, 34.0, 64.0, 92.0, 167.0, 352.0, 658.0, 1399.0, 3503.0, 9308.0, 30035.0, 134144.0, 1286222.0, 2404793.0, 255695.0, 46486.0, 13141.0, 4636.0, 1785.0, 829.0, 383.0, 180.0, 117.0, 67.0, 46.0, 31.0, 20.0, 9.0, 18.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.109375, -9.829833984375, -9.55029296875, -9.270751953125, -8.9912109375, -8.711669921875, -8.43212890625, -8.152587890625, -7.873046875, -7.593505859375, -7.31396484375, -7.034423828125, -6.7548828125, -6.475341796875, -6.19580078125, -5.916259765625, -5.63671875, -5.357177734375, -5.07763671875, -4.798095703125, -4.5185546875, -4.239013671875, -3.95947265625, -3.679931640625, -3.400390625, -3.120849609375, -2.84130859375, -2.561767578125, -2.2822265625, -2.002685546875, -1.72314453125, -1.443603515625, -1.1640625, -0.884521484375, -0.60498046875, -0.325439453125, -0.0458984375, 0.233642578125, 0.51318359375, 0.792724609375, 1.072265625, 1.351806640625, 1.63134765625, 1.910888671875, 2.1904296875, 2.469970703125, 2.74951171875, 3.029052734375, 3.30859375, 3.588134765625, 3.86767578125, 4.147216796875, 4.4267578125, 4.706298828125, 4.98583984375, 5.265380859375, 5.544921875, 5.824462890625, 6.10400390625, 6.383544921875, 6.6630859375, 6.942626953125, 7.22216796875, 7.501708984375, 7.78125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 6.0, 4.0, 7.0, 11.0, 8.0, 18.0, 27.0, 24.0, 28.0, 39.0, 54.0, 59.0, 57.0, 75.0, 74.0, 63.0, 77.0, 55.0, 64.0, 52.0, 40.0, 29.0, 29.0, 28.0, 21.0, 11.0, 11.0, 12.0, 9.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.561767578125, -4.37353515625, -4.185302734375, -3.9970703125, -3.808837890625, -3.62060546875, -3.432373046875, -3.244140625, -3.055908203125, -2.86767578125, -2.679443359375, -2.4912109375, -2.302978515625, -2.11474609375, -1.926513671875, -1.73828125, -1.550048828125, -1.36181640625, -1.173583984375, -0.9853515625, -0.797119140625, -0.60888671875, -0.420654296875, -0.232421875, -0.044189453125, 0.14404296875, 0.332275390625, 0.5205078125, 0.708740234375, 0.89697265625, 1.085205078125, 1.2734375, 1.461669921875, 1.64990234375, 1.838134765625, 2.0263671875, 2.214599609375, 2.40283203125, 2.591064453125, 2.779296875, 2.967529296875, 3.15576171875, 3.343994140625, 3.5322265625, 3.720458984375, 3.90869140625, 4.096923828125, 4.28515625, 4.473388671875, 4.66162109375, 4.849853515625, 5.0380859375, 5.226318359375, 5.41455078125, 5.602783203125, 5.791015625, 5.979248046875, 6.16748046875, 6.355712890625, 6.5439453125, 6.732177734375, 6.92041015625, 7.108642578125, 7.296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 6.0, 26.0, 26.0, 48.0, 62.0, 91.0, 150.0, 336.0, 656.0, 1671.0, 5573.0, 25266.0, 177935.0, 3167089.0, 741605.0, 58363.0, 10596.0, 2745.0, 950.0, 453.0, 228.0, 132.0, 79.0, 46.0, 37.0, 21.0, 18.0, 15.0, 12.0, 11.0, 13.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.75, -17.2918701171875, -16.833740234375, -16.3756103515625, -15.91748046875, -15.4593505859375, -15.001220703125, -14.5430908203125, -14.0849609375, -13.6268310546875, -13.168701171875, -12.7105712890625, -12.25244140625, -11.7943115234375, -11.336181640625, -10.8780517578125, -10.419921875, -9.9617919921875, -9.503662109375, -9.0455322265625, -8.58740234375, -8.1292724609375, -7.671142578125, -7.2130126953125, -6.7548828125, -6.2967529296875, -5.838623046875, -5.3804931640625, -4.92236328125, -4.4642333984375, -4.006103515625, -3.5479736328125, -3.08984375, -2.6317138671875, -2.173583984375, -1.7154541015625, -1.25732421875, -0.7991943359375, -0.341064453125, 0.1170654296875, 0.5751953125, 1.0333251953125, 1.491455078125, 1.9495849609375, 2.40771484375, 2.8658447265625, 3.323974609375, 3.7821044921875, 4.240234375, 4.6983642578125, 5.156494140625, 5.6146240234375, 6.07275390625, 6.5308837890625, 6.989013671875, 7.4471435546875, 7.9052734375, 8.3634033203125, 8.821533203125, 9.2796630859375, 9.73779296875, 10.1959228515625, 10.654052734375, 11.1121826171875, 11.5703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 17.0, 16.0, 32.0, 37.0, 68.0, 80.0, 143.0, 238.0, 393.0, 697.0, 800.0, 623.0, 328.0, 206.0, 111.0, 80.0, 48.0, 45.0, 25.0, 16.0, 16.0, 5.0, 8.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.9241943359375, -13.465576171875, -13.0069580078125, -12.54833984375, -12.0897216796875, -11.631103515625, -11.1724853515625, -10.7138671875, -10.2552490234375, -9.796630859375, -9.3380126953125, -8.87939453125, -8.4207763671875, -7.962158203125, -7.5035400390625, -7.044921875, -6.5863037109375, -6.127685546875, -5.6690673828125, -5.21044921875, -4.7518310546875, -4.293212890625, -3.8345947265625, -3.3759765625, -2.9173583984375, -2.458740234375, -2.0001220703125, -1.54150390625, -1.0828857421875, -0.624267578125, -0.1656494140625, 0.29296875, 0.7515869140625, 1.210205078125, 1.6688232421875, 2.12744140625, 2.5860595703125, 3.044677734375, 3.5032958984375, 3.9619140625, 4.4205322265625, 4.879150390625, 5.3377685546875, 5.79638671875, 6.2550048828125, 6.713623046875, 7.1722412109375, 7.630859375, 8.0894775390625, 8.548095703125, 9.0067138671875, 9.46533203125, 9.9239501953125, 10.382568359375, 10.8411865234375, 11.2998046875, 11.7584228515625, 12.217041015625, 12.6756591796875, 13.13427734375, 13.5928955078125, 14.051513671875, 14.5101318359375, 14.96875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 0.0, 4.0, 4.0, 12.0, 8.0, 17.0, 54.0, 97.0, 181.0, 196.0, 204.0, 121.0, 50.0, 25.0, 16.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.23287963867188, -143.41714477539062, -138.60140991210938, -133.7856903076172, -128.96995544433594, -124.15422058105469, -119.33848571777344, -114.52275848388672, -109.70703125, -104.89129638671875, -100.07556915283203, -95.25983428955078, -90.44410705566406, -85.62837219238281, -80.81263732910156, -75.99691009521484, -71.1811752319336, -66.36544036865234, -61.549713134765625, -56.733978271484375, -51.918251037597656, -47.102516174316406, -42.28678512573242, -37.47105407714844, -32.65532302856445, -27.83959197998047, -23.023860931396484, -18.208127975463867, -13.392396926879883, -8.576665878295898, -3.7609329223632812, 1.0547981262207031, 5.8705291748046875, 10.686260223388672, 15.501992225646973, 20.317724227905273, 25.133455276489258, 29.949186325073242, 34.76491928100586, 39.580650329589844, 44.39638137817383, 49.21211242675781, 54.0278434753418, 58.84357452392578, 63.65930938720703, 68.47503662109375, 73.290771484375, 78.10650634765625, 82.92223358154297, 87.73796844482422, 92.55369567871094, 97.36943054199219, 102.1851577758789, 107.00089263916016, 111.81661987304688, 116.63235473632812, 121.44808959960938, 126.26382446289062, 131.07955932617188, 135.89527893066406, 140.7110137939453, 145.52674865722656, 150.3424835205078, 155.158203125, 159.97393798828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 17.0, 8.0, 11.0, 16.0, 16.0, 21.0, 15.0, 20.0, 32.0, 32.0, 29.0, 45.0, 30.0, 37.0, 38.0, 49.0, 53.0, 47.0, 56.0, 42.0, 34.0, 46.0, 32.0, 35.0, 39.0, 28.0, 37.0, 20.0, 12.0, 22.0, 16.0, 15.0, 12.0, 8.0, 2.0, 4.0, 3.0, 8.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-58.22266387939453, -56.405364990234375, -54.588069915771484, -52.77077102661133, -50.95347213745117, -49.13617706298828, -47.318878173828125, -45.50157928466797, -43.68428039550781, -41.866981506347656, -40.049686431884766, -38.23238754272461, -36.41508865356445, -34.59779357910156, -32.780494689941406, -30.96319580078125, -29.14590072631836, -27.328603744506836, -25.51130485534668, -23.694007873535156, -21.876708984375, -20.059412002563477, -18.242115020751953, -16.424816131591797, -14.607519149780273, -12.790221214294434, -10.972923278808594, -9.15562629699707, -7.3383283615112305, -5.521030426025391, -3.703733444213867, -1.8864355087280273, -0.06914138793945312, 1.7481563091278076, 3.5654540061950684, 5.38275146484375, 7.20004940032959, 9.01734733581543, 10.834644317626953, 12.651942253112793, 14.469240188598633, 16.286537170410156, 18.103836059570312, 19.921133041381836, 21.73843002319336, 23.555728912353516, 25.37302589416504, 27.190322875976562, 29.00762176513672, 30.824918746948242, 32.642215728759766, 34.45951461791992, 36.27681350708008, 38.09410858154297, 39.911407470703125, 41.72870635986328, 43.54600524902344, 45.363304138183594, 47.180599212646484, 48.99789810180664, 50.8151969909668, 52.63249206542969, 54.449790954589844, 56.26708984375, 58.08438491821289]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 11.0, 9.0, 20.0, 24.0, 54.0, 82.0, 170.0, 290.0, 610.0, 1227.0, 2749.0, 7017.0, 19361.0, 56583.0, 170553.0, 420677.0, 244526.0, 80988.0, 27186.0, 9573.0, 3744.0, 1550.0, 722.0, 381.0, 185.0, 109.0, 65.0, 28.0, 33.0, 10.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6640625, -11.295654296875, -10.92724609375, -10.558837890625, -10.1904296875, -9.822021484375, -9.45361328125, -9.085205078125, -8.716796875, -8.348388671875, -7.97998046875, -7.611572265625, -7.2431640625, -6.874755859375, -6.50634765625, -6.137939453125, -5.76953125, -5.401123046875, -5.03271484375, -4.664306640625, -4.2958984375, -3.927490234375, -3.55908203125, -3.190673828125, -2.822265625, -2.453857421875, -2.08544921875, -1.717041015625, -1.3486328125, -0.980224609375, -0.61181640625, -0.243408203125, 0.125, 0.493408203125, 0.86181640625, 1.230224609375, 1.5986328125, 1.967041015625, 2.33544921875, 2.703857421875, 3.072265625, 3.440673828125, 3.80908203125, 4.177490234375, 4.5458984375, 4.914306640625, 5.28271484375, 5.651123046875, 6.01953125, 6.387939453125, 6.75634765625, 7.124755859375, 7.4931640625, 7.861572265625, 8.22998046875, 8.598388671875, 8.966796875, 9.335205078125, 9.70361328125, 10.072021484375, 10.4404296875, 10.808837890625, 11.17724609375, 11.545654296875, 11.9140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 10.0, 20.0, 21.0, 32.0, 27.0, 33.0, 46.0, 65.0, 64.0, 78.0, 65.0, 82.0, 62.0, 66.0, 60.0, 47.0, 58.0, 28.0, 27.0, 20.0, 15.0, 13.0, 13.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.125, -4.92987060546875, -4.7347412109375, -4.53961181640625, -4.344482421875, -4.14935302734375, -3.9542236328125, -3.75909423828125, -3.56396484375, -3.36883544921875, -3.1737060546875, -2.97857666015625, -2.783447265625, -2.58831787109375, -2.3931884765625, -2.19805908203125, -2.0029296875, -1.80780029296875, -1.6126708984375, -1.41754150390625, -1.222412109375, -1.02728271484375, -0.8321533203125, -0.63702392578125, -0.44189453125, -0.24676513671875, -0.0516357421875, 0.14349365234375, 0.338623046875, 0.53375244140625, 0.7288818359375, 0.92401123046875, 1.119140625, 1.31427001953125, 1.5093994140625, 1.70452880859375, 1.899658203125, 2.09478759765625, 2.2899169921875, 2.48504638671875, 2.68017578125, 2.87530517578125, 3.0704345703125, 3.26556396484375, 3.460693359375, 3.65582275390625, 3.8509521484375, 4.04608154296875, 4.2412109375, 4.43634033203125, 4.6314697265625, 4.82659912109375, 5.021728515625, 5.21685791015625, 5.4119873046875, 5.60711669921875, 5.80224609375, 5.99737548828125, 6.1925048828125, 6.38763427734375, 6.582763671875, 6.77789306640625, 6.9730224609375, 7.16815185546875, 7.36328125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 8.0, 9.0, 10.0, 18.0, 22.0, 21.0, 54.0, 64.0, 75.0, 117.0, 135.0, 223.0, 320.0, 470.0, 756.0, 1179.0, 2176.0, 5019.0, 20113.0, 142659.0, 725063.0, 121917.0, 17944.0, 4689.0, 2055.0, 1135.0, 726.0, 454.0, 329.0, 234.0, 151.0, 123.0, 88.0, 57.0, 36.0, 25.0, 24.0, 15.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.359375, -19.7509765625, -19.142578125, -18.5341796875, -17.92578125, -17.3173828125, -16.708984375, -16.1005859375, -15.4921875, -14.8837890625, -14.275390625, -13.6669921875, -13.05859375, -12.4501953125, -11.841796875, -11.2333984375, -10.625, -10.0166015625, -9.408203125, -8.7998046875, -8.19140625, -7.5830078125, -6.974609375, -6.3662109375, -5.7578125, -5.1494140625, -4.541015625, -3.9326171875, -3.32421875, -2.7158203125, -2.107421875, -1.4990234375, -0.890625, -0.2822265625, 0.326171875, 0.9345703125, 1.54296875, 2.1513671875, 2.759765625, 3.3681640625, 3.9765625, 4.5849609375, 5.193359375, 5.8017578125, 6.41015625, 7.0185546875, 7.626953125, 8.2353515625, 8.84375, 9.4521484375, 10.060546875, 10.6689453125, 11.27734375, 11.8857421875, 12.494140625, 13.1025390625, 13.7109375, 14.3193359375, 14.927734375, 15.5361328125, 16.14453125, 16.7529296875, 17.361328125, 17.9697265625, 18.578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 9.0, 6.0, 13.0, 17.0, 6.0, 29.0, 29.0, 25.0, 32.0, 25.0, 43.0, 40.0, 36.0, 53.0, 55.0, 45.0, 55.0, 51.0, 32.0, 47.0, 40.0, 37.0, 36.0, 25.0, 33.0, 24.0, 22.0, 14.0, 21.0, 14.0, 13.0, 11.0, 3.0, 5.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.585205078125, -16.98291015625, -16.380615234375, -15.7783203125, -15.176025390625, -14.57373046875, -13.971435546875, -13.369140625, -12.766845703125, -12.16455078125, -11.562255859375, -10.9599609375, -10.357666015625, -9.75537109375, -9.153076171875, -8.55078125, -7.948486328125, -7.34619140625, -6.743896484375, -6.1416015625, -5.539306640625, -4.93701171875, -4.334716796875, -3.732421875, -3.130126953125, -2.52783203125, -1.925537109375, -1.3232421875, -0.720947265625, -0.11865234375, 0.483642578125, 1.0859375, 1.688232421875, 2.29052734375, 2.892822265625, 3.4951171875, 4.097412109375, 4.69970703125, 5.302001953125, 5.904296875, 6.506591796875, 7.10888671875, 7.711181640625, 8.3134765625, 8.915771484375, 9.51806640625, 10.120361328125, 10.72265625, 11.324951171875, 11.92724609375, 12.529541015625, 13.1318359375, 13.734130859375, 14.33642578125, 14.938720703125, 15.541015625, 16.143310546875, 16.74560546875, 17.347900390625, 17.9501953125, 18.552490234375, 19.15478515625, 19.757080078125, 20.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 12.0, 7.0, 5.0, 8.0, 11.0, 16.0, 21.0, 27.0, 30.0, 62.0, 101.0, 135.0, 298.0, 573.0, 1263.0, 3628.0, 13664.0, 76666.0, 673072.0, 234165.0, 33572.0, 7319.0, 2073.0, 847.0, 399.0, 188.0, 136.0, 78.0, 53.0, 36.0, 26.0, 16.0, 19.0, 8.0, 6.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.8717041015625, -5.680908203125, -5.4901123046875, -5.29931640625, -5.1085205078125, -4.917724609375, -4.7269287109375, -4.5361328125, -4.3453369140625, -4.154541015625, -3.9637451171875, -3.77294921875, -3.5821533203125, -3.391357421875, -3.2005615234375, -3.009765625, -2.8189697265625, -2.628173828125, -2.4373779296875, -2.24658203125, -2.0557861328125, -1.864990234375, -1.6741943359375, -1.4833984375, -1.2926025390625, -1.101806640625, -0.9110107421875, -0.72021484375, -0.5294189453125, -0.338623046875, -0.1478271484375, 0.04296875, 0.2337646484375, 0.424560546875, 0.6153564453125, 0.80615234375, 0.9969482421875, 1.187744140625, 1.3785400390625, 1.5693359375, 1.7601318359375, 1.950927734375, 2.1417236328125, 2.33251953125, 2.5233154296875, 2.714111328125, 2.9049072265625, 3.095703125, 3.2864990234375, 3.477294921875, 3.6680908203125, 3.85888671875, 4.0496826171875, 4.240478515625, 4.4312744140625, 4.6220703125, 4.8128662109375, 5.003662109375, 5.1944580078125, 5.38525390625, 5.5760498046875, 5.766845703125, 5.9576416015625, 6.1484375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 15.0, 16.0, 28.0, 27.0, 37.0, 39.0, 65.0, 84.0, 125.0, 154.0, 98.0, 47.0, 55.0, 38.0, 32.0, 24.0, 19.0, 19.0, 10.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012280046939849854, -0.001182854175567627, -0.0011377036571502686, -0.0010925531387329102, -0.0010474026203155518, -0.0010022521018981934, -0.000957101583480835, -0.0009119510650634766, -0.0008668005466461182, -0.0008216500282287598, -0.0007764995098114014, -0.000731348991394043, -0.0006861984729766846, -0.0006410479545593262, -0.0005958974361419678, -0.0005507469177246094, -0.000505596399307251, -0.0004604458808898926, -0.0004152953624725342, -0.0003701448440551758, -0.0003249943256378174, -0.000279843807220459, -0.00023469328880310059, -0.0001895427703857422, -0.0001443922519683838, -9.924173355102539e-05, -5.409121513366699e-05, -8.940696716308594e-06, 3.6209821701049805e-05, 8.13603401184082e-05, 0.0001265108585357666, 0.000171661376953125, 0.0002168118953704834, 0.0002619624137878418, 0.0003071129322052002, 0.0003522634506225586, 0.000397413969039917, 0.0004425644874572754, 0.0004877150058746338, 0.0005328655242919922, 0.0005780160427093506, 0.000623166561126709, 0.0006683170795440674, 0.0007134675979614258, 0.0007586181163787842, 0.0008037686347961426, 0.000848919153213501, 0.0008940696716308594, 0.0009392201900482178, 0.0009843707084655762, 0.0010295212268829346, 0.001074671745300293, 0.0011198222637176514, 0.0011649727821350098, 0.0012101233005523682, 0.0012552738189697266, 0.001300424337387085, 0.0013455748558044434, 0.0013907253742218018, 0.0014358758926391602, 0.0014810264110565186, 0.001526176929473877, 0.0015713274478912354, 0.0016164779663085938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 11.0, 14.0, 22.0, 18.0, 26.0, 45.0, 86.0, 105.0, 186.0, 328.0, 530.0, 949.0, 2197.0, 5619.0, 21237.0, 155382.0, 734398.0, 102818.0, 16091.0, 4462.0, 1758.0, 900.0, 517.0, 299.0, 179.0, 127.0, 67.0, 64.0, 35.0, 30.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.48828125, -5.30780029296875, -5.1273193359375, -4.94683837890625, -4.766357421875, -4.58587646484375, -4.4053955078125, -4.22491455078125, -4.04443359375, -3.86395263671875, -3.6834716796875, -3.50299072265625, -3.322509765625, -3.14202880859375, -2.9615478515625, -2.78106689453125, -2.6005859375, -2.42010498046875, -2.2396240234375, -2.05914306640625, -1.878662109375, -1.69818115234375, -1.5177001953125, -1.33721923828125, -1.15673828125, -0.97625732421875, -0.7957763671875, -0.61529541015625, -0.434814453125, -0.25433349609375, -0.0738525390625, 0.10662841796875, 0.287109375, 0.46759033203125, 0.6480712890625, 0.82855224609375, 1.009033203125, 1.18951416015625, 1.3699951171875, 1.55047607421875, 1.73095703125, 1.91143798828125, 2.0919189453125, 2.27239990234375, 2.452880859375, 2.63336181640625, 2.8138427734375, 2.99432373046875, 3.1748046875, 3.35528564453125, 3.5357666015625, 3.71624755859375, 3.896728515625, 4.07720947265625, 4.2576904296875, 4.43817138671875, 4.61865234375, 4.79913330078125, 4.9796142578125, 5.16009521484375, 5.340576171875, 5.52105712890625, 5.7015380859375, 5.88201904296875, 6.0625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 1.0, 5.0, 3.0, 9.0, 8.0, 6.0, 2.0, 13.0, 14.0, 20.0, 21.0, 28.0, 34.0, 38.0, 41.0, 44.0, 63.0, 49.0, 62.0, 53.0, 52.0, 63.0, 52.0, 47.0, 42.0, 34.0, 24.0, 27.0, 32.0, 19.0, 24.0, 14.0, 5.0, 6.0, 5.0, 7.0, 3.0, 4.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.634765625, -3.519287109375, -3.40380859375, -3.288330078125, -3.1728515625, -3.057373046875, -2.94189453125, -2.826416015625, -2.7109375, -2.595458984375, -2.47998046875, -2.364501953125, -2.2490234375, -2.133544921875, -2.01806640625, -1.902587890625, -1.787109375, -1.671630859375, -1.55615234375, -1.440673828125, -1.3251953125, -1.209716796875, -1.09423828125, -0.978759765625, -0.86328125, -0.747802734375, -0.63232421875, -0.516845703125, -0.4013671875, -0.285888671875, -0.17041015625, -0.054931640625, 0.060546875, 0.176025390625, 0.29150390625, 0.406982421875, 0.5224609375, 0.637939453125, 0.75341796875, 0.868896484375, 0.984375, 1.099853515625, 1.21533203125, 1.330810546875, 1.4462890625, 1.561767578125, 1.67724609375, 1.792724609375, 1.908203125, 2.023681640625, 2.13916015625, 2.254638671875, 2.3701171875, 2.485595703125, 2.60107421875, 2.716552734375, 2.83203125, 2.947509765625, 3.06298828125, 3.178466796875, 3.2939453125, 3.409423828125, 3.52490234375, 3.640380859375, 3.755859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 9.0, 25.0, 51.0, 134.0, 243.0, 330.0, 123.0, 42.0, 21.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.59625244140625, -271.1712341308594, -264.7462158203125, -258.3211975097656, -251.89617919921875, -245.47116088867188, -239.046142578125, -232.62112426757812, -226.19610595703125, -219.77108764648438, -213.3460693359375, -206.92105102539062, -200.49603271484375, -194.07101440429688, -187.64599609375, -181.22097778320312, -174.79595947265625, -168.37094116210938, -161.9459228515625, -155.52090454101562, -149.09588623046875, -142.67086791992188, -136.245849609375, -129.82083129882812, -123.39579772949219, -116.97077941894531, -110.54576110839844, -104.12074279785156, -97.69572448730469, -91.27070617675781, -84.84568786621094, -78.42066955566406, -71.99565124511719, -65.57063293457031, -59.14561462402344, -52.72059631347656, -46.29557800292969, -39.87055587768555, -33.44553756713867, -27.020519256591797, -20.595500946044922, -14.170482635498047, -7.7454633712768555, -1.320444107055664, 5.104574203491211, 11.529594421386719, 17.954612731933594, 24.37963104248047, 30.804649353027344, 37.22966766357422, 43.654685974121094, 50.07970428466797, 56.504722595214844, 62.929744720458984, 69.35476684570312, 75.77978515625, 82.20480346679688, 88.62982177734375, 95.05484008789062, 101.4798583984375, 107.90487670898438, 114.32989501953125, 120.75491333007812, 127.179931640625, 133.60494995117188]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 8.0, 10.0, 12.0, 13.0, 18.0, 23.0, 18.0, 26.0, 28.0, 27.0, 41.0, 41.0, 46.0, 54.0, 69.0, 88.0, 87.0, 53.0, 49.0, 40.0, 32.0, 34.0, 40.0, 32.0, 22.0, 22.0, 17.0, 9.0, 6.0, 11.0, 6.0, 11.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.84745025634766, -80.99778747558594, -78.14812469482422, -75.2984619140625, -72.44879913330078, -69.59913635253906, -66.74946594238281, -63.89980697631836, -61.05014419555664, -58.20048141479492, -55.3508186340332, -52.50115203857422, -49.6514892578125, -46.80182647705078, -43.95216369628906, -41.102500915527344, -38.252838134765625, -35.403175354003906, -32.55351257324219, -29.703847885131836, -26.854185104370117, -24.0045223236084, -21.154857635498047, -18.305194854736328, -15.45553207397461, -12.60586929321289, -9.756205558776855, -6.90654182434082, -4.056879043579102, -1.2072162628173828, 1.6424484252929688, 4.4921112060546875, 7.341773986816406, 10.191436767578125, 13.04110050201416, 15.890764236450195, 18.740427017211914, 21.590089797973633, 24.439754486083984, 27.289417266845703, 30.139080047607422, 32.98874282836914, 35.83840560913086, 38.688072204589844, 41.53773498535156, 44.38739776611328, 47.237060546875, 50.08672332763672, 52.93638610839844, 55.786048889160156, 58.635711669921875, 61.485374450683594, 64.33503723144531, 67.18470001220703, 70.03436279296875, 72.884033203125, 75.73368835449219, 78.5833511352539, 81.43301391601562, 84.28267669677734, 87.13233947753906, 89.98200225830078, 92.8316650390625, 95.68133544921875, 98.53099822998047]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 7.0, 12.0, 26.0, 40.0, 83.0, 149.0, 323.0, 742.0, 1787.0, 4393.0, 12485.0, 40840.0, 222417.0, 2410718.0, 1336251.0, 123819.0, 26695.0, 8242.0, 3046.0, 1151.0, 520.0, 205.0, 129.0, 68.0, 41.0, 21.0, 18.0, 16.0, 16.0, 6.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.69140625, -5.43096923828125, -5.1705322265625, -4.91009521484375, -4.649658203125, -4.38922119140625, -4.1287841796875, -3.86834716796875, -3.60791015625, -3.34747314453125, -3.0870361328125, -2.82659912109375, -2.566162109375, -2.30572509765625, -2.0452880859375, -1.78485107421875, -1.5244140625, -1.26397705078125, -1.0035400390625, -0.74310302734375, -0.482666015625, -0.22222900390625, 0.0382080078125, 0.29864501953125, 0.55908203125, 0.81951904296875, 1.0799560546875, 1.34039306640625, 1.600830078125, 1.86126708984375, 2.1217041015625, 2.38214111328125, 2.642578125, 2.90301513671875, 3.1634521484375, 3.42388916015625, 3.684326171875, 3.94476318359375, 4.2052001953125, 4.46563720703125, 4.72607421875, 4.98651123046875, 5.2469482421875, 5.50738525390625, 5.767822265625, 6.02825927734375, 6.2886962890625, 6.54913330078125, 6.8095703125, 7.07000732421875, 7.3304443359375, 7.59088134765625, 7.851318359375, 8.11175537109375, 8.3721923828125, 8.63262939453125, 8.89306640625, 9.15350341796875, 9.4139404296875, 9.67437744140625, 9.934814453125, 10.19525146484375, 10.4556884765625, 10.71612548828125, 10.9765625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 4.0, 7.0, 4.0, 20.0, 26.0, 38.0, 39.0, 89.0, 81.0, 86.0, 113.0, 85.0, 107.0, 67.0, 92.0, 44.0, 36.0, 23.0, 16.0, 15.0, 3.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.29296875, -4.00933837890625, -3.7257080078125, -3.44207763671875, -3.158447265625, -2.87481689453125, -2.5911865234375, -2.30755615234375, -2.02392578125, -1.74029541015625, -1.4566650390625, -1.17303466796875, -0.889404296875, -0.60577392578125, -0.3221435546875, -0.03851318359375, 0.2451171875, 0.52874755859375, 0.8123779296875, 1.09600830078125, 1.379638671875, 1.66326904296875, 1.9468994140625, 2.23052978515625, 2.51416015625, 2.79779052734375, 3.0814208984375, 3.36505126953125, 3.648681640625, 3.93231201171875, 4.2159423828125, 4.49957275390625, 4.783203125, 5.06683349609375, 5.3504638671875, 5.63409423828125, 5.917724609375, 6.20135498046875, 6.4849853515625, 6.76861572265625, 7.05224609375, 7.33587646484375, 7.6195068359375, 7.90313720703125, 8.186767578125, 8.47039794921875, 8.7540283203125, 9.03765869140625, 9.3212890625, 9.60491943359375, 9.8885498046875, 10.17218017578125, 10.455810546875, 10.73944091796875, 11.0230712890625, 11.30670166015625, 11.59033203125, 11.87396240234375, 12.1575927734375, 12.44122314453125, 12.724853515625, 13.00848388671875, 13.2921142578125, 13.57574462890625, 13.859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 2.0, 8.0, 8.0, 17.0, 12.0, 22.0, 37.0, 43.0, 66.0, 99.0, 152.0, 263.0, 380.0, 676.0, 1296.0, 2921.0, 7210.0, 22074.0, 88521.0, 820008.0, 2937293.0, 247634.0, 44517.0, 12480.0, 4422.0, 1795.0, 899.0, 482.0, 303.0, 187.0, 124.0, 79.0, 53.0, 54.0, 38.0, 18.0, 23.0, 12.0, 11.0, 7.0, 8.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.6640625, -10.343505859375, -10.02294921875, -9.702392578125, -9.3818359375, -9.061279296875, -8.74072265625, -8.420166015625, -8.099609375, -7.779052734375, -7.45849609375, -7.137939453125, -6.8173828125, -6.496826171875, -6.17626953125, -5.855712890625, -5.53515625, -5.214599609375, -4.89404296875, -4.573486328125, -4.2529296875, -3.932373046875, -3.61181640625, -3.291259765625, -2.970703125, -2.650146484375, -2.32958984375, -2.009033203125, -1.6884765625, -1.367919921875, -1.04736328125, -0.726806640625, -0.40625, -0.085693359375, 0.23486328125, 0.555419921875, 0.8759765625, 1.196533203125, 1.51708984375, 1.837646484375, 2.158203125, 2.478759765625, 2.79931640625, 3.119873046875, 3.4404296875, 3.760986328125, 4.08154296875, 4.402099609375, 4.72265625, 5.043212890625, 5.36376953125, 5.684326171875, 6.0048828125, 6.325439453125, 6.64599609375, 6.966552734375, 7.287109375, 7.607666015625, 7.92822265625, 8.248779296875, 8.5693359375, 8.889892578125, 9.21044921875, 9.531005859375, 9.8515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 4.0, 9.0, 11.0, 10.0, 22.0, 36.0, 39.0, 59.0, 81.0, 134.0, 203.0, 327.0, 561.0, 784.0, 631.0, 415.0, 230.0, 157.0, 105.0, 67.0, 50.0, 32.0, 29.0, 12.0, 15.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.9473876953125, -10.590087890625, -10.2327880859375, -9.87548828125, -9.5181884765625, -9.160888671875, -8.8035888671875, -8.4462890625, -8.0889892578125, -7.731689453125, -7.3743896484375, -7.01708984375, -6.6597900390625, -6.302490234375, -5.9451904296875, -5.587890625, -5.2305908203125, -4.873291015625, -4.5159912109375, -4.15869140625, -3.8013916015625, -3.444091796875, -3.0867919921875, -2.7294921875, -2.3721923828125, -2.014892578125, -1.6575927734375, -1.30029296875, -0.9429931640625, -0.585693359375, -0.2283935546875, 0.12890625, 0.4862060546875, 0.843505859375, 1.2008056640625, 1.55810546875, 1.9154052734375, 2.272705078125, 2.6300048828125, 2.9873046875, 3.3446044921875, 3.701904296875, 4.0592041015625, 4.41650390625, 4.7738037109375, 5.131103515625, 5.4884033203125, 5.845703125, 6.2030029296875, 6.560302734375, 6.9176025390625, 7.27490234375, 7.6322021484375, 7.989501953125, 8.3468017578125, 8.7041015625, 9.0614013671875, 9.418701171875, 9.7760009765625, 10.13330078125, 10.4906005859375, 10.847900390625, 11.2052001953125, 11.5625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 7.0, 7.0, 33.0, 95.0, 242.0, 296.0, 195.0, 83.0, 24.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.0605163574219, -269.6875305175781, -263.3145751953125, -256.94158935546875, -250.56863403320312, -244.19564819335938, -237.8226776123047, -231.44970703125, -225.0767364501953, -218.70376586914062, -212.33079528808594, -205.95782470703125, -199.5848388671875, -193.2118682861328, -186.83889770507812, -180.46592712402344, -174.09295654296875, -167.71998596191406, -161.34701538085938, -154.9740447998047, -148.60107421875, -142.22808837890625, -135.85511779785156, -129.48214721679688, -123.10917663574219, -116.7362060546875, -110.36323547363281, -103.9902572631836, -97.6172866821289, -91.24431610107422, -84.871337890625, -78.49836730957031, -72.12541198730469, -65.75244140625, -59.37946701049805, -53.006492614746094, -46.633522033691406, -40.26055145263672, -33.887577056884766, -27.514602661132812, -21.141632080078125, -14.768659591674805, -8.395687103271484, -2.022714614868164, 4.350257873535156, 10.723230361938477, 17.096202850341797, 23.46917724609375, 29.842147827148438, 36.215118408203125, 42.58809280395508, 48.96106719970703, 55.33403778076172, 61.707008361816406, 68.07998657226562, 74.45295715332031, 80.825927734375, 87.19889831542969, 93.57186889648438, 99.9448471069336, 106.31781768798828, 112.69078826904297, 119.06376647949219, 125.43673706054688, 131.80970764160156]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 8.0, 1.0, 8.0, 7.0, 17.0, 25.0, 26.0, 37.0, 49.0, 50.0, 70.0, 74.0, 74.0, 83.0, 85.0, 72.0, 68.0, 58.0, 41.0, 49.0, 27.0, 25.0, 13.0, 8.0, 13.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.61972045898438, -89.03205871582031, -86.44438934326172, -83.85671997070312, -81.26905822753906, -78.681396484375, -76.0937271118164, -73.50605773925781, -70.91839599609375, -68.33073425292969, -65.7430648803711, -63.155399322509766, -60.56773376464844, -57.98006820678711, -55.39240264892578, -52.80473709106445, -50.217071533203125, -47.6294059753418, -45.04174041748047, -42.45407485961914, -39.86640930175781, -37.278743743896484, -34.691078186035156, -32.10341262817383, -29.5157470703125, -26.928081512451172, -24.340415954589844, -21.752750396728516, -19.165084838867188, -16.57741928100586, -13.989753723144531, -11.402088165283203, -8.814422607421875, -6.226757049560547, -3.6390914916992188, -1.0514259338378906, 1.5362396240234375, 4.123905181884766, 6.711570739746094, 9.299236297607422, 11.88690185546875, 14.474567413330078, 17.062232971191406, 19.649898529052734, 22.237564086914062, 24.82522964477539, 27.41289520263672, 30.000560760498047, 32.588226318359375, 35.1758918762207, 37.76355743408203, 40.35122299194336, 42.93888854980469, 45.526554107666016, 48.114219665527344, 50.70188522338867, 53.28955078125, 55.87721633911133, 58.464881896972656, 61.052547454833984, 63.64021301269531, 66.22787475585938, 68.81554412841797, 71.40321350097656, 73.99087524414062]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 6.0, 9.0, 13.0, 20.0, 23.0, 69.0, 74.0, 125.0, 180.0, 300.0, 501.0, 844.0, 1512.0, 2784.0, 5326.0, 10355.0, 22368.0, 50700.0, 125306.0, 320853.0, 301747.0, 116251.0, 47261.0, 20911.0, 9945.0, 5023.0, 2588.0, 1472.0, 799.0, 465.0, 267.0, 159.0, 99.0, 77.0, 47.0, 26.0, 18.0, 11.0, 8.0, 2.0, 3.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.8983154296875, -6.632568359375, -6.3668212890625, -6.10107421875, -5.8353271484375, -5.569580078125, -5.3038330078125, -5.0380859375, -4.7723388671875, -4.506591796875, -4.2408447265625, -3.97509765625, -3.7093505859375, -3.443603515625, -3.1778564453125, -2.912109375, -2.6463623046875, -2.380615234375, -2.1148681640625, -1.84912109375, -1.5833740234375, -1.317626953125, -1.0518798828125, -0.7861328125, -0.5203857421875, -0.254638671875, 0.0111083984375, 0.27685546875, 0.5426025390625, 0.808349609375, 1.0740966796875, 1.33984375, 1.6055908203125, 1.871337890625, 2.1370849609375, 2.40283203125, 2.6685791015625, 2.934326171875, 3.2000732421875, 3.4658203125, 3.7315673828125, 3.997314453125, 4.2630615234375, 4.52880859375, 4.7945556640625, 5.060302734375, 5.3260498046875, 5.591796875, 5.8575439453125, 6.123291015625, 6.3890380859375, 6.65478515625, 6.9205322265625, 7.186279296875, 7.4520263671875, 7.7177734375, 7.9835205078125, 8.249267578125, 8.5150146484375, 8.78076171875, 9.0465087890625, 9.312255859375, 9.5780029296875, 9.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 16.0, 18.0, 22.0, 26.0, 25.0, 47.0, 53.0, 48.0, 48.0, 64.0, 74.0, 57.0, 61.0, 49.0, 53.0, 63.0, 49.0, 44.0, 36.0, 30.0, 15.0, 14.0, 17.0, 12.0, 10.0, 6.0, 4.0, 7.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.57421875, -4.3885498046875, -4.202880859375, -4.0172119140625, -3.83154296875, -3.6458740234375, -3.460205078125, -3.2745361328125, -3.0888671875, -2.9031982421875, -2.717529296875, -2.5318603515625, -2.34619140625, -2.1605224609375, -1.974853515625, -1.7891845703125, -1.603515625, -1.4178466796875, -1.232177734375, -1.0465087890625, -0.86083984375, -0.6751708984375, -0.489501953125, -0.3038330078125, -0.1181640625, 0.0675048828125, 0.253173828125, 0.4388427734375, 0.62451171875, 0.8101806640625, 0.995849609375, 1.1815185546875, 1.3671875, 1.5528564453125, 1.738525390625, 1.9241943359375, 2.10986328125, 2.2955322265625, 2.481201171875, 2.6668701171875, 2.8525390625, 3.0382080078125, 3.223876953125, 3.4095458984375, 3.59521484375, 3.7808837890625, 3.966552734375, 4.1522216796875, 4.337890625, 4.5235595703125, 4.709228515625, 4.8948974609375, 5.08056640625, 5.2662353515625, 5.451904296875, 5.6375732421875, 5.8232421875, 6.0089111328125, 6.194580078125, 6.3802490234375, 6.56591796875, 6.7515869140625, 6.937255859375, 7.1229248046875, 7.30859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 7.0, 2.0, 4.0, 5.0, 9.0, 16.0, 18.0, 22.0, 33.0, 48.0, 74.0, 91.0, 127.0, 170.0, 278.0, 402.0, 675.0, 1159.0, 2251.0, 5855.0, 23728.0, 181519.0, 730467.0, 79795.0, 13390.0, 3951.0, 1757.0, 946.0, 576.0, 354.0, 255.0, 168.0, 123.0, 79.0, 66.0, 37.0, 22.0, 24.0, 20.0, 12.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.328125, -19.718017578125, -19.10791015625, -18.497802734375, -17.8876953125, -17.277587890625, -16.66748046875, -16.057373046875, -15.447265625, -14.837158203125, -14.22705078125, -13.616943359375, -13.0068359375, -12.396728515625, -11.78662109375, -11.176513671875, -10.56640625, -9.956298828125, -9.34619140625, -8.736083984375, -8.1259765625, -7.515869140625, -6.90576171875, -6.295654296875, -5.685546875, -5.075439453125, -4.46533203125, -3.855224609375, -3.2451171875, -2.635009765625, -2.02490234375, -1.414794921875, -0.8046875, -0.194580078125, 0.41552734375, 1.025634765625, 1.6357421875, 2.245849609375, 2.85595703125, 3.466064453125, 4.076171875, 4.686279296875, 5.29638671875, 5.906494140625, 6.5166015625, 7.126708984375, 7.73681640625, 8.346923828125, 8.95703125, 9.567138671875, 10.17724609375, 10.787353515625, 11.3974609375, 12.007568359375, 12.61767578125, 13.227783203125, 13.837890625, 14.447998046875, 15.05810546875, 15.668212890625, 16.2783203125, 16.888427734375, 17.49853515625, 18.108642578125, 18.71875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 23.0, 18.0, 17.0, 28.0, 34.0, 37.0, 45.0, 38.0, 49.0, 42.0, 52.0, 50.0, 77.0, 53.0, 54.0, 40.0, 51.0, 33.0, 37.0, 30.0, 25.0, 20.0, 21.0, 13.0, 14.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.390625, -16.782470703125, -16.17431640625, -15.566162109375, -14.9580078125, -14.349853515625, -13.74169921875, -13.133544921875, -12.525390625, -11.917236328125, -11.30908203125, -10.700927734375, -10.0927734375, -9.484619140625, -8.87646484375, -8.268310546875, -7.66015625, -7.052001953125, -6.44384765625, -5.835693359375, -5.2275390625, -4.619384765625, -4.01123046875, -3.403076171875, -2.794921875, -2.186767578125, -1.57861328125, -0.970458984375, -0.3623046875, 0.245849609375, 0.85400390625, 1.462158203125, 2.0703125, 2.678466796875, 3.28662109375, 3.894775390625, 4.5029296875, 5.111083984375, 5.71923828125, 6.327392578125, 6.935546875, 7.543701171875, 8.15185546875, 8.760009765625, 9.3681640625, 9.976318359375, 10.58447265625, 11.192626953125, 11.80078125, 12.408935546875, 13.01708984375, 13.625244140625, 14.2333984375, 14.841552734375, 15.44970703125, 16.057861328125, 16.666015625, 17.274169921875, 17.88232421875, 18.490478515625, 19.0986328125, 19.706787109375, 20.31494140625, 20.923095703125, 21.53125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 4.0, 10.0, 14.0, 25.0, 29.0, 49.0, 68.0, 106.0, 181.0, 264.0, 415.0, 742.0, 1317.0, 2693.0, 6693.0, 29652.0, 335434.0, 618651.0, 37633.0, 8033.0, 3023.0, 1451.0, 775.0, 475.0, 296.0, 163.0, 122.0, 70.0, 40.0, 32.0, 19.0, 17.0, 15.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.49432373046875, -5.2659912109375, -5.03765869140625, -4.809326171875, -4.58099365234375, -4.3526611328125, -4.12432861328125, -3.89599609375, -3.66766357421875, -3.4393310546875, -3.21099853515625, -2.982666015625, -2.75433349609375, -2.5260009765625, -2.29766845703125, -2.0693359375, -1.84100341796875, -1.6126708984375, -1.38433837890625, -1.156005859375, -0.92767333984375, -0.6993408203125, -0.47100830078125, -0.24267578125, -0.01434326171875, 0.2139892578125, 0.44232177734375, 0.670654296875, 0.89898681640625, 1.1273193359375, 1.35565185546875, 1.583984375, 1.81231689453125, 2.0406494140625, 2.26898193359375, 2.497314453125, 2.72564697265625, 2.9539794921875, 3.18231201171875, 3.41064453125, 3.63897705078125, 3.8673095703125, 4.09564208984375, 4.323974609375, 4.55230712890625, 4.7806396484375, 5.00897216796875, 5.2373046875, 5.46563720703125, 5.6939697265625, 5.92230224609375, 6.150634765625, 6.37896728515625, 6.6072998046875, 6.83563232421875, 7.06396484375, 7.29229736328125, 7.5206298828125, 7.74896240234375, 7.977294921875, 8.20562744140625, 8.4339599609375, 8.66229248046875, 8.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 14.0, 35.0, 63.0, 198.0, 456.0, 125.0, 44.0, 26.0, 16.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005268096923828125, -0.005105435848236084, -0.004942774772644043, -0.004780113697052002, -0.004617452621459961, -0.00445479154586792, -0.004292130470275879, -0.004129469394683838, -0.003966808319091797, -0.003804147243499756, -0.003641486167907715, -0.003478825092315674, -0.003316164016723633, -0.003153502941131592, -0.0029908418655395508, -0.0028281807899475098, -0.0026655197143554688, -0.0025028586387634277, -0.0023401975631713867, -0.0021775364875793457, -0.0020148754119873047, -0.0018522143363952637, -0.0016895532608032227, -0.0015268921852111816, -0.0013642311096191406, -0.0012015700340270996, -0.0010389089584350586, -0.0008762478828430176, -0.0007135868072509766, -0.0005509257316589355, -0.00038826465606689453, -0.00022560358047485352, -6.29425048828125e-05, 9.971857070922852e-05, 0.00026237964630126953, 0.00042504072189331055, 0.0005877017974853516, 0.0007503628730773926, 0.0009130239486694336, 0.0010756850242614746, 0.0012383460998535156, 0.0014010071754455566, 0.0015636682510375977, 0.0017263293266296387, 0.0018889904022216797, 0.0020516514778137207, 0.0022143125534057617, 0.0023769736289978027, 0.0025396347045898438, 0.0027022957801818848, 0.0028649568557739258, 0.003027617931365967, 0.003190279006958008, 0.003352940082550049, 0.00351560115814209, 0.003678262233734131, 0.003840923309326172, 0.004003584384918213, 0.004166245460510254, 0.004328906536102295, 0.004491567611694336, 0.004654228687286377, 0.004816889762878418, 0.004979550838470459, 0.0051422119140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 11.0, 29.0, 47.0, 76.0, 137.0, 306.0, 787.0, 2554.0, 16868.0, 936504.0, 83914.0, 5144.0, 1257.0, 467.0, 179.0, 93.0, 53.0, 36.0, 23.0, 19.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.4375, -17.94873046875, -17.4599609375, -16.97119140625, -16.482421875, -15.99365234375, -15.5048828125, -15.01611328125, -14.52734375, -14.03857421875, -13.5498046875, -13.06103515625, -12.572265625, -12.08349609375, -11.5947265625, -11.10595703125, -10.6171875, -10.12841796875, -9.6396484375, -9.15087890625, -8.662109375, -8.17333984375, -7.6845703125, -7.19580078125, -6.70703125, -6.21826171875, -5.7294921875, -5.24072265625, -4.751953125, -4.26318359375, -3.7744140625, -3.28564453125, -2.796875, -2.30810546875, -1.8193359375, -1.33056640625, -0.841796875, -0.35302734375, 0.1357421875, 0.62451171875, 1.11328125, 1.60205078125, 2.0908203125, 2.57958984375, 3.068359375, 3.55712890625, 4.0458984375, 4.53466796875, 5.0234375, 5.51220703125, 6.0009765625, 6.48974609375, 6.978515625, 7.46728515625, 7.9560546875, 8.44482421875, 8.93359375, 9.42236328125, 9.9111328125, 10.39990234375, 10.888671875, 11.37744140625, 11.8662109375, 12.35498046875, 12.84375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 6.0, 14.0, 20.0, 31.0, 78.0, 138.0, 194.0, 210.0, 139.0, 64.0, 37.0, 23.0, 9.0, 12.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3359375, -11.0296630859375, -10.723388671875, -10.4171142578125, -10.11083984375, -9.8045654296875, -9.498291015625, -9.1920166015625, -8.8857421875, -8.5794677734375, -8.273193359375, -7.9669189453125, -7.66064453125, -7.3543701171875, -7.048095703125, -6.7418212890625, -6.435546875, -6.1292724609375, -5.822998046875, -5.5167236328125, -5.21044921875, -4.9041748046875, -4.597900390625, -4.2916259765625, -3.9853515625, -3.6790771484375, -3.372802734375, -3.0665283203125, -2.76025390625, -2.4539794921875, -2.147705078125, -1.8414306640625, -1.53515625, -1.2288818359375, -0.922607421875, -0.6163330078125, -0.31005859375, -0.0037841796875, 0.302490234375, 0.6087646484375, 0.9150390625, 1.2213134765625, 1.527587890625, 1.8338623046875, 2.14013671875, 2.4464111328125, 2.752685546875, 3.0589599609375, 3.365234375, 3.6715087890625, 3.977783203125, 4.2840576171875, 4.59033203125, 4.8966064453125, 5.202880859375, 5.5091552734375, 5.8154296875, 6.1217041015625, 6.427978515625, 6.7342529296875, 7.04052734375, 7.3468017578125, 7.653076171875, 7.9593505859375, 8.265625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 15.0, 37.0, 72.0, 157.0, 264.0, 204.0, 117.0, 56.0, 31.0, 17.0, 8.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.45606994628906, -123.65691375732422, -118.8577651977539, -114.05860900878906, -109.25946044921875, -104.4603042602539, -99.66114807128906, -94.86199951171875, -90.0628433227539, -85.26368713378906, -80.46453857421875, -75.6653823852539, -70.86622619628906, -66.06707763671875, -61.267921447753906, -56.46876907348633, -51.66961669921875, -46.87046432495117, -42.071311950683594, -37.27215576171875, -32.47300338745117, -27.673851013183594, -22.874696731567383, -18.075542449951172, -13.276390075683594, -8.4772367477417, -3.6780834197998047, 1.1210699081420898, 5.920223236083984, 10.719375610351562, 15.518529891967773, 20.317684173583984, 25.1168212890625, 29.915973663330078, 34.715126037597656, 39.5142822265625, 44.31343460083008, 49.112586975097656, 53.9117431640625, 58.71089553833008, 63.510047912597656, 68.3092041015625, 73.10835266113281, 77.90750885009766, 82.7066650390625, 87.50581359863281, 92.30496978759766, 97.1041259765625, 101.90327453613281, 106.70243072509766, 111.50157928466797, 116.30073547363281, 121.09988403320312, 125.89904022216797, 130.6981964111328, 135.49734497070312, 140.2965087890625, 145.0956573486328, 149.8948211669922, 154.6939697265625, 159.4931182861328, 164.29226684570312, 169.0914306640625, 173.8905792236328, 178.68972778320312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 13.0, 5.0, 11.0, 9.0, 11.0, 12.0, 11.0, 19.0, 21.0, 14.0, 25.0, 19.0, 20.0, 24.0, 32.0, 42.0, 55.0, 59.0, 65.0, 66.0, 58.0, 51.0, 41.0, 26.0, 28.0, 37.0, 21.0, 19.0, 24.0, 21.0, 14.0, 15.0, 21.0, 15.0, 13.0, 6.0, 5.0, 7.0, 13.0, 10.0, 0.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-62.65190887451172, -60.691123962402344, -58.730342864990234, -56.76955795288086, -54.80877685546875, -52.847991943359375, -50.88720703125, -48.926422119140625, -46.965641021728516, -45.00485610961914, -43.04407501220703, -41.083290100097656, -39.12250518798828, -37.16172409057617, -35.2009391784668, -33.24015808105469, -31.279373168945312, -29.31859016418457, -27.357807159423828, -25.397022247314453, -23.43623924255371, -21.47545623779297, -19.514671325683594, -17.55388832092285, -15.59310531616211, -13.632322311401367, -11.671538352966309, -9.71075439453125, -7.749971389770508, -5.789188385009766, -3.828404426574707, -1.8676204681396484, 0.09316253662109375, 2.053946018218994, 4.0147294998168945, 5.975512981414795, 7.936296463012695, 9.897079467773438, 11.857863426208496, 13.818647384643555, 15.779430389404297, 17.74021339416504, 19.70099639892578, 21.661781311035156, 23.6225643157959, 25.58334732055664, 27.544132232666016, 29.504915237426758, 31.4656982421875, 33.426483154296875, 35.387264251708984, 37.34804916381836, 39.30883026123047, 41.269615173339844, 43.23040008544922, 45.191184997558594, 47.1519660949707, 49.11275100708008, 51.07353210449219, 53.03431701660156, 54.99510192871094, 56.95588302612305, 58.91666793823242, 60.87744903564453, 62.838233947753906]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 4.0, 5.0, 12.0, 33.0, 38.0, 59.0, 98.0, 154.0, 242.0, 396.0, 598.0, 1149.0, 2162.0, 4373.0, 10423.0, 31826.0, 173013.0, 1872332.0, 1873943.0, 173458.0, 30872.0, 10036.0, 4199.0, 2023.0, 1079.0, 671.0, 416.0, 234.0, 141.0, 85.0, 61.0, 37.0, 26.0, 21.0, 16.0, 15.0, 8.0, 3.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.65338134765625, -6.4239501953125, -6.19451904296875, -5.965087890625, -5.73565673828125, -5.5062255859375, -5.27679443359375, -5.04736328125, -4.81793212890625, -4.5885009765625, -4.35906982421875, -4.129638671875, -3.90020751953125, -3.6707763671875, -3.44134521484375, -3.2119140625, -2.98248291015625, -2.7530517578125, -2.52362060546875, -2.294189453125, -2.06475830078125, -1.8353271484375, -1.60589599609375, -1.37646484375, -1.14703369140625, -0.9176025390625, -0.68817138671875, -0.458740234375, -0.22930908203125, 0.0001220703125, 0.22955322265625, 0.458984375, 0.68841552734375, 0.9178466796875, 1.14727783203125, 1.376708984375, 1.60614013671875, 1.8355712890625, 2.06500244140625, 2.29443359375, 2.52386474609375, 2.7532958984375, 2.98272705078125, 3.212158203125, 3.44158935546875, 3.6710205078125, 3.90045166015625, 4.1298828125, 4.35931396484375, 4.5887451171875, 4.81817626953125, 5.047607421875, 5.27703857421875, 5.5064697265625, 5.73590087890625, 5.96533203125, 6.19476318359375, 6.4241943359375, 6.65362548828125, 6.883056640625, 7.11248779296875, 7.3419189453125, 7.57135009765625, 7.80078125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 4.0, 9.0, 12.0, 15.0, 14.0, 20.0, 28.0, 33.0, 30.0, 39.0, 37.0, 50.0, 69.0, 72.0, 62.0, 59.0, 52.0, 57.0, 55.0, 61.0, 34.0, 41.0, 42.0, 23.0, 20.0, 13.0, 10.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.626953125, -3.456695556640625, -3.28643798828125, -3.116180419921875, -2.9459228515625, -2.775665283203125, -2.60540771484375, -2.435150146484375, -2.264892578125, -2.094635009765625, -1.92437744140625, -1.754119873046875, -1.5838623046875, -1.413604736328125, -1.24334716796875, -1.073089599609375, -0.90283203125, -0.732574462890625, -0.56231689453125, -0.392059326171875, -0.2218017578125, -0.051544189453125, 0.11871337890625, 0.288970947265625, 0.459228515625, 0.629486083984375, 0.79974365234375, 0.970001220703125, 1.1402587890625, 1.310516357421875, 1.48077392578125, 1.651031494140625, 1.8212890625, 1.991546630859375, 2.16180419921875, 2.332061767578125, 2.5023193359375, 2.672576904296875, 2.84283447265625, 3.013092041015625, 3.183349609375, 3.353607177734375, 3.52386474609375, 3.694122314453125, 3.8643798828125, 4.034637451171875, 4.20489501953125, 4.375152587890625, 4.54541015625, 4.715667724609375, 4.88592529296875, 5.056182861328125, 5.2264404296875, 5.396697998046875, 5.56695556640625, 5.737213134765625, 5.907470703125, 6.077728271484375, 6.24798583984375, 6.418243408203125, 6.5885009765625, 6.758758544921875, 6.92901611328125, 7.099273681640625, 7.26953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 2.0, 6.0, 9.0, 17.0, 20.0, 27.0, 49.0, 57.0, 91.0, 97.0, 152.0, 265.0, 419.0, 744.0, 1509.0, 3921.0, 14466.0, 97647.0, 3298375.0, 720601.0, 42021.0, 8362.0, 2613.0, 1165.0, 579.0, 339.0, 216.0, 159.0, 92.0, 75.0, 48.0, 38.0, 27.0, 23.0, 12.0, 7.0, 7.0, 3.0, 6.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.9296875, -13.477294921875, -13.02490234375, -12.572509765625, -12.1201171875, -11.667724609375, -11.21533203125, -10.762939453125, -10.310546875, -9.858154296875, -9.40576171875, -8.953369140625, -8.5009765625, -8.048583984375, -7.59619140625, -7.143798828125, -6.69140625, -6.239013671875, -5.78662109375, -5.334228515625, -4.8818359375, -4.429443359375, -3.97705078125, -3.524658203125, -3.072265625, -2.619873046875, -2.16748046875, -1.715087890625, -1.2626953125, -0.810302734375, -0.35791015625, 0.094482421875, 0.546875, 0.999267578125, 1.45166015625, 1.904052734375, 2.3564453125, 2.808837890625, 3.26123046875, 3.713623046875, 4.166015625, 4.618408203125, 5.07080078125, 5.523193359375, 5.9755859375, 6.427978515625, 6.88037109375, 7.332763671875, 7.78515625, 8.237548828125, 8.68994140625, 9.142333984375, 9.5947265625, 10.047119140625, 10.49951171875, 10.951904296875, 11.404296875, 11.856689453125, 12.30908203125, 12.761474609375, 13.2138671875, 13.666259765625, 14.11865234375, 14.571044921875, 15.0234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 7.0, 10.0, 12.0, 22.0, 26.0, 56.0, 93.0, 216.0, 454.0, 1086.0, 1052.0, 503.0, 213.0, 108.0, 71.0, 47.0, 32.0, 22.0, 16.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.96875, -16.469970703125, -15.97119140625, -15.472412109375, -14.9736328125, -14.474853515625, -13.97607421875, -13.477294921875, -12.978515625, -12.479736328125, -11.98095703125, -11.482177734375, -10.9833984375, -10.484619140625, -9.98583984375, -9.487060546875, -8.98828125, -8.489501953125, -7.99072265625, -7.491943359375, -6.9931640625, -6.494384765625, -5.99560546875, -5.496826171875, -4.998046875, -4.499267578125, -4.00048828125, -3.501708984375, -3.0029296875, -2.504150390625, -2.00537109375, -1.506591796875, -1.0078125, -0.509033203125, -0.01025390625, 0.488525390625, 0.9873046875, 1.486083984375, 1.98486328125, 2.483642578125, 2.982421875, 3.481201171875, 3.97998046875, 4.478759765625, 4.9775390625, 5.476318359375, 5.97509765625, 6.473876953125, 6.97265625, 7.471435546875, 7.97021484375, 8.468994140625, 8.9677734375, 9.466552734375, 9.96533203125, 10.464111328125, 10.962890625, 11.461669921875, 11.96044921875, 12.459228515625, 12.9580078125, 13.456787109375, 13.95556640625, 14.454345703125, 14.953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 7.0, 14.0, 53.0, 133.0, 290.0, 295.0, 129.0, 35.0, 28.0, 6.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-260.38079833984375, -253.84283447265625, -247.30487060546875, -240.76690673828125, -234.2289581298828, -227.6909942626953, -221.1530303955078, -214.6150665283203, -208.07711791992188, -201.53915405273438, -195.00119018554688, -188.46322631835938, -181.92527770996094, -175.38731384277344, -168.84934997558594, -162.31138610839844, -155.77342224121094, -149.23545837402344, -142.69749450683594, -136.1595458984375, -129.62158203125, -123.0836181640625, -116.545654296875, -110.0076904296875, -103.46973419189453, -96.93177032470703, -90.39381408691406, -83.85585021972656, -77.31788635253906, -70.7799301147461, -64.2419662475586, -57.70400619506836, -51.166046142578125, -44.62808609008789, -38.090126037597656, -31.552162170410156, -25.014202117919922, -18.476242065429688, -11.938278198242188, -5.400318145751953, 1.1376419067382812, 7.675602912902832, 14.213563919067383, 20.75152587890625, 27.289485931396484, 33.82744598388672, 40.36540985107422, 46.90336990356445, 53.44132995605469, 59.97929000854492, 66.51725006103516, 73.05521392822266, 79.59317016601562, 86.13113403320312, 92.66909790039062, 99.20706176757812, 105.7450180053711, 112.2829818725586, 118.82093811035156, 125.35890197753906, 131.89686584472656, 138.434814453125, 144.9727783203125, 151.5107421875, 158.0487060546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 9.0, 9.0, 8.0, 13.0, 16.0, 28.0, 21.0, 43.0, 39.0, 37.0, 53.0, 56.0, 43.0, 58.0, 65.0, 74.0, 55.0, 59.0, 47.0, 54.0, 41.0, 37.0, 25.0, 25.0, 17.0, 11.0, 24.0, 8.0, 7.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.72247314453125, -62.74386978149414, -60.7652702331543, -58.78666687011719, -56.808067321777344, -54.829463958740234, -52.85086441040039, -50.87226104736328, -48.89366149902344, -46.91505813598633, -44.936458587646484, -42.957855224609375, -40.97925567626953, -39.00065231323242, -37.02205276489258, -35.04344940185547, -33.064849853515625, -31.08624839782715, -29.107646942138672, -27.129045486450195, -25.15044403076172, -23.17184066772461, -21.193241119384766, -19.214637756347656, -17.236034393310547, -15.25743293762207, -13.278831481933594, -11.300230026245117, -9.32162857055664, -7.343026161193848, -5.364424705505371, -3.3858232498168945, -1.4072227478027344, 0.5713788270950317, 2.549980401992798, 4.5285820960998535, 6.50718355178833, 8.485785484313965, 10.464386940002441, 12.442988395690918, 14.421589851379395, 16.400192260742188, 18.378793716430664, 20.35739517211914, 22.335996627807617, 24.314598083496094, 26.29319953918457, 28.271800994873047, 30.250402450561523, 32.22900390625, 34.20760726928711, 36.18620681762695, 38.16481018066406, 40.143409729003906, 42.122013092041016, 44.10061264038086, 46.07921600341797, 48.05781936645508, 50.03641891479492, 52.01502227783203, 53.993621826171875, 55.972225189208984, 57.95082473754883, 59.92942810058594, 61.90802764892578]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 9.0, 12.0, 14.0, 17.0, 25.0, 40.0, 84.0, 105.0, 153.0, 275.0, 475.0, 816.0, 1438.0, 2690.0, 5161.0, 11184.0, 25426.0, 63562.0, 159644.0, 308289.0, 265548.0, 118995.0, 46819.0, 19615.0, 8846.0, 4266.0, 2147.0, 1209.0, 679.0, 377.0, 259.0, 142.0, 89.0, 67.0, 31.0, 20.0, 9.0, 10.0, 5.0, 3.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.49554443359375, -6.3035888671875, -6.11163330078125, -5.919677734375, -5.72772216796875, -5.5357666015625, -5.34381103515625, -5.15185546875, -4.95989990234375, -4.7679443359375, -4.57598876953125, -4.384033203125, -4.19207763671875, -4.0001220703125, -3.80816650390625, -3.6162109375, -3.42425537109375, -3.2322998046875, -3.04034423828125, -2.848388671875, -2.65643310546875, -2.4644775390625, -2.27252197265625, -2.08056640625, -1.88861083984375, -1.6966552734375, -1.50469970703125, -1.312744140625, -1.12078857421875, -0.9288330078125, -0.73687744140625, -0.544921875, -0.35296630859375, -0.1610107421875, 0.03094482421875, 0.222900390625, 0.41485595703125, 0.6068115234375, 0.79876708984375, 0.99072265625, 1.18267822265625, 1.3746337890625, 1.56658935546875, 1.758544921875, 1.95050048828125, 2.1424560546875, 2.33441162109375, 2.5263671875, 2.71832275390625, 2.9102783203125, 3.10223388671875, 3.294189453125, 3.48614501953125, 3.6781005859375, 3.87005615234375, 4.06201171875, 4.25396728515625, 4.4459228515625, 4.63787841796875, 4.829833984375, 5.02178955078125, 5.2137451171875, 5.40570068359375, 5.59765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 12.0, 11.0, 10.0, 20.0, 25.0, 22.0, 37.0, 43.0, 49.0, 41.0, 55.0, 68.0, 61.0, 53.0, 61.0, 50.0, 64.0, 46.0, 44.0, 46.0, 26.0, 31.0, 30.0, 25.0, 17.0, 14.0, 8.0, 7.0, 3.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.87664794921875, -3.6986083984375, -3.52056884765625, -3.342529296875, -3.16448974609375, -2.9864501953125, -2.80841064453125, -2.63037109375, -2.45233154296875, -2.2742919921875, -2.09625244140625, -1.918212890625, -1.74017333984375, -1.5621337890625, -1.38409423828125, -1.2060546875, -1.02801513671875, -0.8499755859375, -0.67193603515625, -0.493896484375, -0.31585693359375, -0.1378173828125, 0.04022216796875, 0.21826171875, 0.39630126953125, 0.5743408203125, 0.75238037109375, 0.930419921875, 1.10845947265625, 1.2864990234375, 1.46453857421875, 1.642578125, 1.82061767578125, 1.9986572265625, 2.17669677734375, 2.354736328125, 2.53277587890625, 2.7108154296875, 2.88885498046875, 3.06689453125, 3.24493408203125, 3.4229736328125, 3.60101318359375, 3.779052734375, 3.95709228515625, 4.1351318359375, 4.31317138671875, 4.4912109375, 4.66925048828125, 4.8472900390625, 5.02532958984375, 5.203369140625, 5.38140869140625, 5.5594482421875, 5.73748779296875, 5.91552734375, 6.09356689453125, 6.2716064453125, 6.44964599609375, 6.627685546875, 6.80572509765625, 6.9837646484375, 7.16180419921875, 7.33984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 4.0, 4.0, 6.0, 11.0, 16.0, 16.0, 36.0, 38.0, 56.0, 81.0, 133.0, 183.0, 282.0, 511.0, 950.0, 2030.0, 4527.0, 13564.0, 58104.0, 343150.0, 531231.0, 68851.0, 15140.0, 5099.0, 2013.0, 1046.0, 581.0, 324.0, 167.0, 126.0, 69.0, 63.0, 43.0, 25.0, 19.0, 9.0, 10.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.59375, -11.2203369140625, -10.846923828125, -10.4735107421875, -10.10009765625, -9.7266845703125, -9.353271484375, -8.9798583984375, -8.6064453125, -8.2330322265625, -7.859619140625, -7.4862060546875, -7.11279296875, -6.7393798828125, -6.365966796875, -5.9925537109375, -5.619140625, -5.2457275390625, -4.872314453125, -4.4989013671875, -4.12548828125, -3.7520751953125, -3.378662109375, -3.0052490234375, -2.6318359375, -2.2584228515625, -1.885009765625, -1.5115966796875, -1.13818359375, -0.7647705078125, -0.391357421875, -0.0179443359375, 0.35546875, 0.7288818359375, 1.102294921875, 1.4757080078125, 1.84912109375, 2.2225341796875, 2.595947265625, 2.9693603515625, 3.3427734375, 3.7161865234375, 4.089599609375, 4.4630126953125, 4.83642578125, 5.2098388671875, 5.583251953125, 5.9566650390625, 6.330078125, 6.7034912109375, 7.076904296875, 7.4503173828125, 7.82373046875, 8.1971435546875, 8.570556640625, 8.9439697265625, 9.3173828125, 9.6907958984375, 10.064208984375, 10.4376220703125, 10.81103515625, 11.1844482421875, 11.557861328125, 11.9312744140625, 12.3046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 6.0, 14.0, 9.0, 18.0, 25.0, 32.0, 17.0, 37.0, 51.0, 48.0, 46.0, 47.0, 55.0, 44.0, 65.0, 39.0, 54.0, 56.0, 45.0, 41.0, 37.0, 33.0, 27.0, 23.0, 27.0, 20.0, 18.0, 8.0, 15.0, 10.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.810791015625, -14.26220703125, -13.713623046875, -13.1650390625, -12.616455078125, -12.06787109375, -11.519287109375, -10.970703125, -10.422119140625, -9.87353515625, -9.324951171875, -8.7763671875, -8.227783203125, -7.67919921875, -7.130615234375, -6.58203125, -6.033447265625, -5.48486328125, -4.936279296875, -4.3876953125, -3.839111328125, -3.29052734375, -2.741943359375, -2.193359375, -1.644775390625, -1.09619140625, -0.547607421875, 0.0009765625, 0.549560546875, 1.09814453125, 1.646728515625, 2.1953125, 2.743896484375, 3.29248046875, 3.841064453125, 4.3896484375, 4.938232421875, 5.48681640625, 6.035400390625, 6.583984375, 7.132568359375, 7.68115234375, 8.229736328125, 8.7783203125, 9.326904296875, 9.87548828125, 10.424072265625, 10.97265625, 11.521240234375, 12.06982421875, 12.618408203125, 13.1669921875, 13.715576171875, 14.26416015625, 14.812744140625, 15.361328125, 15.909912109375, 16.45849609375, 17.007080078125, 17.5556640625, 18.104248046875, 18.65283203125, 19.201416015625, 19.75]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 8.0, 9.0, 16.0, 27.0, 33.0, 26.0, 49.0, 74.0, 123.0, 215.0, 372.0, 600.0, 940.0, 1687.0, 3246.0, 6638.0, 15152.0, 40602.0, 146984.0, 600957.0, 157592.0, 43136.0, 15715.0, 6759.0, 3314.0, 1720.0, 997.0, 550.0, 369.0, 212.0, 162.0, 83.0, 62.0, 41.0, 28.0, 13.0, 10.0, 3.0, 8.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.841796875, -2.75164794921875, -2.6614990234375, -2.57135009765625, -2.481201171875, -2.39105224609375, -2.3009033203125, -2.21075439453125, -2.12060546875, -2.03045654296875, -1.9403076171875, -1.85015869140625, -1.760009765625, -1.66986083984375, -1.5797119140625, -1.48956298828125, -1.3994140625, -1.30926513671875, -1.2191162109375, -1.12896728515625, -1.038818359375, -0.94866943359375, -0.8585205078125, -0.76837158203125, -0.67822265625, -0.58807373046875, -0.4979248046875, -0.40777587890625, -0.317626953125, -0.22747802734375, -0.1373291015625, -0.04718017578125, 0.04296875, 0.13311767578125, 0.2232666015625, 0.31341552734375, 0.403564453125, 0.49371337890625, 0.5838623046875, 0.67401123046875, 0.76416015625, 0.85430908203125, 0.9444580078125, 1.03460693359375, 1.124755859375, 1.21490478515625, 1.3050537109375, 1.39520263671875, 1.4853515625, 1.57550048828125, 1.6656494140625, 1.75579833984375, 1.845947265625, 1.93609619140625, 2.0262451171875, 2.11639404296875, 2.20654296875, 2.29669189453125, 2.3868408203125, 2.47698974609375, 2.567138671875, 2.65728759765625, 2.7474365234375, 2.83758544921875, 2.927734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 10.0, 11.0, 22.0, 36.0, 66.0, 209.0, 252.0, 175.0, 78.0, 40.0, 25.0, 10.0, 16.0, 9.0, 4.0, 4.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001651763916015625, -0.00159551203250885, -0.0015392601490020752, -0.0014830082654953003, -0.0014267563819885254, -0.0013705044984817505, -0.0013142526149749756, -0.0012580007314682007, -0.0012017488479614258, -0.0011454969644546509, -0.001089245080947876, -0.001032993197441101, -0.0009767413139343262, -0.0009204894304275513, -0.0008642375469207764, -0.0008079856634140015, -0.0007517337799072266, -0.0006954818964004517, -0.0006392300128936768, -0.0005829781293869019, -0.000526726245880127, -0.00047047436237335205, -0.00041422247886657715, -0.00035797059535980225, -0.00030171871185302734, -0.00024546682834625244, -0.00018921494483947754, -0.00013296306133270264, -7.671117782592773e-05, -2.0459294319152832e-05, 3.579258918762207e-05, 9.204447269439697e-05, 0.00014829635620117188, 0.00020454823970794678, 0.0002608001232147217, 0.0003170520067214966, 0.0003733038902282715, 0.0004295557737350464, 0.0004858076572418213, 0.0005420595407485962, 0.0005983114242553711, 0.000654563307762146, 0.0007108151912689209, 0.0007670670747756958, 0.0008233189582824707, 0.0008795708417892456, 0.0009358227252960205, 0.0009920746088027954, 0.0010483264923095703, 0.0011045783758163452, 0.0011608302593231201, 0.001217082142829895, 0.00127333402633667, 0.0013295859098434448, 0.0013858377933502197, 0.0014420896768569946, 0.0014983415603637695, 0.0015545934438705444, 0.0016108453273773193, 0.0016670972108840942, 0.0017233490943908691, 0.001779600977897644, 0.001835852861404419, 0.0018921047449111938, 0.0019483566284179688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 4.0, 10.0, 12.0, 15.0, 25.0, 28.0, 40.0, 87.0, 158.0, 275.0, 555.0, 1343.0, 3403.0, 10394.0, 38977.0, 228327.0, 653311.0, 83414.0, 18674.0, 5652.0, 2098.0, 831.0, 437.0, 204.0, 90.0, 64.0, 47.0, 26.0, 12.0, 11.0, 12.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.96484375, -4.831512451171875, -4.69818115234375, -4.564849853515625, -4.4315185546875, -4.298187255859375, -4.16485595703125, -4.031524658203125, -3.898193359375, -3.764862060546875, -3.63153076171875, -3.498199462890625, -3.3648681640625, -3.231536865234375, -3.09820556640625, -2.964874267578125, -2.83154296875, -2.698211669921875, -2.56488037109375, -2.431549072265625, -2.2982177734375, -2.164886474609375, -2.03155517578125, -1.898223876953125, -1.764892578125, -1.631561279296875, -1.49822998046875, -1.364898681640625, -1.2315673828125, -1.098236083984375, -0.96490478515625, -0.831573486328125, -0.6982421875, -0.564910888671875, -0.43157958984375, -0.298248291015625, -0.1649169921875, -0.031585693359375, 0.10174560546875, 0.235076904296875, 0.368408203125, 0.501739501953125, 0.63507080078125, 0.768402099609375, 0.9017333984375, 1.035064697265625, 1.16839599609375, 1.301727294921875, 1.43505859375, 1.568389892578125, 1.70172119140625, 1.835052490234375, 1.9683837890625, 2.101715087890625, 2.23504638671875, 2.368377685546875, 2.501708984375, 2.635040283203125, 2.76837158203125, 2.901702880859375, 3.0350341796875, 3.168365478515625, 3.30169677734375, 3.435028076171875, 3.568359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 14.0, 19.0, 17.0, 23.0, 31.0, 46.0, 51.0, 72.0, 79.0, 83.0, 86.0, 95.0, 63.0, 76.0, 43.0, 37.0, 33.0, 26.0, 12.0, 20.0, 6.0, 5.0, 4.0, 2.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.619140625, -3.516143798828125, -3.41314697265625, -3.310150146484375, -3.2071533203125, -3.104156494140625, -3.00115966796875, -2.898162841796875, -2.795166015625, -2.692169189453125, -2.58917236328125, -2.486175537109375, -2.3831787109375, -2.280181884765625, -2.17718505859375, -2.074188232421875, -1.97119140625, -1.868194580078125, -1.76519775390625, -1.662200927734375, -1.5592041015625, -1.456207275390625, -1.35321044921875, -1.250213623046875, -1.147216796875, -1.044219970703125, -0.94122314453125, -0.838226318359375, -0.7352294921875, -0.632232666015625, -0.52923583984375, -0.426239013671875, -0.3232421875, -0.220245361328125, -0.11724853515625, -0.014251708984375, 0.0887451171875, 0.191741943359375, 0.29473876953125, 0.397735595703125, 0.500732421875, 0.603729248046875, 0.70672607421875, 0.809722900390625, 0.9127197265625, 1.015716552734375, 1.11871337890625, 1.221710205078125, 1.32470703125, 1.427703857421875, 1.53070068359375, 1.633697509765625, 1.7366943359375, 1.839691162109375, 1.94268798828125, 2.045684814453125, 2.148681640625, 2.251678466796875, 2.35467529296875, 2.457672119140625, 2.5606689453125, 2.663665771484375, 2.76666259765625, 2.869659423828125, 2.97265625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 20.0, 41.0, 71.0, 142.0, 258.0, 238.0, 112.0, 58.0, 24.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.380126953125, -96.49137115478516, -92.60261535644531, -88.71385192871094, -84.8250961303711, -80.93634033203125, -77.0475845336914, -73.15882873535156, -69.27006530761719, -65.38130950927734, -61.492549896240234, -57.60379409790039, -53.71503448486328, -49.82627868652344, -45.937522888183594, -42.048763275146484, -38.16000747680664, -34.2712516784668, -30.382492065429688, -26.493736267089844, -22.604976654052734, -18.71622085571289, -14.827463150024414, -10.938705444335938, -7.049947738647461, -3.1611902713775635, 0.727567195892334, 4.616324424743652, 8.505082130432129, 12.393838882446289, 16.282596588134766, 20.171354293823242, 24.06011199951172, 27.948869705200195, 31.837627410888672, 35.726383209228516, 39.615142822265625, 43.50389862060547, 47.39265441894531, 51.28141403198242, 55.17017364501953, 59.058929443359375, 62.947689056396484, 66.8364486694336, 70.72520446777344, 74.61396026611328, 78.50271606445312, 82.3914794921875, 86.28022766113281, 90.16898345947266, 94.0577392578125, 97.94650268554688, 101.83525848388672, 105.72401428222656, 109.6127700805664, 113.50152587890625, 117.39028930664062, 121.27904510498047, 125.16780090332031, 129.0565643310547, 132.9453125, 136.83407592773438, 140.72283935546875, 144.61158752441406, 148.50035095214844]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 6.0, 6.0, 5.0, 10.0, 10.0, 10.0, 9.0, 18.0, 19.0, 21.0, 26.0, 25.0, 21.0, 37.0, 27.0, 38.0, 33.0, 53.0, 60.0, 76.0, 64.0, 50.0, 39.0, 42.0, 33.0, 26.0, 37.0, 34.0, 23.0, 14.0, 15.0, 19.0, 19.0, 15.0, 9.0, 13.0, 5.0, 5.0, 5.0, 1.0, 7.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.46983337402344, -52.68632888793945, -50.90282440185547, -49.11932373046875, -47.335819244384766, -45.55231475830078, -43.7688102722168, -41.98530578613281, -40.20180130004883, -38.418296813964844, -36.63479232788086, -34.851287841796875, -33.067787170410156, -31.284282684326172, -29.500778198242188, -27.717273712158203, -25.93377113342285, -24.150266647338867, -22.366764068603516, -20.58325958251953, -18.799755096435547, -17.016250610351562, -15.232748031616211, -13.449243545532227, -11.665740013122559, -9.88223648071289, -8.098731994628906, -6.315228462219238, -4.531724452972412, -2.748220443725586, -0.964716911315918, 0.8187875747680664, 2.6022911071777344, 4.3857951164245605, 6.169299125671387, 7.952802658081055, 9.736307144165039, 11.519810676574707, 13.303314208984375, 15.08681869506836, 16.870323181152344, 18.653827667236328, 20.43733024597168, 22.220834732055664, 24.00433921813965, 25.787841796875, 27.571346282958984, 29.35485076904297, 31.13835334777832, 32.92185592651367, 34.705360412597656, 36.48886489868164, 38.272369384765625, 40.05587387084961, 41.839378356933594, 43.62287902832031, 45.4063835144043, 47.18988800048828, 48.973392486572266, 50.75689697265625, 52.54039764404297, 54.32390213012695, 56.10740661621094, 57.89091110229492, 59.674415588378906]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 13.0, 8.0, 21.0, 14.0, 41.0, 63.0, 112.0, 145.0, 258.0, 432.0, 832.0, 1538.0, 2990.0, 6275.0, 15362.0, 51537.0, 295141.0, 1901606.0, 1616351.0, 234322.0, 42923.0, 12991.0, 5324.0, 2586.0, 1357.0, 795.0, 465.0, 285.0, 183.0, 97.0, 65.0, 47.0, 30.0, 21.0, 20.0, 6.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.703125, -5.518798828125, -5.33447265625, -5.150146484375, -4.9658203125, -4.781494140625, -4.59716796875, -4.412841796875, -4.228515625, -4.044189453125, -3.85986328125, -3.675537109375, -3.4912109375, -3.306884765625, -3.12255859375, -2.938232421875, -2.75390625, -2.569580078125, -2.38525390625, -2.200927734375, -2.0166015625, -1.832275390625, -1.64794921875, -1.463623046875, -1.279296875, -1.094970703125, -0.91064453125, -0.726318359375, -0.5419921875, -0.357666015625, -0.17333984375, 0.010986328125, 0.1953125, 0.379638671875, 0.56396484375, 0.748291015625, 0.9326171875, 1.116943359375, 1.30126953125, 1.485595703125, 1.669921875, 1.854248046875, 2.03857421875, 2.222900390625, 2.4072265625, 2.591552734375, 2.77587890625, 2.960205078125, 3.14453125, 3.328857421875, 3.51318359375, 3.697509765625, 3.8818359375, 4.066162109375, 4.25048828125, 4.434814453125, 4.619140625, 4.803466796875, 4.98779296875, 5.172119140625, 5.3564453125, 5.540771484375, 5.72509765625, 5.909423828125, 6.09375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 2.0, 9.0, 9.0, 8.0, 12.0, 22.0, 23.0, 29.0, 43.0, 42.0, 37.0, 39.0, 66.0, 70.0, 75.0, 59.0, 64.0, 49.0, 55.0, 52.0, 45.0, 50.0, 34.0, 30.0, 17.0, 19.0, 8.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.98046875, -3.803466796875, -3.62646484375, -3.449462890625, -3.2724609375, -3.095458984375, -2.91845703125, -2.741455078125, -2.564453125, -2.387451171875, -2.21044921875, -2.033447265625, -1.8564453125, -1.679443359375, -1.50244140625, -1.325439453125, -1.1484375, -0.971435546875, -0.79443359375, -0.617431640625, -0.4404296875, -0.263427734375, -0.08642578125, 0.090576171875, 0.267578125, 0.444580078125, 0.62158203125, 0.798583984375, 0.9755859375, 1.152587890625, 1.32958984375, 1.506591796875, 1.68359375, 1.860595703125, 2.03759765625, 2.214599609375, 2.3916015625, 2.568603515625, 2.74560546875, 2.922607421875, 3.099609375, 3.276611328125, 3.45361328125, 3.630615234375, 3.8076171875, 3.984619140625, 4.16162109375, 4.338623046875, 4.515625, 4.692626953125, 4.86962890625, 5.046630859375, 5.2236328125, 5.400634765625, 5.57763671875, 5.754638671875, 5.931640625, 6.108642578125, 6.28564453125, 6.462646484375, 6.6396484375, 6.816650390625, 6.99365234375, 7.170654296875, 7.34765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 6.0, 17.0, 42.0, 52.0, 101.0, 160.0, 253.0, 596.0, 3684.0, 1480916.0, 2703056.0, 4164.0, 621.0, 265.0, 133.0, 85.0, 55.0, 30.0, 21.0, 10.0, 3.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.58935546875, -34.2724609375, -32.95556640625, -31.638671875, -30.32177734375, -29.0048828125, -27.68798828125, -26.37109375, -25.05419921875, -23.7373046875, -22.42041015625, -21.103515625, -19.78662109375, -18.4697265625, -17.15283203125, -15.8359375, -14.51904296875, -13.2021484375, -11.88525390625, -10.568359375, -9.25146484375, -7.9345703125, -6.61767578125, -5.30078125, -3.98388671875, -2.6669921875, -1.35009765625, -0.033203125, 1.28369140625, 2.6005859375, 3.91748046875, 5.234375, 6.55126953125, 7.8681640625, 9.18505859375, 10.501953125, 11.81884765625, 13.1357421875, 14.45263671875, 15.76953125, 17.08642578125, 18.4033203125, 19.72021484375, 21.037109375, 22.35400390625, 23.6708984375, 24.98779296875, 26.3046875, 27.62158203125, 28.9384765625, 30.25537109375, 31.572265625, 32.88916015625, 34.2060546875, 35.52294921875, 36.83984375, 38.15673828125, 39.4736328125, 40.79052734375, 42.107421875, 43.42431640625, 44.7412109375, 46.05810546875, 47.375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 34.0, 80.0, 196.0, 685.0, 1820.0, 860.0, 223.0, 85.0, 43.0, 14.0, 9.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.119140625, -19.30078125, -18.482421875, -17.6640625, -16.845703125, -16.02734375, -15.208984375, -14.390625, -13.572265625, -12.75390625, -11.935546875, -11.1171875, -10.298828125, -9.48046875, -8.662109375, -7.84375, -7.025390625, -6.20703125, -5.388671875, -4.5703125, -3.751953125, -2.93359375, -2.115234375, -1.296875, -0.478515625, 0.33984375, 1.158203125, 1.9765625, 2.794921875, 3.61328125, 4.431640625, 5.25, 6.068359375, 6.88671875, 7.705078125, 8.5234375, 9.341796875, 10.16015625, 10.978515625, 11.796875, 12.615234375, 13.43359375, 14.251953125, 15.0703125, 15.888671875, 16.70703125, 17.525390625, 18.34375, 19.162109375, 19.98046875, 20.798828125, 21.6171875, 22.435546875, 23.25390625, 24.072265625, 24.890625, 25.708984375, 26.52734375, 27.345703125, 28.1640625, 28.982421875, 29.80078125, 30.619140625, 31.4375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 21.0, 34.0, 115.0, 236.0, 320.0, 157.0, 61.0, 29.0, 11.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-276.21636962890625, -270.2434387207031, -264.2705078125, -258.2975769042969, -252.32464599609375, -246.3517303466797, -240.37879943847656, -234.40586853027344, -228.4329376220703, -222.4600067138672, -216.48707580566406, -210.51414489746094, -204.54122924804688, -198.56829833984375, -192.59536743164062, -186.6224365234375, -180.64950561523438, -174.67657470703125, -168.70364379882812, -162.730712890625, -156.75778198242188, -150.7848663330078, -144.8119354248047, -138.83900451660156, -132.86607360839844, -126.89314270019531, -120.92021179199219, -114.9472885131836, -108.97435760498047, -103.00142669677734, -97.02850341796875, -91.05557250976562, -85.08262634277344, -79.10969543457031, -73.13676452636719, -67.1638412475586, -61.19091033935547, -55.217979431152344, -49.245052337646484, -43.272125244140625, -37.2991943359375, -31.326265335083008, -25.353336334228516, -19.380407333374023, -13.407478332519531, -7.434549331665039, -1.4616203308105469, 4.5113067626953125, 10.484237670898438, 16.45716667175293, 22.430095672607422, 28.403024673461914, 34.375953674316406, 40.34888458251953, 46.32181167602539, 52.29473876953125, 58.267669677734375, 64.2406005859375, 70.21353149414062, 76.18645477294922, 82.15938568115234, 88.13231658935547, 94.10523986816406, 100.07817077636719, 106.05110168457031]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 15.0, 17.0, 23.0, 23.0, 25.0, 29.0, 40.0, 35.0, 40.0, 38.0, 39.0, 39.0, 35.0, 48.0, 54.0, 44.0, 39.0, 43.0, 38.0, 39.0, 44.0, 38.0, 14.0, 22.0, 20.0, 30.0, 12.0, 12.0, 21.0, 8.0, 7.0, 3.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-43.81529998779297, -42.46793746948242, -41.120574951171875, -39.773216247558594, -38.42585372924805, -37.0784912109375, -35.73113250732422, -34.38376998901367, -33.036407470703125, -31.689044952392578, -30.341684341430664, -28.99432373046875, -27.646961212158203, -26.299598693847656, -24.952238082885742, -23.604877471923828, -22.25751495361328, -20.910152435302734, -19.56279182434082, -18.215431213378906, -16.86806869506836, -15.520707130432129, -14.173345565795898, -12.825984001159668, -11.478622436523438, -10.131260871887207, -8.783899307250977, -7.436537742614746, -6.089176177978516, -4.741814613342285, -3.3944530487060547, -2.047091484069824, -0.6997337341308594, 0.6476278305053711, 1.9949893951416016, 3.342350959777832, 4.6897125244140625, 6.037074089050293, 7.384435653686523, 8.731797218322754, 10.079158782958984, 11.426520347595215, 12.773881912231445, 14.121243476867676, 15.468605041503906, 16.815967559814453, 18.163328170776367, 19.51068878173828, 20.858051300048828, 22.205413818359375, 23.55277442932129, 24.900135040283203, 26.24749755859375, 27.594860076904297, 28.94222068786621, 30.289581298828125, 31.636943817138672, 32.98430633544922, 34.3316650390625, 35.67902755737305, 37.026390075683594, 38.37375259399414, 39.72111511230469, 41.06847381591797, 42.415836334228516]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 18.0, 17.0, 35.0, 45.0, 67.0, 121.0, 208.0, 386.0, 786.0, 1522.0, 3080.0, 6667.0, 15850.0, 41400.0, 119087.0, 320268.0, 334486.0, 129602.0, 44218.0, 16983.0, 7057.0, 3272.0, 1545.0, 842.0, 409.0, 235.0, 140.0, 77.0, 38.0, 38.0, 14.0, 11.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.28125, -8.07440185546875, -7.8675537109375, -7.66070556640625, -7.453857421875, -7.24700927734375, -7.0401611328125, -6.83331298828125, -6.62646484375, -6.41961669921875, -6.2127685546875, -6.00592041015625, -5.799072265625, -5.59222412109375, -5.3853759765625, -5.17852783203125, -4.9716796875, -4.76483154296875, -4.5579833984375, -4.35113525390625, -4.144287109375, -3.93743896484375, -3.7305908203125, -3.52374267578125, -3.31689453125, -3.11004638671875, -2.9031982421875, -2.69635009765625, -2.489501953125, -2.28265380859375, -2.0758056640625, -1.86895751953125, -1.662109375, -1.45526123046875, -1.2484130859375, -1.04156494140625, -0.834716796875, -0.62786865234375, -0.4210205078125, -0.21417236328125, -0.00732421875, 0.19952392578125, 0.4063720703125, 0.61322021484375, 0.820068359375, 1.02691650390625, 1.2337646484375, 1.44061279296875, 1.6474609375, 1.85430908203125, 2.0611572265625, 2.26800537109375, 2.474853515625, 2.68170166015625, 2.8885498046875, 3.09539794921875, 3.30224609375, 3.50909423828125, 3.7159423828125, 3.92279052734375, 4.129638671875, 4.33648681640625, 4.5433349609375, 4.75018310546875, 4.95703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 1.0, 5.0, 12.0, 13.0, 16.0, 20.0, 22.0, 36.0, 33.0, 34.0, 48.0, 52.0, 50.0, 53.0, 66.0, 54.0, 56.0, 61.0, 55.0, 49.0, 51.0, 44.0, 35.0, 26.0, 21.0, 24.0, 18.0, 10.0, 7.0, 6.0, 10.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.13818359375, -3.9560546875, -3.77392578125, -3.591796875, -3.40966796875, -3.2275390625, -3.04541015625, -2.86328125, -2.68115234375, -2.4990234375, -2.31689453125, -2.134765625, -1.95263671875, -1.7705078125, -1.58837890625, -1.40625, -1.22412109375, -1.0419921875, -0.85986328125, -0.677734375, -0.49560546875, -0.3134765625, -0.13134765625, 0.05078125, 0.23291015625, 0.4150390625, 0.59716796875, 0.779296875, 0.96142578125, 1.1435546875, 1.32568359375, 1.5078125, 1.68994140625, 1.8720703125, 2.05419921875, 2.236328125, 2.41845703125, 2.6005859375, 2.78271484375, 2.96484375, 3.14697265625, 3.3291015625, 3.51123046875, 3.693359375, 3.87548828125, 4.0576171875, 4.23974609375, 4.421875, 4.60400390625, 4.7861328125, 4.96826171875, 5.150390625, 5.33251953125, 5.5146484375, 5.69677734375, 5.87890625, 6.06103515625, 6.2431640625, 6.42529296875, 6.607421875, 6.78955078125, 6.9716796875, 7.15380859375, 7.3359375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 3.0, 4.0, 4.0, 9.0, 14.0, 17.0, 33.0, 33.0, 37.0, 58.0, 56.0, 83.0, 123.0, 180.0, 254.0, 301.0, 537.0, 878.0, 1737.0, 3837.0, 11355.0, 42307.0, 222247.0, 636035.0, 94963.0, 21430.0, 6411.0, 2436.0, 1160.0, 617.0, 404.0, 257.0, 179.0, 126.0, 103.0, 68.0, 65.0, 43.0, 37.0, 26.0, 19.0, 14.0, 15.0, 10.0, 11.0, 4.0, 3.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3125, -8.994140625, -8.67578125, -8.357421875, -8.0390625, -7.720703125, -7.40234375, -7.083984375, -6.765625, -6.447265625, -6.12890625, -5.810546875, -5.4921875, -5.173828125, -4.85546875, -4.537109375, -4.21875, -3.900390625, -3.58203125, -3.263671875, -2.9453125, -2.626953125, -2.30859375, -1.990234375, -1.671875, -1.353515625, -1.03515625, -0.716796875, -0.3984375, -0.080078125, 0.23828125, 0.556640625, 0.875, 1.193359375, 1.51171875, 1.830078125, 2.1484375, 2.466796875, 2.78515625, 3.103515625, 3.421875, 3.740234375, 4.05859375, 4.376953125, 4.6953125, 5.013671875, 5.33203125, 5.650390625, 5.96875, 6.287109375, 6.60546875, 6.923828125, 7.2421875, 7.560546875, 7.87890625, 8.197265625, 8.515625, 8.833984375, 9.15234375, 9.470703125, 9.7890625, 10.107421875, 10.42578125, 10.744140625, 11.0625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 6.0, 6.0, 12.0, 10.0, 12.0, 11.0, 23.0, 14.0, 8.0, 32.0, 33.0, 29.0, 37.0, 37.0, 44.0, 44.0, 42.0, 49.0, 49.0, 51.0, 52.0, 50.0, 46.0, 39.0, 37.0, 32.0, 18.0, 20.0, 29.0, 18.0, 10.0, 22.0, 8.0, 11.0, 8.0, 9.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8515625, -14.3704833984375, -13.889404296875, -13.4083251953125, -12.92724609375, -12.4461669921875, -11.965087890625, -11.4840087890625, -11.0029296875, -10.5218505859375, -10.040771484375, -9.5596923828125, -9.07861328125, -8.5975341796875, -8.116455078125, -7.6353759765625, -7.154296875, -6.6732177734375, -6.192138671875, -5.7110595703125, -5.22998046875, -4.7489013671875, -4.267822265625, -3.7867431640625, -3.3056640625, -2.8245849609375, -2.343505859375, -1.8624267578125, -1.38134765625, -0.9002685546875, -0.419189453125, 0.0618896484375, 0.54296875, 1.0240478515625, 1.505126953125, 1.9862060546875, 2.46728515625, 2.9483642578125, 3.429443359375, 3.9105224609375, 4.3916015625, 4.8726806640625, 5.353759765625, 5.8348388671875, 6.31591796875, 6.7969970703125, 7.278076171875, 7.7591552734375, 8.240234375, 8.7213134765625, 9.202392578125, 9.6834716796875, 10.16455078125, 10.6456298828125, 11.126708984375, 11.6077880859375, 12.0888671875, 12.5699462890625, 13.051025390625, 13.5321044921875, 14.01318359375, 14.4942626953125, 14.975341796875, 15.4564208984375, 15.9375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 9.0, 16.0, 15.0, 32.0, 35.0, 46.0, 85.0, 134.0, 192.0, 387.0, 612.0, 1039.0, 2112.0, 4225.0, 9238.0, 22809.0, 65131.0, 279464.0, 540697.0, 76211.0, 25850.0, 10519.0, 4665.0, 2164.0, 1135.0, 680.0, 357.0, 228.0, 144.0, 84.0, 69.0, 47.0, 23.0, 14.0, 16.0, 10.0, 16.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.8603515625, -1.7963409423828125, -1.732330322265625, -1.6683197021484375, -1.60430908203125, -1.5402984619140625, -1.476287841796875, -1.4122772216796875, -1.3482666015625, -1.2842559814453125, -1.220245361328125, -1.1562347412109375, -1.09222412109375, -1.0282135009765625, -0.964202880859375, -0.9001922607421875, -0.836181640625, -0.7721710205078125, -0.708160400390625, -0.6441497802734375, -0.58013916015625, -0.5161285400390625, -0.452117919921875, -0.3881072998046875, -0.3240966796875, -0.2600860595703125, -0.196075439453125, -0.1320648193359375, -0.06805419921875, -0.0040435791015625, 0.059967041015625, 0.1239776611328125, 0.18798828125, 0.2519989013671875, 0.316009521484375, 0.3800201416015625, 0.44403076171875, 0.5080413818359375, 0.572052001953125, 0.6360626220703125, 0.7000732421875, 0.7640838623046875, 0.828094482421875, 0.8921051025390625, 0.95611572265625, 1.0201263427734375, 1.084136962890625, 1.1481475830078125, 1.212158203125, 1.2761688232421875, 1.340179443359375, 1.4041900634765625, 1.46820068359375, 1.5322113037109375, 1.596221923828125, 1.6602325439453125, 1.7242431640625, 1.7882537841796875, 1.852264404296875, 1.9162750244140625, 1.98028564453125, 2.0442962646484375, 2.108306884765625, 2.1723175048828125, 2.236328125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 6.0, 8.0, 5.0, 13.0, 6.0, 17.0, 35.0, 36.0, 56.0, 105.0, 184.0, 195.0, 111.0, 71.0, 35.0, 30.0, 16.0, 7.0, 11.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0012502670288085938, -0.001214638352394104, -0.0011790096759796143, -0.0011433809995651245, -0.0011077523231506348, -0.001072123646736145, -0.0010364949703216553, -0.0010008662939071655, -0.0009652376174926758, -0.000929608941078186, -0.0008939802646636963, -0.0008583515882492065, -0.0008227229118347168, -0.000787094235420227, -0.0007514655590057373, -0.0007158368825912476, -0.0006802082061767578, -0.0006445795297622681, -0.0006089508533477783, -0.0005733221769332886, -0.0005376935005187988, -0.0005020648241043091, -0.00046643614768981934, -0.0004308074712753296, -0.00039517879486083984, -0.0003595501184463501, -0.00032392144203186035, -0.0002882927656173706, -0.00025266408920288086, -0.0002170354127883911, -0.00018140673637390137, -0.00014577805995941162, -0.00011014938354492188, -7.452070713043213e-05, -3.889203071594238e-05, -3.2633543014526367e-06, 3.236532211303711e-05, 6.799399852752686e-05, 0.0001036226749420166, 0.00013925135135650635, 0.0001748800277709961, 0.00021050870418548584, 0.0002461373805999756, 0.00028176605701446533, 0.0003173947334289551, 0.0003530234098434448, 0.00038865208625793457, 0.0004242807626724243, 0.00045990943908691406, 0.0004955381155014038, 0.0005311667919158936, 0.0005667954683303833, 0.000602424144744873, 0.0006380528211593628, 0.0006736814975738525, 0.0007093101739883423, 0.000744938850402832, 0.0007805675268173218, 0.0008161962032318115, 0.0008518248796463013, 0.000887453556060791, 0.0009230822324752808, 0.0009587109088897705, 0.0009943395853042603, 0.00102996826171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 7.0, 4.0, 10.0, 10.0, 7.0, 15.0, 16.0, 23.0, 20.0, 37.0, 54.0, 110.0, 171.0, 244.0, 349.0, 581.0, 967.0, 1657.0, 3076.0, 6850.0, 16421.0, 48015.0, 173606.0, 626858.0, 111462.0, 34195.0, 12355.0, 5183.0, 2646.0, 1332.0, 811.0, 493.0, 322.0, 200.0, 139.0, 104.0, 61.0, 46.0, 30.0, 16.0, 12.0, 9.0, 6.0, 4.0, 2.0, 16.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.580078125, -2.507080078125, -2.43408203125, -2.361083984375, -2.2880859375, -2.215087890625, -2.14208984375, -2.069091796875, -1.99609375, -1.923095703125, -1.85009765625, -1.777099609375, -1.7041015625, -1.631103515625, -1.55810546875, -1.485107421875, -1.412109375, -1.339111328125, -1.26611328125, -1.193115234375, -1.1201171875, -1.047119140625, -0.97412109375, -0.901123046875, -0.828125, -0.755126953125, -0.68212890625, -0.609130859375, -0.5361328125, -0.463134765625, -0.39013671875, -0.317138671875, -0.244140625, -0.171142578125, -0.09814453125, -0.025146484375, 0.0478515625, 0.120849609375, 0.19384765625, 0.266845703125, 0.33984375, 0.412841796875, 0.48583984375, 0.558837890625, 0.6318359375, 0.704833984375, 0.77783203125, 0.850830078125, 0.923828125, 0.996826171875, 1.06982421875, 1.142822265625, 1.2158203125, 1.288818359375, 1.36181640625, 1.434814453125, 1.5078125, 1.580810546875, 1.65380859375, 1.726806640625, 1.7998046875, 1.872802734375, 1.94580078125, 2.018798828125, 2.091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 5.0, 3.0, 9.0, 11.0, 13.0, 11.0, 12.0, 14.0, 22.0, 22.0, 20.0, 32.0, 28.0, 37.0, 57.0, 61.0, 60.0, 87.0, 88.0, 76.0, 61.0, 47.0, 39.0, 34.0, 26.0, 20.0, 15.0, 16.0, 10.0, 6.0, 9.0, 6.0, 9.0, 10.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.380859375, -2.30780029296875, -2.2347412109375, -2.16168212890625, -2.088623046875, -2.01556396484375, -1.9425048828125, -1.86944580078125, -1.79638671875, -1.72332763671875, -1.6502685546875, -1.57720947265625, -1.504150390625, -1.43109130859375, -1.3580322265625, -1.28497314453125, -1.2119140625, -1.13885498046875, -1.0657958984375, -0.99273681640625, -0.919677734375, -0.84661865234375, -0.7735595703125, -0.70050048828125, -0.62744140625, -0.55438232421875, -0.4813232421875, -0.40826416015625, -0.335205078125, -0.26214599609375, -0.1890869140625, -0.11602783203125, -0.04296875, 0.03009033203125, 0.1031494140625, 0.17620849609375, 0.249267578125, 0.32232666015625, 0.3953857421875, 0.46844482421875, 0.54150390625, 0.61456298828125, 0.6876220703125, 0.76068115234375, 0.833740234375, 0.90679931640625, 0.9798583984375, 1.05291748046875, 1.1259765625, 1.19903564453125, 1.2720947265625, 1.34515380859375, 1.418212890625, 1.49127197265625, 1.5643310546875, 1.63739013671875, 1.71044921875, 1.78350830078125, 1.8565673828125, 1.92962646484375, 2.002685546875, 2.07574462890625, 2.1488037109375, 2.22186279296875, 2.294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 8.0, 16.0, 38.0, 51.0, 93.0, 130.0, 234.0, 163.0, 93.0, 45.0, 39.0, 27.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.77720260620117, -56.64575958251953, -54.514320373535156, -52.382877349853516, -50.25143814086914, -48.1199951171875, -45.988555908203125, -43.857112884521484, -41.725669860839844, -39.5942268371582, -37.46278762817383, -35.33134460449219, -33.19990539550781, -31.068462371826172, -28.937021255493164, -26.805580139160156, -24.67414093017578, -22.542699813842773, -20.411258697509766, -18.279815673828125, -16.14837646484375, -14.016934394836426, -11.885492324829102, -9.754051208496094, -7.622610092163086, -5.491168975830078, -3.359727382659912, -1.228285789489746, 0.9031553268432617, 3.0345964431762695, 5.166038513183594, 7.297479629516602, 9.428916931152344, 11.560358047485352, 13.69179916381836, 15.823241233825684, 17.954681396484375, 20.086124420166016, 22.217565536499023, 24.34900665283203, 26.48044776916504, 28.611888885498047, 30.743330001831055, 32.87477111816406, 35.0062141418457, 37.13765335083008, 39.26909637451172, 41.400535583496094, 43.531978607177734, 45.663421630859375, 47.79486083984375, 49.92630386352539, 52.057743072509766, 54.189186096191406, 56.32062530517578, 58.45206832885742, 60.58351135253906, 62.7149543762207, 64.84639739990234, 66.97783660888672, 69.1092758178711, 71.24071502685547, 73.37216186523438, 75.50360107421875, 77.63504028320312]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 9.0, 7.0, 11.0, 10.0, 17.0, 26.0, 30.0, 24.0, 34.0, 38.0, 45.0, 63.0, 99.0, 130.0, 100.0, 70.0, 59.0, 40.0, 41.0, 32.0, 23.0, 23.0, 9.0, 13.0, 9.0, 12.0, 9.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-107.55998229980469, -104.90193939208984, -102.243896484375, -99.58584594726562, -96.92780303955078, -94.26976013183594, -91.61170959472656, -88.95366668701172, -86.29562377929688, -83.63758087158203, -80.97953796386719, -78.32148742675781, -75.66344451904297, -73.00540161132812, -70.34735107421875, -67.6893081665039, -65.03126525878906, -62.37322235107422, -59.71517562866211, -57.05712890625, -54.399085998535156, -51.74104309082031, -49.0829963684082, -46.424949645996094, -43.76690673828125, -41.108863830566406, -38.4508171081543, -35.79277038574219, -33.134727478027344, -30.476682662963867, -27.81863784790039, -25.160593032836914, -22.502540588378906, -19.84449577331543, -17.186450958251953, -14.528406143188477, -11.870361328125, -9.212316513061523, -6.554271697998047, -3.8962268829345703, -1.2381820678710938, 1.4198627471923828, 4.077907562255859, 6.735952377319336, 9.393997192382812, 12.052042007446289, 14.710086822509766, 17.368131637573242, 20.02617645263672, 22.684221267700195, 25.342266082763672, 28.00031089782715, 30.658355712890625, 33.31639862060547, 35.97444534301758, 38.63249206542969, 41.29053497314453, 43.948577880859375, 46.606624603271484, 49.264671325683594, 51.92271423339844, 54.58075714111328, 57.23880386352539, 59.8968505859375, 62.554893493652344]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 5.0, 3.0, 11.0, 13.0, 16.0, 30.0, 32.0, 53.0, 72.0, 104.0, 172.0, 238.0, 456.0, 779.0, 1331.0, 2688.0, 5988.0, 16412.0, 63984.0, 385464.0, 2173948.0, 1301532.0, 186890.0, 34750.0, 10406.0, 4158.0, 2027.0, 1087.0, 556.0, 380.0, 230.0, 154.0, 86.0, 63.0, 38.0, 30.0, 29.0, 22.0, 17.0, 7.0, 6.0, 8.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.47076416015625, -6.2735595703125, -6.07635498046875, -5.879150390625, -5.68194580078125, -5.4847412109375, -5.28753662109375, -5.09033203125, -4.89312744140625, -4.6959228515625, -4.49871826171875, -4.301513671875, -4.10430908203125, -3.9071044921875, -3.70989990234375, -3.5126953125, -3.31549072265625, -3.1182861328125, -2.92108154296875, -2.723876953125, -2.52667236328125, -2.3294677734375, -2.13226318359375, -1.93505859375, -1.73785400390625, -1.5406494140625, -1.34344482421875, -1.146240234375, -0.94903564453125, -0.7518310546875, -0.55462646484375, -0.357421875, -0.16021728515625, 0.0369873046875, 0.23419189453125, 0.431396484375, 0.62860107421875, 0.8258056640625, 1.02301025390625, 1.22021484375, 1.41741943359375, 1.6146240234375, 1.81182861328125, 2.009033203125, 2.20623779296875, 2.4034423828125, 2.60064697265625, 2.7978515625, 2.99505615234375, 3.1922607421875, 3.38946533203125, 3.586669921875, 3.78387451171875, 3.9810791015625, 4.17828369140625, 4.37548828125, 4.57269287109375, 4.7698974609375, 4.96710205078125, 5.164306640625, 5.36151123046875, 5.5587158203125, 5.75592041015625, 5.953125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 8.0, 8.0, 22.0, 20.0, 20.0, 31.0, 30.0, 40.0, 46.0, 60.0, 51.0, 67.0, 62.0, 63.0, 58.0, 65.0, 62.0, 56.0, 31.0, 37.0, 22.0, 32.0, 24.0, 23.0, 17.0, 11.0, 10.0, 6.0, 4.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.0697021484375, -3.889404296875, -3.7091064453125, -3.52880859375, -3.3485107421875, -3.168212890625, -2.9879150390625, -2.8076171875, -2.6273193359375, -2.447021484375, -2.2667236328125, -2.08642578125, -1.9061279296875, -1.725830078125, -1.5455322265625, -1.365234375, -1.1849365234375, -1.004638671875, -0.8243408203125, -0.64404296875, -0.4637451171875, -0.283447265625, -0.1031494140625, 0.0771484375, 0.2574462890625, 0.437744140625, 0.6180419921875, 0.79833984375, 0.9786376953125, 1.158935546875, 1.3392333984375, 1.51953125, 1.6998291015625, 1.880126953125, 2.0604248046875, 2.24072265625, 2.4210205078125, 2.601318359375, 2.7816162109375, 2.9619140625, 3.1422119140625, 3.322509765625, 3.5028076171875, 3.68310546875, 3.8634033203125, 4.043701171875, 4.2239990234375, 4.404296875, 4.5845947265625, 4.764892578125, 4.9451904296875, 5.12548828125, 5.3057861328125, 5.486083984375, 5.6663818359375, 5.8466796875, 6.0269775390625, 6.207275390625, 6.3875732421875, 6.56787109375, 6.7481689453125, 6.928466796875, 7.1087646484375, 7.2890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 9.0, 21.0, 34.0, 50.0, 99.0, 179.0, 317.0, 832.0, 2916.0, 40003.0, 4038903.0, 104402.0, 4534.0, 1016.0, 445.0, 235.0, 123.0, 62.0, 31.0, 20.0, 18.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.640625, -28.7587890625, -27.876953125, -26.9951171875, -26.11328125, -25.2314453125, -24.349609375, -23.4677734375, -22.5859375, -21.7041015625, -20.822265625, -19.9404296875, -19.05859375, -18.1767578125, -17.294921875, -16.4130859375, -15.53125, -14.6494140625, -13.767578125, -12.8857421875, -12.00390625, -11.1220703125, -10.240234375, -9.3583984375, -8.4765625, -7.5947265625, -6.712890625, -5.8310546875, -4.94921875, -4.0673828125, -3.185546875, -2.3037109375, -1.421875, -0.5400390625, 0.341796875, 1.2236328125, 2.10546875, 2.9873046875, 3.869140625, 4.7509765625, 5.6328125, 6.5146484375, 7.396484375, 8.2783203125, 9.16015625, 10.0419921875, 10.923828125, 11.8056640625, 12.6875, 13.5693359375, 14.451171875, 15.3330078125, 16.21484375, 17.0966796875, 17.978515625, 18.8603515625, 19.7421875, 20.6240234375, 21.505859375, 22.3876953125, 23.26953125, 24.1513671875, 25.033203125, 25.9150390625, 26.796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 7.0, 16.0, 31.0, 41.0, 71.0, 153.0, 431.0, 939.0, 1214.0, 637.0, 272.0, 126.0, 53.0, 26.0, 16.0, 11.0, 9.0, 10.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.9375, -19.338623046875, -18.73974609375, -18.140869140625, -17.5419921875, -16.943115234375, -16.34423828125, -15.745361328125, -15.146484375, -14.547607421875, -13.94873046875, -13.349853515625, -12.7509765625, -12.152099609375, -11.55322265625, -10.954345703125, -10.35546875, -9.756591796875, -9.15771484375, -8.558837890625, -7.9599609375, -7.361083984375, -6.76220703125, -6.163330078125, -5.564453125, -4.965576171875, -4.36669921875, -3.767822265625, -3.1689453125, -2.570068359375, -1.97119140625, -1.372314453125, -0.7734375, -0.174560546875, 0.42431640625, 1.023193359375, 1.6220703125, 2.220947265625, 2.81982421875, 3.418701171875, 4.017578125, 4.616455078125, 5.21533203125, 5.814208984375, 6.4130859375, 7.011962890625, 7.61083984375, 8.209716796875, 8.80859375, 9.407470703125, 10.00634765625, 10.605224609375, 11.2041015625, 11.802978515625, 12.40185546875, 13.000732421875, 13.599609375, 14.198486328125, 14.79736328125, 15.396240234375, 15.9951171875, 16.593994140625, 17.19287109375, 17.791748046875, 18.390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 10.0, 10.0, 37.0, 78.0, 169.0, 262.0, 234.0, 109.0, 53.0, 16.0, 10.0, 11.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.4344940185547, -149.5614776611328, -144.68846130371094, -139.81544494628906, -134.9424285888672, -130.0694122314453, -125.19640350341797, -120.3233871459961, -115.45037078857422, -110.57735443115234, -105.70433807373047, -100.8313217163086, -95.95831298828125, -91.08529663085938, -86.2122802734375, -81.33926391601562, -76.46624755859375, -71.59323120117188, -66.72021484375, -61.84720230102539, -56.974185943603516, -52.10116958618164, -47.22815704345703, -42.355140686035156, -37.48212432861328, -32.609107971191406, -27.736093521118164, -22.863079071044922, -17.990062713623047, -13.117046356201172, -8.24403190612793, -3.3710174560546875, 1.50201416015625, 6.375029563903809, 11.248044967651367, 16.12105941772461, 20.994075775146484, 25.86709213256836, 30.7401065826416, 35.613121032714844, 40.48613739013672, 45.359153747558594, 50.23217010498047, 55.10518264770508, 59.97819900512695, 64.85121154785156, 69.72422790527344, 74.59724426269531, 79.47026062011719, 84.34327697753906, 89.21629333496094, 94.08930969238281, 98.96232604980469, 103.83534240722656, 108.7083511352539, 113.58136749267578, 118.45438385009766, 123.32740020751953, 128.20040893554688, 133.07342529296875, 137.94644165039062, 142.8194580078125, 147.69247436523438, 152.56549072265625, 157.43850708007812]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 7.0, 4.0, 6.0, 8.0, 9.0, 12.0, 8.0, 14.0, 23.0, 15.0, 17.0, 12.0, 23.0, 24.0, 24.0, 28.0, 44.0, 42.0, 51.0, 47.0, 47.0, 48.0, 40.0, 35.0, 42.0, 51.0, 42.0, 27.0, 33.0, 27.0, 30.0, 24.0, 24.0, 13.0, 19.0, 8.0, 12.0, 13.0, 12.0, 7.0, 4.0, 8.0, 6.0, 4.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.855377197265625, -44.46354675292969, -43.071712493896484, -41.67987823486328, -40.288047790527344, -38.896217346191406, -37.5043830871582, -36.112548828125, -34.72071838378906, -33.328887939453125, -31.937053680419922, -30.54522132873535, -29.15338897705078, -27.76155662536621, -26.36972427368164, -24.97789192199707, -23.5860595703125, -22.19422721862793, -20.80239486694336, -19.41056251525879, -18.01873016357422, -16.62689781188965, -15.235065460205078, -13.843233108520508, -12.451400756835938, -11.059568405151367, -9.667736053466797, -8.275903701782227, -6.884071350097656, -5.492238998413086, -4.100406646728516, -2.7085742950439453, -1.3167381286621094, 0.07509422302246094, 1.4669265747070312, 2.8587589263916016, 4.250591278076172, 5.642423629760742, 7.0342559814453125, 8.426088333129883, 9.817920684814453, 11.209753036499023, 12.601585388183594, 13.993417739868164, 15.385250091552734, 16.777082443237305, 18.168914794921875, 19.560747146606445, 20.952579498291016, 22.344411849975586, 23.736244201660156, 25.128076553344727, 26.519908905029297, 27.911741256713867, 29.303573608398438, 30.695405960083008, 32.08723831176758, 33.47907257080078, 34.87090301513672, 36.262733459472656, 37.65456771850586, 39.04640197753906, 40.438232421875, 41.83006286621094, 43.22189712524414]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 10.0, 21.0, 19.0, 28.0, 47.0, 47.0, 84.0, 117.0, 207.0, 342.0, 601.0, 1119.0, 2016.0, 3958.0, 8105.0, 18228.0, 44034.0, 116403.0, 302669.0, 330459.0, 131433.0, 49698.0, 20584.0, 9044.0, 4273.0, 2216.0, 1142.0, 635.0, 395.0, 228.0, 139.0, 103.0, 50.0, 24.0, 20.0, 17.0, 12.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.49615478515625, -5.2852783203125, -5.07440185546875, -4.863525390625, -4.65264892578125, -4.4417724609375, -4.23089599609375, -4.02001953125, -3.80914306640625, -3.5982666015625, -3.38739013671875, -3.176513671875, -2.96563720703125, -2.7547607421875, -2.54388427734375, -2.3330078125, -2.12213134765625, -1.9112548828125, -1.70037841796875, -1.489501953125, -1.27862548828125, -1.0677490234375, -0.85687255859375, -0.64599609375, -0.43511962890625, -0.2242431640625, -0.01336669921875, 0.197509765625, 0.40838623046875, 0.6192626953125, 0.83013916015625, 1.041015625, 1.25189208984375, 1.4627685546875, 1.67364501953125, 1.884521484375, 2.09539794921875, 2.3062744140625, 2.51715087890625, 2.72802734375, 2.93890380859375, 3.1497802734375, 3.36065673828125, 3.571533203125, 3.78240966796875, 3.9932861328125, 4.20416259765625, 4.4150390625, 4.62591552734375, 4.8367919921875, 5.04766845703125, 5.258544921875, 5.46942138671875, 5.6802978515625, 5.89117431640625, 6.10205078125, 6.31292724609375, 6.5238037109375, 6.73468017578125, 6.945556640625, 7.15643310546875, 7.3673095703125, 7.57818603515625, 7.7890625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 2.0, 7.0, 6.0, 13.0, 9.0, 17.0, 18.0, 23.0, 27.0, 33.0, 27.0, 30.0, 53.0, 54.0, 36.0, 67.0, 36.0, 62.0, 66.0, 53.0, 50.0, 29.0, 48.0, 40.0, 34.0, 34.0, 20.0, 25.0, 16.0, 15.0, 19.0, 11.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.736328125, -3.564178466796875, -3.39202880859375, -3.219879150390625, -3.0477294921875, -2.875579833984375, -2.70343017578125, -2.531280517578125, -2.359130859375, -2.186981201171875, -2.01483154296875, -1.842681884765625, -1.6705322265625, -1.498382568359375, -1.32623291015625, -1.154083251953125, -0.98193359375, -0.809783935546875, -0.63763427734375, -0.465484619140625, -0.2933349609375, -0.121185302734375, 0.05096435546875, 0.223114013671875, 0.395263671875, 0.567413330078125, 0.73956298828125, 0.911712646484375, 1.0838623046875, 1.256011962890625, 1.42816162109375, 1.600311279296875, 1.7724609375, 1.944610595703125, 2.11676025390625, 2.288909912109375, 2.4610595703125, 2.633209228515625, 2.80535888671875, 2.977508544921875, 3.149658203125, 3.321807861328125, 3.49395751953125, 3.666107177734375, 3.8382568359375, 4.010406494140625, 4.18255615234375, 4.354705810546875, 4.52685546875, 4.699005126953125, 4.87115478515625, 5.043304443359375, 5.2154541015625, 5.387603759765625, 5.55975341796875, 5.731903076171875, 5.904052734375, 6.076202392578125, 6.24835205078125, 6.420501708984375, 6.5926513671875, 6.764801025390625, 6.93695068359375, 7.109100341796875, 7.28125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 14.0, 13.0, 15.0, 22.0, 40.0, 43.0, 49.0, 76.0, 104.0, 167.0, 225.0, 333.0, 506.0, 813.0, 1433.0, 3047.0, 8825.0, 39702.0, 567602.0, 372852.0, 37637.0, 8285.0, 3057.0, 1386.0, 814.0, 477.0, 317.0, 198.0, 150.0, 106.0, 55.0, 53.0, 35.0, 25.0, 17.0, 19.0, 12.0, 8.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.390625, -11.963134765625, -11.53564453125, -11.108154296875, -10.6806640625, -10.253173828125, -9.82568359375, -9.398193359375, -8.970703125, -8.543212890625, -8.11572265625, -7.688232421875, -7.2607421875, -6.833251953125, -6.40576171875, -5.978271484375, -5.55078125, -5.123291015625, -4.69580078125, -4.268310546875, -3.8408203125, -3.413330078125, -2.98583984375, -2.558349609375, -2.130859375, -1.703369140625, -1.27587890625, -0.848388671875, -0.4208984375, 0.006591796875, 0.43408203125, 0.861572265625, 1.2890625, 1.716552734375, 2.14404296875, 2.571533203125, 2.9990234375, 3.426513671875, 3.85400390625, 4.281494140625, 4.708984375, 5.136474609375, 5.56396484375, 5.991455078125, 6.4189453125, 6.846435546875, 7.27392578125, 7.701416015625, 8.12890625, 8.556396484375, 8.98388671875, 9.411376953125, 9.8388671875, 10.266357421875, 10.69384765625, 11.121337890625, 11.548828125, 11.976318359375, 12.40380859375, 12.831298828125, 13.2587890625, 13.686279296875, 14.11376953125, 14.541259765625, 14.96875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 10.0, 11.0, 5.0, 12.0, 12.0, 27.0, 26.0, 31.0, 45.0, 45.0, 48.0, 52.0, 57.0, 76.0, 66.0, 57.0, 57.0, 62.0, 47.0, 42.0, 40.0, 29.0, 33.0, 21.0, 17.0, 9.0, 8.0, 12.0, 13.0, 10.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.301025390625, -17.61767578125, -16.934326171875, -16.2509765625, -15.567626953125, -14.88427734375, -14.200927734375, -13.517578125, -12.834228515625, -12.15087890625, -11.467529296875, -10.7841796875, -10.100830078125, -9.41748046875, -8.734130859375, -8.05078125, -7.367431640625, -6.68408203125, -6.000732421875, -5.3173828125, -4.634033203125, -3.95068359375, -3.267333984375, -2.583984375, -1.900634765625, -1.21728515625, -0.533935546875, 0.1494140625, 0.832763671875, 1.51611328125, 2.199462890625, 2.8828125, 3.566162109375, 4.24951171875, 4.932861328125, 5.6162109375, 6.299560546875, 6.98291015625, 7.666259765625, 8.349609375, 9.032958984375, 9.71630859375, 10.399658203125, 11.0830078125, 11.766357421875, 12.44970703125, 13.133056640625, 13.81640625, 14.499755859375, 15.18310546875, 15.866455078125, 16.5498046875, 17.233154296875, 17.91650390625, 18.599853515625, 19.283203125, 19.966552734375, 20.64990234375, 21.333251953125, 22.0166015625, 22.699951171875, 23.38330078125, 24.066650390625, 24.75]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 10.0, 13.0, 19.0, 31.0, 52.0, 70.0, 131.0, 283.0, 606.0, 2123.0, 11576.0, 183989.0, 821315.0, 23349.0, 3341.0, 871.0, 341.0, 167.0, 88.0, 56.0, 43.0, 24.0, 21.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.06463623046875, -5.8870849609375, -5.70953369140625, -5.531982421875, -5.35443115234375, -5.1768798828125, -4.99932861328125, -4.82177734375, -4.64422607421875, -4.4666748046875, -4.28912353515625, -4.111572265625, -3.93402099609375, -3.7564697265625, -3.57891845703125, -3.4013671875, -3.22381591796875, -3.0462646484375, -2.86871337890625, -2.691162109375, -2.51361083984375, -2.3360595703125, -2.15850830078125, -1.98095703125, -1.80340576171875, -1.6258544921875, -1.44830322265625, -1.270751953125, -1.09320068359375, -0.9156494140625, -0.73809814453125, -0.560546875, -0.38299560546875, -0.2054443359375, -0.02789306640625, 0.149658203125, 0.32720947265625, 0.5047607421875, 0.68231201171875, 0.85986328125, 1.03741455078125, 1.2149658203125, 1.39251708984375, 1.570068359375, 1.74761962890625, 1.9251708984375, 2.10272216796875, 2.2802734375, 2.45782470703125, 2.6353759765625, 2.81292724609375, 2.990478515625, 3.16802978515625, 3.3455810546875, 3.52313232421875, 3.70068359375, 3.87823486328125, 4.0557861328125, 4.23333740234375, 4.410888671875, 4.58843994140625, 4.7659912109375, 4.94354248046875, 5.12109375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 8.0, 11.0, 22.0, 45.0, 92.0, 355.0, 253.0, 82.0, 48.0, 24.0, 15.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002925872802734375, -0.0028340518474578857, -0.0027422308921813965, -0.0026504099369049072, -0.002558588981628418, -0.0024667680263519287, -0.0023749470710754395, -0.00228312611579895, -0.002191305160522461, -0.0020994842052459717, -0.0020076632499694824, -0.0019158422946929932, -0.001824021339416504, -0.0017322003841400146, -0.0016403794288635254, -0.0015485584735870361, -0.0014567375183105469, -0.0013649165630340576, -0.0012730956077575684, -0.001181274652481079, -0.0010894536972045898, -0.0009976327419281006, -0.0009058117866516113, -0.0008139908313751221, -0.0007221698760986328, -0.0006303489208221436, -0.0005385279655456543, -0.00044670701026916504, -0.0003548860549926758, -0.0002630650997161865, -0.00017124414443969727, -7.942318916320801e-05, 1.239776611328125e-05, 0.00010421872138977051, 0.00019603967666625977, 0.000287860631942749, 0.0003796815872192383, 0.00047150254249572754, 0.0005633234977722168, 0.0006551444530487061, 0.0007469654083251953, 0.0008387863636016846, 0.0009306073188781738, 0.001022428274154663, 0.0011142492294311523, 0.0012060701847076416, 0.0012978911399841309, 0.0013897120952606201, 0.0014815330505371094, 0.0015733540058135986, 0.0016651749610900879, 0.0017569959163665771, 0.0018488168716430664, 0.0019406378269195557, 0.002032458782196045, 0.002124279737472534, 0.0022161006927490234, 0.0023079216480255127, 0.002399742603302002, 0.002491563558578491, 0.0025833845138549805, 0.0026752054691314697, 0.002767026424407959, 0.0028588473796844482, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 12.0, 34.0, 45.0, 48.0, 82.0, 108.0, 210.0, 312.0, 537.0, 1038.0, 2166.0, 5757.0, 18507.0, 86569.0, 742341.0, 149409.0, 27861.0, 7715.0, 2833.0, 1264.0, 669.0, 386.0, 250.0, 131.0, 91.0, 53.0, 43.0, 25.0, 12.0, 10.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.417938232421875, -3.31634521484375, -3.214752197265625, -3.1131591796875, -3.011566162109375, -2.90997314453125, -2.808380126953125, -2.706787109375, -2.605194091796875, -2.50360107421875, -2.402008056640625, -2.3004150390625, -2.198822021484375, -2.09722900390625, -1.995635986328125, -1.89404296875, -1.792449951171875, -1.69085693359375, -1.589263916015625, -1.4876708984375, -1.386077880859375, -1.28448486328125, -1.182891845703125, -1.081298828125, -0.979705810546875, -0.87811279296875, -0.776519775390625, -0.6749267578125, -0.573333740234375, -0.47174072265625, -0.370147705078125, -0.2685546875, -0.166961669921875, -0.06536865234375, 0.036224365234375, 0.1378173828125, 0.239410400390625, 0.34100341796875, 0.442596435546875, 0.544189453125, 0.645782470703125, 0.74737548828125, 0.848968505859375, 0.9505615234375, 1.052154541015625, 1.15374755859375, 1.255340576171875, 1.35693359375, 1.458526611328125, 1.56011962890625, 1.661712646484375, 1.7633056640625, 1.864898681640625, 1.96649169921875, 2.068084716796875, 2.169677734375, 2.271270751953125, 2.37286376953125, 2.474456787109375, 2.5760498046875, 2.677642822265625, 2.77923583984375, 2.880828857421875, 2.982421875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 12.0, 5.0, 11.0, 14.0, 20.0, 25.0, 46.0, 56.0, 68.0, 89.0, 132.0, 139.0, 113.0, 69.0, 50.0, 23.0, 32.0, 26.0, 15.0, 21.0, 11.0, 12.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.875335693359375, -4.75067138671875, -4.626007080078125, -4.5013427734375, -4.376678466796875, -4.25201416015625, -4.127349853515625, -4.002685546875, -3.878021240234375, -3.75335693359375, -3.628692626953125, -3.5040283203125, -3.379364013671875, -3.25469970703125, -3.130035400390625, -3.00537109375, -2.880706787109375, -2.75604248046875, -2.631378173828125, -2.5067138671875, -2.382049560546875, -2.25738525390625, -2.132720947265625, -2.008056640625, -1.883392333984375, -1.75872802734375, -1.634063720703125, -1.5093994140625, -1.384735107421875, -1.26007080078125, -1.135406494140625, -1.0107421875, -0.886077880859375, -0.76141357421875, -0.636749267578125, -0.5120849609375, -0.387420654296875, -0.26275634765625, -0.138092041015625, -0.013427734375, 0.111236572265625, 0.23590087890625, 0.360565185546875, 0.4852294921875, 0.609893798828125, 0.73455810546875, 0.859222412109375, 0.98388671875, 1.108551025390625, 1.23321533203125, 1.357879638671875, 1.4825439453125, 1.607208251953125, 1.73187255859375, 1.856536865234375, 1.981201171875, 2.105865478515625, 2.23052978515625, 2.355194091796875, 2.4798583984375, 2.604522705078125, 2.72918701171875, 2.853851318359375, 2.978515625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 13.0, 36.0, 88.0, 422.0, 321.0, 79.0, 24.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.60452270507812, -99.35810852050781, -93.1116943359375, -86.86528015136719, -80.6188735961914, -74.3724594116211, -68.12604522705078, -61.879634857177734, -55.63322067260742, -49.38680648803711, -43.14039611816406, -36.89398193359375, -30.64756965637207, -24.40115737915039, -18.154743194580078, -11.908332824707031, -5.661918640136719, 0.5844941139221191, 6.830906867980957, 13.077320098876953, 19.323732376098633, 25.570144653320312, 31.816558837890625, 38.06296920776367, 44.309383392333984, 50.5557975769043, 56.802207946777344, 63.048622131347656, 69.29503631591797, 75.54144287109375, 81.78785705566406, 88.03427124023438, 94.28068542480469, 100.527099609375, 106.77351379394531, 113.01992797851562, 119.2663345336914, 125.51274871826172, 131.7591552734375, 138.0055694580078, 144.25198364257812, 150.49839782714844, 156.74481201171875, 162.99122619628906, 169.23764038085938, 175.48403930664062, 181.73046875, 187.97686767578125, 194.22329711914062, 200.46971130371094, 206.71612548828125, 212.96253967285156, 219.20895385742188, 225.45535278320312, 231.7017822265625, 237.94818115234375, 244.19459533691406, 250.44100952148438, 256.6874084472656, 262.933837890625, 269.18023681640625, 275.4266662597656, 281.6730651855469, 287.91949462890625, 294.1658935546875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 6.0, 13.0, 13.0, 12.0, 16.0, 17.0, 31.0, 24.0, 34.0, 34.0, 37.0, 41.0, 41.0, 112.0, 139.0, 80.0, 40.0, 35.0, 29.0, 20.0, 30.0, 20.0, 19.0, 28.0, 18.0, 14.0, 17.0, 10.0, 9.0, 10.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-90.8123550415039, -88.3792495727539, -85.94615173339844, -83.51304626464844, -81.07994842529297, -78.64684295654297, -76.2137451171875, -73.7806396484375, -71.3475341796875, -68.9144287109375, -66.48133087158203, -64.04822540283203, -61.61512756347656, -59.18202209472656, -56.74892044067383, -54.315818786621094, -51.882720947265625, -49.44961929321289, -47.016517639160156, -44.58341598510742, -42.15031433105469, -39.71720886230469, -37.28410720825195, -34.85100555419922, -32.417903900146484, -29.98480224609375, -27.551700592041016, -25.11859703063965, -22.685495376586914, -20.25239372253418, -17.819290161132812, -15.386188507080078, -12.953079223632812, -10.519977569580078, -8.086874961853027, -5.653772830963135, -3.220670700073242, -0.7875690460205078, 1.645533561706543, 4.078636169433594, 6.511737823486328, 8.944839477539062, 11.377942085266113, 13.811044692993164, 16.2441463470459, 18.677248001098633, 21.1103515625, 23.543453216552734, 25.97655487060547, 28.409656524658203, 30.842758178710938, 33.27585983276367, 35.708961486816406, 38.142066955566406, 40.57516860961914, 43.008270263671875, 45.44137191772461, 47.874473571777344, 50.30757522583008, 52.74067687988281, 55.17378234863281, 57.60688018798828, 60.03998565673828, 62.473087310791016, 64.90618896484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 9.0, 30.0, 30.0, 38.0, 66.0, 116.0, 196.0, 310.0, 463.0, 780.0, 1394.0, 2379.0, 5171.0, 10946.0, 29807.0, 123403.0, 683168.0, 2138630.0, 964113.0, 173154.0, 36361.0, 12033.0, 5245.0, 2577.0, 1480.0, 858.0, 555.0, 341.0, 225.0, 128.0, 87.0, 48.0, 45.0, 23.0, 20.0, 11.0, 8.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1796875, -5.955810546875, -5.73193359375, -5.508056640625, -5.2841796875, -5.060302734375, -4.83642578125, -4.612548828125, -4.388671875, -4.164794921875, -3.94091796875, -3.717041015625, -3.4931640625, -3.269287109375, -3.04541015625, -2.821533203125, -2.59765625, -2.373779296875, -2.14990234375, -1.926025390625, -1.7021484375, -1.478271484375, -1.25439453125, -1.030517578125, -0.806640625, -0.582763671875, -0.35888671875, -0.135009765625, 0.0888671875, 0.312744140625, 0.53662109375, 0.760498046875, 0.984375, 1.208251953125, 1.43212890625, 1.656005859375, 1.8798828125, 2.103759765625, 2.32763671875, 2.551513671875, 2.775390625, 2.999267578125, 3.22314453125, 3.447021484375, 3.6708984375, 3.894775390625, 4.11865234375, 4.342529296875, 4.56640625, 4.790283203125, 5.01416015625, 5.238037109375, 5.4619140625, 5.685791015625, 5.90966796875, 6.133544921875, 6.357421875, 6.581298828125, 6.80517578125, 7.029052734375, 7.2529296875, 7.476806640625, 7.70068359375, 7.924560546875, 8.1484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 9.0, 15.0, 20.0, 23.0, 29.0, 26.0, 29.0, 31.0, 54.0, 37.0, 56.0, 67.0, 65.0, 59.0, 63.0, 55.0, 50.0, 52.0, 47.0, 45.0, 28.0, 25.0, 14.0, 19.0, 14.0, 22.0, 8.0, 12.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.548431396484375, -3.37615966796875, -3.203887939453125, -3.0316162109375, -2.859344482421875, -2.68707275390625, -2.514801025390625, -2.342529296875, -2.170257568359375, -1.99798583984375, -1.825714111328125, -1.6534423828125, -1.481170654296875, -1.30889892578125, -1.136627197265625, -0.96435546875, -0.792083740234375, -0.61981201171875, -0.447540283203125, -0.2752685546875, -0.102996826171875, 0.06927490234375, 0.241546630859375, 0.413818359375, 0.586090087890625, 0.75836181640625, 0.930633544921875, 1.1029052734375, 1.275177001953125, 1.44744873046875, 1.619720458984375, 1.7919921875, 1.964263916015625, 2.13653564453125, 2.308807373046875, 2.4810791015625, 2.653350830078125, 2.82562255859375, 2.997894287109375, 3.170166015625, 3.342437744140625, 3.51470947265625, 3.686981201171875, 3.8592529296875, 4.031524658203125, 4.20379638671875, 4.376068115234375, 4.54833984375, 4.720611572265625, 4.89288330078125, 5.065155029296875, 5.2374267578125, 5.409698486328125, 5.58197021484375, 5.754241943359375, 5.926513671875, 6.098785400390625, 6.27105712890625, 6.443328857421875, 6.6156005859375, 6.787872314453125, 6.96014404296875, 7.132415771484375, 7.3046875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 18.0, 39.0, 58.0, 147.0, 308.0, 783.0, 6136.0, 4172055.0, 13003.0, 1059.0, 375.0, 157.0, 66.0, 31.0, 23.0, 11.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-96.75, -93.869140625, -90.98828125, -88.107421875, -85.2265625, -82.345703125, -79.46484375, -76.583984375, -73.703125, -70.822265625, -67.94140625, -65.060546875, -62.1796875, -59.298828125, -56.41796875, -53.537109375, -50.65625, -47.775390625, -44.89453125, -42.013671875, -39.1328125, -36.251953125, -33.37109375, -30.490234375, -27.609375, -24.728515625, -21.84765625, -18.966796875, -16.0859375, -13.205078125, -10.32421875, -7.443359375, -4.5625, -1.681640625, 1.19921875, 4.080078125, 6.9609375, 9.841796875, 12.72265625, 15.603515625, 18.484375, 21.365234375, 24.24609375, 27.126953125, 30.0078125, 32.888671875, 35.76953125, 38.650390625, 41.53125, 44.412109375, 47.29296875, 50.173828125, 53.0546875, 55.935546875, 58.81640625, 61.697265625, 64.578125, 67.458984375, 70.33984375, 73.220703125, 76.1015625, 78.982421875, 81.86328125, 84.744140625, 87.625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 15.0, 22.0, 65.0, 154.0, 337.0, 1228.0, 1524.0, 441.0, 143.0, 72.0, 37.0, 23.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.578125, -15.314208984375, -14.05029296875, -12.786376953125, -11.5224609375, -10.258544921875, -8.99462890625, -7.730712890625, -6.466796875, -5.202880859375, -3.93896484375, -2.675048828125, -1.4111328125, -0.147216796875, 1.11669921875, 2.380615234375, 3.64453125, 4.908447265625, 6.17236328125, 7.436279296875, 8.7001953125, 9.964111328125, 11.22802734375, 12.491943359375, 13.755859375, 15.019775390625, 16.28369140625, 17.547607421875, 18.8115234375, 20.075439453125, 21.33935546875, 22.603271484375, 23.8671875, 25.131103515625, 26.39501953125, 27.658935546875, 28.9228515625, 30.186767578125, 31.45068359375, 32.714599609375, 33.978515625, 35.242431640625, 36.50634765625, 37.770263671875, 39.0341796875, 40.298095703125, 41.56201171875, 42.825927734375, 44.08984375, 45.353759765625, 46.61767578125, 47.881591796875, 49.1455078125, 50.409423828125, 51.67333984375, 52.937255859375, 54.201171875, 55.465087890625, 56.72900390625, 57.992919921875, 59.2568359375, 60.520751953125, 61.78466796875, 63.048583984375, 64.3125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 11.0, 12.0, 25.0, 56.0, 104.0, 253.0, 262.0, 142.0, 54.0, 31.0, 17.0, 7.0, 4.0, 5.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.2028503417969, -248.6716766357422, -239.1405029296875, -229.6093292236328, -220.07815551757812, -210.54698181152344, -201.01580810546875, -191.48463439941406, -181.95346069335938, -172.4222869873047, -162.89111328125, -153.3599395751953, -143.82876586914062, -134.29759216308594, -124.76641845703125, -115.23524475097656, -105.70407104492188, -96.17289733886719, -86.6417236328125, -77.11054992675781, -67.57937622070312, -58.04820251464844, -48.51702880859375, -38.98585510253906, -29.454681396484375, -19.923507690429688, -10.392333984375, -0.8611602783203125, 8.670013427734375, 18.201187133789062, 27.73236083984375, 37.26353454589844, 46.794677734375, 56.32585144042969, 65.85702514648438, 75.38819885253906, 84.91937255859375, 94.45054626464844, 103.98171997070312, 113.51289367675781, 123.0440673828125, 132.5752410888672, 142.10641479492188, 151.63758850097656, 161.16876220703125, 170.69993591308594, 180.23110961914062, 189.7622833251953, 199.29345703125, 208.8246307373047, 218.35580444335938, 227.88697814941406, 237.41815185546875, 246.94932556152344, 256.4804992675781, 266.01165771484375, 275.5428466796875, 285.07403564453125, 294.6051940917969, 304.1363525390625, 313.66754150390625, 323.19873046875, 332.7298889160156, 342.26104736328125, 351.792236328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 4.0, 8.0, 10.0, 10.0, 15.0, 16.0, 26.0, 22.0, 35.0, 33.0, 36.0, 51.0, 49.0, 59.0, 57.0, 63.0, 70.0, 52.0, 55.0, 38.0, 41.0, 44.0, 27.0, 32.0, 31.0, 18.0, 8.0, 11.0, 16.0, 9.0, 6.0, 6.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-110.79570007324219, -107.67374420166016, -104.5517807006836, -101.42982482910156, -98.30786895751953, -95.18590545654297, -92.06394958496094, -88.94198608398438, -85.82003021240234, -82.69807434082031, -79.57611083984375, -76.45415496826172, -73.33219909667969, -70.21023559570312, -67.0882797241211, -63.9663200378418, -60.844364166259766, -57.72240447998047, -54.60044860839844, -51.47848892211914, -48.356529235839844, -45.23457336425781, -42.112613677978516, -38.99065399169922, -35.86869812011719, -32.74673843383789, -29.624780654907227, -26.502822875976562, -23.380863189697266, -20.2589054107666, -17.136947631835938, -14.01498794555664, -10.893028259277344, -7.771069526672363, -4.649111270904541, -1.5271530151367188, 1.5948057174682617, 4.716764450073242, 7.838722229003906, 10.960681915283203, 14.082639694213867, 17.20459747314453, 20.326557159423828, 23.448514938354492, 26.570472717285156, 29.692432403564453, 32.81439208984375, 35.93634796142578, 39.05830764770508, 42.180267333984375, 45.302223205566406, 48.4241828918457, 51.546142578125, 54.66809844970703, 57.79005813598633, 60.912017822265625, 64.03397369384766, 67.15592956542969, 70.27789306640625, 73.39984893798828, 76.52180480957031, 79.64376831054688, 82.7657241821289, 85.88768005371094, 89.0096435546875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 20.0, 15.0, 36.0, 64.0, 115.0, 185.0, 314.0, 572.0, 1275.0, 2944.0, 7417.0, 23731.0, 97618.0, 518671.0, 309803.0, 60109.0, 16073.0, 5306.0, 2155.0, 1025.0, 470.0, 262.0, 151.0, 81.0, 56.0, 22.0, 26.0, 11.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.7010498046875, -9.386474609375, -9.0718994140625, -8.75732421875, -8.4427490234375, -8.128173828125, -7.8135986328125, -7.4990234375, -7.1844482421875, -6.869873046875, -6.5552978515625, -6.24072265625, -5.9261474609375, -5.611572265625, -5.2969970703125, -4.982421875, -4.6678466796875, -4.353271484375, -4.0386962890625, -3.72412109375, -3.4095458984375, -3.094970703125, -2.7803955078125, -2.4658203125, -2.1512451171875, -1.836669921875, -1.5220947265625, -1.20751953125, -0.8929443359375, -0.578369140625, -0.2637939453125, 0.05078125, 0.3653564453125, 0.679931640625, 0.9945068359375, 1.30908203125, 1.6236572265625, 1.938232421875, 2.2528076171875, 2.5673828125, 2.8819580078125, 3.196533203125, 3.5111083984375, 3.82568359375, 4.1402587890625, 4.454833984375, 4.7694091796875, 5.083984375, 5.3985595703125, 5.713134765625, 6.0277099609375, 6.34228515625, 6.6568603515625, 6.971435546875, 7.2860107421875, 7.6005859375, 7.9151611328125, 8.229736328125, 8.5443115234375, 8.85888671875, 9.1734619140625, 9.488037109375, 9.8026123046875, 10.1171875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 11.0, 8.0, 19.0, 16.0, 20.0, 32.0, 22.0, 28.0, 47.0, 42.0, 48.0, 56.0, 48.0, 54.0, 52.0, 44.0, 54.0, 48.0, 50.0, 40.0, 38.0, 38.0, 36.0, 20.0, 32.0, 23.0, 20.0, 8.0, 11.0, 4.0, 5.0, 5.0, 2.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5528564453125, -4.363525390625, -4.1741943359375, -3.98486328125, -3.7955322265625, -3.606201171875, -3.4168701171875, -3.2275390625, -3.0382080078125, -2.848876953125, -2.6595458984375, -2.47021484375, -2.2808837890625, -2.091552734375, -1.9022216796875, -1.712890625, -1.5235595703125, -1.334228515625, -1.1448974609375, -0.95556640625, -0.7662353515625, -0.576904296875, -0.3875732421875, -0.1982421875, -0.0089111328125, 0.180419921875, 0.3697509765625, 0.55908203125, 0.7484130859375, 0.937744140625, 1.1270751953125, 1.31640625, 1.5057373046875, 1.695068359375, 1.8843994140625, 2.07373046875, 2.2630615234375, 2.452392578125, 2.6417236328125, 2.8310546875, 3.0203857421875, 3.209716796875, 3.3990478515625, 3.58837890625, 3.7777099609375, 3.967041015625, 4.1563720703125, 4.345703125, 4.5350341796875, 4.724365234375, 4.9136962890625, 5.10302734375, 5.2923583984375, 5.481689453125, 5.6710205078125, 5.8603515625, 6.0496826171875, 6.239013671875, 6.4283447265625, 6.61767578125, 6.8070068359375, 6.996337890625, 7.1856689453125, 7.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 15.0, 17.0, 27.0, 51.0, 92.0, 153.0, 301.0, 697.0, 2612.0, 31794.0, 976215.0, 32624.0, 2625.0, 702.0, 258.0, 142.0, 93.0, 51.0, 20.0, 19.0, 9.0, 7.0, 6.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.64599609375, -13.9951171875, -13.34423828125, -12.693359375, -12.04248046875, -11.3916015625, -10.74072265625, -10.08984375, -9.43896484375, -8.7880859375, -8.13720703125, -7.486328125, -6.83544921875, -6.1845703125, -5.53369140625, -4.8828125, -4.23193359375, -3.5810546875, -2.93017578125, -2.279296875, -1.62841796875, -0.9775390625, -0.32666015625, 0.32421875, 0.97509765625, 1.6259765625, 2.27685546875, 2.927734375, 3.57861328125, 4.2294921875, 4.88037109375, 5.53125, 6.18212890625, 6.8330078125, 7.48388671875, 8.134765625, 8.78564453125, 9.4365234375, 10.08740234375, 10.73828125, 11.38916015625, 12.0400390625, 12.69091796875, 13.341796875, 13.99267578125, 14.6435546875, 15.29443359375, 15.9453125, 16.59619140625, 17.2470703125, 17.89794921875, 18.548828125, 19.19970703125, 19.8505859375, 20.50146484375, 21.15234375, 21.80322265625, 22.4541015625, 23.10498046875, 23.755859375, 24.40673828125, 25.0576171875, 25.70849609375, 26.359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 12.0, 16.0, 18.0, 13.0, 27.0, 34.0, 25.0, 45.0, 56.0, 48.0, 78.0, 81.0, 84.0, 75.0, 64.0, 59.0, 53.0, 39.0, 32.0, 26.0, 15.0, 22.0, 8.0, 8.0, 12.0, 9.0, 5.0, 5.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.6005859375, -22.826171875, -22.0517578125, -21.27734375, -20.5029296875, -19.728515625, -18.9541015625, -18.1796875, -17.4052734375, -16.630859375, -15.8564453125, -15.08203125, -14.3076171875, -13.533203125, -12.7587890625, -11.984375, -11.2099609375, -10.435546875, -9.6611328125, -8.88671875, -8.1123046875, -7.337890625, -6.5634765625, -5.7890625, -5.0146484375, -4.240234375, -3.4658203125, -2.69140625, -1.9169921875, -1.142578125, -0.3681640625, 0.40625, 1.1806640625, 1.955078125, 2.7294921875, 3.50390625, 4.2783203125, 5.052734375, 5.8271484375, 6.6015625, 7.3759765625, 8.150390625, 8.9248046875, 9.69921875, 10.4736328125, 11.248046875, 12.0224609375, 12.796875, 13.5712890625, 14.345703125, 15.1201171875, 15.89453125, 16.6689453125, 17.443359375, 18.2177734375, 18.9921875, 19.7666015625, 20.541015625, 21.3154296875, 22.08984375, 22.8642578125, 23.638671875, 24.4130859375, 25.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 8.0, 9.0, 31.0, 32.0, 39.0, 93.0, 164.0, 365.0, 1178.0, 4209.0, 43470.0, 975733.0, 18897.0, 2793.0, 807.0, 328.0, 163.0, 69.0, 44.0, 26.0, 18.0, 11.0, 8.0, 6.0, 12.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.798828125, -3.677703857421875, -3.55657958984375, -3.435455322265625, -3.3143310546875, -3.193206787109375, -3.07208251953125, -2.950958251953125, -2.829833984375, -2.708709716796875, -2.58758544921875, -2.466461181640625, -2.3453369140625, -2.224212646484375, -2.10308837890625, -1.981964111328125, -1.86083984375, -1.739715576171875, -1.61859130859375, -1.497467041015625, -1.3763427734375, -1.255218505859375, -1.13409423828125, -1.012969970703125, -0.891845703125, -0.770721435546875, -0.64959716796875, -0.528472900390625, -0.4073486328125, -0.286224365234375, -0.16510009765625, -0.043975830078125, 0.0771484375, 0.198272705078125, 0.31939697265625, 0.440521240234375, 0.5616455078125, 0.682769775390625, 0.80389404296875, 0.925018310546875, 1.046142578125, 1.167266845703125, 1.28839111328125, 1.409515380859375, 1.5306396484375, 1.651763916015625, 1.77288818359375, 1.894012451171875, 2.01513671875, 2.136260986328125, 2.25738525390625, 2.378509521484375, 2.4996337890625, 2.620758056640625, 2.74188232421875, 2.863006591796875, 2.984130859375, 3.105255126953125, 3.22637939453125, 3.347503662109375, 3.4686279296875, 3.589752197265625, 3.71087646484375, 3.832000732421875, 3.953125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 14.0, 20.0, 35.0, 55.0, 100.0, 214.0, 235.0, 126.0, 69.0, 35.0, 23.0, 19.0, 8.0, 2.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013141632080078125, -0.0012768208980560303, -0.001239478588104248, -0.0012021362781524658, -0.0011647939682006836, -0.0011274516582489014, -0.0010901093482971191, -0.001052767038345337, -0.0010154247283935547, -0.0009780824184417725, -0.0009407401084899902, -0.000903397798538208, -0.0008660554885864258, -0.0008287131786346436, -0.0007913708686828613, -0.0007540285587310791, -0.0007166862487792969, -0.0006793439388275146, -0.0006420016288757324, -0.0006046593189239502, -0.000567317008972168, -0.0005299746990203857, -0.0004926323890686035, -0.0004552900791168213, -0.00041794776916503906, -0.00038060545921325684, -0.0003432631492614746, -0.0003059208393096924, -0.00026857852935791016, -0.00023123621940612793, -0.0001938939094543457, -0.00015655159950256348, -0.00011920928955078125, -8.186697959899902e-05, -4.45246696472168e-05, -7.18235969543457e-06, 3.0159950256347656e-05, 6.750226020812988e-05, 0.00010484457015991211, 0.00014218688011169434, 0.00017952919006347656, 0.0002168715000152588, 0.000254213809967041, 0.00029155611991882324, 0.00032889842987060547, 0.0003662407398223877, 0.0004035830497741699, 0.00044092535972595215, 0.0004782676696777344, 0.0005156099796295166, 0.0005529522895812988, 0.0005902945995330811, 0.0006276369094848633, 0.0006649792194366455, 0.0007023215293884277, 0.00073966383934021, 0.0007770061492919922, 0.0008143484592437744, 0.0008516907691955566, 0.0008890330791473389, 0.0009263753890991211, 0.0009637176990509033, 0.0010010600090026855, 0.0010384023189544678, 0.00107574462890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 10.0, 10.0, 25.0, 37.0, 73.0, 117.0, 208.0, 348.0, 656.0, 1277.0, 2940.0, 8088.0, 35104.0, 828042.0, 145253.0, 17263.0, 5012.0, 1929.0, 974.0, 513.0, 259.0, 165.0, 86.0, 45.0, 35.0, 19.0, 13.0, 11.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.3984375, -2.32745361328125, -2.2564697265625, -2.18548583984375, -2.114501953125, -2.04351806640625, -1.9725341796875, -1.90155029296875, -1.83056640625, -1.75958251953125, -1.6885986328125, -1.61761474609375, -1.546630859375, -1.47564697265625, -1.4046630859375, -1.33367919921875, -1.2626953125, -1.19171142578125, -1.1207275390625, -1.04974365234375, -0.978759765625, -0.90777587890625, -0.8367919921875, -0.76580810546875, -0.69482421875, -0.62384033203125, -0.5528564453125, -0.48187255859375, -0.410888671875, -0.33990478515625, -0.2689208984375, -0.19793701171875, -0.126953125, -0.05596923828125, 0.0150146484375, 0.08599853515625, 0.156982421875, 0.22796630859375, 0.2989501953125, 0.36993408203125, 0.44091796875, 0.51190185546875, 0.5828857421875, 0.65386962890625, 0.724853515625, 0.79583740234375, 0.8668212890625, 0.93780517578125, 1.0087890625, 1.07977294921875, 1.1507568359375, 1.22174072265625, 1.292724609375, 1.36370849609375, 1.4346923828125, 1.50567626953125, 1.57666015625, 1.64764404296875, 1.7186279296875, 1.78961181640625, 1.860595703125, 1.93157958984375, 2.0025634765625, 2.07354736328125, 2.14453125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 12.0, 15.0, 16.0, 15.0, 30.0, 43.0, 66.0, 80.0, 102.0, 121.0, 92.0, 100.0, 80.0, 59.0, 24.0, 19.0, 22.0, 15.0, 15.0, 2.0, 8.0, 5.0, 2.0, 3.0, 1.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.005859375, -1.9481201171875, -1.890380859375, -1.8326416015625, -1.77490234375, -1.7171630859375, -1.659423828125, -1.6016845703125, -1.5439453125, -1.4862060546875, -1.428466796875, -1.3707275390625, -1.31298828125, -1.2552490234375, -1.197509765625, -1.1397705078125, -1.08203125, -1.0242919921875, -0.966552734375, -0.9088134765625, -0.85107421875, -0.7933349609375, -0.735595703125, -0.6778564453125, -0.6201171875, -0.5623779296875, -0.504638671875, -0.4468994140625, -0.38916015625, -0.3314208984375, -0.273681640625, -0.2159423828125, -0.158203125, -0.1004638671875, -0.042724609375, 0.0150146484375, 0.07275390625, 0.1304931640625, 0.188232421875, 0.2459716796875, 0.3037109375, 0.3614501953125, 0.419189453125, 0.4769287109375, 0.53466796875, 0.5924072265625, 0.650146484375, 0.7078857421875, 0.765625, 0.8233642578125, 0.881103515625, 0.9388427734375, 0.99658203125, 1.0543212890625, 1.112060546875, 1.1697998046875, 1.2275390625, 1.2852783203125, 1.343017578125, 1.4007568359375, 1.45849609375, 1.5162353515625, 1.573974609375, 1.6317138671875, 1.689453125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 32.0, 127.0, 701.0, 105.0, 25.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-204.4772186279297, -197.0380401611328, -189.59886169433594, -182.15968322753906, -174.7205047607422, -167.2813262939453, -159.84214782714844, -152.40296936035156, -144.9637908935547, -137.5246124267578, -130.08543395996094, -122.64625549316406, -115.20707702636719, -107.76789855957031, -100.32872009277344, -92.88954162597656, -85.45036315917969, -78.01118469238281, -70.57200622558594, -63.13282775878906, -55.69364929199219, -48.25447082519531, -40.81529235839844, -33.37611389160156, -25.936935424804688, -18.497756958007812, -11.058578491210938, -3.6194000244140625, 3.8197784423828125, 11.258956909179688, 18.698135375976562, 26.137313842773438, 33.57647705078125, 41.015655517578125, 48.454833984375, 55.894012451171875, 63.33319091796875, 70.77236938476562, 78.2115478515625, 85.65072631835938, 93.08990478515625, 100.52908325195312, 107.96826171875, 115.40744018554688, 122.84661865234375, 130.28579711914062, 137.7249755859375, 145.16415405273438, 152.60333251953125, 160.04251098632812, 167.481689453125, 174.92086791992188, 182.36004638671875, 189.79922485351562, 197.2384033203125, 204.67758178710938, 212.11676025390625, 219.55593872070312, 226.9951171875, 234.43429565429688, 241.87347412109375, 249.31265258789062, 256.7518310546875, 264.1910095214844, 271.63018798828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 9.0, 10.0, 13.0, 10.0, 22.0, 28.0, 24.0, 30.0, 32.0, 59.0, 117.0, 299.0, 109.0, 36.0, 49.0, 23.0, 31.0, 12.0, 15.0, 19.0, 11.0, 10.0, 6.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.204261779785156, -53.45351791381836, -50.7027702331543, -47.9520263671875, -45.2012825012207, -42.450538635253906, -39.699790954589844, -36.94904708862305, -34.19830322265625, -31.44755744934082, -28.696813583374023, -25.946067810058594, -23.195323944091797, -20.444578170776367, -17.693832397460938, -14.94308853149414, -12.192340850830078, -9.441596031188965, -6.690850734710693, -3.940105438232422, -1.1893606185913086, 1.5613842010498047, 4.312129974365234, 7.062873840332031, 9.813619613647461, 12.564364433288574, 15.315109252929688, 18.065855026245117, 20.816600799560547, 23.567344665527344, 26.318090438842773, 29.06883430480957, 31.819580078125, 34.5703239440918, 37.32107162475586, 40.071815490722656, 42.82255935668945, 45.57330322265625, 48.32405090332031, 51.07479476928711, 53.825538635253906, 56.5762825012207, 59.327030181884766, 62.07777404785156, 64.82852172851562, 67.57926177978516, 70.33000946044922, 73.08074951171875, 75.83149719238281, 78.58224487304688, 81.3329849243164, 84.08373260498047, 86.83448028564453, 89.58522033691406, 92.33596801757812, 95.08671569824219, 97.83746337890625, 100.58821105957031, 103.33895111083984, 106.0896987915039, 108.84044647216797, 111.5911865234375, 114.34193420410156, 117.09268188476562, 119.84342193603516]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 10.0, 22.0, 38.0, 50.0, 56.0, 73.0, 390.0, 148.0, 77.0, 49.0, 26.0, 24.0, 14.0, 11.0, 9.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -5.841552734375, -5.38623046875, -4.930908203125, -4.4755859375, -4.020263671875, -3.56494140625, -3.109619140625, -2.654296875, -2.198974609375, -1.74365234375, -1.288330078125, -0.8330078125, -0.377685546875, 0.07763671875, 0.532958984375, 0.98828125, 1.443603515625, 1.89892578125, 2.354248046875, 2.8095703125, 3.264892578125, 3.72021484375, 4.175537109375, 4.630859375, 5.086181640625, 5.54150390625, 5.996826171875, 6.4521484375, 6.907470703125, 7.36279296875, 7.818115234375, 8.2734375, 8.728759765625, 9.18408203125, 9.639404296875, 10.0947265625, 10.550048828125, 11.00537109375, 11.460693359375, 11.916015625, 12.371337890625, 12.82666015625, 13.281982421875, 13.7373046875, 14.192626953125, 14.64794921875, 15.103271484375, 15.55859375, 16.013916015625, 16.46923828125, 16.924560546875, 17.3798828125, 17.835205078125, 18.29052734375, 18.745849609375, 19.201171875, 19.656494140625, 20.11181640625, 20.567138671875, 21.0224609375, 21.477783203125, 21.93310546875, 22.388427734375, 22.84375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 7.0, 7.0, 10.0, 19.0, 12.0, 12.0, 23.0, 31.0, 66.0, 85.0, 141.0, 260.0, 472.0, 1196.0, 3937.0, 26785.0, 8332886.0, 17267.0, 3247.0, 1051.0, 476.0, 221.0, 117.0, 68.0, 38.0, 36.0, 28.0, 23.0, 5.0, 10.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.35891723632812, -72.37186431884766, -70.38480377197266, -68.39775085449219, -66.41069793701172, -64.42364501953125, -62.436588287353516, -60.44953155517578, -58.46247863769531, -56.47542190551758, -54.48836898803711, -52.501312255859375, -50.514259338378906, -48.52720260620117, -46.5401496887207, -44.55309295654297, -42.5660400390625, -40.578983306884766, -38.5919303894043, -36.60487365722656, -34.617820739746094, -32.63076400756836, -30.64371109008789, -28.656654357910156, -26.669597625732422, -24.68254280090332, -22.69548797607422, -20.708433151245117, -18.721378326416016, -16.73432159423828, -14.747267723083496, -12.760212898254395, -10.77315902709961, -8.786104202270508, -6.799049377441406, -4.8119940757751465, -2.824939250946045, -0.8378839492797852, 1.1491708755493164, 3.136225700378418, 5.1232805252075195, 7.110335350036621, 9.097390174865723, 11.08444595336914, 13.071500778198242, 15.058555603027344, 17.045610427856445, 19.032665252685547, 21.01972007751465, 23.00677490234375, 24.99382972717285, 26.980884552001953, 28.967939376831055, 30.954994201660156, 32.94205093383789, 34.92910385131836, 36.916160583496094, 38.90321731567383, 40.8902702331543, 42.87732696533203, 44.8643798828125, 46.851436614990234, 48.8384895324707, 50.82554626464844, 52.812599182128906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 7.0, 2.0, 12.0, 6.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.6932601928711, -101.4347915649414, -98.17632293701172, -94.9178466796875, -91.65937805175781, -88.40090942382812, -85.14244079589844, -81.88397216796875, -78.62550354003906, -75.36703491210938, -72.10856628417969, -68.85009765625, -65.59162139892578, -62.333152770996094, -59.074684143066406, -55.81621551513672, -52.5577392578125, -49.29927062988281, -46.04079818725586, -42.78232955932617, -39.52385711669922, -36.26538848876953, -33.006919860839844, -29.748449325561523, -26.489978790283203, -23.231508255004883, -19.973037719726562, -16.714569091796875, -13.456098556518555, -10.197628021240234, -6.939159393310547, -3.6806888580322266, -0.42221832275390625, 2.836251735687256, 6.094721794128418, 9.353191375732422, 12.611661911010742, 15.870132446289062, 19.12860107421875, 22.38707160949707, 25.64554214477539, 28.90401268005371, 32.16248321533203, 35.42095184326172, 38.679420471191406, 41.93789291381836, 45.19636154174805, 48.454833984375, 51.71330261230469, 54.971771240234375, 58.23024368286133, 61.488712310791016, 64.74718475341797, 68.00565338134766, 71.26412200927734, 74.52259063720703, 77.78106689453125, 81.03953552246094, 84.29800415039062, 87.55647277832031, 90.81494903564453, 94.07341766357422, 97.3318862915039, 100.5903549194336, 103.84882354736328]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 14.0, 14.0, 12.0, 25.0, 23.0, 30.0, 51.0, 61.0, 100.0, 157.0, 247.0, 389.0, 687.0, 1285.0, 2881.0, 6931.0, 20415.0, 70636.0, 216126.0, 142807.0, 40175.0, 12340.0, 4569.0, 2020.0, 951.0, 511.0, 298.0, 170.0, 108.0, 74.0, 47.0, 27.0, 23.0, 13.0, 8.0, 10.0, 5.0, 3.0, 2.0], "bins": [-84.125, -82.203125, -80.28125, -78.359375, -76.4375, -74.515625, -72.59375, -70.671875, -68.75, -66.828125, -64.90625, -62.984375, -61.0625, -59.140625, -57.21875, -55.296875, -53.375, -51.453125, -49.53125, -47.609375, -45.6875, -43.765625, -41.84375, -39.921875, -38.0, -36.078125, -34.15625, -32.234375, -30.3125, -28.390625, -26.46875, -24.546875, -22.625, -20.703125, -18.78125, -16.859375, -14.9375, -13.015625, -11.09375, -9.171875, -7.25, -5.328125, -3.40625, -1.484375, 0.4375, 2.359375, 4.28125, 6.203125, 8.125, 10.046875, 11.96875, 13.890625, 15.8125, 17.734375, 19.65625, 21.578125, 23.5, 25.421875, 27.34375, 29.265625, 31.1875, 33.109375, 35.03125, 36.953125, 38.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 13.0, 14.0, 22.0, 26.0, 45.0, 59.0, 72.0, 101.0, 112.0, 110.0, 110.0, 113.0, 72.0, 41.0, 47.0, 19.0, 15.0, 5.0, 8.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.4375, -16.0570068359375, -15.676513671875, -15.2960205078125, -14.91552734375, -14.5350341796875, -14.154541015625, -13.7740478515625, -13.3935546875, -13.0130615234375, -12.632568359375, -12.2520751953125, -11.87158203125, -11.4910888671875, -11.110595703125, -10.7301025390625, -10.349609375, -9.9691162109375, -9.588623046875, -9.2081298828125, -8.82763671875, -8.4471435546875, -8.066650390625, -7.6861572265625, -7.3056640625, -6.9251708984375, -6.544677734375, -6.1641845703125, -5.78369140625, -5.4031982421875, -5.022705078125, -4.6422119140625, -4.26171875, -3.8812255859375, -3.500732421875, -3.1202392578125, -2.73974609375, -2.3592529296875, -1.978759765625, -1.5982666015625, -1.2177734375, -0.8372802734375, -0.456787109375, -0.0762939453125, 0.30419921875, 0.6846923828125, 1.065185546875, 1.4456787109375, 1.826171875, 2.2066650390625, 2.587158203125, 2.9676513671875, 3.34814453125, 3.7286376953125, 4.109130859375, 4.4896240234375, 4.8701171875, 5.2506103515625, 5.631103515625, 6.0115966796875, 6.39208984375, 6.7725830078125, 7.153076171875, 7.5335693359375, 7.9140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 5.0, 4.0, 5.0, 14.0, 13.0, 20.0, 18.0, 38.0, 55.0, 78.0, 77.0, 54.0, 35.0, 14.0, 13.0, 16.0, 7.0, 4.0, 1.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.44195556640625, -64.41422271728516, -62.3864860534668, -60.3587532043457, -58.33102035522461, -56.30328369140625, -54.275550842285156, -52.24781799316406, -50.22008514404297, -48.192352294921875, -46.164615631103516, -44.13688278198242, -42.10914993286133, -40.08141326904297, -38.053680419921875, -36.02594757080078, -33.99821090698242, -31.970476150512695, -29.9427433013916, -27.915008544921875, -25.88727569580078, -23.859540939331055, -21.831806182861328, -19.804073333740234, -17.776338577270508, -15.748604774475098, -13.720870971679688, -11.693136215209961, -9.66540241241455, -7.637668609619141, -5.609933853149414, -3.582200050354004, -1.5544700622558594, 0.4732639789581299, 2.500998020172119, 4.5287322998046875, 6.556466102600098, 8.584199905395508, 10.611934661865234, 12.639668464660645, 14.667402267456055, 16.69513702392578, 18.722869873046875, 20.7506046295166, 22.778339385986328, 24.806072235107422, 26.83380699157715, 28.861541748046875, 30.88927459716797, 32.91700744628906, 34.94474411010742, 36.972476959228516, 39.00020980834961, 41.02794647216797, 43.05567932128906, 45.083412170410156, 47.11114501953125, 49.138877868652344, 51.1666145324707, 53.1943473815918, 55.22208023071289, 57.24981689453125, 59.277549743652344, 61.30528259277344, 63.3330192565918]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 14.0, 15.0, 25.0, 34.0, 39.0, 54.0, 60.0, 75.0, 54.0, 34.0, 17.0, 13.0, 5.0, 5.0, 1.0, 4.0, 0.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.305160522460938, -28.190046310424805, -27.074932098388672, -25.959819793701172, -24.84470558166504, -23.729591369628906, -22.614479064941406, -21.499364852905273, -20.38425064086914, -19.269136428833008, -18.154022216796875, -17.038909912109375, -15.923795700073242, -14.80868148803711, -13.693568229675293, -12.578454971313477, -11.463340759277344, -10.348226547241211, -9.233113288879395, -8.118000030517578, -7.002885818481445, -5.887772083282471, -4.772658348083496, -3.6575446128845215, -2.542430877685547, -1.4273171424865723, -0.31220340728759766, 0.802910327911377, 1.9180240631103516, 3.033137798309326, 4.148251533508301, 5.263365268707275, 6.378482818603516, 7.49359655380249, 8.608710289001465, 9.723823547363281, 10.838937759399414, 11.954051971435547, 13.069165229797363, 14.18427848815918, 15.299392700195312, 16.414506912231445, 17.529621124267578, 18.644733428955078, 19.75984764099121, 20.874961853027344, 21.990074157714844, 23.105188369750977, 24.22030258178711, 25.335416793823242, 26.450531005859375, 27.565643310546875, 28.680757522583008, 29.79587173461914, 30.91098403930664, 32.026100158691406, 33.141212463378906, 34.256324768066406, 35.37144088745117, 36.48655319213867, 37.60166931152344, 38.71678161621094, 39.83189392089844, 40.9470100402832, 42.0621223449707]}, "eval/loss": 0.8383785486221313, "eval/wer": 0.1366748020715519, "eval/runtime": 1219.9567, "eval/samples_per_second": 2.166, "eval/steps_per_second": 0.271, "train/train_runtime": 122857.9097, "train/train_samples_per_second": 4.646, "train/train_steps_per_second": 0.145, "train/total_flos": 0.0, "train/train_loss": 2.2609593777487165} \ No newline at end of file