diff --git "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" --- "a/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" +++ "b/wandb/run-20220315_195757-3ex43zbl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.4212, "train/learning_rate": 5.066508313539193e-06, "train/epoch": 16.82, "train/global_step": 15000, "_runtime": 104132, "_timestamp": 1647478409, "_step": 15009, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 7.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 15.0, 44.0, 30345.0, 34.0, 13.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-203.375, -198.9697265625, -194.564453125, -190.1591796875, -185.75390625, -181.3486328125, -176.943359375, -172.5380859375, -168.1328125, -163.7275390625, -159.322265625, -154.9169921875, -150.51171875, -146.1064453125, -141.701171875, -137.2958984375, -132.890625, -128.4853515625, -124.080078125, -119.6748046875, -115.26953125, -110.8642578125, -106.458984375, -102.0537109375, -97.6484375, -93.2431640625, -88.837890625, -84.4326171875, -80.02734375, -75.6220703125, -71.216796875, -66.8115234375, -62.40625, -58.0009765625, -53.595703125, -49.1904296875, -44.78515625, -40.3798828125, -35.974609375, -31.5693359375, -27.1640625, -22.7587890625, -18.353515625, -13.9482421875, -9.54296875, -5.1376953125, -0.732421875, 3.6728515625, 8.078125, 12.4833984375, 16.888671875, 21.2939453125, 25.69921875, 30.1044921875, 34.509765625, 38.9150390625, 43.3203125, 47.7255859375, 52.130859375, 56.5361328125, 60.94140625, 65.3466796875, 69.751953125, 74.1572265625, 78.5625]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 8.0, 1.0, 3.0, 4.0, 10.0, 7.0, 10.0, 9.0, 12.0, 7.0, 13.0, 24.0, 20.0, 24.0, 29.0, 28.0, 33.0, 34.0, 31.0, 37.0, 42.0, 46.0, 41.0, 33.0, 30.0, 37.0, 42.0, 46.0, 29.0, 42.0, 34.0, 31.0, 25.0, 27.0, 28.0, 23.0, 17.0, 16.0, 15.0, 11.0, 7.0, 13.0, 6.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.40045166015625, -48.178958892822266, -46.957462310791016, -45.73596954345703, -44.51447677612305, -43.29298400878906, -42.07148742675781, -40.84999465942383, -39.628501892089844, -38.40700912475586, -37.18551254272461, -35.964019775390625, -34.74252700805664, -33.521034240722656, -32.299537658691406, -31.078044891357422, -29.856548309326172, -28.635053634643555, -27.41356086730957, -26.192066192626953, -24.97057342529297, -23.74907875061035, -22.527584075927734, -21.30609130859375, -20.084596633911133, -18.863101959228516, -17.64160919189453, -16.420114517211914, -15.198620796203613, -13.977127075195312, -12.755632400512695, -11.534138679504395, -10.312644958496094, -9.091151237487793, -7.869657039642334, -6.648162841796875, -5.426669120788574, -4.205175399780273, -2.9836812019348145, -1.7621870040893555, -0.5406932830810547, 0.6808006763458252, 1.902294635772705, 3.123788595199585, 4.345282554626465, 5.566776275634766, 6.788270473480225, 8.009764671325684, 9.231258392333984, 10.452752113342285, 11.674245834350586, 12.895740509033203, 14.117234230041504, 15.338727951049805, 16.560222625732422, 17.781715393066406, 19.003210067749023, 20.22470474243164, 21.446197509765625, 22.667692184448242, 23.88918685913086, 25.110679626464844, 26.33217430114746, 27.553668975830078, 28.775161743164062]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 8.0, 7.0, 3.0, 14.0, 9.0, 9.0, 15.0, 18.0, 15.0, 16.0, 15.0, 26.0, 16.0, 30.0, 32.0, 31.0, 39.0, 43.0, 47.0, 39.0, 41.0, 30.0, 37.0, 38.0, 41.0, 48.0, 50.0, 39.0, 32.0, 38.0, 28.0, 26.0, 12.0, 20.0, 25.0, 14.0, 13.0, 8.0, 5.0, 6.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.58970642089844, -40.332950592041016, -39.076194763183594, -37.81943893432617, -36.56268310546875, -35.30592727661133, -34.049171447753906, -32.792415618896484, -31.535659790039062, -30.27890396118164, -29.02214813232422, -27.765392303466797, -26.508636474609375, -25.251880645751953, -23.99512481689453, -22.73836898803711, -21.481611251831055, -20.224855422973633, -18.96809959411621, -17.71134376525879, -16.454587936401367, -15.197832107543945, -13.941075325012207, -12.684319496154785, -11.427563667297363, -10.170807838439941, -8.91405200958252, -7.6572957038879395, -6.400539875030518, -5.143784046173096, -3.8870277404785156, -2.6302719116210938, -1.3735160827636719, -0.11676013469696045, 1.139995813369751, 2.396751880645752, 3.653507709503174, 4.910263538360596, 6.167019844055176, 7.423775672912598, 8.68053150177002, 9.937287330627441, 11.194043159484863, 12.450799942016602, 13.707555770874023, 14.964311599731445, 16.221067428588867, 17.47782325744629, 18.73457908630371, 19.991334915161133, 21.248090744018555, 22.504846572875977, 23.7616024017334, 25.01835823059082, 26.275115966796875, 27.531871795654297, 28.78862762451172, 30.04538345336914, 31.302139282226562, 32.558895111083984, 33.815650939941406, 35.07240676879883, 36.32916259765625, 37.58591842651367, 38.842674255371094]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 16.0, 21.0, 41.0, 40.0, 83.0, 118.0, 208.0, 365.0, 555.0, 845.0, 1351.0, 2216.0, 3385.0, 5149.0, 8024.0, 12072.0, 17691.0, 26098.0, 36285.0, 48779.0, 63932.0, 78808.0, 92226.0, 104872.0, 122125.0, 95017.0, 81935.0, 67546.0, 52848.0, 39303.0, 28409.0, 19720.0, 13437.0, 8768.0, 5945.0, 3736.0, 2412.0, 1540.0, 1004.0, 633.0, 388.0, 222.0, 131.0, 117.0, 45.0, 31.0, 35.0, 13.0, 9.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-128.75, -124.4765625, -120.203125, -115.9296875, -111.65625, -107.3828125, -103.109375, -98.8359375, -94.5625, -90.2890625, -86.015625, -81.7421875, -77.46875, -73.1953125, -68.921875, -64.6484375, -60.375, -56.1015625, -51.828125, -47.5546875, -43.28125, -39.0078125, -34.734375, -30.4609375, -26.1875, -21.9140625, -17.640625, -13.3671875, -9.09375, -4.8203125, -0.546875, 3.7265625, 8.0, 12.2734375, 16.546875, 20.8203125, 25.09375, 29.3671875, 33.640625, 37.9140625, 42.1875, 46.4609375, 50.734375, 55.0078125, 59.28125, 63.5546875, 67.828125, 72.1015625, 76.375, 80.6484375, 84.921875, 89.1953125, 93.46875, 97.7421875, 102.015625, 106.2890625, 110.5625, 114.8359375, 119.109375, 123.3828125, 127.65625, 131.9296875, 136.203125, 140.4765625, 144.75]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 7.0, 11.0, 10.0, 11.0, 16.0, 12.0, 25.0, 17.0, 15.0, 18.0, 29.0, 31.0, 33.0, 30.0, 30.0, 44.0, 36.0, 46.0, 47.0, 66.0, 30.0, 35.0, 43.0, 37.0, 19.0, 33.0, 34.0, 32.0, 21.0, 30.0, 19.0, 22.0, 24.0, 15.0, 15.0, 9.0, 11.0, 5.0, 1.0, 2.0, 5.0, 6.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-60.375, -58.544921875, -56.71484375, -54.884765625, -53.0546875, -51.224609375, -49.39453125, -47.564453125, -45.734375, -43.904296875, -42.07421875, -40.244140625, -38.4140625, -36.583984375, -34.75390625, -32.923828125, -31.09375, -29.263671875, -27.43359375, -25.603515625, -23.7734375, -21.943359375, -20.11328125, -18.283203125, -16.453125, -14.623046875, -12.79296875, -10.962890625, -9.1328125, -7.302734375, -5.47265625, -3.642578125, -1.8125, 0.017578125, 1.84765625, 3.677734375, 5.5078125, 7.337890625, 9.16796875, 10.998046875, 12.828125, 14.658203125, 16.48828125, 18.318359375, 20.1484375, 21.978515625, 23.80859375, 25.638671875, 27.46875, 29.298828125, 31.12890625, 32.958984375, 34.7890625, 36.619140625, 38.44921875, 40.279296875, 42.109375, 43.939453125, 45.76953125, 47.599609375, 49.4296875, 51.259765625, 53.08984375, 54.919921875, 56.75]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 5.0, 7.0, 13.0, 10.0, 18.0, 22.0, 25.0, 13.0, 20.0, 29.0, 34.0, 32.0, 53.0, 36.0, 41.0, 38.0, 39.0, 40.0, 36.0, 43.0, 43.0, 32.0, 37.0, 32.0, 34.0, 26.0, 35.0, 28.0, 16.0, 23.0, 29.0, 22.0, 16.0, 14.0, 12.0, 4.0, 10.0, 10.0, 4.0, 4.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.2568359375, -35.010318756103516, -33.76380157470703, -32.51728057861328, -31.270763397216797, -30.024246215820312, -28.777729034423828, -27.531211853027344, -26.284692764282227, -25.038175582885742, -23.791656494140625, -22.54513931274414, -21.298622131347656, -20.05210304260254, -18.805585861206055, -17.559066772460938, -16.312549591064453, -15.066031455993652, -13.819513320922852, -12.572996139526367, -11.326478004455566, -10.079959869384766, -8.833442687988281, -7.5869245529174805, -6.34040641784668, -5.093888282775879, -3.8473706245422363, -2.6008527278900146, -1.354334831237793, -0.10781669616699219, 1.1387009620666504, 2.385218620300293, 3.6317405700683594, 4.87825870513916, 6.124776363372803, 7.371294021606445, 8.617812156677246, 9.864330291748047, 11.110847473144531, 12.357365608215332, 13.603883743286133, 14.850401878356934, 16.096920013427734, 17.34343719482422, 18.589954376220703, 19.83647346496582, 21.082990646362305, 22.329509735107422, 23.576026916503906, 24.82254409790039, 26.069063186645508, 27.315580368041992, 28.56209945678711, 29.808616638183594, 31.055133819580078, 32.30165100097656, 33.54817199707031, 34.7946891784668, 36.04120635986328, 37.28772735595703, 38.534244537353516, 39.78076171875, 41.027278900146484, 42.27379608154297, 43.52031326293945]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 10.0, 3.0, 7.0, 17.0, 15.0, 13.0, 19.0, 15.0, 16.0, 23.0, 28.0, 35.0, 33.0, 44.0, 40.0, 36.0, 50.0, 42.0, 42.0, 45.0, 44.0, 54.0, 47.0, 37.0, 34.0, 34.0, 35.0, 17.0, 28.0, 26.0, 18.0, 15.0, 15.0, 16.0, 10.0, 4.0, 10.0, 8.0, 5.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.45900344848633, -47.047386169433594, -45.63576889038086, -44.224151611328125, -42.812538146972656, -41.40092086791992, -39.98930358886719, -38.57768630981445, -37.16606903076172, -35.754451751708984, -34.34283447265625, -32.931217193603516, -31.519601821899414, -30.10798454284668, -28.696369171142578, -27.284751892089844, -25.87313461303711, -24.461517333984375, -23.04990005493164, -21.63828468322754, -20.226667404174805, -18.81505012512207, -17.40343475341797, -15.991817474365234, -14.5802001953125, -13.168582916259766, -11.756966590881348, -10.34535026550293, -8.933732986450195, -7.522116184234619, -6.110499382019043, -4.698883056640625, -3.2872695922851562, -1.87565279006958, -0.4640359878540039, 0.9475808143615723, 2.3591976165771484, 3.7708144187927246, 5.182431221008301, 6.594047546386719, 8.005664825439453, 9.417282104492188, 10.828898429870605, 12.240514755249023, 13.652132034301758, 15.063749313354492, 16.475364685058594, 17.886981964111328, 19.298599243164062, 20.710216522216797, 22.12183380126953, 23.533449172973633, 24.945066452026367, 26.3566837310791, 27.768299102783203, 29.179916381835938, 30.591533660888672, 32.003150939941406, 33.41476821899414, 34.826385498046875, 36.237998962402344, 37.64961624145508, 39.06123352050781, 40.47285079956055, 41.88446807861328]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 9.0, 6.0, 12.0, 17.0, 31.0, 63.0, 99.0, 139.0, 201.0, 332.0, 502.0, 824.0, 1190.0, 1895.0, 2922.0, 4621.0, 7246.0, 11634.0, 18119.0, 28335.0, 44816.0, 70871.0, 111981.0, 176124.0, 276669.0, 426654.0, 627248.0, 729612.0, 580540.0, 387644.0, 250077.0, 159445.0, 101226.0, 63926.0, 40044.0, 25419.0, 16209.0, 10215.0, 6529.0, 4060.0, 2491.0, 1630.0, 1000.0, 646.0, 386.0, 251.0, 150.0, 84.0, 74.0, 30.0, 26.0, 12.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.78125, -58.8447265625, -56.908203125, -54.9716796875, -53.03515625, -51.0986328125, -49.162109375, -47.2255859375, -45.2890625, -43.3525390625, -41.416015625, -39.4794921875, -37.54296875, -35.6064453125, -33.669921875, -31.7333984375, -29.796875, -27.8603515625, -25.923828125, -23.9873046875, -22.05078125, -20.1142578125, -18.177734375, -16.2412109375, -14.3046875, -12.3681640625, -10.431640625, -8.4951171875, -6.55859375, -4.6220703125, -2.685546875, -0.7490234375, 1.1875, 3.1240234375, 5.060546875, 6.9970703125, 8.93359375, 10.8701171875, 12.806640625, 14.7431640625, 16.6796875, 18.6162109375, 20.552734375, 22.4892578125, 24.42578125, 26.3623046875, 28.298828125, 30.2353515625, 32.171875, 34.1083984375, 36.044921875, 37.9814453125, 39.91796875, 41.8544921875, 43.791015625, 45.7275390625, 47.6640625, 49.6005859375, 51.537109375, 53.4736328125, 55.41015625, 57.3466796875, 59.283203125, 61.2197265625, 63.15625]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 9.0, 11.0, 11.0, 9.0, 12.0, 16.0, 23.0, 13.0, 14.0, 28.0, 34.0, 37.0, 38.0, 37.0, 33.0, 38.0, 26.0, 48.0, 37.0, 45.0, 31.0, 36.0, 43.0, 38.0, 32.0, 32.0, 31.0, 31.0, 25.0, 20.0, 24.0, 20.0, 16.0, 20.0, 14.0, 5.0, 6.0, 6.0, 10.0, 5.0, 10.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-36.875, -35.76171875, -34.6484375, -33.53515625, -32.421875, -31.30859375, -30.1953125, -29.08203125, -27.96875, -26.85546875, -25.7421875, -24.62890625, -23.515625, -22.40234375, -21.2890625, -20.17578125, -19.0625, -17.94921875, -16.8359375, -15.72265625, -14.609375, -13.49609375, -12.3828125, -11.26953125, -10.15625, -9.04296875, -7.9296875, -6.81640625, -5.703125, -4.58984375, -3.4765625, -2.36328125, -1.25, -0.13671875, 0.9765625, 2.08984375, 3.203125, 4.31640625, 5.4296875, 6.54296875, 7.65625, 8.76953125, 9.8828125, 10.99609375, 12.109375, 13.22265625, 14.3359375, 15.44921875, 16.5625, 17.67578125, 18.7890625, 19.90234375, 21.015625, 22.12890625, 23.2421875, 24.35546875, 25.46875, 26.58203125, 27.6953125, 28.80859375, 29.921875, 31.03515625, 32.1484375, 33.26171875, 34.375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 15.0, 31.0, 49.0, 91.0, 131.0, 203.0, 330.0, 519.0, 830.0, 1367.0, 2374.0, 3840.0, 6691.0, 11177.0, 19026.0, 32785.0, 55054.0, 93905.0, 157167.0, 254428.0, 397502.0, 574862.0, 707779.0, 640556.0, 462624.0, 303612.0, 188856.0, 113366.0, 67773.0, 39720.0, 23529.0, 13839.0, 8196.0, 4781.0, 2881.0, 1729.0, 1047.0, 607.0, 397.0, 229.0, 138.0, 107.0, 51.0, 22.0, 26.0, 14.0, 10.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-51.59375, -50.1064453125, -48.619140625, -47.1318359375, -45.64453125, -44.1572265625, -42.669921875, -41.1826171875, -39.6953125, -38.2080078125, -36.720703125, -35.2333984375, -33.74609375, -32.2587890625, -30.771484375, -29.2841796875, -27.796875, -26.3095703125, -24.822265625, -23.3349609375, -21.84765625, -20.3603515625, -18.873046875, -17.3857421875, -15.8984375, -14.4111328125, -12.923828125, -11.4365234375, -9.94921875, -8.4619140625, -6.974609375, -5.4873046875, -4.0, -2.5126953125, -1.025390625, 0.4619140625, 1.94921875, 3.4365234375, 4.923828125, 6.4111328125, 7.8984375, 9.3857421875, 10.873046875, 12.3603515625, 13.84765625, 15.3349609375, 16.822265625, 18.3095703125, 19.796875, 21.2841796875, 22.771484375, 24.2587890625, 25.74609375, 27.2333984375, 28.720703125, 30.2080078125, 31.6953125, 33.1826171875, 34.669921875, 36.1572265625, 37.64453125, 39.1318359375, 40.619140625, 42.1064453125, 43.59375]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 2.0, 6.0, 4.0, 11.0, 17.0, 14.0, 8.0, 28.0, 19.0, 33.0, 53.0, 50.0, 66.0, 85.0, 96.0, 138.0, 152.0, 175.0, 193.0, 195.0, 231.0, 238.0, 256.0, 233.0, 244.0, 217.0, 190.0, 205.0, 187.0, 121.0, 136.0, 102.0, 71.0, 72.0, 68.0, 37.0, 34.0, 23.0, 18.0, 13.0, 10.0, 7.0, 3.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.58544921875, -18.9677734375, -18.35009765625, -17.732421875, -17.11474609375, -16.4970703125, -15.87939453125, -15.26171875, -14.64404296875, -14.0263671875, -13.40869140625, -12.791015625, -12.17333984375, -11.5556640625, -10.93798828125, -10.3203125, -9.70263671875, -9.0849609375, -8.46728515625, -7.849609375, -7.23193359375, -6.6142578125, -5.99658203125, -5.37890625, -4.76123046875, -4.1435546875, -3.52587890625, -2.908203125, -2.29052734375, -1.6728515625, -1.05517578125, -0.4375, 0.18017578125, 0.7978515625, 1.41552734375, 2.033203125, 2.65087890625, 3.2685546875, 3.88623046875, 4.50390625, 5.12158203125, 5.7392578125, 6.35693359375, 6.974609375, 7.59228515625, 8.2099609375, 8.82763671875, 9.4453125, 10.06298828125, 10.6806640625, 11.29833984375, 11.916015625, 12.53369140625, 13.1513671875, 13.76904296875, 14.38671875, 15.00439453125, 15.6220703125, 16.23974609375, 16.857421875, 17.47509765625, 18.0927734375, 18.71044921875, 19.328125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 11.0, 12.0, 9.0, 8.0, 18.0, 21.0, 19.0, 19.0, 33.0, 29.0, 27.0, 31.0, 40.0, 41.0, 41.0, 43.0, 50.0, 42.0, 43.0, 46.0, 42.0, 46.0, 45.0, 40.0, 34.0, 34.0, 22.0, 30.0, 18.0, 12.0, 19.0, 10.0, 7.0, 8.0, 11.0, 8.0, 2.0, 9.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-44.83341598510742, -43.50592803955078, -42.17844009399414, -40.8509521484375, -39.52346420288086, -38.19597625732422, -36.86848831176758, -35.54100036621094, -34.2135124206543, -32.886024475097656, -31.558536529541016, -30.231048583984375, -28.903560638427734, -27.576072692871094, -26.248584747314453, -24.921096801757812, -23.593608856201172, -22.26612091064453, -20.93863296508789, -19.61114501953125, -18.28365707397461, -16.95616912841797, -15.628681182861328, -14.301193237304688, -12.973705291748047, -11.646217346191406, -10.318729400634766, -8.991241455078125, -7.663753509521484, -6.336265563964844, -5.008777618408203, -3.6812896728515625, -2.3537979125976562, -1.0263099670410156, 0.301177978515625, 1.6286659240722656, 2.9561538696289062, 4.283641815185547, 5.6111297607421875, 6.938617706298828, 8.266105651855469, 9.59359359741211, 10.92108154296875, 12.24856948852539, 13.576057434082031, 14.903545379638672, 16.231033325195312, 17.558521270751953, 18.886009216308594, 20.213497161865234, 21.540985107421875, 22.868473052978516, 24.195960998535156, 25.523448944091797, 26.850936889648438, 28.178424835205078, 29.50591278076172, 30.83340072631836, 32.160888671875, 33.48837661743164, 34.81586456298828, 36.14335250854492, 37.47084045410156, 38.7983283996582, 40.125816345214844]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 12.0, 10.0, 19.0, 19.0, 13.0, 19.0, 14.0, 26.0, 18.0, 20.0, 30.0, 29.0, 31.0, 34.0, 34.0, 34.0, 32.0, 46.0, 42.0, 41.0, 40.0, 34.0, 35.0, 30.0, 38.0, 36.0, 26.0, 24.0, 19.0, 27.0, 28.0, 14.0, 21.0, 15.0, 9.0, 8.0, 11.0, 5.0, 8.0, 5.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.27363586425781, -37.102352142333984, -35.931068420410156, -34.759788513183594, -33.588504791259766, -32.41722106933594, -31.24593734741211, -30.07465362548828, -28.903371810913086, -27.732088088989258, -26.560806274414062, -25.389522552490234, -24.218238830566406, -23.04695701599121, -21.875673294067383, -20.704391479492188, -19.53310775756836, -18.36182403564453, -17.190542221069336, -16.019258499145508, -14.847975730895996, -13.676692962646484, -12.505409240722656, -11.334126472473145, -10.162843704223633, -8.991560935974121, -7.820277690887451, -6.648994445800781, -5.4777116775512695, -4.306428909301758, -3.135145664215088, -1.963862419128418, -0.7925758361816406, 0.3787071704864502, 1.549990177154541, 2.721273183822632, 3.8925561904907227, 5.063838958740234, 6.235122203826904, 7.406405448913574, 8.577688217163086, 9.748970985412598, 10.92025375366211, 12.091537475585938, 13.26282024383545, 14.434103012084961, 15.605386734008789, 16.776668548583984, 17.947952270507812, 19.11923599243164, 20.290517807006836, 21.461801528930664, 22.63308334350586, 23.804367065429688, 24.975650787353516, 26.146934509277344, 27.31821632385254, 28.489500045776367, 29.660781860351562, 30.83206558227539, 32.00334930419922, 33.17462921142578, 34.34591293334961, 35.51719665527344, 36.688480377197266]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 17.0, 21.0, 32.0, 69.0, 89.0, 179.0, 274.0, 423.0, 722.0, 1193.0, 1916.0, 2947.0, 5045.0, 7977.0, 12205.0, 19200.0, 29194.0, 44095.0, 65501.0, 92051.0, 121551.0, 141160.0, 136795.0, 112581.0, 83028.0, 58782.0, 39442.0, 26163.0, 17052.0, 10782.0, 6673.0, 4320.0, 2684.0, 1765.0, 1055.0, 633.0, 377.0, 224.0, 130.0, 80.0, 53.0, 32.0, 20.0, 13.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.328125, -23.587646484375, -22.84716796875, -22.106689453125, -21.3662109375, -20.625732421875, -19.88525390625, -19.144775390625, -18.404296875, -17.663818359375, -16.92333984375, -16.182861328125, -15.4423828125, -14.701904296875, -13.96142578125, -13.220947265625, -12.48046875, -11.739990234375, -10.99951171875, -10.259033203125, -9.5185546875, -8.778076171875, -8.03759765625, -7.297119140625, -6.556640625, -5.816162109375, -5.07568359375, -4.335205078125, -3.5947265625, -2.854248046875, -2.11376953125, -1.373291015625, -0.6328125, 0.107666015625, 0.84814453125, 1.588623046875, 2.3291015625, 3.069580078125, 3.81005859375, 4.550537109375, 5.291015625, 6.031494140625, 6.77197265625, 7.512451171875, 8.2529296875, 8.993408203125, 9.73388671875, 10.474365234375, 11.21484375, 11.955322265625, 12.69580078125, 13.436279296875, 14.1767578125, 14.917236328125, 15.65771484375, 16.398193359375, 17.138671875, 17.879150390625, 18.61962890625, 19.360107421875, 20.1005859375, 20.841064453125, 21.58154296875, 22.322021484375, 23.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 9.0, 14.0, 22.0, 22.0, 16.0, 21.0, 21.0, 19.0, 24.0, 34.0, 27.0, 26.0, 38.0, 31.0, 39.0, 34.0, 40.0, 46.0, 30.0, 40.0, 40.0, 39.0, 35.0, 32.0, 32.0, 31.0, 22.0, 23.0, 31.0, 16.0, 19.0, 15.0, 15.0, 9.0, 13.0, 11.0, 5.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-35.34375, -34.2568359375, -33.169921875, -32.0830078125, -30.99609375, -29.9091796875, -28.822265625, -27.7353515625, -26.6484375, -25.5615234375, -24.474609375, -23.3876953125, -22.30078125, -21.2138671875, -20.126953125, -19.0400390625, -17.953125, -16.8662109375, -15.779296875, -14.6923828125, -13.60546875, -12.5185546875, -11.431640625, -10.3447265625, -9.2578125, -8.1708984375, -7.083984375, -5.9970703125, -4.91015625, -3.8232421875, -2.736328125, -1.6494140625, -0.5625, 0.5244140625, 1.611328125, 2.6982421875, 3.78515625, 4.8720703125, 5.958984375, 7.0458984375, 8.1328125, 9.2197265625, 10.306640625, 11.3935546875, 12.48046875, 13.5673828125, 14.654296875, 15.7412109375, 16.828125, 17.9150390625, 19.001953125, 20.0888671875, 21.17578125, 22.2626953125, 23.349609375, 24.4365234375, 25.5234375, 26.6103515625, 27.697265625, 28.7841796875, 29.87109375, 30.9580078125, 32.044921875, 33.1318359375, 34.21875]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 4.0, 9.0, 22.0, 31.0, 27.0, 52.0, 54.0, 84.0, 113.0, 168.0, 282.0, 374.0, 536.0, 761.0, 1196.0, 1772.0, 2793.0, 4246.0, 7030.0, 11909.0, 22305.0, 88388.0, 822736.0, 39757.0, 17461.0, 9742.0, 5813.0, 3798.0, 2248.0, 1546.0, 1037.0, 729.0, 425.0, 306.0, 231.0, 177.0, 107.0, 72.0, 60.0, 42.0, 32.0, 22.0, 22.0, 11.0, 6.0, 6.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-57.90625, -56.16796875, -54.4296875, -52.69140625, -50.953125, -49.21484375, -47.4765625, -45.73828125, -44.0, -42.26171875, -40.5234375, -38.78515625, -37.046875, -35.30859375, -33.5703125, -31.83203125, -30.09375, -28.35546875, -26.6171875, -24.87890625, -23.140625, -21.40234375, -19.6640625, -17.92578125, -16.1875, -14.44921875, -12.7109375, -10.97265625, -9.234375, -7.49609375, -5.7578125, -4.01953125, -2.28125, -0.54296875, 1.1953125, 2.93359375, 4.671875, 6.41015625, 8.1484375, 9.88671875, 11.625, 13.36328125, 15.1015625, 16.83984375, 18.578125, 20.31640625, 22.0546875, 23.79296875, 25.53125, 27.26953125, 29.0078125, 30.74609375, 32.484375, 34.22265625, 35.9609375, 37.69921875, 39.4375, 41.17578125, 42.9140625, 44.65234375, 46.390625, 48.12890625, 49.8671875, 51.60546875, 53.34375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 2.0, 11.0, 11.0, 15.0, 14.0, 23.0, 30.0, 39.0, 19.0, 41.0, 46.0, 43.0, 62.0, 59.0, 54.0, 58.0, 66.0, 57.0, 50.0, 50.0, 51.0, 32.0, 32.0, 31.0, 35.0, 11.0, 12.0, 11.0, 11.0, 6.0, 9.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-55.09375, -53.49755859375, -51.9013671875, -50.30517578125, -48.708984375, -47.11279296875, -45.5166015625, -43.92041015625, -42.32421875, -40.72802734375, -39.1318359375, -37.53564453125, -35.939453125, -34.34326171875, -32.7470703125, -31.15087890625, -29.5546875, -27.95849609375, -26.3623046875, -24.76611328125, -23.169921875, -21.57373046875, -19.9775390625, -18.38134765625, -16.78515625, -15.18896484375, -13.5927734375, -11.99658203125, -10.400390625, -8.80419921875, -7.2080078125, -5.61181640625, -4.015625, -2.41943359375, -0.8232421875, 0.77294921875, 2.369140625, 3.96533203125, 5.5615234375, 7.15771484375, 8.75390625, 10.35009765625, 11.9462890625, 13.54248046875, 15.138671875, 16.73486328125, 18.3310546875, 19.92724609375, 21.5234375, 23.11962890625, 24.7158203125, 26.31201171875, 27.908203125, 29.50439453125, 31.1005859375, 32.69677734375, 34.29296875, 35.88916015625, 37.4853515625, 39.08154296875, 40.677734375, 42.27392578125, 43.8701171875, 45.46630859375, 47.0625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 7.0, 8.0, 12.0, 18.0, 10.0, 21.0, 19.0, 18.0, 30.0, 19.0, 51.0, 53.0, 64.0, 113.0, 172.0, 214.0, 368.0, 570.0, 1190.0, 2655.0, 7820.0, 40832.0, 944400.0, 37082.0, 7448.0, 2493.0, 1105.0, 632.0, 325.0, 218.0, 140.0, 105.0, 78.0, 59.0, 52.0, 36.0, 24.0, 13.0, 10.0, 12.0, 12.0, 13.0, 8.0, 13.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.625, -38.3662109375, -37.107421875, -35.8486328125, -34.58984375, -33.3310546875, -32.072265625, -30.8134765625, -29.5546875, -28.2958984375, -27.037109375, -25.7783203125, -24.51953125, -23.2607421875, -22.001953125, -20.7431640625, -19.484375, -18.2255859375, -16.966796875, -15.7080078125, -14.44921875, -13.1904296875, -11.931640625, -10.6728515625, -9.4140625, -8.1552734375, -6.896484375, -5.6376953125, -4.37890625, -3.1201171875, -1.861328125, -0.6025390625, 0.65625, 1.9150390625, 3.173828125, 4.4326171875, 5.69140625, 6.9501953125, 8.208984375, 9.4677734375, 10.7265625, 11.9853515625, 13.244140625, 14.5029296875, 15.76171875, 17.0205078125, 18.279296875, 19.5380859375, 20.796875, 22.0556640625, 23.314453125, 24.5732421875, 25.83203125, 27.0908203125, 28.349609375, 29.6083984375, 30.8671875, 32.1259765625, 33.384765625, 34.6435546875, 35.90234375, 37.1611328125, 38.419921875, 39.6787109375, 40.9375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 11.0, 16.0, 20.0, 43.0, 119.0, 327.0, 275.0, 100.0, 31.0, 20.0, 10.0, 5.0, 11.0, 4.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007183074951171875, -0.0068686604499816895, -0.006554245948791504, -0.006239831447601318, -0.005925416946411133, -0.005611002445220947, -0.005296587944030762, -0.004982173442840576, -0.004667758941650391, -0.004353344440460205, -0.0040389299392700195, -0.003724515438079834, -0.0034101009368896484, -0.003095686435699463, -0.0027812719345092773, -0.002466857433319092, -0.0021524429321289062, -0.0018380284309387207, -0.0015236139297485352, -0.0012091994285583496, -0.0008947849273681641, -0.0005803704261779785, -0.00026595592498779297, 4.845857620239258e-05, 0.0003628730773925781, 0.0006772875785827637, 0.0009917020797729492, 0.0013061165809631348, 0.0016205310821533203, 0.0019349455833435059, 0.0022493600845336914, 0.002563774585723877, 0.0028781890869140625, 0.003192603588104248, 0.0035070180892944336, 0.003821432590484619, 0.004135847091674805, 0.00445026159286499, 0.004764676094055176, 0.005079090595245361, 0.005393505096435547, 0.005707919597625732, 0.006022334098815918, 0.0063367486000061035, 0.006651163101196289, 0.006965577602386475, 0.00727999210357666, 0.007594406604766846, 0.007908821105957031, 0.008223235607147217, 0.008537650108337402, 0.008852064609527588, 0.009166479110717773, 0.009480893611907959, 0.009795308113098145, 0.01010972261428833, 0.010424137115478516, 0.010738551616668701, 0.011052966117858887, 0.011367380619049072, 0.011681795120239258, 0.011996209621429443, 0.012310624122619629, 0.012625038623809814, 0.012939453125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 10.0, 9.0, 15.0, 13.0, 19.0, 23.0, 24.0, 33.0, 46.0, 85.0, 102.0, 144.0, 218.0, 267.0, 380.0, 545.0, 768.0, 1202.0, 2012.0, 3354.0, 6591.0, 14075.0, 33585.0, 84819.0, 199560.0, 323179.0, 216071.0, 92692.0, 36589.0, 15223.0, 7165.0, 3603.0, 2067.0, 1262.0, 821.0, 550.0, 402.0, 270.0, 193.0, 152.0, 113.0, 63.0, 58.0, 59.0, 37.0, 24.0, 18.0, 9.0, 10.0, 13.0, 2.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0], "bins": [-11.1015625, -10.760498046875, -10.41943359375, -10.078369140625, -9.7373046875, -9.396240234375, -9.05517578125, -8.714111328125, -8.373046875, -8.031982421875, -7.69091796875, -7.349853515625, -7.0087890625, -6.667724609375, -6.32666015625, -5.985595703125, -5.64453125, -5.303466796875, -4.96240234375, -4.621337890625, -4.2802734375, -3.939208984375, -3.59814453125, -3.257080078125, -2.916015625, -2.574951171875, -2.23388671875, -1.892822265625, -1.5517578125, -1.210693359375, -0.86962890625, -0.528564453125, -0.1875, 0.153564453125, 0.49462890625, 0.835693359375, 1.1767578125, 1.517822265625, 1.85888671875, 2.199951171875, 2.541015625, 2.882080078125, 3.22314453125, 3.564208984375, 3.9052734375, 4.246337890625, 4.58740234375, 4.928466796875, 5.26953125, 5.610595703125, 5.95166015625, 6.292724609375, 6.6337890625, 6.974853515625, 7.31591796875, 7.656982421875, 7.998046875, 8.339111328125, 8.68017578125, 9.021240234375, 9.3623046875, 9.703369140625, 10.04443359375, 10.385498046875, 10.7265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 11.0, 9.0, 17.0, 27.0, 42.0, 34.0, 37.0, 46.0, 60.0, 54.0, 73.0, 83.0, 74.0, 83.0, 58.0, 48.0, 51.0, 51.0, 30.0, 22.0, 18.0, 13.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.40234375, -3.3011474609375, -3.199951171875, -3.0987548828125, -2.99755859375, -2.8963623046875, -2.795166015625, -2.6939697265625, -2.5927734375, -2.4915771484375, -2.390380859375, -2.2891845703125, -2.18798828125, -2.0867919921875, -1.985595703125, -1.8843994140625, -1.783203125, -1.6820068359375, -1.580810546875, -1.4796142578125, -1.37841796875, -1.2772216796875, -1.176025390625, -1.0748291015625, -0.9736328125, -0.8724365234375, -0.771240234375, -0.6700439453125, -0.56884765625, -0.4676513671875, -0.366455078125, -0.2652587890625, -0.1640625, -0.0628662109375, 0.038330078125, 0.1395263671875, 0.24072265625, 0.3419189453125, 0.443115234375, 0.5443115234375, 0.6455078125, 0.7467041015625, 0.847900390625, 0.9490966796875, 1.05029296875, 1.1514892578125, 1.252685546875, 1.3538818359375, 1.455078125, 1.5562744140625, 1.657470703125, 1.7586669921875, 1.85986328125, 1.9610595703125, 2.062255859375, 2.1634521484375, 2.2646484375, 2.3658447265625, 2.467041015625, 2.5682373046875, 2.66943359375, 2.7706298828125, 2.871826171875, 2.9730224609375, 3.07421875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 8.0, 4.0, 10.0, 11.0, 15.0, 15.0, 15.0, 27.0, 19.0, 25.0, 28.0, 29.0, 37.0, 38.0, 28.0, 38.0, 41.0, 47.0, 41.0, 61.0, 56.0, 35.0, 47.0, 40.0, 32.0, 38.0, 41.0, 27.0, 24.0, 18.0, 19.0, 14.0, 12.0, 6.0, 14.0, 7.0, 12.0, 3.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.39250946044922, -39.21043014526367, -38.02834701538086, -36.84626770019531, -35.664188385009766, -34.48210906982422, -33.300025939941406, -32.11794662475586, -30.935867309570312, -29.753786087036133, -28.571706771850586, -27.389625549316406, -26.20754623413086, -25.02546501159668, -23.8433837890625, -22.661304473876953, -21.479223251342773, -20.297142028808594, -19.115062713623047, -17.932981491088867, -16.75090217590332, -15.56882095336914, -14.386740684509277, -13.204660415649414, -12.02258014678955, -10.840499877929688, -9.658419609069824, -8.476339340209961, -7.2942585945129395, -6.112178325653076, -4.930097579956055, -3.7480173110961914, -2.565937042236328, -1.3838566541671753, -0.20177626609802246, 0.9803042411804199, 2.162384510040283, 3.3444647789001465, 4.526545524597168, 5.708625793457031, 6.8907060623168945, 8.072786331176758, 9.254866600036621, 10.436946868896484, 11.619028091430664, 12.801107406616211, 13.98318862915039, 15.165268898010254, 16.347349166870117, 17.529430389404297, 18.711509704589844, 19.893590927124023, 21.07567024230957, 22.25775146484375, 23.439830780029297, 24.621912002563477, 25.803993225097656, 26.986074447631836, 28.168153762817383, 29.350234985351562, 30.53231430053711, 31.71439552307129, 32.89647674560547, 34.078556060791016, 35.26063537597656]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 13.0, 5.0, 14.0, 18.0, 18.0, 22.0, 11.0, 22.0, 23.0, 20.0, 34.0, 27.0, 38.0, 29.0, 45.0, 25.0, 47.0, 37.0, 47.0, 51.0, 35.0, 38.0, 39.0, 34.0, 37.0, 33.0, 25.0, 22.0, 32.0, 22.0, 26.0, 13.0, 16.0, 7.0, 10.0, 10.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 8.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-38.83957290649414, -37.71359634399414, -36.58761978149414, -35.46164321899414, -34.33566665649414, -33.209693908691406, -32.083717346191406, -30.957738876342773, -29.831764221191406, -28.705787658691406, -27.579811096191406, -26.453834533691406, -25.32785987854004, -24.20188331604004, -23.07590675354004, -21.94993019104004, -20.82395362854004, -19.69797706604004, -18.57200050354004, -17.446025848388672, -16.320049285888672, -15.194072723388672, -14.068096160888672, -12.942119598388672, -11.816143989562988, -10.690167427062988, -9.564191818237305, -8.438215255737305, -7.312239170074463, -6.186263084411621, -5.060286521911621, -3.9343104362487793, -2.8083343505859375, -1.6823581457138062, -0.5563819408416748, 0.5695943832397461, 1.695570468902588, 2.8215465545654297, 3.9475231170654297, 5.0734992027282715, 6.199475288391113, 7.325451374053955, 8.451427459716797, 9.577404022216797, 10.703380584716797, 11.82935619354248, 12.95533275604248, 14.081308364868164, 15.207284927368164, 16.333261489868164, 17.459238052368164, 18.58521270751953, 19.71118927001953, 20.83716583251953, 21.96314239501953, 23.08911895751953, 24.21509552001953, 25.34107208251953, 26.46704864501953, 27.59302520751953, 28.7189998626709, 29.8449764251709, 30.9709529876709, 32.096927642822266, 33.222904205322266]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 13.0, 26.0, 38.0, 58.0, 103.0, 134.0, 221.0, 334.0, 547.0, 904.0, 1390.0, 2316.0, 3746.0, 6233.0, 10358.0, 17691.0, 28490.0, 46923.0, 74316.0, 109449.0, 143681.0, 158993.0, 143084.0, 108116.0, 73474.0, 46220.0, 28513.0, 17204.0, 10203.0, 6242.0, 3681.0, 2227.0, 1369.0, 821.0, 566.0, 309.0, 186.0, 131.0, 80.0, 67.0, 35.0, 18.0, 14.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-52.40625, -50.79296875, -49.1796875, -47.56640625, -45.953125, -44.33984375, -42.7265625, -41.11328125, -39.5, -37.88671875, -36.2734375, -34.66015625, -33.046875, -31.43359375, -29.8203125, -28.20703125, -26.59375, -24.98046875, -23.3671875, -21.75390625, -20.140625, -18.52734375, -16.9140625, -15.30078125, -13.6875, -12.07421875, -10.4609375, -8.84765625, -7.234375, -5.62109375, -4.0078125, -2.39453125, -0.78125, 0.83203125, 2.4453125, 4.05859375, 5.671875, 7.28515625, 8.8984375, 10.51171875, 12.125, 13.73828125, 15.3515625, 16.96484375, 18.578125, 20.19140625, 21.8046875, 23.41796875, 25.03125, 26.64453125, 28.2578125, 29.87109375, 31.484375, 33.09765625, 34.7109375, 36.32421875, 37.9375, 39.55078125, 41.1640625, 42.77734375, 44.390625, 46.00390625, 47.6171875, 49.23046875, 50.84375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 6.0, 8.0, 8.0, 9.0, 8.0, 18.0, 21.0, 16.0, 16.0, 18.0, 21.0, 29.0, 16.0, 29.0, 46.0, 44.0, 40.0, 36.0, 32.0, 42.0, 46.0, 51.0, 46.0, 35.0, 40.0, 41.0, 28.0, 34.0, 32.0, 26.0, 36.0, 19.0, 20.0, 18.0, 13.0, 10.0, 9.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-39.84375, -38.6884765625, -37.533203125, -36.3779296875, -35.22265625, -34.0673828125, -32.912109375, -31.7568359375, -30.6015625, -29.4462890625, -28.291015625, -27.1357421875, -25.98046875, -24.8251953125, -23.669921875, -22.5146484375, -21.359375, -20.2041015625, -19.048828125, -17.8935546875, -16.73828125, -15.5830078125, -14.427734375, -13.2724609375, -12.1171875, -10.9619140625, -9.806640625, -8.6513671875, -7.49609375, -6.3408203125, -5.185546875, -4.0302734375, -2.875, -1.7197265625, -0.564453125, 0.5908203125, 1.74609375, 2.9013671875, 4.056640625, 5.2119140625, 6.3671875, 7.5224609375, 8.677734375, 9.8330078125, 10.98828125, 12.1435546875, 13.298828125, 14.4541015625, 15.609375, 16.7646484375, 17.919921875, 19.0751953125, 20.23046875, 21.3857421875, 22.541015625, 23.6962890625, 24.8515625, 26.0068359375, 27.162109375, 28.3173828125, 29.47265625, 30.6279296875, 31.783203125, 32.9384765625, 34.09375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 9.0, 8.0, 24.0, 23.0, 42.0, 64.0, 103.0, 191.0, 266.0, 430.0, 616.0, 972.0, 1535.0, 2276.0, 3489.0, 5232.0, 7630.0, 11320.0, 17083.0, 24417.0, 35395.0, 48740.0, 65661.0, 83032.0, 100162.0, 109730.0, 109827.0, 101052.0, 85867.0, 67442.0, 50471.0, 36477.0, 25559.0, 17485.0, 11883.0, 8062.0, 5409.0, 3701.0, 2305.0, 1563.0, 1046.0, 692.0, 442.0, 287.0, 197.0, 121.0, 80.0, 51.0, 28.0, 25.0, 10.0, 10.0, 7.0, 6.0, 2.0, 1.0], "bins": [-39.625, -38.46142578125, -37.2978515625, -36.13427734375, -34.970703125, -33.80712890625, -32.6435546875, -31.47998046875, -30.31640625, -29.15283203125, -27.9892578125, -26.82568359375, -25.662109375, -24.49853515625, -23.3349609375, -22.17138671875, -21.0078125, -19.84423828125, -18.6806640625, -17.51708984375, -16.353515625, -15.18994140625, -14.0263671875, -12.86279296875, -11.69921875, -10.53564453125, -9.3720703125, -8.20849609375, -7.044921875, -5.88134765625, -4.7177734375, -3.55419921875, -2.390625, -1.22705078125, -0.0634765625, 1.10009765625, 2.263671875, 3.42724609375, 4.5908203125, 5.75439453125, 6.91796875, 8.08154296875, 9.2451171875, 10.40869140625, 11.572265625, 12.73583984375, 13.8994140625, 15.06298828125, 16.2265625, 17.39013671875, 18.5537109375, 19.71728515625, 20.880859375, 22.04443359375, 23.2080078125, 24.37158203125, 25.53515625, 26.69873046875, 27.8623046875, 29.02587890625, 30.189453125, 31.35302734375, 32.5166015625, 33.68017578125, 34.84375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 7.0, 10.0, 12.0, 14.0, 17.0, 17.0, 19.0, 16.0, 37.0, 31.0, 27.0, 28.0, 37.0, 35.0, 37.0, 35.0, 40.0, 37.0, 39.0, 52.0, 30.0, 42.0, 29.0, 41.0, 34.0, 34.0, 37.0, 18.0, 28.0, 25.0, 20.0, 15.0, 20.0, 11.0, 13.0, 8.0, 8.0, 8.0, 6.0, 3.0, 8.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-25.859375, -25.11376953125, -24.3681640625, -23.62255859375, -22.876953125, -22.13134765625, -21.3857421875, -20.64013671875, -19.89453125, -19.14892578125, -18.4033203125, -17.65771484375, -16.912109375, -16.16650390625, -15.4208984375, -14.67529296875, -13.9296875, -13.18408203125, -12.4384765625, -11.69287109375, -10.947265625, -10.20166015625, -9.4560546875, -8.71044921875, -7.96484375, -7.21923828125, -6.4736328125, -5.72802734375, -4.982421875, -4.23681640625, -3.4912109375, -2.74560546875, -2.0, -1.25439453125, -0.5087890625, 0.23681640625, 0.982421875, 1.72802734375, 2.4736328125, 3.21923828125, 3.96484375, 4.71044921875, 5.4560546875, 6.20166015625, 6.947265625, 7.69287109375, 8.4384765625, 9.18408203125, 9.9296875, 10.67529296875, 11.4208984375, 12.16650390625, 12.912109375, 13.65771484375, 14.4033203125, 15.14892578125, 15.89453125, 16.64013671875, 17.3857421875, 18.13134765625, 18.876953125, 19.62255859375, 20.3681640625, 21.11376953125, 21.859375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 15.0, 30.0, 22.0, 65.0, 92.0, 110.0, 190.0, 266.0, 437.0, 779.0, 1202.0, 1946.0, 3357.0, 5651.0, 9665.0, 16654.0, 29130.0, 51202.0, 86339.0, 135675.0, 179255.0, 179173.0, 137241.0, 88032.0, 51805.0, 29079.0, 16991.0, 9621.0, 5857.0, 3384.0, 2009.0, 1291.0, 721.0, 464.0, 247.0, 206.0, 121.0, 74.0, 55.0, 30.0, 20.0, 16.0, 10.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.708251953125, -19.07275390625, -18.437255859375, -17.8017578125, -17.166259765625, -16.53076171875, -15.895263671875, -15.259765625, -14.624267578125, -13.98876953125, -13.353271484375, -12.7177734375, -12.082275390625, -11.44677734375, -10.811279296875, -10.17578125, -9.540283203125, -8.90478515625, -8.269287109375, -7.6337890625, -6.998291015625, -6.36279296875, -5.727294921875, -5.091796875, -4.456298828125, -3.82080078125, -3.185302734375, -2.5498046875, -1.914306640625, -1.27880859375, -0.643310546875, -0.0078125, 0.627685546875, 1.26318359375, 1.898681640625, 2.5341796875, 3.169677734375, 3.80517578125, 4.440673828125, 5.076171875, 5.711669921875, 6.34716796875, 6.982666015625, 7.6181640625, 8.253662109375, 8.88916015625, 9.524658203125, 10.16015625, 10.795654296875, 11.43115234375, 12.066650390625, 12.7021484375, 13.337646484375, 13.97314453125, 14.608642578125, 15.244140625, 15.879638671875, 16.51513671875, 17.150634765625, 17.7861328125, 18.421630859375, 19.05712890625, 19.692626953125, 20.328125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 12.0, 18.0, 27.0, 32.0, 49.0, 56.0, 99.0, 110.0, 127.0, 109.0, 100.0, 58.0, 65.0, 37.0, 29.0, 19.0, 14.0, 9.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002574920654296875, -0.0024664998054504395, -0.002358078956604004, -0.0022496581077575684, -0.002141237258911133, -0.0020328164100646973, -0.0019243955612182617, -0.0018159747123718262, -0.0017075538635253906, -0.001599133014678955, -0.0014907121658325195, -0.001382291316986084, -0.0012738704681396484, -0.0011654496192932129, -0.0010570287704467773, -0.0009486079216003418, -0.0008401870727539062, -0.0007317662239074707, -0.0006233453750610352, -0.0005149245262145996, -0.00040650367736816406, -0.0002980828285217285, -0.00018966197967529297, -8.124113082885742e-05, 2.7179718017578125e-05, 0.00013560056686401367, 0.00024402141571044922, 0.00035244226455688477, 0.0004608631134033203, 0.0005692839622497559, 0.0006777048110961914, 0.000786125659942627, 0.0008945465087890625, 0.001002967357635498, 0.0011113882064819336, 0.0012198090553283691, 0.0013282299041748047, 0.0014366507530212402, 0.0015450716018676758, 0.0016534924507141113, 0.0017619132995605469, 0.0018703341484069824, 0.001978754997253418, 0.0020871758460998535, 0.002195596694946289, 0.0023040175437927246, 0.00241243839263916, 0.0025208592414855957, 0.0026292800903320312, 0.002737700939178467, 0.0028461217880249023, 0.002954542636871338, 0.0030629634857177734, 0.003171384334564209, 0.0032798051834106445, 0.00338822603225708, 0.0034966468811035156, 0.003605067729949951, 0.0037134885787963867, 0.0038219094276428223, 0.003930330276489258, 0.004038751125335693, 0.004147171974182129, 0.0042555928230285645, 0.004364013671875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 12.0, 10.0, 9.0, 18.0, 16.0, 32.0, 54.0, 68.0, 102.0, 152.0, 241.0, 329.0, 565.0, 935.0, 1531.0, 2475.0, 4315.0, 7622.0, 13397.0, 23470.0, 40660.0, 69200.0, 109146.0, 153520.0, 176783.0, 157214.0, 113848.0, 72212.0, 42788.0, 24465.0, 14050.0, 7961.0, 4605.0, 2624.0, 1577.0, 914.0, 576.0, 339.0, 226.0, 148.0, 94.0, 78.0, 53.0, 38.0, 36.0, 19.0, 19.0, 7.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.71875, -16.17138671875, -15.6240234375, -15.07666015625, -14.529296875, -13.98193359375, -13.4345703125, -12.88720703125, -12.33984375, -11.79248046875, -11.2451171875, -10.69775390625, -10.150390625, -9.60302734375, -9.0556640625, -8.50830078125, -7.9609375, -7.41357421875, -6.8662109375, -6.31884765625, -5.771484375, -5.22412109375, -4.6767578125, -4.12939453125, -3.58203125, -3.03466796875, -2.4873046875, -1.93994140625, -1.392578125, -0.84521484375, -0.2978515625, 0.24951171875, 0.796875, 1.34423828125, 1.8916015625, 2.43896484375, 2.986328125, 3.53369140625, 4.0810546875, 4.62841796875, 5.17578125, 5.72314453125, 6.2705078125, 6.81787109375, 7.365234375, 7.91259765625, 8.4599609375, 9.00732421875, 9.5546875, 10.10205078125, 10.6494140625, 11.19677734375, 11.744140625, 12.29150390625, 12.8388671875, 13.38623046875, 13.93359375, 14.48095703125, 15.0283203125, 15.57568359375, 16.123046875, 16.67041015625, 17.2177734375, 17.76513671875, 18.3125]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 2.0, 4.0, 13.0, 14.0, 18.0, 14.0, 15.0, 22.0, 36.0, 30.0, 34.0, 40.0, 40.0, 49.0, 67.0, 63.0, 59.0, 68.0, 50.0, 44.0, 46.0, 45.0, 39.0, 35.0, 22.0, 22.0, 19.0, 20.0, 17.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.43359375, -5.23406982421875, -5.0345458984375, -4.83502197265625, -4.635498046875, -4.43597412109375, -4.2364501953125, -4.03692626953125, -3.83740234375, -3.63787841796875, -3.4383544921875, -3.23883056640625, -3.039306640625, -2.83978271484375, -2.6402587890625, -2.44073486328125, -2.2412109375, -2.04168701171875, -1.8421630859375, -1.64263916015625, -1.443115234375, -1.24359130859375, -1.0440673828125, -0.84454345703125, -0.64501953125, -0.44549560546875, -0.2459716796875, -0.04644775390625, 0.153076171875, 0.35260009765625, 0.5521240234375, 0.75164794921875, 0.951171875, 1.15069580078125, 1.3502197265625, 1.54974365234375, 1.749267578125, 1.94879150390625, 2.1483154296875, 2.34783935546875, 2.54736328125, 2.74688720703125, 2.9464111328125, 3.14593505859375, 3.345458984375, 3.54498291015625, 3.7445068359375, 3.94403076171875, 4.1435546875, 4.34307861328125, 4.5426025390625, 4.74212646484375, 4.941650390625, 5.14117431640625, 5.3406982421875, 5.54022216796875, 5.73974609375, 5.93927001953125, 6.1387939453125, 6.33831787109375, 6.537841796875, 6.73736572265625, 6.9368896484375, 7.13641357421875, 7.3359375]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 6.0, 4.0, 6.0, 9.0, 19.0, 20.0, 20.0, 20.0, 27.0, 35.0, 35.0, 30.0, 41.0, 41.0, 56.0, 46.0, 46.0, 41.0, 42.0, 54.0, 32.0, 49.0, 38.0, 32.0, 32.0, 30.0, 35.0, 23.0, 19.0, 20.0, 16.0, 16.0, 10.0, 15.0, 7.0, 7.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.89065933227539, -36.71190643310547, -35.53314971923828, -34.35439682006836, -33.17564010620117, -31.99688720703125, -30.818132400512695, -29.63937759399414, -28.460622787475586, -27.28186798095703, -26.103113174438477, -24.924358367919922, -23.74560546875, -22.566848754882812, -21.38809585571289, -20.209341049194336, -19.03058624267578, -17.851831436157227, -16.673076629638672, -15.494322776794434, -14.315567970275879, -13.136813163757324, -11.958059310913086, -10.779304504394531, -9.600549697875977, -8.421794891357422, -7.243040561676025, -6.064286231994629, -4.885531425476074, -3.7067766189575195, -2.528022289276123, -1.3492679595947266, -0.1705169677734375, 1.008237600326538, 2.1869921684265137, 3.3657467365264893, 4.544501304626465, 5.7232561111450195, 6.902010440826416, 8.080764770507812, 9.259519577026367, 10.438274383544922, 11.617029190063477, 12.795783042907715, 13.97453784942627, 15.153292655944824, 16.332046508789062, 17.510801315307617, 18.689556121826172, 19.868310928344727, 21.04706573486328, 22.225820541381836, 23.40457534790039, 24.583328247070312, 25.762083053588867, 26.940837860107422, 28.119592666625977, 29.29834747314453, 30.477102279663086, 31.65585708618164, 32.83460998535156, 34.01336669921875, 35.19211959838867, 36.370872497558594, 37.54962921142578]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 11.0, 17.0, 18.0, 22.0, 21.0, 25.0, 23.0, 22.0, 32.0, 26.0, 45.0, 31.0, 38.0, 37.0, 45.0, 37.0, 38.0, 32.0, 47.0, 33.0, 43.0, 47.0, 44.0, 19.0, 38.0, 29.0, 23.0, 29.0, 13.0, 13.0, 19.0, 12.0, 8.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.39418411254883, -34.238304138183594, -33.08242416381836, -31.926542282104492, -30.770662307739258, -29.614782333374023, -28.458900451660156, -27.303020477294922, -26.147140502929688, -24.991260528564453, -23.83538055419922, -22.67949867248535, -21.523618698120117, -20.367738723754883, -19.211856842041016, -18.05597686767578, -16.900096893310547, -15.744216918945312, -14.588335990905762, -13.432455062866211, -12.276575088500977, -11.120695114135742, -9.964814186096191, -8.80893325805664, -7.653053283691406, -6.497172832489014, -5.341292381286621, -4.1854119300842285, -3.029531478881836, -1.8736510276794434, -0.7177705764770508, 0.4381103515625, 1.5939903259277344, 2.749870777130127, 3.9057512283325195, 5.061631679534912, 6.217512130737305, 7.373392581939697, 8.52927303314209, 9.68515396118164, 10.841033935546875, 11.99691390991211, 13.15279483795166, 14.308675765991211, 15.464555740356445, 16.62043571472168, 17.776317596435547, 18.93219757080078, 20.088077545166016, 21.24395751953125, 22.399837493896484, 23.55571937561035, 24.711599349975586, 25.86747932434082, 27.023361206054688, 28.179241180419922, 29.335121154785156, 30.49100112915039, 31.646881103515625, 32.80276107788086, 33.958641052246094, 35.114524841308594, 36.27040481567383, 37.42628479003906, 38.5821647644043]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 10.0, 8.0, 23.0, 30.0, 47.0, 64.0, 112.0, 159.0, 230.0, 339.0, 543.0, 836.0, 1381.0, 2220.0, 3483.0, 5559.0, 9139.0, 15024.0, 25209.0, 41975.0, 71998.0, 125369.0, 219065.0, 375589.0, 600925.0, 779186.0, 717245.0, 494545.0, 296553.0, 170174.0, 97680.0, 56773.0, 32763.0, 19467.0, 11603.0, 7192.0, 4347.0, 2829.0, 1691.0, 1084.0, 662.0, 404.0, 258.0, 179.0, 107.0, 79.0, 53.0, 28.0, 25.0, 10.0, 8.0, 8.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.78125, -35.5859375, -34.390625, -33.1953125, -32.0, -30.8046875, -29.609375, -28.4140625, -27.21875, -26.0234375, -24.828125, -23.6328125, -22.4375, -21.2421875, -20.046875, -18.8515625, -17.65625, -16.4609375, -15.265625, -14.0703125, -12.875, -11.6796875, -10.484375, -9.2890625, -8.09375, -6.8984375, -5.703125, -4.5078125, -3.3125, -2.1171875, -0.921875, 0.2734375, 1.46875, 2.6640625, 3.859375, 5.0546875, 6.25, 7.4453125, 8.640625, 9.8359375, 11.03125, 12.2265625, 13.421875, 14.6171875, 15.8125, 17.0078125, 18.203125, 19.3984375, 20.59375, 21.7890625, 22.984375, 24.1796875, 25.375, 26.5703125, 27.765625, 28.9609375, 30.15625, 31.3515625, 32.546875, 33.7421875, 34.9375, 36.1328125, 37.328125, 38.5234375, 39.71875]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 8.0, 12.0, 14.0, 15.0, 15.0, 26.0, 23.0, 18.0, 29.0, 26.0, 24.0, 34.0, 27.0, 44.0, 33.0, 36.0, 37.0, 54.0, 35.0, 51.0, 34.0, 41.0, 32.0, 34.0, 40.0, 37.0, 37.0, 24.0, 19.0, 21.0, 20.0, 11.0, 12.0, 10.0, 15.0, 6.0, 7.0, 6.0, 8.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.734375, -26.890869140625, -26.04736328125, -25.203857421875, -24.3603515625, -23.516845703125, -22.67333984375, -21.829833984375, -20.986328125, -20.142822265625, -19.29931640625, -18.455810546875, -17.6123046875, -16.768798828125, -15.92529296875, -15.081787109375, -14.23828125, -13.394775390625, -12.55126953125, -11.707763671875, -10.8642578125, -10.020751953125, -9.17724609375, -8.333740234375, -7.490234375, -6.646728515625, -5.80322265625, -4.959716796875, -4.1162109375, -3.272705078125, -2.42919921875, -1.585693359375, -0.7421875, 0.101318359375, 0.94482421875, 1.788330078125, 2.6318359375, 3.475341796875, 4.31884765625, 5.162353515625, 6.005859375, 6.849365234375, 7.69287109375, 8.536376953125, 9.3798828125, 10.223388671875, 11.06689453125, 11.910400390625, 12.75390625, 13.597412109375, 14.44091796875, 15.284423828125, 16.1279296875, 16.971435546875, 17.81494140625, 18.658447265625, 19.501953125, 20.345458984375, 21.18896484375, 22.032470703125, 22.8759765625, 23.719482421875, 24.56298828125, 25.406494140625, 26.25]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 10.0, 13.0, 19.0, 31.0, 32.0, 55.0, 83.0, 124.0, 177.0, 304.0, 412.0, 688.0, 1089.0, 1729.0, 2978.0, 4860.0, 8044.0, 14085.0, 25128.0, 44196.0, 80050.0, 142981.0, 250810.0, 414594.0, 619745.0, 754549.0, 673734.0, 474232.0, 293210.0, 168406.0, 94935.0, 52492.0, 29487.0, 16936.0, 9413.0, 5707.0, 3423.0, 1978.0, 1264.0, 795.0, 520.0, 297.0, 217.0, 144.0, 94.0, 69.0, 51.0, 31.0, 23.0, 18.0, 9.0, 5.0, 4.0, 6.0, 1.0, 2.0, 2.0], "bins": [-35.5, -34.41259765625, -33.3251953125, -32.23779296875, -31.150390625, -30.06298828125, -28.9755859375, -27.88818359375, -26.80078125, -25.71337890625, -24.6259765625, -23.53857421875, -22.451171875, -21.36376953125, -20.2763671875, -19.18896484375, -18.1015625, -17.01416015625, -15.9267578125, -14.83935546875, -13.751953125, -12.66455078125, -11.5771484375, -10.48974609375, -9.40234375, -8.31494140625, -7.2275390625, -6.14013671875, -5.052734375, -3.96533203125, -2.8779296875, -1.79052734375, -0.703125, 0.38427734375, 1.4716796875, 2.55908203125, 3.646484375, 4.73388671875, 5.8212890625, 6.90869140625, 7.99609375, 9.08349609375, 10.1708984375, 11.25830078125, 12.345703125, 13.43310546875, 14.5205078125, 15.60791015625, 16.6953125, 17.78271484375, 18.8701171875, 19.95751953125, 21.044921875, 22.13232421875, 23.2197265625, 24.30712890625, 25.39453125, 26.48193359375, 27.5693359375, 28.65673828125, 29.744140625, 30.83154296875, 31.9189453125, 33.00634765625, 34.09375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 11.0, 8.0, 13.0, 8.0, 15.0, 20.0, 24.0, 50.0, 55.0, 72.0, 69.0, 93.0, 109.0, 163.0, 175.0, 203.0, 229.0, 257.0, 285.0, 261.0, 256.0, 261.0, 222.0, 224.0, 199.0, 165.0, 126.0, 100.0, 93.0, 76.0, 62.0, 45.0, 36.0, 25.0, 18.0, 12.0, 8.0, 10.0, 5.0, 0.0, 6.0, 3.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-16.359375, -15.899169921875, -15.43896484375, -14.978759765625, -14.5185546875, -14.058349609375, -13.59814453125, -13.137939453125, -12.677734375, -12.217529296875, -11.75732421875, -11.297119140625, -10.8369140625, -10.376708984375, -9.91650390625, -9.456298828125, -8.99609375, -8.535888671875, -8.07568359375, -7.615478515625, -7.1552734375, -6.695068359375, -6.23486328125, -5.774658203125, -5.314453125, -4.854248046875, -4.39404296875, -3.933837890625, -3.4736328125, -3.013427734375, -2.55322265625, -2.093017578125, -1.6328125, -1.172607421875, -0.71240234375, -0.252197265625, 0.2080078125, 0.668212890625, 1.12841796875, 1.588623046875, 2.048828125, 2.509033203125, 2.96923828125, 3.429443359375, 3.8896484375, 4.349853515625, 4.81005859375, 5.270263671875, 5.73046875, 6.190673828125, 6.65087890625, 7.111083984375, 7.5712890625, 8.031494140625, 8.49169921875, 8.951904296875, 9.412109375, 9.872314453125, 10.33251953125, 10.792724609375, 11.2529296875, 11.713134765625, 12.17333984375, 12.633544921875, 13.09375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 9.0, 15.0, 15.0, 17.0, 17.0, 24.0, 32.0, 30.0, 23.0, 34.0, 28.0, 38.0, 50.0, 47.0, 54.0, 33.0, 60.0, 47.0, 50.0, 44.0, 36.0, 38.0, 35.0, 24.0, 25.0, 26.0, 28.0, 12.0, 21.0, 9.0, 11.0, 12.0, 8.0, 8.0, 6.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-32.47420883178711, -31.481689453125, -30.489171981811523, -29.496652603149414, -28.504133224487305, -27.511615753173828, -26.51909637451172, -25.52657699584961, -24.5340576171875, -23.54153823852539, -22.549020767211914, -21.556501388549805, -20.563982009887695, -19.57146453857422, -18.57894515991211, -17.58642578125, -16.593908309936523, -15.60138988494873, -14.608870506286621, -13.616352081298828, -12.623832702636719, -11.631314277648926, -10.638795852661133, -9.646276473999023, -8.65375804901123, -7.661239147186279, -6.668720245361328, -5.676201820373535, -4.683682918548584, -3.691164016723633, -2.69864559173584, -1.7061266899108887, -0.7136077880859375, 0.2789109945297241, 1.2714297771453857, 2.263948440551758, 3.256467342376709, 4.24898624420166, 5.241504669189453, 6.234023571014404, 7.2265424728393555, 8.219060897827148, 9.211580276489258, 10.20409870147705, 11.196617126464844, 12.189136505126953, 13.181654930114746, 14.174173355102539, 15.166692733764648, 16.159212112426758, 17.151729583740234, 18.144248962402344, 19.136768341064453, 20.129287719726562, 21.12180519104004, 22.11432456970215, 23.106842041015625, 24.099361419677734, 25.09187889099121, 26.08439826965332, 27.07691764831543, 28.069435119628906, 29.061954498291016, 30.054473876953125, 31.046993255615234]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 9.0, 6.0, 9.0, 16.0, 24.0, 17.0, 12.0, 20.0, 18.0, 26.0, 20.0, 36.0, 34.0, 41.0, 37.0, 29.0, 46.0, 50.0, 41.0, 41.0, 47.0, 42.0, 36.0, 28.0, 40.0, 45.0, 37.0, 22.0, 25.0, 25.0, 21.0, 15.0, 20.0, 14.0, 11.0, 6.0, 9.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-35.72895050048828, -34.707271575927734, -33.68559265136719, -32.66391372680664, -31.64223289489746, -30.620553970336914, -29.598873138427734, -28.577194213867188, -27.55551528930664, -26.533836364746094, -25.512157440185547, -24.490476608276367, -23.46879768371582, -22.447118759155273, -21.425437927246094, -20.403759002685547, -19.382080078125, -18.360401153564453, -17.338722229003906, -16.317041397094727, -15.29536247253418, -14.273683547973633, -13.25200366973877, -12.230323791503906, -11.20864486694336, -10.186965942382812, -9.16528606414795, -8.143606185913086, -7.121927261352539, -6.100247859954834, -5.078568458557129, -4.056889057159424, -3.035207748413086, -2.013528347015381, -0.9918489456176758, 0.029830455780029297, 1.0515098571777344, 2.0731892585754395, 3.0948686599731445, 4.11654806137085, 5.138227462768555, 6.15990686416626, 7.181586265563965, 8.203266143798828, 9.224945068359375, 10.246623992919922, 11.268303871154785, 12.289983749389648, 13.311662673950195, 14.333341598510742, 15.355021476745605, 16.37670135498047, 17.398380279541016, 18.420059204101562, 19.44173812866211, 20.46341896057129, 21.485097885131836, 22.506776809692383, 23.528457641601562, 24.55013656616211, 25.571815490722656, 26.593494415283203, 27.61517333984375, 28.63685417175293, 29.658533096313477]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 9.0, 12.0, 15.0, 25.0, 28.0, 56.0, 75.0, 116.0, 182.0, 282.0, 423.0, 607.0, 944.0, 1441.0, 2083.0, 3301.0, 4944.0, 7235.0, 10689.0, 15480.0, 21761.0, 30805.0, 41569.0, 54927.0, 69506.0, 83273.0, 94838.0, 102586.0, 100023.0, 91254.0, 76943.0, 62543.0, 48480.0, 36175.0, 26959.0, 18990.0, 13046.0, 8974.0, 6080.0, 4023.0, 2717.0, 1760.0, 1140.0, 763.0, 525.0, 345.0, 212.0, 124.0, 95.0, 64.0, 43.0, 23.0, 19.0, 13.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.8203125, -15.3062744140625, -14.792236328125, -14.2781982421875, -13.76416015625, -13.2501220703125, -12.736083984375, -12.2220458984375, -11.7080078125, -11.1939697265625, -10.679931640625, -10.1658935546875, -9.65185546875, -9.1378173828125, -8.623779296875, -8.1097412109375, -7.595703125, -7.0816650390625, -6.567626953125, -6.0535888671875, -5.53955078125, -5.0255126953125, -4.511474609375, -3.9974365234375, -3.4833984375, -2.9693603515625, -2.455322265625, -1.9412841796875, -1.42724609375, -0.9132080078125, -0.399169921875, 0.1148681640625, 0.62890625, 1.1429443359375, 1.656982421875, 2.1710205078125, 2.68505859375, 3.1990966796875, 3.713134765625, 4.2271728515625, 4.7412109375, 5.2552490234375, 5.769287109375, 6.2833251953125, 6.79736328125, 7.3114013671875, 7.825439453125, 8.3394775390625, 8.853515625, 9.3675537109375, 9.881591796875, 10.3956298828125, 10.90966796875, 11.4237060546875, 11.937744140625, 12.4517822265625, 12.9658203125, 13.4798583984375, 13.993896484375, 14.5079345703125, 15.02197265625, 15.5360107421875, 16.050048828125, 16.5640869140625, 17.078125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 5.0, 4.0, 1.0, 3.0, 8.0, 6.0, 7.0, 15.0, 9.0, 11.0, 18.0, 19.0, 23.0, 27.0, 19.0, 28.0, 29.0, 24.0, 45.0, 35.0, 39.0, 46.0, 34.0, 47.0, 44.0, 45.0, 38.0, 38.0, 38.0, 41.0, 37.0, 32.0, 30.0, 23.0, 27.0, 23.0, 16.0, 11.0, 14.0, 13.0, 7.0, 10.0, 5.0, 4.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.171875, -28.310791015625, -27.44970703125, -26.588623046875, -25.7275390625, -24.866455078125, -24.00537109375, -23.144287109375, -22.283203125, -21.422119140625, -20.56103515625, -19.699951171875, -18.8388671875, -17.977783203125, -17.11669921875, -16.255615234375, -15.39453125, -14.533447265625, -13.67236328125, -12.811279296875, -11.9501953125, -11.089111328125, -10.22802734375, -9.366943359375, -8.505859375, -7.644775390625, -6.78369140625, -5.922607421875, -5.0615234375, -4.200439453125, -3.33935546875, -2.478271484375, -1.6171875, -0.756103515625, 0.10498046875, 0.966064453125, 1.8271484375, 2.688232421875, 3.54931640625, 4.410400390625, 5.271484375, 6.132568359375, 6.99365234375, 7.854736328125, 8.7158203125, 9.576904296875, 10.43798828125, 11.299072265625, 12.16015625, 13.021240234375, 13.88232421875, 14.743408203125, 15.6044921875, 16.465576171875, 17.32666015625, 18.187744140625, 19.048828125, 19.909912109375, 20.77099609375, 21.632080078125, 22.4931640625, 23.354248046875, 24.21533203125, 25.076416015625, 25.9375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 10.0, 12.0, 14.0, 28.0, 44.0, 62.0, 111.0, 176.0, 227.0, 418.0, 671.0, 1065.0, 1799.0, 2831.0, 4547.0, 7684.0, 13817.0, 27386.0, 322946.0, 599362.0, 29994.0, 14704.0, 7976.0, 4857.0, 2893.0, 1842.0, 1126.0, 682.0, 471.0, 281.0, 175.0, 110.0, 83.0, 42.0, 35.0, 18.0, 17.0, 13.0, 5.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-91.125, -88.59765625, -86.0703125, -83.54296875, -81.015625, -78.48828125, -75.9609375, -73.43359375, -70.90625, -68.37890625, -65.8515625, -63.32421875, -60.796875, -58.26953125, -55.7421875, -53.21484375, -50.6875, -48.16015625, -45.6328125, -43.10546875, -40.578125, -38.05078125, -35.5234375, -32.99609375, -30.46875, -27.94140625, -25.4140625, -22.88671875, -20.359375, -17.83203125, -15.3046875, -12.77734375, -10.25, -7.72265625, -5.1953125, -2.66796875, -0.140625, 2.38671875, 4.9140625, 7.44140625, 9.96875, 12.49609375, 15.0234375, 17.55078125, 20.078125, 22.60546875, 25.1328125, 27.66015625, 30.1875, 32.71484375, 35.2421875, 37.76953125, 40.296875, 42.82421875, 45.3515625, 47.87890625, 50.40625, 52.93359375, 55.4609375, 57.98828125, 60.515625, 63.04296875, 65.5703125, 68.09765625, 70.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 4.0, 4.0, 17.0, 9.0, 11.0, 18.0, 19.0, 23.0, 28.0, 31.0, 34.0, 37.0, 30.0, 39.0, 36.0, 41.0, 36.0, 40.0, 47.0, 41.0, 45.0, 57.0, 39.0, 36.0, 36.0, 18.0, 43.0, 29.0, 23.0, 17.0, 19.0, 15.0, 9.0, 13.0, 11.0, 6.0, 11.0, 8.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-34.625, -33.43603515625, -32.2470703125, -31.05810546875, -29.869140625, -28.68017578125, -27.4912109375, -26.30224609375, -25.11328125, -23.92431640625, -22.7353515625, -21.54638671875, -20.357421875, -19.16845703125, -17.9794921875, -16.79052734375, -15.6015625, -14.41259765625, -13.2236328125, -12.03466796875, -10.845703125, -9.65673828125, -8.4677734375, -7.27880859375, -6.08984375, -4.90087890625, -3.7119140625, -2.52294921875, -1.333984375, -0.14501953125, 1.0439453125, 2.23291015625, 3.421875, 4.61083984375, 5.7998046875, 6.98876953125, 8.177734375, 9.36669921875, 10.5556640625, 11.74462890625, 12.93359375, 14.12255859375, 15.3115234375, 16.50048828125, 17.689453125, 18.87841796875, 20.0673828125, 21.25634765625, 22.4453125, 23.63427734375, 24.8232421875, 26.01220703125, 27.201171875, 28.39013671875, 29.5791015625, 30.76806640625, 31.95703125, 33.14599609375, 34.3349609375, 35.52392578125, 36.712890625, 37.90185546875, 39.0908203125, 40.27978515625, 41.46875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 6.0, 12.0, 8.0, 16.0, 19.0, 22.0, 21.0, 21.0, 31.0, 58.0, 51.0, 70.0, 117.0, 151.0, 150.0, 225.0, 291.0, 385.0, 592.0, 884.0, 1344.0, 2231.0, 3771.0, 7365.0, 17219.0, 64577.0, 865522.0, 51121.0, 15374.0, 6947.0, 3561.0, 2037.0, 1261.0, 857.0, 550.0, 411.0, 328.0, 222.0, 175.0, 109.0, 97.0, 76.0, 68.0, 48.0, 33.0, 16.0, 18.0, 25.0, 12.0, 17.0, 10.0, 9.0, 2.0, 8.0, 6.0, 3.0, 0.0, 2.0], "bins": [-43.53125, -42.189453125, -40.84765625, -39.505859375, -38.1640625, -36.822265625, -35.48046875, -34.138671875, -32.796875, -31.455078125, -30.11328125, -28.771484375, -27.4296875, -26.087890625, -24.74609375, -23.404296875, -22.0625, -20.720703125, -19.37890625, -18.037109375, -16.6953125, -15.353515625, -14.01171875, -12.669921875, -11.328125, -9.986328125, -8.64453125, -7.302734375, -5.9609375, -4.619140625, -3.27734375, -1.935546875, -0.59375, 0.748046875, 2.08984375, 3.431640625, 4.7734375, 6.115234375, 7.45703125, 8.798828125, 10.140625, 11.482421875, 12.82421875, 14.166015625, 15.5078125, 16.849609375, 18.19140625, 19.533203125, 20.875, 22.216796875, 23.55859375, 24.900390625, 26.2421875, 27.583984375, 28.92578125, 30.267578125, 31.609375, 32.951171875, 34.29296875, 35.634765625, 36.9765625, 38.318359375, 39.66015625, 41.001953125, 42.34375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 12.0, 9.0, 20.0, 21.0, 23.0, 52.0, 61.0, 79.0, 82.0, 174.0, 126.0, 74.0, 74.0, 59.0, 27.0, 22.0, 25.0, 10.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0105743408203125, -0.010204792022705078, -0.009835243225097656, -0.009465694427490234, -0.009096145629882812, -0.00872659683227539, -0.008357048034667969, -0.007987499237060547, -0.007617950439453125, -0.007248401641845703, -0.006878852844238281, -0.006509304046630859, -0.0061397552490234375, -0.005770206451416016, -0.005400657653808594, -0.005031108856201172, -0.00466156005859375, -0.004292011260986328, -0.003922462463378906, -0.0035529136657714844, -0.0031833648681640625, -0.0028138160705566406, -0.0024442672729492188, -0.002074718475341797, -0.001705169677734375, -0.0013356208801269531, -0.0009660720825195312, -0.0005965232849121094, -0.0002269744873046875, 0.00014257431030273438, 0.0005121231079101562, 0.0008816719055175781, 0.001251220703125, 0.0016207695007324219, 0.0019903182983398438, 0.0023598670959472656, 0.0027294158935546875, 0.0030989646911621094, 0.0034685134887695312, 0.003838062286376953, 0.004207611083984375, 0.004577159881591797, 0.004946708679199219, 0.005316257476806641, 0.0056858062744140625, 0.006055355072021484, 0.006424903869628906, 0.006794452667236328, 0.00716400146484375, 0.007533550262451172, 0.007903099060058594, 0.008272647857666016, 0.008642196655273438, 0.00901174545288086, 0.009381294250488281, 0.009750843048095703, 0.010120391845703125, 0.010489940643310547, 0.010859489440917969, 0.01122903823852539, 0.011598587036132812, 0.011968135833740234, 0.012337684631347656, 0.012707233428955078, 0.0130767822265625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 11.0, 11.0, 16.0, 28.0, 28.0, 38.0, 44.0, 75.0, 124.0, 155.0, 213.0, 307.0, 458.0, 651.0, 1014.0, 1686.0, 2826.0, 5117.0, 10186.0, 22524.0, 56883.0, 165838.0, 391499.0, 245944.0, 82663.0, 30979.0, 13417.0, 6446.0, 3537.0, 2089.0, 1238.0, 777.0, 543.0, 349.0, 262.0, 178.0, 117.0, 91.0, 51.0, 33.0, 32.0, 23.0, 19.0, 14.0, 7.0, 9.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3125, -10.9554443359375, -10.598388671875, -10.2413330078125, -9.88427734375, -9.5272216796875, -9.170166015625, -8.8131103515625, -8.4560546875, -8.0989990234375, -7.741943359375, -7.3848876953125, -7.02783203125, -6.6707763671875, -6.313720703125, -5.9566650390625, -5.599609375, -5.2425537109375, -4.885498046875, -4.5284423828125, -4.17138671875, -3.8143310546875, -3.457275390625, -3.1002197265625, -2.7431640625, -2.3861083984375, -2.029052734375, -1.6719970703125, -1.31494140625, -0.9578857421875, -0.600830078125, -0.2437744140625, 0.11328125, 0.4703369140625, 0.827392578125, 1.1844482421875, 1.54150390625, 1.8985595703125, 2.255615234375, 2.6126708984375, 2.9697265625, 3.3267822265625, 3.683837890625, 4.0408935546875, 4.39794921875, 4.7550048828125, 5.112060546875, 5.4691162109375, 5.826171875, 6.1832275390625, 6.540283203125, 6.8973388671875, 7.25439453125, 7.6114501953125, 7.968505859375, 8.3255615234375, 8.6826171875, 9.0396728515625, 9.396728515625, 9.7537841796875, 10.11083984375, 10.4678955078125, 10.824951171875, 11.1820068359375, 11.5390625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 6.0, 7.0, 2.0, 11.0, 10.0, 7.0, 14.0, 23.0, 24.0, 20.0, 35.0, 54.0, 66.0, 61.0, 73.0, 91.0, 84.0, 87.0, 72.0, 53.0, 46.0, 31.0, 22.0, 21.0, 21.0, 15.0, 12.0, 8.0, 9.0, 5.0, 4.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9140625, -2.81317138671875, -2.7122802734375, -2.61138916015625, -2.510498046875, -2.40960693359375, -2.3087158203125, -2.20782470703125, -2.10693359375, -2.00604248046875, -1.9051513671875, -1.80426025390625, -1.703369140625, -1.60247802734375, -1.5015869140625, -1.40069580078125, -1.2998046875, -1.19891357421875, -1.0980224609375, -0.99713134765625, -0.896240234375, -0.79534912109375, -0.6944580078125, -0.59356689453125, -0.49267578125, -0.39178466796875, -0.2908935546875, -0.19000244140625, -0.089111328125, 0.01177978515625, 0.1126708984375, 0.21356201171875, 0.314453125, 0.41534423828125, 0.5162353515625, 0.61712646484375, 0.718017578125, 0.81890869140625, 0.9197998046875, 1.02069091796875, 1.12158203125, 1.22247314453125, 1.3233642578125, 1.42425537109375, 1.525146484375, 1.62603759765625, 1.7269287109375, 1.82781982421875, 1.9287109375, 2.02960205078125, 2.1304931640625, 2.23138427734375, 2.332275390625, 2.43316650390625, 2.5340576171875, 2.63494873046875, 2.73583984375, 2.83673095703125, 2.9376220703125, 3.03851318359375, 3.139404296875, 3.24029541015625, 3.3411865234375, 3.44207763671875, 3.54296875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 9.0, 13.0, 8.0, 13.0, 9.0, 12.0, 19.0, 22.0, 32.0, 41.0, 60.0, 42.0, 49.0, 60.0, 54.0, 68.0, 65.0, 58.0, 49.0, 52.0, 48.0, 42.0, 32.0, 26.0, 32.0, 20.0, 15.0, 11.0, 11.0, 11.0, 7.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.658294677734375, -34.57943344116211, -33.500572204589844, -32.42171096801758, -31.342851638793945, -30.26399040222168, -29.185131072998047, -28.10626983642578, -27.027408599853516, -25.94854736328125, -24.869686126708984, -23.79082679748535, -22.711965560913086, -21.63310432434082, -20.554244995117188, -19.475383758544922, -18.396522521972656, -17.31766128540039, -16.238800048828125, -15.159940719604492, -14.081079483032227, -13.002218246459961, -11.923357963562012, -10.844497680664062, -9.765636444091797, -8.686775207519531, -7.607914924621582, -6.529054164886475, -5.450193405151367, -4.37133264541626, -3.2924718856811523, -2.213611125946045, -1.1347465515136719, -0.05588579177856445, 1.022974967956543, 2.1018357276916504, 3.180696487426758, 4.259557247161865, 5.338418006896973, 6.41727876663208, 7.4961395263671875, 8.575000762939453, 9.653861045837402, 10.732721328735352, 11.811582565307617, 12.890443801879883, 13.969304084777832, 15.048164367675781, 16.127025604248047, 17.205886840820312, 18.284748077392578, 19.36360740661621, 20.442468643188477, 21.521329879760742, 22.600189208984375, 23.67905044555664, 24.757911682128906, 25.836772918701172, 26.915634155273438, 27.99449348449707, 29.073354721069336, 30.1522159576416, 31.231075286865234, 32.3099365234375, 33.388797760009766]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 8.0, 6.0, 16.0, 10.0, 18.0, 17.0, 17.0, 19.0, 20.0, 31.0, 25.0, 38.0, 31.0, 35.0, 37.0, 41.0, 33.0, 43.0, 47.0, 38.0, 53.0, 47.0, 38.0, 43.0, 40.0, 28.0, 26.0, 28.0, 31.0, 19.0, 18.0, 24.0, 10.0, 14.0, 7.0, 7.0, 5.0, 3.0, 8.0, 4.0, 4.0, 1.0, 2.0, 5.0, 0.0, 3.0], "bins": [-34.17149353027344, -33.2392692565918, -32.307044982910156, -31.37482261657715, -30.44260025024414, -29.5103759765625, -28.57815170288086, -27.64592742919922, -26.71370506286621, -25.78148078918457, -24.849258422851562, -23.917034149169922, -22.98480987548828, -22.052587509155273, -21.120363235473633, -20.188140869140625, -19.255916595458984, -18.323692321777344, -17.391469955444336, -16.459245681762695, -15.527022361755371, -14.594799041748047, -13.662574768066406, -12.730351448059082, -11.798128128051758, -10.865904808044434, -9.93368148803711, -9.001457214355469, -8.069233894348145, -7.13701057434082, -6.204786777496338, -5.2725629806518555, -4.340339660644531, -3.408116102218628, -2.4758925437927246, -1.5436689853668213, -0.611445426940918, 0.32077789306640625, 1.2530016899108887, 2.185225486755371, 3.1174488067626953, 4.0496721267700195, 4.981895923614502, 5.914119720458984, 6.846343040466309, 7.778566360473633, 8.710790634155273, 9.643013954162598, 10.575237274169922, 11.507460594177246, 12.43968391418457, 13.371908187866211, 14.304131507873535, 15.23635482788086, 16.1685791015625, 17.10080337524414, 18.03302574157715, 18.96525001525879, 19.897472381591797, 20.829696655273438, 21.761920928955078, 22.694143295288086, 23.626367568969727, 24.558589935302734, 25.490814208984375]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 10.0, 5.0, 20.0, 20.0, 46.0, 39.0, 93.0, 130.0, 195.0, 334.0, 483.0, 756.0, 1132.0, 1703.0, 2723.0, 4384.0, 6541.0, 10367.0, 15705.0, 24494.0, 39427.0, 59802.0, 87510.0, 121709.0, 146453.0, 146741.0, 121627.0, 88275.0, 59575.0, 38773.0, 24859.0, 15831.0, 10215.0, 6678.0, 4147.0, 2690.0, 1790.0, 1138.0, 752.0, 497.0, 321.0, 202.0, 117.0, 84.0, 55.0, 45.0, 19.0, 20.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-25.515625, -24.71826171875, -23.9208984375, -23.12353515625, -22.326171875, -21.52880859375, -20.7314453125, -19.93408203125, -19.13671875, -18.33935546875, -17.5419921875, -16.74462890625, -15.947265625, -15.14990234375, -14.3525390625, -13.55517578125, -12.7578125, -11.96044921875, -11.1630859375, -10.36572265625, -9.568359375, -8.77099609375, -7.9736328125, -7.17626953125, -6.37890625, -5.58154296875, -4.7841796875, -3.98681640625, -3.189453125, -2.39208984375, -1.5947265625, -0.79736328125, 0.0, 0.79736328125, 1.5947265625, 2.39208984375, 3.189453125, 3.98681640625, 4.7841796875, 5.58154296875, 6.37890625, 7.17626953125, 7.9736328125, 8.77099609375, 9.568359375, 10.36572265625, 11.1630859375, 11.96044921875, 12.7578125, 13.55517578125, 14.3525390625, 15.14990234375, 15.947265625, 16.74462890625, 17.5419921875, 18.33935546875, 19.13671875, 19.93408203125, 20.7314453125, 21.52880859375, 22.326171875, 23.12353515625, 23.9208984375, 24.71826171875, 25.515625]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 5.0, 3.0, 11.0, 13.0, 12.0, 12.0, 16.0, 26.0, 24.0, 18.0, 26.0, 33.0, 31.0, 28.0, 31.0, 28.0, 46.0, 50.0, 37.0, 48.0, 44.0, 38.0, 41.0, 47.0, 37.0, 29.0, 38.0, 41.0, 28.0, 25.0, 23.0, 18.0, 21.0, 14.0, 12.0, 12.0, 9.0, 5.0, 5.0, 2.0, 4.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.46875, -28.650146484375, -27.83154296875, -27.012939453125, -26.1943359375, -25.375732421875, -24.55712890625, -23.738525390625, -22.919921875, -22.101318359375, -21.28271484375, -20.464111328125, -19.6455078125, -18.826904296875, -18.00830078125, -17.189697265625, -16.37109375, -15.552490234375, -14.73388671875, -13.915283203125, -13.0966796875, -12.278076171875, -11.45947265625, -10.640869140625, -9.822265625, -9.003662109375, -8.18505859375, -7.366455078125, -6.5478515625, -5.729248046875, -4.91064453125, -4.092041015625, -3.2734375, -2.454833984375, -1.63623046875, -0.817626953125, 0.0009765625, 0.819580078125, 1.63818359375, 2.456787109375, 3.275390625, 4.093994140625, 4.91259765625, 5.731201171875, 6.5498046875, 7.368408203125, 8.18701171875, 9.005615234375, 9.82421875, 10.642822265625, 11.46142578125, 12.280029296875, 13.0986328125, 13.917236328125, 14.73583984375, 15.554443359375, 16.373046875, 17.191650390625, 18.01025390625, 18.828857421875, 19.6474609375, 20.466064453125, 21.28466796875, 22.103271484375, 22.921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 8.0, 5.0, 5.0, 14.0, 16.0, 23.0, 32.0, 75.0, 86.0, 140.0, 251.0, 355.0, 599.0, 994.0, 1504.0, 2494.0, 4427.0, 7434.0, 12360.0, 21647.0, 38624.0, 67165.0, 112576.0, 165476.0, 188997.0, 161706.0, 108966.0, 64824.0, 37165.0, 20989.0, 11969.0, 6821.0, 4206.0, 2588.0, 1526.0, 908.0, 570.0, 360.0, 249.0, 151.0, 83.0, 67.0, 31.0, 26.0, 13.0, 12.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-35.09375, -34.104248046875, -33.11474609375, -32.125244140625, -31.1357421875, -30.146240234375, -29.15673828125, -28.167236328125, -27.177734375, -26.188232421875, -25.19873046875, -24.209228515625, -23.2197265625, -22.230224609375, -21.24072265625, -20.251220703125, -19.26171875, -18.272216796875, -17.28271484375, -16.293212890625, -15.3037109375, -14.314208984375, -13.32470703125, -12.335205078125, -11.345703125, -10.356201171875, -9.36669921875, -8.377197265625, -7.3876953125, -6.398193359375, -5.40869140625, -4.419189453125, -3.4296875, -2.440185546875, -1.45068359375, -0.461181640625, 0.5283203125, 1.517822265625, 2.50732421875, 3.496826171875, 4.486328125, 5.475830078125, 6.46533203125, 7.454833984375, 8.4443359375, 9.433837890625, 10.42333984375, 11.412841796875, 12.40234375, 13.391845703125, 14.38134765625, 15.370849609375, 16.3603515625, 17.349853515625, 18.33935546875, 19.328857421875, 20.318359375, 21.307861328125, 22.29736328125, 23.286865234375, 24.2763671875, 25.265869140625, 26.25537109375, 27.244873046875, 28.234375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 5.0, 6.0, 10.0, 8.0, 17.0, 18.0, 16.0, 21.0, 27.0, 21.0, 27.0, 44.0, 41.0, 47.0, 38.0, 38.0, 41.0, 53.0, 46.0, 42.0, 45.0, 53.0, 45.0, 41.0, 46.0, 25.0, 28.0, 26.0, 23.0, 12.0, 22.0, 11.0, 10.0, 10.0, 12.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.296875, -19.651123046875, -19.00537109375, -18.359619140625, -17.7138671875, -17.068115234375, -16.42236328125, -15.776611328125, -15.130859375, -14.485107421875, -13.83935546875, -13.193603515625, -12.5478515625, -11.902099609375, -11.25634765625, -10.610595703125, -9.96484375, -9.319091796875, -8.67333984375, -8.027587890625, -7.3818359375, -6.736083984375, -6.09033203125, -5.444580078125, -4.798828125, -4.153076171875, -3.50732421875, -2.861572265625, -2.2158203125, -1.570068359375, -0.92431640625, -0.278564453125, 0.3671875, 1.012939453125, 1.65869140625, 2.304443359375, 2.9501953125, 3.595947265625, 4.24169921875, 4.887451171875, 5.533203125, 6.178955078125, 6.82470703125, 7.470458984375, 8.1162109375, 8.761962890625, 9.40771484375, 10.053466796875, 10.69921875, 11.344970703125, 11.99072265625, 12.636474609375, 13.2822265625, 13.927978515625, 14.57373046875, 15.219482421875, 15.865234375, 16.510986328125, 17.15673828125, 17.802490234375, 18.4482421875, 19.093994140625, 19.73974609375, 20.385498046875, 21.03125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 11.0, 20.0, 29.0, 42.0, 71.0, 95.0, 152.0, 206.0, 323.0, 499.0, 749.0, 1143.0, 1954.0, 3267.0, 5683.0, 10393.0, 20067.0, 41494.0, 89711.0, 190349.0, 288821.0, 204212.0, 96559.0, 44986.0, 21580.0, 11024.0, 6075.0, 3368.0, 2063.0, 1273.0, 772.0, 523.0, 338.0, 241.0, 144.0, 87.0, 77.0, 45.0, 34.0, 20.0, 15.0, 7.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-25.203125, -24.378173828125, -23.55322265625, -22.728271484375, -21.9033203125, -21.078369140625, -20.25341796875, -19.428466796875, -18.603515625, -17.778564453125, -16.95361328125, -16.128662109375, -15.3037109375, -14.478759765625, -13.65380859375, -12.828857421875, -12.00390625, -11.178955078125, -10.35400390625, -9.529052734375, -8.7041015625, -7.879150390625, -7.05419921875, -6.229248046875, -5.404296875, -4.579345703125, -3.75439453125, -2.929443359375, -2.1044921875, -1.279541015625, -0.45458984375, 0.370361328125, 1.1953125, 2.020263671875, 2.84521484375, 3.670166015625, 4.4951171875, 5.320068359375, 6.14501953125, 6.969970703125, 7.794921875, 8.619873046875, 9.44482421875, 10.269775390625, 11.0947265625, 11.919677734375, 12.74462890625, 13.569580078125, 14.39453125, 15.219482421875, 16.04443359375, 16.869384765625, 17.6943359375, 18.519287109375, 19.34423828125, 20.169189453125, 20.994140625, 21.819091796875, 22.64404296875, 23.468994140625, 24.2939453125, 25.118896484375, 25.94384765625, 26.768798828125, 27.59375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 4.0, 12.0, 8.0, 24.0, 33.0, 57.0, 76.0, 109.0, 125.0, 134.0, 120.0, 89.0, 58.0, 44.0, 30.0, 22.0, 16.0, 11.0, 8.0, 5.0, 1.0, 5.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002590179443359375, -0.0024836063385009766, -0.002377033233642578, -0.0022704601287841797, -0.0021638870239257812, -0.002057313919067383, -0.0019507408142089844, -0.001844167709350586, -0.0017375946044921875, -0.001631021499633789, -0.0015244483947753906, -0.0014178752899169922, -0.0013113021850585938, -0.0012047290802001953, -0.0010981559753417969, -0.0009915828704833984, -0.000885009765625, -0.0007784366607666016, -0.0006718635559082031, -0.0005652904510498047, -0.00045871734619140625, -0.0003521442413330078, -0.0002455711364746094, -0.00013899803161621094, -3.24249267578125e-05, 7.414817810058594e-05, 0.00018072128295898438, 0.0002872943878173828, 0.00039386749267578125, 0.0005004405975341797, 0.0006070137023925781, 0.0007135868072509766, 0.000820159912109375, 0.0009267330169677734, 0.0010333061218261719, 0.0011398792266845703, 0.0012464523315429688, 0.0013530254364013672, 0.0014595985412597656, 0.001566171646118164, 0.0016727447509765625, 0.001779317855834961, 0.0018858909606933594, 0.001992464065551758, 0.0020990371704101562, 0.0022056102752685547, 0.002312183380126953, 0.0024187564849853516, 0.00252532958984375, 0.0026319026947021484, 0.002738475799560547, 0.0028450489044189453, 0.0029516220092773438, 0.003058195114135742, 0.0031647682189941406, 0.003271341323852539, 0.0033779144287109375, 0.003484487533569336, 0.0035910606384277344, 0.003697633743286133, 0.0038042068481445312, 0.00391077995300293, 0.004017353057861328, 0.0041239261627197266, 0.004230499267578125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 5.0, 6.0, 1.0, 6.0, 12.0, 17.0, 19.0, 32.0, 48.0, 78.0, 105.0, 141.0, 209.0, 323.0, 468.0, 690.0, 1026.0, 1604.0, 2387.0, 3575.0, 5874.0, 9337.0, 16181.0, 27793.0, 50707.0, 92231.0, 157194.0, 212652.0, 189293.0, 119928.0, 67178.0, 36514.0, 20645.0, 11987.0, 7213.0, 4503.0, 2865.0, 1883.0, 1252.0, 807.0, 550.0, 408.0, 235.0, 171.0, 109.0, 96.0, 70.0, 47.0, 23.0, 24.0, 15.0, 13.0, 1.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0], "bins": [-19.234375, -18.646728515625, -18.05908203125, -17.471435546875, -16.8837890625, -16.296142578125, -15.70849609375, -15.120849609375, -14.533203125, -13.945556640625, -13.35791015625, -12.770263671875, -12.1826171875, -11.594970703125, -11.00732421875, -10.419677734375, -9.83203125, -9.244384765625, -8.65673828125, -8.069091796875, -7.4814453125, -6.893798828125, -6.30615234375, -5.718505859375, -5.130859375, -4.543212890625, -3.95556640625, -3.367919921875, -2.7802734375, -2.192626953125, -1.60498046875, -1.017333984375, -0.4296875, 0.157958984375, 0.74560546875, 1.333251953125, 1.9208984375, 2.508544921875, 3.09619140625, 3.683837890625, 4.271484375, 4.859130859375, 5.44677734375, 6.034423828125, 6.6220703125, 7.209716796875, 7.79736328125, 8.385009765625, 8.97265625, 9.560302734375, 10.14794921875, 10.735595703125, 11.3232421875, 11.910888671875, 12.49853515625, 13.086181640625, 13.673828125, 14.261474609375, 14.84912109375, 15.436767578125, 16.0244140625, 16.612060546875, 17.19970703125, 17.787353515625, 18.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 13.0, 4.0, 8.0, 13.0, 15.0, 17.0, 23.0, 23.0, 30.0, 43.0, 38.0, 44.0, 43.0, 55.0, 58.0, 51.0, 45.0, 59.0, 52.0, 56.0, 37.0, 52.0, 28.0, 26.0, 27.0, 17.0, 26.0, 13.0, 17.0, 5.0, 4.0, 8.0, 8.0, 6.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.265625, -6.06243896484375, -5.8592529296875, -5.65606689453125, -5.452880859375, -5.24969482421875, -5.0465087890625, -4.84332275390625, -4.64013671875, -4.43695068359375, -4.2337646484375, -4.03057861328125, -3.827392578125, -3.62420654296875, -3.4210205078125, -3.21783447265625, -3.0146484375, -2.81146240234375, -2.6082763671875, -2.40509033203125, -2.201904296875, -1.99871826171875, -1.7955322265625, -1.59234619140625, -1.38916015625, -1.18597412109375, -0.9827880859375, -0.77960205078125, -0.576416015625, -0.37322998046875, -0.1700439453125, 0.03314208984375, 0.236328125, 0.43951416015625, 0.6427001953125, 0.84588623046875, 1.049072265625, 1.25225830078125, 1.4554443359375, 1.65863037109375, 1.86181640625, 2.06500244140625, 2.2681884765625, 2.47137451171875, 2.674560546875, 2.87774658203125, 3.0809326171875, 3.28411865234375, 3.4873046875, 3.69049072265625, 3.8936767578125, 4.09686279296875, 4.300048828125, 4.50323486328125, 4.7064208984375, 4.90960693359375, 5.11279296875, 5.31597900390625, 5.5191650390625, 5.72235107421875, 5.925537109375, 6.12872314453125, 6.3319091796875, 6.53509521484375, 6.73828125]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 4.0, 7.0, 8.0, 13.0, 13.0, 13.0, 22.0, 33.0, 23.0, 30.0, 30.0, 39.0, 38.0, 36.0, 64.0, 49.0, 46.0, 52.0, 46.0, 48.0, 40.0, 39.0, 40.0, 40.0, 31.0, 25.0, 23.0, 38.0, 13.0, 15.0, 11.0, 10.0, 11.0, 11.0, 8.0, 7.0, 1.0, 6.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8775691986084, -21.08901023864746, -20.30044937133789, -19.511890411376953, -18.723331451416016, -17.934772491455078, -17.14621353149414, -16.35765266418457, -15.569093704223633, -14.780534744262695, -13.991974830627441, -13.203414916992188, -12.41485595703125, -11.626296997070312, -10.837737083435059, -10.049177169799805, -9.260618209838867, -8.47205924987793, -7.683499336242676, -6.89493989944458, -6.106380462646484, -5.317821025848389, -4.529261589050293, -3.7407021522521973, -2.9521427154541016, -2.163583278656006, -1.3750238418579102, -0.5864644050598145, 0.20209503173828125, 0.990654468536377, 1.7792139053344727, 2.5677733421325684, 3.3563308715820312, 4.144890308380127, 4.933449745178223, 5.722009181976318, 6.510568618774414, 7.29912805557251, 8.087687492370605, 8.87624740600586, 9.664806365966797, 10.453365325927734, 11.241925239562988, 12.030485153198242, 12.81904411315918, 13.607603073120117, 14.396162986755371, 15.184722900390625, 15.973281860351562, 16.7618408203125, 17.550399780273438, 18.338960647583008, 19.127519607543945, 19.916078567504883, 20.704639434814453, 21.49319839477539, 22.281757354736328, 23.070316314697266, 23.858875274658203, 24.647436141967773, 25.43599510192871, 26.22455406188965, 27.01311492919922, 27.801673889160156, 28.590232849121094]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 9.0, 6.0, 7.0, 9.0, 14.0, 14.0, 17.0, 22.0, 27.0, 28.0, 21.0, 34.0, 34.0, 45.0, 49.0, 36.0, 61.0, 52.0, 51.0, 55.0, 50.0, 37.0, 52.0, 40.0, 31.0, 37.0, 30.0, 27.0, 30.0, 20.0, 8.0, 11.0, 6.0, 6.0, 8.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.469696044921875, -33.427268981933594, -32.38484573364258, -31.342418670654297, -30.29999351501465, -29.257568359375, -28.21514129638672, -27.17271614074707, -26.130290985107422, -25.087865829467773, -24.045440673828125, -23.003013610839844, -21.960588455200195, -20.918163299560547, -19.875736236572266, -18.833311080932617, -17.79088592529297, -16.74846076965332, -15.706034660339355, -14.66360855102539, -13.621183395385742, -12.578758239746094, -11.536332130432129, -10.493906021118164, -9.451480865478516, -8.409055709838867, -7.366629600524902, -6.324203968048096, -5.281778335571289, -4.239352703094482, -3.196927070617676, -2.154501438140869, -1.1120796203613281, -0.06965398788452148, 0.9727716445922852, 2.015197277069092, 3.0576229095458984, 4.100048542022705, 5.142474174499512, 6.184899806976318, 7.227325439453125, 8.269750595092773, 9.312176704406738, 10.354602813720703, 11.397027969360352, 12.439453125, 13.481879234313965, 14.52430534362793, 15.566730499267578, 16.609155654907227, 17.651580810546875, 18.694007873535156, 19.736433029174805, 20.778858184814453, 21.821285247802734, 22.863710403442383, 23.90613555908203, 24.94856071472168, 25.990985870361328, 27.03341293334961, 28.075838088989258, 29.118263244628906, 30.160690307617188, 31.203115463256836, 32.245540618896484]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 21.0, 31.0, 38.0, 63.0, 75.0, 119.0, 183.0, 289.0, 428.0, 600.0, 888.0, 1487.0, 2245.0, 3507.0, 5619.0, 9403.0, 15728.0, 27666.0, 50640.0, 98307.0, 200167.0, 402778.0, 709382.0, 913228.0, 777000.0, 474155.0, 241934.0, 120016.0, 60774.0, 32364.0, 17976.0, 10412.0, 6308.0, 3722.0, 2386.0, 1504.0, 965.0, 621.0, 438.0, 274.0, 166.0, 126.0, 87.0, 43.0, 45.0, 28.0, 16.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-21.828125, -21.1591796875, -20.490234375, -19.8212890625, -19.15234375, -18.4833984375, -17.814453125, -17.1455078125, -16.4765625, -15.8076171875, -15.138671875, -14.4697265625, -13.80078125, -13.1318359375, -12.462890625, -11.7939453125, -11.125, -10.4560546875, -9.787109375, -9.1181640625, -8.44921875, -7.7802734375, -7.111328125, -6.4423828125, -5.7734375, -5.1044921875, -4.435546875, -3.7666015625, -3.09765625, -2.4287109375, -1.759765625, -1.0908203125, -0.421875, 0.2470703125, 0.916015625, 1.5849609375, 2.25390625, 2.9228515625, 3.591796875, 4.2607421875, 4.9296875, 5.5986328125, 6.267578125, 6.9365234375, 7.60546875, 8.2744140625, 8.943359375, 9.6123046875, 10.28125, 10.9501953125, 11.619140625, 12.2880859375, 12.95703125, 13.6259765625, 14.294921875, 14.9638671875, 15.6328125, 16.3017578125, 16.970703125, 17.6396484375, 18.30859375, 18.9775390625, 19.646484375, 20.3154296875, 20.984375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 3.0, 7.0, 5.0, 11.0, 14.0, 21.0, 15.0, 25.0, 22.0, 23.0, 28.0, 27.0, 25.0, 32.0, 36.0, 44.0, 29.0, 62.0, 51.0, 55.0, 45.0, 36.0, 44.0, 46.0, 36.0, 34.0, 34.0, 32.0, 26.0, 25.0, 19.0, 23.0, 7.0, 12.0, 11.0, 6.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.390625, -22.68359375, -21.9765625, -21.26953125, -20.5625, -19.85546875, -19.1484375, -18.44140625, -17.734375, -17.02734375, -16.3203125, -15.61328125, -14.90625, -14.19921875, -13.4921875, -12.78515625, -12.078125, -11.37109375, -10.6640625, -9.95703125, -9.25, -8.54296875, -7.8359375, -7.12890625, -6.421875, -5.71484375, -5.0078125, -4.30078125, -3.59375, -2.88671875, -2.1796875, -1.47265625, -0.765625, -0.05859375, 0.6484375, 1.35546875, 2.0625, 2.76953125, 3.4765625, 4.18359375, 4.890625, 5.59765625, 6.3046875, 7.01171875, 7.71875, 8.42578125, 9.1328125, 9.83984375, 10.546875, 11.25390625, 11.9609375, 12.66796875, 13.375, 14.08203125, 14.7890625, 15.49609375, 16.203125, 16.91015625, 17.6171875, 18.32421875, 19.03125, 19.73828125, 20.4453125, 21.15234375, 21.859375]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 10.0, 12.0, 14.0, 18.0, 39.0, 58.0, 69.0, 129.0, 214.0, 342.0, 534.0, 950.0, 1684.0, 2819.0, 5263.0, 10001.0, 20349.0, 42286.0, 95077.0, 220227.0, 508363.0, 1003312.0, 1122877.0, 646781.0, 284708.0, 122260.0, 54006.0, 24972.0, 12225.0, 6467.0, 3526.0, 1904.0, 1076.0, 662.0, 364.0, 248.0, 156.0, 90.0, 63.0, 34.0, 35.0, 18.0, 15.0, 12.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -32.064453125, -31.03515625, -30.005859375, -28.9765625, -27.947265625, -26.91796875, -25.888671875, -24.859375, -23.830078125, -22.80078125, -21.771484375, -20.7421875, -19.712890625, -18.68359375, -17.654296875, -16.625, -15.595703125, -14.56640625, -13.537109375, -12.5078125, -11.478515625, -10.44921875, -9.419921875, -8.390625, -7.361328125, -6.33203125, -5.302734375, -4.2734375, -3.244140625, -2.21484375, -1.185546875, -0.15625, 0.873046875, 1.90234375, 2.931640625, 3.9609375, 4.990234375, 6.01953125, 7.048828125, 8.078125, 9.107421875, 10.13671875, 11.166015625, 12.1953125, 13.224609375, 14.25390625, 15.283203125, 16.3125, 17.341796875, 18.37109375, 19.400390625, 20.4296875, 21.458984375, 22.48828125, 23.517578125, 24.546875, 25.576171875, 26.60546875, 27.634765625, 28.6640625, 29.693359375, 30.72265625, 31.751953125, 32.78125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 16.0, 10.0, 9.0, 23.0, 23.0, 21.0, 30.0, 29.0, 39.0, 62.0, 95.0, 109.0, 118.0, 152.0, 161.0, 176.0, 250.0, 262.0, 263.0, 295.0, 265.0, 239.0, 244.0, 201.0, 195.0, 140.0, 126.0, 88.0, 78.0, 79.0, 52.0, 52.0, 42.0, 20.0, 23.0, 13.0, 15.0, 9.0, 9.0, 8.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 3.0], "bins": [-10.8203125, -10.5238037109375, -10.227294921875, -9.9307861328125, -9.63427734375, -9.3377685546875, -9.041259765625, -8.7447509765625, -8.4482421875, -8.1517333984375, -7.855224609375, -7.5587158203125, -7.26220703125, -6.9656982421875, -6.669189453125, -6.3726806640625, -6.076171875, -5.7796630859375, -5.483154296875, -5.1866455078125, -4.89013671875, -4.5936279296875, -4.297119140625, -4.0006103515625, -3.7041015625, -3.4075927734375, -3.111083984375, -2.8145751953125, -2.51806640625, -2.2215576171875, -1.925048828125, -1.6285400390625, -1.33203125, -1.0355224609375, -0.739013671875, -0.4425048828125, -0.14599609375, 0.1505126953125, 0.447021484375, 0.7435302734375, 1.0400390625, 1.3365478515625, 1.633056640625, 1.9295654296875, 2.22607421875, 2.5225830078125, 2.819091796875, 3.1156005859375, 3.412109375, 3.7086181640625, 4.005126953125, 4.3016357421875, 4.59814453125, 4.8946533203125, 5.191162109375, 5.4876708984375, 5.7841796875, 6.0806884765625, 6.377197265625, 6.6737060546875, 6.97021484375, 7.2667236328125, 7.563232421875, 7.8597412109375, 8.15625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 10.0, 6.0, 9.0, 11.0, 8.0, 12.0, 16.0, 27.0, 29.0, 30.0, 40.0, 42.0, 60.0, 67.0, 64.0, 67.0, 49.0, 65.0, 70.0, 56.0, 47.0, 39.0, 32.0, 34.0, 28.0, 22.0, 9.0, 14.0, 7.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.321521759033203, -26.465770721435547, -25.61001968383789, -24.754268646240234, -23.898517608642578, -23.042766571044922, -22.187015533447266, -21.33126449584961, -20.475513458251953, -19.619762420654297, -18.76401138305664, -17.908260345458984, -17.052509307861328, -16.196758270263672, -15.341007232666016, -14.48525619506836, -13.629505157470703, -12.773754119873047, -11.91800308227539, -11.062252044677734, -10.206501007080078, -9.350749969482422, -8.494998931884766, -7.639247894287109, -6.783496856689453, -5.927745819091797, -5.071994781494141, -4.216243743896484, -3.360492706298828, -2.504741668701172, -1.6489906311035156, -0.7932395935058594, 0.06251144409179688, 0.9182624816894531, 1.7740135192871094, 2.6297645568847656, 3.485515594482422, 4.341266632080078, 5.197017669677734, 6.052768707275391, 6.908519744873047, 7.764270782470703, 8.62002182006836, 9.475772857666016, 10.331523895263672, 11.187274932861328, 12.043025970458984, 12.89877700805664, 13.754528045654297, 14.610279083251953, 15.46603012084961, 16.321781158447266, 17.177532196044922, 18.033283233642578, 18.889034271240234, 19.74478530883789, 20.600536346435547, 21.456287384033203, 22.31203842163086, 23.167789459228516, 24.023540496826172, 24.879291534423828, 25.735042572021484, 26.59079360961914, 27.446544647216797]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 7.0, 5.0, 9.0, 8.0, 7.0, 13.0, 17.0, 18.0, 13.0, 19.0, 23.0, 23.0, 23.0, 23.0, 46.0, 44.0, 48.0, 53.0, 44.0, 43.0, 46.0, 42.0, 47.0, 44.0, 31.0, 37.0, 35.0, 24.0, 32.0, 30.0, 28.0, 17.0, 25.0, 16.0, 12.0, 5.0, 15.0, 7.0, 5.0, 7.0, 1.0, 1.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.815170288085938, -24.001041412353516, -23.186914443969727, -22.372787475585938, -21.558658599853516, -20.744529724121094, -19.930402755737305, -19.116275787353516, -18.302146911621094, -17.488018035888672, -16.673891067504883, -15.859763145446777, -15.045635223388672, -14.231507301330566, -13.417379379272461, -12.603251457214355, -11.78912353515625, -10.974995613098145, -10.160867691040039, -9.346739768981934, -8.532611846923828, -7.718483924865723, -6.904356002807617, -6.090228080749512, -5.276100158691406, -4.461972236633301, -3.6478443145751953, -2.83371639251709, -2.0195884704589844, -1.205460548400879, -0.39133262634277344, 0.42279529571533203, 1.2369251251220703, 2.051053047180176, 2.8651809692382812, 3.6793088912963867, 4.493436813354492, 5.307564735412598, 6.121692657470703, 6.935820579528809, 7.749948501586914, 8.56407642364502, 9.378204345703125, 10.19233226776123, 11.006460189819336, 11.820588111877441, 12.634716033935547, 13.448843955993652, 14.262971878051758, 15.077099800109863, 15.891227722167969, 16.70535659790039, 17.51948356628418, 18.33361053466797, 19.14773941040039, 19.961868286132812, 20.7759952545166, 21.59012222290039, 22.404251098632812, 23.218379974365234, 24.032506942749023, 24.846633911132812, 25.660762786865234, 26.474891662597656, 27.289018630981445]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 14.0, 26.0, 27.0, 48.0, 70.0, 108.0, 170.0, 213.0, 318.0, 461.0, 687.0, 956.0, 1348.0, 1953.0, 2788.0, 3870.0, 6079.0, 8853.0, 13804.0, 21290.0, 33434.0, 54060.0, 86726.0, 136387.0, 183367.0, 171258.0, 117694.0, 73733.0, 45464.0, 28736.0, 18363.0, 11795.0, 7667.0, 5177.0, 3526.0, 2385.0, 1697.0, 1195.0, 857.0, 568.0, 429.0, 303.0, 233.0, 130.0, 103.0, 63.0, 43.0, 22.0, 21.0, 22.0, 8.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.859375, -17.280029296875, -16.70068359375, -16.121337890625, -15.5419921875, -14.962646484375, -14.38330078125, -13.803955078125, -13.224609375, -12.645263671875, -12.06591796875, -11.486572265625, -10.9072265625, -10.327880859375, -9.74853515625, -9.169189453125, -8.58984375, -8.010498046875, -7.43115234375, -6.851806640625, -6.2724609375, -5.693115234375, -5.11376953125, -4.534423828125, -3.955078125, -3.375732421875, -2.79638671875, -2.217041015625, -1.6376953125, -1.058349609375, -0.47900390625, 0.100341796875, 0.6796875, 1.259033203125, 1.83837890625, 2.417724609375, 2.9970703125, 3.576416015625, 4.15576171875, 4.735107421875, 5.314453125, 5.893798828125, 6.47314453125, 7.052490234375, 7.6318359375, 8.211181640625, 8.79052734375, 9.369873046875, 9.94921875, 10.528564453125, 11.10791015625, 11.687255859375, 12.2666015625, 12.845947265625, 13.42529296875, 14.004638671875, 14.583984375, 15.163330078125, 15.74267578125, 16.322021484375, 16.9013671875, 17.480712890625, 18.06005859375, 18.639404296875, 19.21875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 6.0, 5.0, 7.0, 13.0, 9.0, 8.0, 16.0, 17.0, 26.0, 16.0, 27.0, 22.0, 23.0, 36.0, 39.0, 50.0, 47.0, 39.0, 55.0, 47.0, 42.0, 45.0, 37.0, 41.0, 33.0, 29.0, 32.0, 24.0, 32.0, 20.0, 32.0, 23.0, 20.0, 13.0, 8.0, 10.0, 12.0, 2.0, 7.0, 7.0, 2.0, 3.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.671875, -21.9375, -21.203125, -20.46875, -19.734375, -19.0, -18.265625, -17.53125, -16.796875, -16.0625, -15.328125, -14.59375, -13.859375, -13.125, -12.390625, -11.65625, -10.921875, -10.1875, -9.453125, -8.71875, -7.984375, -7.25, -6.515625, -5.78125, -5.046875, -4.3125, -3.578125, -2.84375, -2.109375, -1.375, -0.640625, 0.09375, 0.828125, 1.5625, 2.296875, 3.03125, 3.765625, 4.5, 5.234375, 5.96875, 6.703125, 7.4375, 8.171875, 8.90625, 9.640625, 10.375, 11.109375, 11.84375, 12.578125, 13.3125, 14.046875, 14.78125, 15.515625, 16.25, 16.984375, 17.71875, 18.453125, 19.1875, 19.921875, 20.65625, 21.390625, 22.125, 22.859375, 23.59375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 12.0, 9.0, 10.0, 15.0, 25.0, 30.0, 48.0, 48.0, 80.0, 106.0, 132.0, 166.0, 232.0, 320.0, 418.0, 520.0, 722.0, 1075.0, 1591.0, 2275.0, 3430.0, 5306.0, 8645.0, 15906.0, 34668.0, 772410.0, 141542.0, 24536.0, 12684.0, 7275.0, 4512.0, 2941.0, 1940.0, 1305.0, 921.0, 695.0, 512.0, 393.0, 285.0, 229.0, 169.0, 120.0, 71.0, 60.0, 44.0, 37.0, 23.0, 15.0, 15.0, 13.0, 11.0, 1.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0], "bins": [-32.96875, -31.93212890625, -30.8955078125, -29.85888671875, -28.822265625, -27.78564453125, -26.7490234375, -25.71240234375, -24.67578125, -23.63916015625, -22.6025390625, -21.56591796875, -20.529296875, -19.49267578125, -18.4560546875, -17.41943359375, -16.3828125, -15.34619140625, -14.3095703125, -13.27294921875, -12.236328125, -11.19970703125, -10.1630859375, -9.12646484375, -8.08984375, -7.05322265625, -6.0166015625, -4.97998046875, -3.943359375, -2.90673828125, -1.8701171875, -0.83349609375, 0.203125, 1.23974609375, 2.2763671875, 3.31298828125, 4.349609375, 5.38623046875, 6.4228515625, 7.45947265625, 8.49609375, 9.53271484375, 10.5693359375, 11.60595703125, 12.642578125, 13.67919921875, 14.7158203125, 15.75244140625, 16.7890625, 17.82568359375, 18.8623046875, 19.89892578125, 20.935546875, 21.97216796875, 23.0087890625, 24.04541015625, 25.08203125, 26.11865234375, 27.1552734375, 28.19189453125, 29.228515625, 30.26513671875, 31.3017578125, 32.33837890625, 33.375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 6.0, 2.0, 7.0, 4.0, 16.0, 13.0, 16.0, 23.0, 23.0, 36.0, 36.0, 47.0, 47.0, 57.0, 53.0, 67.0, 49.0, 54.0, 67.0, 63.0, 56.0, 39.0, 31.0, 30.0, 31.0, 25.0, 18.0, 10.0, 12.0, 8.0, 11.0, 5.0, 5.0, 6.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.62158203125, -30.6181640625, -29.61474609375, -28.611328125, -27.60791015625, -26.6044921875, -25.60107421875, -24.59765625, -23.59423828125, -22.5908203125, -21.58740234375, -20.583984375, -19.58056640625, -18.5771484375, -17.57373046875, -16.5703125, -15.56689453125, -14.5634765625, -13.56005859375, -12.556640625, -11.55322265625, -10.5498046875, -9.54638671875, -8.54296875, -7.53955078125, -6.5361328125, -5.53271484375, -4.529296875, -3.52587890625, -2.5224609375, -1.51904296875, -0.515625, 0.48779296875, 1.4912109375, 2.49462890625, 3.498046875, 4.50146484375, 5.5048828125, 6.50830078125, 7.51171875, 8.51513671875, 9.5185546875, 10.52197265625, 11.525390625, 12.52880859375, 13.5322265625, 14.53564453125, 15.5390625, 16.54248046875, 17.5458984375, 18.54931640625, 19.552734375, 20.55615234375, 21.5595703125, 22.56298828125, 23.56640625, 24.56982421875, 25.5732421875, 26.57666015625, 27.580078125, 28.58349609375, 29.5869140625, 30.59033203125, 31.59375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 8.0, 5.0, 11.0, 19.0, 16.0, 20.0, 25.0, 42.0, 34.0, 46.0, 58.0, 71.0, 90.0, 138.0, 203.0, 268.0, 427.0, 697.0, 1213.0, 2157.0, 5332.0, 19824.0, 881520.0, 114926.0, 12687.0, 4005.0, 1821.0, 988.0, 564.0, 357.0, 257.0, 181.0, 136.0, 89.0, 72.0, 56.0, 43.0, 29.0, 18.0, 18.0, 18.0, 12.0, 14.0, 8.0, 8.0, 7.0, 6.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-34.875, -33.8134765625, -32.751953125, -31.6904296875, -30.62890625, -29.5673828125, -28.505859375, -27.4443359375, -26.3828125, -25.3212890625, -24.259765625, -23.1982421875, -22.13671875, -21.0751953125, -20.013671875, -18.9521484375, -17.890625, -16.8291015625, -15.767578125, -14.7060546875, -13.64453125, -12.5830078125, -11.521484375, -10.4599609375, -9.3984375, -8.3369140625, -7.275390625, -6.2138671875, -5.15234375, -4.0908203125, -3.029296875, -1.9677734375, -0.90625, 0.1552734375, 1.216796875, 2.2783203125, 3.33984375, 4.4013671875, 5.462890625, 6.5244140625, 7.5859375, 8.6474609375, 9.708984375, 10.7705078125, 11.83203125, 12.8935546875, 13.955078125, 15.0166015625, 16.078125, 17.1396484375, 18.201171875, 19.2626953125, 20.32421875, 21.3857421875, 22.447265625, 23.5087890625, 24.5703125, 25.6318359375, 26.693359375, 27.7548828125, 28.81640625, 29.8779296875, 30.939453125, 32.0009765625, 33.0625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 5.0, 15.0, 23.0, 41.0, 113.0, 606.0, 103.0, 39.0, 25.0, 12.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0181427001953125, -0.01769411563873291, -0.01724553108215332, -0.01679694652557373, -0.01634836196899414, -0.01589977741241455, -0.015451192855834961, -0.015002608299255371, -0.014554023742675781, -0.014105439186096191, -0.013656854629516602, -0.013208270072937012, -0.012759685516357422, -0.012311100959777832, -0.011862516403198242, -0.011413931846618652, -0.010965347290039062, -0.010516762733459473, -0.010068178176879883, -0.009619593620300293, -0.009171009063720703, -0.008722424507141113, -0.008273839950561523, -0.007825255393981934, -0.007376670837402344, -0.006928086280822754, -0.006479501724243164, -0.006030917167663574, -0.005582332611083984, -0.0051337480545043945, -0.004685163497924805, -0.004236578941345215, -0.003787994384765625, -0.003339409828186035, -0.0028908252716064453, -0.0024422407150268555, -0.0019936561584472656, -0.0015450716018676758, -0.001096487045288086, -0.0006479024887084961, -0.00019931793212890625, 0.0002492666244506836, 0.0006978511810302734, 0.0011464357376098633, 0.0015950202941894531, 0.002043604850769043, 0.002492189407348633, 0.0029407739639282227, 0.0033893585205078125, 0.0038379430770874023, 0.004286527633666992, 0.004735112190246582, 0.005183696746826172, 0.005632281303405762, 0.0060808658599853516, 0.006529450416564941, 0.006978034973144531, 0.007426619529724121, 0.007875204086303711, 0.0083237886428833, 0.00877237319946289, 0.00922095775604248, 0.00966954231262207, 0.01011812686920166, 0.01056671142578125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 11.0, 17.0, 17.0, 28.0, 24.0, 35.0, 50.0, 78.0, 103.0, 144.0, 162.0, 243.0, 349.0, 471.0, 652.0, 972.0, 1549.0, 2548.0, 4377.0, 8564.0, 18395.0, 44951.0, 130348.0, 358929.0, 303968.0, 101996.0, 36224.0, 15204.0, 7394.0, 3943.0, 2259.0, 1446.0, 901.0, 570.0, 452.0, 308.0, 243.0, 163.0, 130.0, 87.0, 58.0, 45.0, 39.0, 27.0, 24.0, 13.0, 11.0, 6.0, 2.0, 5.0, 5.0, 4.0, 5.0, 4.0, 1.0], "bins": [-7.1484375, -6.93109130859375, -6.7137451171875, -6.49639892578125, -6.279052734375, -6.06170654296875, -5.8443603515625, -5.62701416015625, -5.40966796875, -5.19232177734375, -4.9749755859375, -4.75762939453125, -4.540283203125, -4.32293701171875, -4.1055908203125, -3.88824462890625, -3.6708984375, -3.45355224609375, -3.2362060546875, -3.01885986328125, -2.801513671875, -2.58416748046875, -2.3668212890625, -2.14947509765625, -1.93212890625, -1.71478271484375, -1.4974365234375, -1.28009033203125, -1.062744140625, -0.84539794921875, -0.6280517578125, -0.41070556640625, -0.193359375, 0.02398681640625, 0.2413330078125, 0.45867919921875, 0.676025390625, 0.89337158203125, 1.1107177734375, 1.32806396484375, 1.54541015625, 1.76275634765625, 1.9801025390625, 2.19744873046875, 2.414794921875, 2.63214111328125, 2.8494873046875, 3.06683349609375, 3.2841796875, 3.50152587890625, 3.7188720703125, 3.93621826171875, 4.153564453125, 4.37091064453125, 4.5882568359375, 4.80560302734375, 5.02294921875, 5.24029541015625, 5.4576416015625, 5.67498779296875, 5.892333984375, 6.10968017578125, 6.3270263671875, 6.54437255859375, 6.76171875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 10.0, 3.0, 9.0, 9.0, 14.0, 14.0, 11.0, 28.0, 25.0, 35.0, 45.0, 72.0, 79.0, 112.0, 101.0, 108.0, 82.0, 56.0, 48.0, 33.0, 25.0, 26.0, 8.0, 8.0, 6.0, 7.0, 7.0, 1.0, 5.0, 2.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3984375, -2.328521728515625, -2.25860595703125, -2.188690185546875, -2.1187744140625, -2.048858642578125, -1.97894287109375, -1.909027099609375, -1.839111328125, -1.769195556640625, -1.69927978515625, -1.629364013671875, -1.5594482421875, -1.489532470703125, -1.41961669921875, -1.349700927734375, -1.27978515625, -1.209869384765625, -1.13995361328125, -1.070037841796875, -1.0001220703125, -0.930206298828125, -0.86029052734375, -0.790374755859375, -0.720458984375, -0.650543212890625, -0.58062744140625, -0.510711669921875, -0.4407958984375, -0.370880126953125, -0.30096435546875, -0.231048583984375, -0.1611328125, -0.091217041015625, -0.02130126953125, 0.048614501953125, 0.1185302734375, 0.188446044921875, 0.25836181640625, 0.328277587890625, 0.398193359375, 0.468109130859375, 0.53802490234375, 0.607940673828125, 0.6778564453125, 0.747772216796875, 0.81768798828125, 0.887603759765625, 0.95751953125, 1.027435302734375, 1.09735107421875, 1.167266845703125, 1.2371826171875, 1.307098388671875, 1.37701416015625, 1.446929931640625, 1.516845703125, 1.586761474609375, 1.65667724609375, 1.726593017578125, 1.7965087890625, 1.866424560546875, 1.93634033203125, 2.006256103515625, 2.076171875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 7.0, 8.0, 13.0, 6.0, 13.0, 8.0, 17.0, 12.0, 25.0, 21.0, 29.0, 32.0, 41.0, 53.0, 66.0, 58.0, 56.0, 61.0, 56.0, 46.0, 69.0, 40.0, 46.0, 34.0, 40.0, 18.0, 22.0, 18.0, 12.0, 14.0, 13.0, 6.0, 3.0, 4.0, 3.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.470121383666992, -18.742862701416016, -18.015602111816406, -17.28834342956543, -16.561084747314453, -15.833826065063477, -15.106566429138184, -14.37930679321289, -13.652048110961914, -12.924789428710938, -12.197529792785645, -11.470270156860352, -10.743011474609375, -10.015752792358398, -9.288493156433105, -8.561233520507812, -7.833974838256836, -7.106715679168701, -6.379456520080566, -5.652197360992432, -4.924938201904297, -4.197679042816162, -3.4704198837280273, -2.7431607246398926, -2.015901565551758, -1.288642406463623, -0.5613832473754883, 0.16587591171264648, 0.8931350708007812, 1.620394229888916, 2.347653388977051, 3.0749125480651855, 3.802173614501953, 4.529432773590088, 5.256691932678223, 5.983951091766357, 6.711210250854492, 7.438469409942627, 8.165728569030762, 8.892988204956055, 9.620246887207031, 10.347505569458008, 11.0747652053833, 11.802024841308594, 12.52928352355957, 13.256542205810547, 13.98380184173584, 14.711061477661133, 15.43832015991211, 16.165578842163086, 16.892837524414062, 17.620098114013672, 18.34735679626465, 19.074615478515625, 19.801876068115234, 20.52913475036621, 21.256393432617188, 21.983652114868164, 22.71091079711914, 23.43817138671875, 24.165430068969727, 24.892688751220703, 25.619949340820312, 26.34720802307129, 27.074466705322266]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 5.0, 9.0, 9.0, 8.0, 12.0, 12.0, 19.0, 14.0, 21.0, 22.0, 25.0, 23.0, 27.0, 39.0, 42.0, 43.0, 45.0, 37.0, 48.0, 63.0, 35.0, 61.0, 36.0, 31.0, 29.0, 27.0, 39.0, 34.0, 24.0, 25.0, 25.0, 18.0, 12.0, 16.0, 12.0, 10.0, 6.0, 7.0, 9.0, 2.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.00201988220215, -23.241886138916016, -22.48175048828125, -21.721616744995117, -20.96148109436035, -20.20134735107422, -19.441211700439453, -18.68107795715332, -17.920944213867188, -17.160810470581055, -16.40067481994629, -15.640541076660156, -14.880406379699707, -14.120271682739258, -13.360136985778809, -12.60000228881836, -11.83986759185791, -11.079732894897461, -10.319598197937012, -9.559463500976562, -8.79932975769043, -8.03919506072998, -7.279060363769531, -6.51892614364624, -5.758791446685791, -4.998656749725342, -4.238522529602051, -3.4783878326416016, -2.7182533740997314, -1.9581189155578613, -1.197984218597412, -0.4378499984741211, 0.3222846984863281, 1.0824191570281982, 1.842553734779358, 2.6026883125305176, 3.3628227710723877, 4.122957229614258, 4.883091926574707, 5.643226146697998, 6.403360843658447, 7.1634955406188965, 7.9236297607421875, 8.683764457702637, 9.443899154663086, 10.204032897949219, 10.964168548583984, 11.724302291870117, 12.484436988830566, 13.244571685791016, 14.004706382751465, 14.764841079711914, 15.524974822998047, 16.285110473632812, 17.045244216918945, 17.805377960205078, 18.565513610839844, 19.325647354125977, 20.085783004760742, 20.845916748046875, 21.60605239868164, 22.366186141967773, 23.126319885253906, 23.886455535888672, 24.646589279174805]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 7.0, 14.0, 16.0, 23.0, 30.0, 39.0, 52.0, 103.0, 137.0, 167.0, 262.0, 387.0, 533.0, 808.0, 1179.0, 1714.0, 2567.0, 3584.0, 5547.0, 7967.0, 11882.0, 17811.0, 26587.0, 39171.0, 56168.0, 78554.0, 102681.0, 122187.0, 128695.0, 117273.0, 94243.0, 70901.0, 50627.0, 34585.0, 23581.0, 15718.0, 10554.0, 6981.0, 4724.0, 3257.0, 2319.0, 1519.0, 1075.0, 751.0, 486.0, 338.0, 254.0, 177.0, 107.0, 81.0, 39.0, 30.0, 26.0, 13.0, 12.0, 9.0, 0.0, 7.0, 6.0, 1.0], "bins": [-16.359375, -15.853515625, -15.34765625, -14.841796875, -14.3359375, -13.830078125, -13.32421875, -12.818359375, -12.3125, -11.806640625, -11.30078125, -10.794921875, -10.2890625, -9.783203125, -9.27734375, -8.771484375, -8.265625, -7.759765625, -7.25390625, -6.748046875, -6.2421875, -5.736328125, -5.23046875, -4.724609375, -4.21875, -3.712890625, -3.20703125, -2.701171875, -2.1953125, -1.689453125, -1.18359375, -0.677734375, -0.171875, 0.333984375, 0.83984375, 1.345703125, 1.8515625, 2.357421875, 2.86328125, 3.369140625, 3.875, 4.380859375, 4.88671875, 5.392578125, 5.8984375, 6.404296875, 6.91015625, 7.416015625, 7.921875, 8.427734375, 8.93359375, 9.439453125, 9.9453125, 10.451171875, 10.95703125, 11.462890625, 11.96875, 12.474609375, 12.98046875, 13.486328125, 13.9921875, 14.498046875, 15.00390625, 15.509765625, 16.015625]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 9.0, 11.0, 10.0, 11.0, 13.0, 14.0, 25.0, 13.0, 25.0, 22.0, 29.0, 25.0, 27.0, 31.0, 36.0, 41.0, 53.0, 58.0, 49.0, 47.0, 36.0, 41.0, 43.0, 32.0, 28.0, 36.0, 23.0, 35.0, 22.0, 27.0, 24.0, 14.0, 13.0, 7.0, 14.0, 7.0, 12.0, 8.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.1591796875, -20.474609375, -19.7900390625, -19.10546875, -18.4208984375, -17.736328125, -17.0517578125, -16.3671875, -15.6826171875, -14.998046875, -14.3134765625, -13.62890625, -12.9443359375, -12.259765625, -11.5751953125, -10.890625, -10.2060546875, -9.521484375, -8.8369140625, -8.15234375, -7.4677734375, -6.783203125, -6.0986328125, -5.4140625, -4.7294921875, -4.044921875, -3.3603515625, -2.67578125, -1.9912109375, -1.306640625, -0.6220703125, 0.0625, 0.7470703125, 1.431640625, 2.1162109375, 2.80078125, 3.4853515625, 4.169921875, 4.8544921875, 5.5390625, 6.2236328125, 6.908203125, 7.5927734375, 8.27734375, 8.9619140625, 9.646484375, 10.3310546875, 11.015625, 11.7001953125, 12.384765625, 13.0693359375, 13.75390625, 14.4384765625, 15.123046875, 15.8076171875, 16.4921875, 17.1767578125, 17.861328125, 18.5458984375, 19.23046875, 19.9150390625, 20.599609375, 21.2841796875, 21.96875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 2.0, 7.0, 7.0, 4.0, 6.0, 15.0, 23.0, 42.0, 58.0, 73.0, 128.0, 205.0, 366.0, 575.0, 983.0, 1727.0, 3036.0, 5858.0, 11059.0, 20823.0, 39333.0, 72953.0, 125941.0, 184171.0, 203313.0, 159138.0, 99506.0, 55420.0, 29715.0, 15619.0, 8258.0, 4389.0, 2461.0, 1366.0, 775.0, 460.0, 276.0, 180.0, 96.0, 68.0, 49.0, 25.0, 15.0, 10.0, 10.0, 10.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.171875, -20.423095703125, -19.67431640625, -18.925537109375, -18.1767578125, -17.427978515625, -16.67919921875, -15.930419921875, -15.181640625, -14.432861328125, -13.68408203125, -12.935302734375, -12.1865234375, -11.437744140625, -10.68896484375, -9.940185546875, -9.19140625, -8.442626953125, -7.69384765625, -6.945068359375, -6.1962890625, -5.447509765625, -4.69873046875, -3.949951171875, -3.201171875, -2.452392578125, -1.70361328125, -0.954833984375, -0.2060546875, 0.542724609375, 1.29150390625, 2.040283203125, 2.7890625, 3.537841796875, 4.28662109375, 5.035400390625, 5.7841796875, 6.532958984375, 7.28173828125, 8.030517578125, 8.779296875, 9.528076171875, 10.27685546875, 11.025634765625, 11.7744140625, 12.523193359375, 13.27197265625, 14.020751953125, 14.76953125, 15.518310546875, 16.26708984375, 17.015869140625, 17.7646484375, 18.513427734375, 19.26220703125, 20.010986328125, 20.759765625, 21.508544921875, 22.25732421875, 23.006103515625, 23.7548828125, 24.503662109375, 25.25244140625, 26.001220703125, 26.75]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 5.0, 10.0, 9.0, 15.0, 7.0, 19.0, 16.0, 27.0, 30.0, 28.0, 27.0, 35.0, 31.0, 29.0, 46.0, 33.0, 41.0, 27.0, 35.0, 40.0, 41.0, 44.0, 52.0, 31.0, 49.0, 30.0, 38.0, 39.0, 22.0, 17.0, 24.0, 22.0, 16.0, 17.0, 9.0, 8.0, 4.0, 6.0, 7.0, 2.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.921875, -16.4346923828125, -15.947509765625, -15.4603271484375, -14.97314453125, -14.4859619140625, -13.998779296875, -13.5115966796875, -13.0244140625, -12.5372314453125, -12.050048828125, -11.5628662109375, -11.07568359375, -10.5885009765625, -10.101318359375, -9.6141357421875, -9.126953125, -8.6397705078125, -8.152587890625, -7.6654052734375, -7.17822265625, -6.6910400390625, -6.203857421875, -5.7166748046875, -5.2294921875, -4.7423095703125, -4.255126953125, -3.7679443359375, -3.28076171875, -2.7935791015625, -2.306396484375, -1.8192138671875, -1.33203125, -0.8448486328125, -0.357666015625, 0.1295166015625, 0.61669921875, 1.1038818359375, 1.591064453125, 2.0782470703125, 2.5654296875, 3.0526123046875, 3.539794921875, 4.0269775390625, 4.51416015625, 5.0013427734375, 5.488525390625, 5.9757080078125, 6.462890625, 6.9500732421875, 7.437255859375, 7.9244384765625, 8.41162109375, 8.8988037109375, 9.385986328125, 9.8731689453125, 10.3603515625, 10.8475341796875, 11.334716796875, 11.8218994140625, 12.30908203125, 12.7962646484375, 13.283447265625, 13.7706298828125, 14.2578125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 7.0, 16.0, 18.0, 34.0, 55.0, 75.0, 138.0, 198.0, 324.0, 553.0, 946.0, 1668.0, 3008.0, 5679.0, 11235.0, 23246.0, 51424.0, 117020.0, 238166.0, 285713.0, 167663.0, 75156.0, 33460.0, 15648.0, 7766.0, 4009.0, 2262.0, 1220.0, 723.0, 432.0, 257.0, 159.0, 118.0, 52.0, 35.0, 20.0, 15.0, 10.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.8125, -23.095947265625, -22.37939453125, -21.662841796875, -20.9462890625, -20.229736328125, -19.51318359375, -18.796630859375, -18.080078125, -17.363525390625, -16.64697265625, -15.930419921875, -15.2138671875, -14.497314453125, -13.78076171875, -13.064208984375, -12.34765625, -11.631103515625, -10.91455078125, -10.197998046875, -9.4814453125, -8.764892578125, -8.04833984375, -7.331787109375, -6.615234375, -5.898681640625, -5.18212890625, -4.465576171875, -3.7490234375, -3.032470703125, -2.31591796875, -1.599365234375, -0.8828125, -0.166259765625, 0.55029296875, 1.266845703125, 1.9833984375, 2.699951171875, 3.41650390625, 4.133056640625, 4.849609375, 5.566162109375, 6.28271484375, 6.999267578125, 7.7158203125, 8.432373046875, 9.14892578125, 9.865478515625, 10.58203125, 11.298583984375, 12.01513671875, 12.731689453125, 13.4482421875, 14.164794921875, 14.88134765625, 15.597900390625, 16.314453125, 17.031005859375, 17.74755859375, 18.464111328125, 19.1806640625, 19.897216796875, 20.61376953125, 21.330322265625, 22.046875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 15.0, 13.0, 17.0, 26.0, 31.0, 65.0, 53.0, 68.0, 73.0, 97.0, 75.0, 78.0, 77.0, 50.0, 54.0, 50.0, 37.0, 22.0, 29.0, 18.0, 12.0, 9.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002227783203125, -0.0021683424711227417, -0.0021089017391204834, -0.002049461007118225, -0.001990020275115967, -0.0019305795431137085, -0.0018711388111114502, -0.001811698079109192, -0.0017522573471069336, -0.0016928166151046753, -0.001633375883102417, -0.0015739351511001587, -0.0015144944190979004, -0.001455053687095642, -0.0013956129550933838, -0.0013361722230911255, -0.0012767314910888672, -0.0012172907590866089, -0.0011578500270843506, -0.0010984092950820923, -0.001038968563079834, -0.0009795278310775757, -0.0009200870990753174, -0.0008606463670730591, -0.0008012056350708008, -0.0007417649030685425, -0.0006823241710662842, -0.0006228834390640259, -0.0005634427070617676, -0.0005040019750595093, -0.000444561243057251, -0.0003851205110549927, -0.0003256797790527344, -0.0002662390470504761, -0.00020679831504821777, -0.00014735758304595947, -8.791685104370117e-05, -2.847611904144287e-05, 3.096461296081543e-05, 9.040534496307373e-05, 0.00014984607696533203, 0.00020928680896759033, 0.00026872754096984863, 0.00032816827297210693, 0.00038760900497436523, 0.00044704973697662354, 0.0005064904689788818, 0.0005659312009811401, 0.0006253719329833984, 0.0006848126649856567, 0.000744253396987915, 0.0008036941289901733, 0.0008631348609924316, 0.0009225755929946899, 0.0009820163249969482, 0.0010414570569992065, 0.0011008977890014648, 0.0011603385210037231, 0.0012197792530059814, 0.0012792199850082397, 0.001338660717010498, 0.0013981014490127563, 0.0014575421810150146, 0.001516982913017273, 0.0015764236450195312]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 9.0, 16.0, 26.0, 33.0, 44.0, 67.0, 103.0, 138.0, 206.0, 284.0, 435.0, 613.0, 972.0, 1438.0, 2259.0, 3514.0, 5722.0, 9362.0, 15683.0, 27630.0, 48551.0, 87761.0, 150158.0, 207444.0, 191981.0, 126129.0, 71424.0, 39545.0, 22361.0, 13243.0, 7706.0, 4936.0, 2989.0, 1905.0, 1235.0, 793.0, 602.0, 371.0, 249.0, 186.0, 141.0, 82.0, 66.0, 46.0, 26.0, 17.0, 13.0, 6.0, 7.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-15.6640625, -15.1558837890625, -14.647705078125, -14.1395263671875, -13.63134765625, -13.1231689453125, -12.614990234375, -12.1068115234375, -11.5986328125, -11.0904541015625, -10.582275390625, -10.0740966796875, -9.56591796875, -9.0577392578125, -8.549560546875, -8.0413818359375, -7.533203125, -7.0250244140625, -6.516845703125, -6.0086669921875, -5.50048828125, -4.9923095703125, -4.484130859375, -3.9759521484375, -3.4677734375, -2.9595947265625, -2.451416015625, -1.9432373046875, -1.43505859375, -0.9268798828125, -0.418701171875, 0.0894775390625, 0.59765625, 1.1058349609375, 1.614013671875, 2.1221923828125, 2.63037109375, 3.1385498046875, 3.646728515625, 4.1549072265625, 4.6630859375, 5.1712646484375, 5.679443359375, 6.1876220703125, 6.69580078125, 7.2039794921875, 7.712158203125, 8.2203369140625, 8.728515625, 9.2366943359375, 9.744873046875, 10.2530517578125, 10.76123046875, 11.2694091796875, 11.777587890625, 12.2857666015625, 12.7939453125, 13.3021240234375, 13.810302734375, 14.3184814453125, 14.82666015625, 15.3348388671875, 15.843017578125, 16.3511962890625, 16.859375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 9.0, 8.0, 17.0, 11.0, 25.0, 24.0, 34.0, 39.0, 52.0, 59.0, 78.0, 69.0, 81.0, 70.0, 68.0, 53.0, 61.0, 48.0, 31.0, 23.0, 34.0, 21.0, 13.0, 17.0, 13.0, 11.0, 3.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.16015625, -6.92730712890625, -6.6944580078125, -6.46160888671875, -6.228759765625, -5.99591064453125, -5.7630615234375, -5.53021240234375, -5.29736328125, -5.06451416015625, -4.8316650390625, -4.59881591796875, -4.365966796875, -4.13311767578125, -3.9002685546875, -3.66741943359375, -3.4345703125, -3.20172119140625, -2.9688720703125, -2.73602294921875, -2.503173828125, -2.27032470703125, -2.0374755859375, -1.80462646484375, -1.57177734375, -1.33892822265625, -1.1060791015625, -0.87322998046875, -0.640380859375, -0.40753173828125, -0.1746826171875, 0.05816650390625, 0.291015625, 0.52386474609375, 0.7567138671875, 0.98956298828125, 1.222412109375, 1.45526123046875, 1.6881103515625, 1.92095947265625, 2.15380859375, 2.38665771484375, 2.6195068359375, 2.85235595703125, 3.085205078125, 3.31805419921875, 3.5509033203125, 3.78375244140625, 4.0166015625, 4.24945068359375, 4.4822998046875, 4.71514892578125, 4.947998046875, 5.18084716796875, 5.4136962890625, 5.64654541015625, 5.87939453125, 6.11224365234375, 6.3450927734375, 6.57794189453125, 6.810791015625, 7.04364013671875, 7.2764892578125, 7.50933837890625, 7.7421875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 3.0, 7.0, 5.0, 3.0, 4.0, 10.0, 9.0, 10.0, 12.0, 14.0, 28.0, 23.0, 26.0, 23.0, 46.0, 43.0, 43.0, 45.0, 56.0, 69.0, 67.0, 64.0, 65.0, 48.0, 42.0, 45.0, 30.0, 20.0, 32.0, 18.0, 17.0, 17.0, 7.0, 9.0, 12.0, 12.0, 8.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.8347110748291, -23.13792610168457, -22.44114112854004, -21.744356155395508, -21.047569274902344, -20.350784301757812, -19.65399932861328, -18.95721435546875, -18.26042938232422, -17.563644409179688, -16.866859436035156, -16.170074462890625, -15.473288536071777, -14.776503562927246, -14.079717636108398, -13.382932662963867, -12.686147689819336, -11.989362716674805, -11.292577743530273, -10.595791816711426, -9.899006843566895, -9.202221870422363, -8.505435943603516, -7.808650970458984, -7.111865997314453, -6.415081024169922, -5.718295574188232, -5.021510124206543, -4.324725151062012, -3.6279399394989014, -2.931154727935791, -2.2343692779541016, -1.5375843048095703, -0.84079909324646, -0.1440138816833496, 0.5527713298797607, 1.249556541442871, 1.9463417530059814, 2.643126964569092, 3.3399124145507812, 4.0366973876953125, 4.733482360839844, 5.430267810821533, 6.127053260803223, 6.823838233947754, 7.520623207092285, 8.217409133911133, 8.914194107055664, 9.610979080200195, 10.307764053344727, 11.004549026489258, 11.701334953308105, 12.398119926452637, 13.094904899597168, 13.791690826416016, 14.488475799560547, 15.185260772705078, 15.88204574584961, 16.57883071899414, 17.275615692138672, 17.972400665283203, 18.669187545776367, 19.3659725189209, 20.06275749206543, 20.75954246520996]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 1.0, 9.0, 8.0, 11.0, 17.0, 16.0, 14.0, 22.0, 14.0, 14.0, 22.0, 26.0, 36.0, 38.0, 32.0, 48.0, 44.0, 53.0, 47.0, 50.0, 65.0, 61.0, 40.0, 44.0, 43.0, 35.0, 32.0, 22.0, 26.0, 19.0, 19.0, 11.0, 11.0, 16.0, 8.0, 10.0, 6.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.293254852294922, -23.51689338684082, -22.74053192138672, -21.964170455932617, -21.187808990478516, -20.41144561767578, -19.63508415222168, -18.858722686767578, -18.082361221313477, -17.305999755859375, -16.529638290405273, -15.753275871276855, -14.976914405822754, -14.200552940368652, -13.424190521240234, -12.647829055786133, -11.871467590332031, -11.09510612487793, -10.318744659423828, -9.54238224029541, -8.766020774841309, -7.989659309387207, -7.213297367095947, -6.4369354248046875, -5.660573959350586, -4.884212493896484, -4.107850551605225, -3.331488847732544, -2.5551271438598633, -1.7787654399871826, -1.002403736114502, -0.2260417938232422, 0.5503215789794922, 1.3266832828521729, 2.1030449867248535, 2.879406690597534, 3.655768394470215, 4.432129859924316, 5.208491802215576, 5.984853744506836, 6.7612152099609375, 7.537576675415039, 8.31393814086914, 9.090300559997559, 9.86666202545166, 10.643023490905762, 11.41938591003418, 12.195747375488281, 12.972108840942383, 13.748470306396484, 14.524831771850586, 15.301194190979004, 16.077556610107422, 16.853918075561523, 17.630279541015625, 18.406641006469727, 19.183002471923828, 19.95936393737793, 20.73572540283203, 21.512086868286133, 22.288448333740234, 23.06481170654297, 23.84117317199707, 24.617534637451172, 25.393896102905273]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 10.0, 9.0, 9.0, 14.0, 21.0, 26.0, 34.0, 53.0, 74.0, 103.0, 142.0, 208.0, 269.0, 379.0, 515.0, 717.0, 1051.0, 1516.0, 2124.0, 3222.0, 4773.0, 7328.0, 11940.0, 20218.0, 35805.0, 68188.0, 136529.0, 279687.0, 533218.0, 817028.0, 882747.0, 646911.0, 358819.0, 178548.0, 88605.0, 45848.0, 25520.0, 15021.0, 9099.0, 5677.0, 3849.0, 2585.0, 1776.0, 1222.0, 856.0, 571.0, 436.0, 306.0, 231.0, 151.0, 95.0, 66.0, 53.0, 35.0, 23.0, 16.0, 8.0, 8.0, 1.0, 3.0], "bins": [-17.375, -16.8668212890625, -16.358642578125, -15.8504638671875, -15.34228515625, -14.8341064453125, -14.325927734375, -13.8177490234375, -13.3095703125, -12.8013916015625, -12.293212890625, -11.7850341796875, -11.27685546875, -10.7686767578125, -10.260498046875, -9.7523193359375, -9.244140625, -8.7359619140625, -8.227783203125, -7.7196044921875, -7.21142578125, -6.7032470703125, -6.195068359375, -5.6868896484375, -5.1787109375, -4.6705322265625, -4.162353515625, -3.6541748046875, -3.14599609375, -2.6378173828125, -2.129638671875, -1.6214599609375, -1.11328125, -0.6051025390625, -0.096923828125, 0.4112548828125, 0.91943359375, 1.4276123046875, 1.935791015625, 2.4439697265625, 2.9521484375, 3.4603271484375, 3.968505859375, 4.4766845703125, 4.98486328125, 5.4930419921875, 6.001220703125, 6.5093994140625, 7.017578125, 7.5257568359375, 8.033935546875, 8.5421142578125, 9.05029296875, 9.5584716796875, 10.066650390625, 10.5748291015625, 11.0830078125, 11.5911865234375, 12.099365234375, 12.6075439453125, 13.11572265625, 13.6239013671875, 14.132080078125, 14.6402587890625, 15.1484375]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 12.0, 8.0, 11.0, 6.0, 13.0, 12.0, 18.0, 16.0, 10.0, 22.0, 20.0, 24.0, 24.0, 26.0, 45.0, 32.0, 36.0, 30.0, 36.0, 47.0, 44.0, 52.0, 48.0, 46.0, 40.0, 33.0, 34.0, 29.0, 30.0, 36.0, 20.0, 26.0, 19.0, 18.0, 19.0, 11.0, 11.0, 9.0, 6.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.18408203125, -12.7119140625, -12.23974609375, -11.767578125, -11.29541015625, -10.8232421875, -10.35107421875, -9.87890625, -9.40673828125, -8.9345703125, -8.46240234375, -7.990234375, -7.51806640625, -7.0458984375, -6.57373046875, -6.1015625, -5.62939453125, -5.1572265625, -4.68505859375, -4.212890625, -3.74072265625, -3.2685546875, -2.79638671875, -2.32421875, -1.85205078125, -1.3798828125, -0.90771484375, -0.435546875, 0.03662109375, 0.5087890625, 0.98095703125, 1.453125, 1.92529296875, 2.3974609375, 2.86962890625, 3.341796875, 3.81396484375, 4.2861328125, 4.75830078125, 5.23046875, 5.70263671875, 6.1748046875, 6.64697265625, 7.119140625, 7.59130859375, 8.0634765625, 8.53564453125, 9.0078125, 9.47998046875, 9.9521484375, 10.42431640625, 10.896484375, 11.36865234375, 11.8408203125, 12.31298828125, 12.78515625, 13.25732421875, 13.7294921875, 14.20166015625, 14.673828125, 15.14599609375, 15.6181640625, 16.09033203125, 16.5625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 9.0, 6.0, 2.0, 12.0, 26.0, 37.0, 50.0, 80.0, 103.0, 147.0, 253.0, 321.0, 484.0, 748.0, 1082.0, 1628.0, 2424.0, 3726.0, 5554.0, 9015.0, 14515.0, 24867.0, 44359.0, 85044.0, 174078.0, 367107.0, 728045.0, 1042976.0, 822279.0, 434450.0, 206061.0, 100060.0, 51530.0, 28386.0, 16375.0, 10035.0, 6233.0, 4095.0, 2658.0, 1720.0, 1181.0, 810.0, 546.0, 383.0, 250.0, 187.0, 115.0, 84.0, 51.0, 40.0, 26.0, 16.0, 10.0, 8.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.203125, -18.5546875, -17.90625, -17.2578125, -16.609375, -15.9609375, -15.3125, -14.6640625, -14.015625, -13.3671875, -12.71875, -12.0703125, -11.421875, -10.7734375, -10.125, -9.4765625, -8.828125, -8.1796875, -7.53125, -6.8828125, -6.234375, -5.5859375, -4.9375, -4.2890625, -3.640625, -2.9921875, -2.34375, -1.6953125, -1.046875, -0.3984375, 0.25, 0.8984375, 1.546875, 2.1953125, 2.84375, 3.4921875, 4.140625, 4.7890625, 5.4375, 6.0859375, 6.734375, 7.3828125, 8.03125, 8.6796875, 9.328125, 9.9765625, 10.625, 11.2734375, 11.921875, 12.5703125, 13.21875, 13.8671875, 14.515625, 15.1640625, 15.8125, 16.4609375, 17.109375, 17.7578125, 18.40625, 19.0546875, 19.703125, 20.3515625, 21.0, 21.6484375, 22.296875]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 5.0, 5.0, 3.0, 9.0, 8.0, 16.0, 17.0, 19.0, 25.0, 31.0, 33.0, 53.0, 72.0, 66.0, 94.0, 119.0, 156.0, 173.0, 199.0, 237.0, 250.0, 266.0, 296.0, 259.0, 271.0, 224.0, 194.0, 151.0, 160.0, 139.0, 99.0, 79.0, 67.0, 62.0, 47.0, 25.0, 26.0, 29.0, 18.0, 17.0, 8.0, 15.0, 3.0, 11.0, 6.0, 2.0, 4.0, 4.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.60345458984375, -6.3865966796875, -6.16973876953125, -5.952880859375, -5.73602294921875, -5.5191650390625, -5.30230712890625, -5.08544921875, -4.86859130859375, -4.6517333984375, -4.43487548828125, -4.218017578125, -4.00115966796875, -3.7843017578125, -3.56744384765625, -3.3505859375, -3.13372802734375, -2.9168701171875, -2.70001220703125, -2.483154296875, -2.26629638671875, -2.0494384765625, -1.83258056640625, -1.61572265625, -1.39886474609375, -1.1820068359375, -0.96514892578125, -0.748291015625, -0.53143310546875, -0.3145751953125, -0.09771728515625, 0.119140625, 0.33599853515625, 0.5528564453125, 0.76971435546875, 0.986572265625, 1.20343017578125, 1.4202880859375, 1.63714599609375, 1.85400390625, 2.07086181640625, 2.2877197265625, 2.50457763671875, 2.721435546875, 2.93829345703125, 3.1551513671875, 3.37200927734375, 3.5888671875, 3.80572509765625, 4.0225830078125, 4.23944091796875, 4.456298828125, 4.67315673828125, 4.8900146484375, 5.10687255859375, 5.32373046875, 5.54058837890625, 5.7574462890625, 5.97430419921875, 6.191162109375, 6.40802001953125, 6.6248779296875, 6.84173583984375, 7.05859375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 11.0, 7.0, 7.0, 9.0, 14.0, 15.0, 26.0, 33.0, 46.0, 60.0, 68.0, 59.0, 62.0, 63.0, 77.0, 68.0, 79.0, 58.0, 39.0, 35.0, 34.0, 23.0, 25.0, 14.0, 14.0, 12.0, 12.0, 5.0, 8.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.976797103881836, -24.220048904418945, -23.463302612304688, -22.706554412841797, -21.949806213378906, -21.19305992126465, -20.436311721801758, -19.6795654296875, -18.92281723022461, -18.16606903076172, -17.40932273864746, -16.65257453918457, -15.895827293395996, -15.139080047607422, -14.382331848144531, -13.625584602355957, -12.868837356567383, -12.112090110778809, -11.355342864990234, -10.598594665527344, -9.84184741973877, -9.085100173950195, -8.328351974487305, -7.5716047286987305, -6.814857482910156, -6.058110237121582, -5.30136251449585, -4.544614791870117, -3.787867546081543, -3.0311200618743896, -2.2743725776672363, -1.517624855041504, -0.7608795166015625, -0.00413203239440918, 0.7526154518127441, 1.5093629360198975, 2.266110420227051, 3.022857904434204, 3.7796053886413574, 4.53635311126709, 5.293100357055664, 6.049847602844238, 6.806595325469971, 7.563343048095703, 8.320090293884277, 9.076837539672852, 9.833585739135742, 10.590332984924316, 11.34708023071289, 12.103827476501465, 12.860574722290039, 13.61732292175293, 14.374070167541504, 15.130817413330078, 15.887565612792969, 16.64431381225586, 17.401060104370117, 18.157808303833008, 18.914554595947266, 19.671302795410156, 20.428050994873047, 21.184797286987305, 21.941545486450195, 22.698291778564453, 23.455039978027344]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 13.0, 15.0, 16.0, 14.0, 11.0, 26.0, 17.0, 25.0, 21.0, 44.0, 28.0, 31.0, 45.0, 29.0, 30.0, 47.0, 40.0, 40.0, 46.0, 41.0, 51.0, 38.0, 44.0, 30.0, 24.0, 22.0, 30.0, 22.0, 23.0, 19.0, 20.0, 13.0, 14.0, 14.0, 8.0, 2.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.06035614013672, -16.4949893951416, -15.929620742797852, -15.364253997802734, -14.7988862991333, -14.233518600463867, -13.66815185546875, -13.102784156799316, -12.537416458129883, -11.97204875946045, -11.406681060791016, -10.841314315795898, -10.275946617126465, -9.710578918457031, -9.145212173461914, -8.57984447479248, -8.014476776123047, -7.449109077453613, -6.883741855621338, -6.3183746337890625, -5.753006935119629, -5.187639236450195, -4.62227201461792, -4.0569047927856445, -3.491537094116211, -2.9261696338653564, -2.360802173614502, -1.7954347133636475, -1.230067253112793, -0.6646997928619385, -0.09933233261108398, 0.4660351276397705, 1.031402587890625, 1.5967700481414795, 2.162137508392334, 2.7275049686431885, 3.292872428894043, 3.8582398891448975, 4.423607349395752, 4.988974571228027, 5.554342269897461, 6.1197099685668945, 6.68507719039917, 7.250444412231445, 7.815812110900879, 8.381179809570312, 8.94654655456543, 9.511914253234863, 10.077281951904297, 10.64264965057373, 11.208017349243164, 11.773384094238281, 12.338751792907715, 12.904119491577148, 13.469486236572266, 14.0348539352417, 14.600221633911133, 15.165589332580566, 15.73095703125, 16.296323776245117, 16.861690521240234, 17.427059173583984, 17.9924259185791, 18.55779457092285, 19.12316131591797]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 13.0, 12.0, 14.0, 29.0, 46.0, 49.0, 54.0, 62.0, 113.0, 172.0, 194.0, 261.0, 393.0, 472.0, 672.0, 952.0, 1395.0, 2010.0, 3000.0, 4942.0, 8189.0, 15720.0, 34633.0, 89435.0, 232819.0, 345467.0, 180161.0, 67120.0, 27201.0, 12670.0, 7042.0, 4260.0, 2701.0, 1824.0, 1244.0, 896.0, 615.0, 464.0, 329.0, 224.0, 173.0, 129.0, 92.0, 83.0, 49.0, 43.0, 34.0, 17.0, 23.0, 14.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.625, -19.987548828125, -19.35009765625, -18.712646484375, -18.0751953125, -17.437744140625, -16.80029296875, -16.162841796875, -15.525390625, -14.887939453125, -14.25048828125, -13.613037109375, -12.9755859375, -12.338134765625, -11.70068359375, -11.063232421875, -10.42578125, -9.788330078125, -9.15087890625, -8.513427734375, -7.8759765625, -7.238525390625, -6.60107421875, -5.963623046875, -5.326171875, -4.688720703125, -4.05126953125, -3.413818359375, -2.7763671875, -2.138916015625, -1.50146484375, -0.864013671875, -0.2265625, 0.410888671875, 1.04833984375, 1.685791015625, 2.3232421875, 2.960693359375, 3.59814453125, 4.235595703125, 4.873046875, 5.510498046875, 6.14794921875, 6.785400390625, 7.4228515625, 8.060302734375, 8.69775390625, 9.335205078125, 9.97265625, 10.610107421875, 11.24755859375, 11.885009765625, 12.5224609375, 13.159912109375, 13.79736328125, 14.434814453125, 15.072265625, 15.709716796875, 16.34716796875, 16.984619140625, 17.6220703125, 18.259521484375, 18.89697265625, 19.534423828125, 20.171875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 8.0, 7.0, 12.0, 24.0, 11.0, 9.0, 20.0, 25.0, 19.0, 19.0, 25.0, 34.0, 44.0, 35.0, 47.0, 34.0, 53.0, 32.0, 41.0, 38.0, 47.0, 46.0, 47.0, 36.0, 32.0, 32.0, 30.0, 25.0, 33.0, 31.0, 17.0, 14.0, 14.0, 11.0, 11.0, 9.0, 2.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-18.234375, -17.6416015625, -17.048828125, -16.4560546875, -15.86328125, -15.2705078125, -14.677734375, -14.0849609375, -13.4921875, -12.8994140625, -12.306640625, -11.7138671875, -11.12109375, -10.5283203125, -9.935546875, -9.3427734375, -8.75, -8.1572265625, -7.564453125, -6.9716796875, -6.37890625, -5.7861328125, -5.193359375, -4.6005859375, -4.0078125, -3.4150390625, -2.822265625, -2.2294921875, -1.63671875, -1.0439453125, -0.451171875, 0.1416015625, 0.734375, 1.3271484375, 1.919921875, 2.5126953125, 3.10546875, 3.6982421875, 4.291015625, 4.8837890625, 5.4765625, 6.0693359375, 6.662109375, 7.2548828125, 7.84765625, 8.4404296875, 9.033203125, 9.6259765625, 10.21875, 10.8115234375, 11.404296875, 11.9970703125, 12.58984375, 13.1826171875, 13.775390625, 14.3681640625, 14.9609375, 15.5537109375, 16.146484375, 16.7392578125, 17.33203125, 17.9248046875, 18.517578125, 19.1103515625, 19.703125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 4.0, 4.0, 3.0, 7.0, 10.0, 17.0, 13.0, 35.0, 38.0, 55.0, 60.0, 114.0, 199.0, 280.0, 447.0, 718.0, 1196.0, 2069.0, 3732.0, 7378.0, 16057.0, 49850.0, 895490.0, 41250.0, 14483.0, 6691.0, 3529.0, 1866.0, 1110.0, 651.0, 381.0, 257.0, 162.0, 113.0, 80.0, 67.0, 39.0, 33.0, 15.0, 10.0, 9.0, 10.0, 8.0, 5.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.6875, -24.677734375, -23.66796875, -22.658203125, -21.6484375, -20.638671875, -19.62890625, -18.619140625, -17.609375, -16.599609375, -15.58984375, -14.580078125, -13.5703125, -12.560546875, -11.55078125, -10.541015625, -9.53125, -8.521484375, -7.51171875, -6.501953125, -5.4921875, -4.482421875, -3.47265625, -2.462890625, -1.453125, -0.443359375, 0.56640625, 1.576171875, 2.5859375, 3.595703125, 4.60546875, 5.615234375, 6.625, 7.634765625, 8.64453125, 9.654296875, 10.6640625, 11.673828125, 12.68359375, 13.693359375, 14.703125, 15.712890625, 16.72265625, 17.732421875, 18.7421875, 19.751953125, 20.76171875, 21.771484375, 22.78125, 23.791015625, 24.80078125, 25.810546875, 26.8203125, 27.830078125, 28.83984375, 29.849609375, 30.859375, 31.869140625, 32.87890625, 33.888671875, 34.8984375, 35.908203125, 36.91796875, 37.927734375, 38.9375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 9.0, 7.0, 11.0, 6.0, 7.0, 7.0, 9.0, 20.0, 21.0, 16.0, 20.0, 28.0, 27.0, 37.0, 33.0, 38.0, 51.0, 45.0, 39.0, 44.0, 41.0, 42.0, 45.0, 42.0, 34.0, 49.0, 39.0, 36.0, 20.0, 30.0, 22.0, 20.0, 18.0, 17.0, 15.0, 14.0, 11.0, 8.0, 7.0, 4.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-18.28125, -17.7923583984375, -17.303466796875, -16.8145751953125, -16.32568359375, -15.8367919921875, -15.347900390625, -14.8590087890625, -14.3701171875, -13.8812255859375, -13.392333984375, -12.9034423828125, -12.41455078125, -11.9256591796875, -11.436767578125, -10.9478759765625, -10.458984375, -9.9700927734375, -9.481201171875, -8.9923095703125, -8.50341796875, -8.0145263671875, -7.525634765625, -7.0367431640625, -6.5478515625, -6.0589599609375, -5.570068359375, -5.0811767578125, -4.59228515625, -4.1033935546875, -3.614501953125, -3.1256103515625, -2.63671875, -2.1478271484375, -1.658935546875, -1.1700439453125, -0.68115234375, -0.1922607421875, 0.296630859375, 0.7855224609375, 1.2744140625, 1.7633056640625, 2.252197265625, 2.7410888671875, 3.22998046875, 3.7188720703125, 4.207763671875, 4.6966552734375, 5.185546875, 5.6744384765625, 6.163330078125, 6.6522216796875, 7.14111328125, 7.6300048828125, 8.118896484375, 8.6077880859375, 9.0966796875, 9.5855712890625, 10.074462890625, 10.5633544921875, 11.05224609375, 11.5411376953125, 12.030029296875, 12.5189208984375, 13.0078125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 13.0, 15.0, 36.0, 43.0, 72.0, 62.0, 111.0, 132.0, 170.0, 276.0, 420.0, 543.0, 822.0, 1257.0, 2079.0, 3445.0, 6301.0, 12406.0, 30539.0, 810606.0, 134311.0, 21852.0, 9750.0, 5064.0, 2927.0, 1707.0, 1148.0, 700.0, 488.0, 341.0, 245.0, 178.0, 126.0, 75.0, 75.0, 49.0, 38.0, 26.0, 36.0, 19.0, 10.0, 3.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.358154296875, -10.98974609375, -10.621337890625, -10.2529296875, -9.884521484375, -9.51611328125, -9.147705078125, -8.779296875, -8.410888671875, -8.04248046875, -7.674072265625, -7.3056640625, -6.937255859375, -6.56884765625, -6.200439453125, -5.83203125, -5.463623046875, -5.09521484375, -4.726806640625, -4.3583984375, -3.989990234375, -3.62158203125, -3.253173828125, -2.884765625, -2.516357421875, -2.14794921875, -1.779541015625, -1.4111328125, -1.042724609375, -0.67431640625, -0.305908203125, 0.0625, 0.430908203125, 0.79931640625, 1.167724609375, 1.5361328125, 1.904541015625, 2.27294921875, 2.641357421875, 3.009765625, 3.378173828125, 3.74658203125, 4.114990234375, 4.4833984375, 4.851806640625, 5.22021484375, 5.588623046875, 5.95703125, 6.325439453125, 6.69384765625, 7.062255859375, 7.4306640625, 7.799072265625, 8.16748046875, 8.535888671875, 8.904296875, 9.272705078125, 9.64111328125, 10.009521484375, 10.3779296875, 10.746337890625, 11.11474609375, 11.483154296875, 11.8515625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 6.0, 11.0, 9.0, 17.0, 47.0, 101.0, 274.0, 281.0, 114.0, 59.0, 22.0, 15.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0029811859130859375, -0.0028819143772125244, -0.0027826428413391113, -0.0026833713054656982, -0.002584099769592285, -0.002484828233718872, -0.002385556697845459, -0.002286285161972046, -0.002187013626098633, -0.0020877420902252197, -0.0019884705543518066, -0.0018891990184783936, -0.0017899274826049805, -0.0016906559467315674, -0.0015913844108581543, -0.0014921128749847412, -0.0013928413391113281, -0.001293569803237915, -0.001194298267364502, -0.0010950267314910889, -0.0009957551956176758, -0.0008964836597442627, -0.0007972121238708496, -0.0006979405879974365, -0.0005986690521240234, -0.0004993975162506104, -0.00040012598037719727, -0.0003008544445037842, -0.0002015829086303711, -0.00010231137275695801, -3.039836883544922e-06, 9.623169898986816e-05, 0.00019550323486328125, 0.00029477477073669434, 0.0003940463066101074, 0.0004933178424835205, 0.0005925893783569336, 0.0006918609142303467, 0.0007911324501037598, 0.0008904039859771729, 0.000989675521850586, 0.001088947057723999, 0.0011882185935974121, 0.0012874901294708252, 0.0013867616653442383, 0.0014860332012176514, 0.0015853047370910645, 0.0016845762729644775, 0.0017838478088378906, 0.0018831193447113037, 0.001982390880584717, 0.00208166241645813, 0.002180933952331543, 0.002280205488204956, 0.002379477024078369, 0.0024787485599517822, 0.0025780200958251953, 0.0026772916316986084, 0.0027765631675720215, 0.0028758347034454346, 0.0029751062393188477, 0.0030743777751922607, 0.003173649311065674, 0.003272920846939087, 0.0033721923828125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 9.0, 16.0, 25.0, 33.0, 36.0, 46.0, 66.0, 78.0, 124.0, 130.0, 197.0, 251.0, 333.0, 468.0, 675.0, 965.0, 1412.0, 2282.0, 3593.0, 5870.0, 9916.0, 17830.0, 32530.0, 62974.0, 123765.0, 218905.0, 242909.0, 152136.0, 78364.0, 39954.0, 21291.0, 12106.0, 7019.0, 4176.0, 2508.0, 1678.0, 1092.0, 777.0, 503.0, 403.0, 284.0, 219.0, 149.0, 116.0, 98.0, 66.0, 42.0, 40.0, 32.0, 19.0, 14.0, 11.0, 10.0, 8.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.15704345703125, -3.0523681640625, -2.94769287109375, -2.843017578125, -2.73834228515625, -2.6336669921875, -2.52899169921875, -2.42431640625, -2.31964111328125, -2.2149658203125, -2.11029052734375, -2.005615234375, -1.90093994140625, -1.7962646484375, -1.69158935546875, -1.5869140625, -1.48223876953125, -1.3775634765625, -1.27288818359375, -1.168212890625, -1.06353759765625, -0.9588623046875, -0.85418701171875, -0.74951171875, -0.64483642578125, -0.5401611328125, -0.43548583984375, -0.330810546875, -0.22613525390625, -0.1214599609375, -0.01678466796875, 0.087890625, 0.19256591796875, 0.2972412109375, 0.40191650390625, 0.506591796875, 0.61126708984375, 0.7159423828125, 0.82061767578125, 0.92529296875, 1.02996826171875, 1.1346435546875, 1.23931884765625, 1.343994140625, 1.44866943359375, 1.5533447265625, 1.65802001953125, 1.7626953125, 1.86737060546875, 1.9720458984375, 2.07672119140625, 2.181396484375, 2.28607177734375, 2.3907470703125, 2.49542236328125, 2.60009765625, 2.70477294921875, 2.8094482421875, 2.91412353515625, 3.018798828125, 3.12347412109375, 3.2281494140625, 3.33282470703125, 3.4375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 7.0, 15.0, 8.0, 20.0, 18.0, 34.0, 28.0, 33.0, 27.0, 50.0, 48.0, 48.0, 51.0, 67.0, 71.0, 66.0, 79.0, 51.0, 36.0, 37.0, 37.0, 27.0, 29.0, 17.0, 19.0, 16.0, 13.0, 8.0, 3.0, 12.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0734710693359375, -1.036590576171875, -0.9997100830078125, -0.96282958984375, -0.9259490966796875, -0.889068603515625, -0.8521881103515625, -0.8153076171875, -0.7784271240234375, -0.741546630859375, -0.7046661376953125, -0.66778564453125, -0.6309051513671875, -0.594024658203125, -0.5571441650390625, -0.520263671875, -0.4833831787109375, -0.446502685546875, -0.4096221923828125, -0.37274169921875, -0.3358612060546875, -0.298980712890625, -0.2621002197265625, -0.2252197265625, -0.1883392333984375, -0.151458740234375, -0.1145782470703125, -0.07769775390625, -0.0408172607421875, -0.003936767578125, 0.0329437255859375, 0.06982421875, 0.1067047119140625, 0.143585205078125, 0.1804656982421875, 0.21734619140625, 0.2542266845703125, 0.291107177734375, 0.3279876708984375, 0.3648681640625, 0.4017486572265625, 0.438629150390625, 0.4755096435546875, 0.51239013671875, 0.5492706298828125, 0.586151123046875, 0.6230316162109375, 0.659912109375, 0.6967926025390625, 0.733673095703125, 0.7705535888671875, 0.80743408203125, 0.8443145751953125, 0.881195068359375, 0.9180755615234375, 0.9549560546875, 0.9918365478515625, 1.028717041015625, 1.0655975341796875, 1.10247802734375, 1.1393585205078125, 1.176239013671875, 1.2131195068359375, 1.25]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 9.0, 8.0, 6.0, 14.0, 11.0, 28.0, 21.0, 36.0, 48.0, 53.0, 64.0, 67.0, 86.0, 62.0, 89.0, 56.0, 61.0, 62.0, 42.0, 29.0, 35.0, 24.0, 20.0, 13.0, 13.0, 14.0, 5.0, 3.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.154644012451172, -23.38775634765625, -22.62087059020996, -21.85398292541504, -21.087095260620117, -20.320207595825195, -19.553321838378906, -18.786434173583984, -18.019546508789062, -17.25265884399414, -16.48577308654785, -15.71888542175293, -14.951997756958008, -14.185111045837402, -13.418224334716797, -12.651336669921875, -11.88444995880127, -11.117563247680664, -10.350675582885742, -9.583788871765137, -8.816901206970215, -8.05001449584961, -7.283127307891846, -6.516240119934082, -5.749352931976318, -4.982465744018555, -4.215578556060791, -3.4486916065216064, -2.6818044185638428, -1.914917230606079, -1.1480302810668945, -0.38114309310913086, 0.3857440948486328, 1.1526312828063965, 1.9195183515548706, 2.6864054203033447, 3.4532926082611084, 4.220179557800293, 4.987066745758057, 5.75395393371582, 6.520841121673584, 7.287728309631348, 8.054615020751953, 8.821502685546875, 9.58838939666748, 10.355277061462402, 11.122163772583008, 11.88905143737793, 12.655938148498535, 13.42282485961914, 14.189712524414062, 14.956599235534668, 15.72348690032959, 16.490373611450195, 17.257261276245117, 18.024147033691406, 18.791034698486328, 19.55792236328125, 20.32480812072754, 21.09169578552246, 21.858583450317383, 22.625471115112305, 23.392356872558594, 24.159244537353516, 24.926132202148438]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 9.0, 8.0, 12.0, 18.0, 18.0, 12.0, 14.0, 20.0, 25.0, 18.0, 26.0, 30.0, 37.0, 29.0, 42.0, 33.0, 38.0, 40.0, 43.0, 42.0, 38.0, 55.0, 36.0, 41.0, 39.0, 27.0, 34.0, 31.0, 22.0, 22.0, 23.0, 19.0, 13.0, 13.0, 18.0, 10.0, 10.0, 5.0, 4.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-16.22251319885254, -15.682835578918457, -15.143157958984375, -14.603480339050293, -14.063802719116211, -13.524124145507812, -12.98444652557373, -12.444768905639648, -11.905091285705566, -11.365413665771484, -10.825736045837402, -10.28605842590332, -9.746379852294922, -9.206703186035156, -8.667024612426758, -8.127346992492676, -7.587669372558594, -7.047991752624512, -6.50831413269043, -5.9686360359191895, -5.428958415985107, -4.889280796051025, -4.349602699279785, -3.809925079345703, -3.270247459411621, -2.730569839477539, -2.190891981124878, -1.6512142419815063, -1.1115365028381348, -0.5718588829040527, -0.0321810245513916, 0.5074968338012695, 1.0471763610839844, 1.586854100227356, 2.1265318393707275, 2.6662096977233887, 3.2058873176574707, 3.7455649375915527, 4.285243034362793, 4.824920654296875, 5.364598274230957, 5.904275894165039, 6.443953514099121, 6.983631610870361, 7.523309230804443, 8.062986373901367, 8.602664947509766, 9.142342567443848, 9.68202018737793, 10.221697807312012, 10.761375427246094, 11.301053047180176, 11.840730667114258, 12.380409240722656, 12.920086860656738, 13.45976448059082, 13.999442100524902, 14.539119720458984, 15.078797340393066, 15.618474960327148, 16.158153533935547, 16.697830200195312, 17.23750877380371, 17.77718734741211, 18.316864013671875]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 14.0, 15.0, 16.0, 28.0, 39.0, 53.0, 87.0, 125.0, 182.0, 249.0, 365.0, 507.0, 781.0, 1173.0, 1771.0, 2567.0, 3972.0, 6089.0, 9496.0, 15019.0, 24791.0, 40826.0, 68961.0, 113057.0, 164119.0, 185393.0, 151599.0, 100437.0, 60779.0, 36172.0, 21741.0, 13537.0, 8419.0, 5390.0, 3622.0, 2263.0, 1611.0, 1083.0, 708.0, 480.0, 322.0, 211.0, 143.0, 114.0, 74.0, 58.0, 33.0, 21.0, 17.0, 12.0, 2.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-22.71875, -21.99462890625, -21.2705078125, -20.54638671875, -19.822265625, -19.09814453125, -18.3740234375, -17.64990234375, -16.92578125, -16.20166015625, -15.4775390625, -14.75341796875, -14.029296875, -13.30517578125, -12.5810546875, -11.85693359375, -11.1328125, -10.40869140625, -9.6845703125, -8.96044921875, -8.236328125, -7.51220703125, -6.7880859375, -6.06396484375, -5.33984375, -4.61572265625, -3.8916015625, -3.16748046875, -2.443359375, -1.71923828125, -0.9951171875, -0.27099609375, 0.453125, 1.17724609375, 1.9013671875, 2.62548828125, 3.349609375, 4.07373046875, 4.7978515625, 5.52197265625, 6.24609375, 6.97021484375, 7.6943359375, 8.41845703125, 9.142578125, 9.86669921875, 10.5908203125, 11.31494140625, 12.0390625, 12.76318359375, 13.4873046875, 14.21142578125, 14.935546875, 15.65966796875, 16.3837890625, 17.10791015625, 17.83203125, 18.55615234375, 19.2802734375, 20.00439453125, 20.728515625, 21.45263671875, 22.1767578125, 22.90087890625, 23.625]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 14.0, 11.0, 6.0, 14.0, 24.0, 13.0, 18.0, 24.0, 20.0, 28.0, 19.0, 31.0, 43.0, 38.0, 47.0, 34.0, 41.0, 50.0, 36.0, 40.0, 44.0, 50.0, 46.0, 28.0, 28.0, 33.0, 24.0, 35.0, 34.0, 18.0, 18.0, 13.0, 13.0, 10.0, 8.0, 10.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-15.9765625, -15.4630126953125, -14.949462890625, -14.4359130859375, -13.92236328125, -13.4088134765625, -12.895263671875, -12.3817138671875, -11.8681640625, -11.3546142578125, -10.841064453125, -10.3275146484375, -9.81396484375, -9.3004150390625, -8.786865234375, -8.2733154296875, -7.759765625, -7.2462158203125, -6.732666015625, -6.2191162109375, -5.70556640625, -5.1920166015625, -4.678466796875, -4.1649169921875, -3.6513671875, -3.1378173828125, -2.624267578125, -2.1107177734375, -1.59716796875, -1.0836181640625, -0.570068359375, -0.0565185546875, 0.45703125, 0.9705810546875, 1.484130859375, 1.9976806640625, 2.51123046875, 3.0247802734375, 3.538330078125, 4.0518798828125, 4.5654296875, 5.0789794921875, 5.592529296875, 6.1060791015625, 6.61962890625, 7.1331787109375, 7.646728515625, 8.1602783203125, 8.673828125, 9.1873779296875, 9.700927734375, 10.2144775390625, 10.72802734375, 11.2415771484375, 11.755126953125, 12.2686767578125, 12.7822265625, 13.2957763671875, 13.809326171875, 14.3228759765625, 14.83642578125, 15.3499755859375, 15.863525390625, 16.3770751953125, 16.890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 6.0, 13.0, 15.0, 28.0, 38.0, 59.0, 97.0, 122.0, 181.0, 246.0, 354.0, 528.0, 803.0, 1204.0, 1836.0, 2828.0, 4387.0, 6859.0, 11268.0, 17869.0, 29736.0, 49050.0, 79823.0, 125026.0, 169171.0, 175689.0, 136624.0, 90340.0, 55398.0, 33867.0, 20215.0, 12711.0, 7862.0, 4998.0, 3196.0, 2050.0, 1422.0, 903.0, 553.0, 392.0, 246.0, 181.0, 125.0, 78.0, 56.0, 27.0, 19.0, 16.0, 11.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 3.0, 1.0], "bins": [-21.890625, -21.209228515625, -20.52783203125, -19.846435546875, -19.1650390625, -18.483642578125, -17.80224609375, -17.120849609375, -16.439453125, -15.758056640625, -15.07666015625, -14.395263671875, -13.7138671875, -13.032470703125, -12.35107421875, -11.669677734375, -10.98828125, -10.306884765625, -9.62548828125, -8.944091796875, -8.2626953125, -7.581298828125, -6.89990234375, -6.218505859375, -5.537109375, -4.855712890625, -4.17431640625, -3.492919921875, -2.8115234375, -2.130126953125, -1.44873046875, -0.767333984375, -0.0859375, 0.595458984375, 1.27685546875, 1.958251953125, 2.6396484375, 3.321044921875, 4.00244140625, 4.683837890625, 5.365234375, 6.046630859375, 6.72802734375, 7.409423828125, 8.0908203125, 8.772216796875, 9.45361328125, 10.135009765625, 10.81640625, 11.497802734375, 12.17919921875, 12.860595703125, 13.5419921875, 14.223388671875, 14.90478515625, 15.586181640625, 16.267578125, 16.948974609375, 17.63037109375, 18.311767578125, 18.9931640625, 19.674560546875, 20.35595703125, 21.037353515625, 21.71875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 6.0, 6.0, 7.0, 4.0, 8.0, 12.0, 6.0, 14.0, 12.0, 20.0, 20.0, 20.0, 22.0, 25.0, 32.0, 44.0, 39.0, 42.0, 39.0, 40.0, 47.0, 37.0, 43.0, 46.0, 47.0, 37.0, 39.0, 34.0, 30.0, 30.0, 25.0, 33.0, 30.0, 17.0, 20.0, 19.0, 17.0, 11.0, 5.0, 4.0, 6.0, 6.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.936279296875, -9.58349609375, -9.230712890625, -8.8779296875, -8.525146484375, -8.17236328125, -7.819580078125, -7.466796875, -7.114013671875, -6.76123046875, -6.408447265625, -6.0556640625, -5.702880859375, -5.35009765625, -4.997314453125, -4.64453125, -4.291748046875, -3.93896484375, -3.586181640625, -3.2333984375, -2.880615234375, -2.52783203125, -2.175048828125, -1.822265625, -1.469482421875, -1.11669921875, -0.763916015625, -0.4111328125, -0.058349609375, 0.29443359375, 0.647216796875, 1.0, 1.352783203125, 1.70556640625, 2.058349609375, 2.4111328125, 2.763916015625, 3.11669921875, 3.469482421875, 3.822265625, 4.175048828125, 4.52783203125, 4.880615234375, 5.2333984375, 5.586181640625, 5.93896484375, 6.291748046875, 6.64453125, 6.997314453125, 7.35009765625, 7.702880859375, 8.0556640625, 8.408447265625, 8.76123046875, 9.114013671875, 9.466796875, 9.819580078125, 10.17236328125, 10.525146484375, 10.8779296875, 11.230712890625, 11.58349609375, 11.936279296875, 12.2890625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 14.0, 13.0, 21.0, 29.0, 30.0, 37.0, 51.0, 64.0, 86.0, 124.0, 153.0, 219.0, 307.0, 412.0, 539.0, 818.0, 1213.0, 2074.0, 3638.0, 8036.0, 20050.0, 66663.0, 306822.0, 469870.0, 113978.0, 30276.0, 10802.0, 4890.0, 2488.0, 1535.0, 964.0, 614.0, 427.0, 337.0, 249.0, 164.0, 118.0, 95.0, 77.0, 51.0, 45.0, 40.0, 18.0, 25.0, 17.0, 14.0, 15.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-40.625, -39.322265625, -38.01953125, -36.716796875, -35.4140625, -34.111328125, -32.80859375, -31.505859375, -30.203125, -28.900390625, -27.59765625, -26.294921875, -24.9921875, -23.689453125, -22.38671875, -21.083984375, -19.78125, -18.478515625, -17.17578125, -15.873046875, -14.5703125, -13.267578125, -11.96484375, -10.662109375, -9.359375, -8.056640625, -6.75390625, -5.451171875, -4.1484375, -2.845703125, -1.54296875, -0.240234375, 1.0625, 2.365234375, 3.66796875, 4.970703125, 6.2734375, 7.576171875, 8.87890625, 10.181640625, 11.484375, 12.787109375, 14.08984375, 15.392578125, 16.6953125, 17.998046875, 19.30078125, 20.603515625, 21.90625, 23.208984375, 24.51171875, 25.814453125, 27.1171875, 28.419921875, 29.72265625, 31.025390625, 32.328125, 33.630859375, 34.93359375, 36.236328125, 37.5390625, 38.841796875, 40.14453125, 41.447265625, 42.75]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 29.0, 39.0, 39.0, 71.0, 99.0, 152.0, 146.0, 112.0, 73.0, 54.0, 39.0, 22.0, 20.0, 18.0, 11.0, 9.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002361297607421875, -0.0022593140602111816, -0.0021573305130004883, -0.002055346965789795, -0.0019533634185791016, -0.0018513798713684082, -0.0017493963241577148, -0.0016474127769470215, -0.0015454292297363281, -0.0014434456825256348, -0.0013414621353149414, -0.001239478588104248, -0.0011374950408935547, -0.0010355114936828613, -0.000933527946472168, -0.0008315443992614746, -0.0007295608520507812, -0.0006275773048400879, -0.0005255937576293945, -0.00042361021041870117, -0.0003216266632080078, -0.00021964311599731445, -0.0001176595687866211, -1.5676021575927734e-05, 8.630752563476562e-05, 0.00018829107284545898, 0.00029027462005615234, 0.0003922581672668457, 0.0004942417144775391, 0.0005962252616882324, 0.0006982088088989258, 0.0008001923561096191, 0.0009021759033203125, 0.0010041594505310059, 0.0011061429977416992, 0.0012081265449523926, 0.001310110092163086, 0.0014120936393737793, 0.0015140771865844727, 0.001616060733795166, 0.0017180442810058594, 0.0018200278282165527, 0.001922011375427246, 0.0020239949226379395, 0.002125978469848633, 0.002227962017059326, 0.0023299455642700195, 0.002431929111480713, 0.0025339126586914062, 0.0026358962059020996, 0.002737879753112793, 0.0028398633003234863, 0.0029418468475341797, 0.003043830394744873, 0.0031458139419555664, 0.0032477974891662598, 0.003349781036376953, 0.0034517645835876465, 0.00355374813079834, 0.003655731678009033, 0.0037577152252197266, 0.00385969877243042, 0.003961682319641113, 0.004063665866851807, 0.0041656494140625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 14.0, 7.0, 11.0, 22.0, 18.0, 28.0, 32.0, 58.0, 59.0, 100.0, 122.0, 158.0, 267.0, 340.0, 542.0, 883.0, 1586.0, 2819.0, 5644.0, 12243.0, 31305.0, 98488.0, 332127.0, 377146.0, 119648.0, 36643.0, 14143.0, 6316.0, 3156.0, 1716.0, 1037.0, 558.0, 375.0, 279.0, 189.0, 126.0, 87.0, 66.0, 49.0, 35.0, 23.0, 25.0, 14.0, 16.0, 8.0, 7.0, 5.0, 2.0, 7.0, 1.0, 4.0, 2.0, 1.0], "bins": [-31.28125, -30.36328125, -29.4453125, -28.52734375, -27.609375, -26.69140625, -25.7734375, -24.85546875, -23.9375, -23.01953125, -22.1015625, -21.18359375, -20.265625, -19.34765625, -18.4296875, -17.51171875, -16.59375, -15.67578125, -14.7578125, -13.83984375, -12.921875, -12.00390625, -11.0859375, -10.16796875, -9.25, -8.33203125, -7.4140625, -6.49609375, -5.578125, -4.66015625, -3.7421875, -2.82421875, -1.90625, -0.98828125, -0.0703125, 0.84765625, 1.765625, 2.68359375, 3.6015625, 4.51953125, 5.4375, 6.35546875, 7.2734375, 8.19140625, 9.109375, 10.02734375, 10.9453125, 11.86328125, 12.78125, 13.69921875, 14.6171875, 15.53515625, 16.453125, 17.37109375, 18.2890625, 19.20703125, 20.125, 21.04296875, 21.9609375, 22.87890625, 23.796875, 24.71484375, 25.6328125, 26.55078125, 27.46875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 6.0, 7.0, 15.0, 12.0, 16.0, 14.0, 27.0, 27.0, 32.0, 61.0, 55.0, 72.0, 73.0, 114.0, 87.0, 82.0, 66.0, 68.0, 33.0, 31.0, 27.0, 22.0, 15.0, 11.0, 9.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.57257080078125, -4.3521728515625, -4.13177490234375, -3.911376953125, -3.69097900390625, -3.4705810546875, -3.25018310546875, -3.02978515625, -2.80938720703125, -2.5889892578125, -2.36859130859375, -2.148193359375, -1.92779541015625, -1.7073974609375, -1.48699951171875, -1.2666015625, -1.04620361328125, -0.8258056640625, -0.60540771484375, -0.385009765625, -0.16461181640625, 0.0557861328125, 0.27618408203125, 0.49658203125, 0.71697998046875, 0.9373779296875, 1.15777587890625, 1.378173828125, 1.59857177734375, 1.8189697265625, 2.03936767578125, 2.259765625, 2.48016357421875, 2.7005615234375, 2.92095947265625, 3.141357421875, 3.36175537109375, 3.5821533203125, 3.80255126953125, 4.02294921875, 4.24334716796875, 4.4637451171875, 4.68414306640625, 4.904541015625, 5.12493896484375, 5.3453369140625, 5.56573486328125, 5.7861328125, 6.00653076171875, 6.2269287109375, 6.44732666015625, 6.667724609375, 6.88812255859375, 7.1085205078125, 7.32891845703125, 7.54931640625, 7.76971435546875, 7.9901123046875, 8.21051025390625, 8.430908203125, 8.65130615234375, 8.8717041015625, 9.09210205078125, 9.3125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 5.0, 10.0, 3.0, 6.0, 10.0, 9.0, 15.0, 13.0, 24.0, 29.0, 38.0, 34.0, 50.0, 56.0, 75.0, 72.0, 54.0, 80.0, 64.0, 54.0, 66.0, 49.0, 45.0, 36.0, 24.0, 16.0, 13.0, 14.0, 14.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.554733276367188, -23.836198806762695, -23.117664337158203, -22.39912986755371, -21.68059539794922, -20.96206283569336, -20.243528366088867, -19.524993896484375, -18.806459426879883, -18.08792495727539, -17.3693904876709, -16.650856018066406, -15.93232250213623, -15.213788032531738, -14.495254516601562, -13.77672004699707, -13.058185577392578, -12.339651107788086, -11.621116638183594, -10.902583122253418, -10.184048652648926, -9.465514183044434, -8.746980667114258, -8.028446197509766, -7.309911727905273, -6.591377258300781, -5.872843265533447, -5.154309272766113, -4.435774803161621, -3.717240571975708, -2.998706340789795, -2.280172348022461, -1.5616378784179688, -0.8431036472320557, -0.12456941604614258, 0.5939648151397705, 1.3124990463256836, 2.0310332775115967, 2.7495675086975098, 3.4681015014648438, 4.186635971069336, 4.905170440673828, 5.623704433441162, 6.342238426208496, 7.060772895812988, 7.7793073654174805, 8.497840881347656, 9.216375350952148, 9.93490982055664, 10.653444290161133, 11.371978759765625, 12.0905122756958, 12.809046745300293, 13.527581214904785, 14.246114730834961, 14.964649200439453, 15.683183670043945, 16.401718139648438, 17.12025260925293, 17.838787078857422, 18.55731964111328, 19.275854110717773, 19.994388580322266, 20.712923049926758, 21.43145751953125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 11.0, 2.0, 12.0, 9.0, 17.0, 11.0, 13.0, 27.0, 22.0, 26.0, 30.0, 24.0, 40.0, 32.0, 45.0, 27.0, 33.0, 35.0, 53.0, 43.0, 50.0, 41.0, 44.0, 35.0, 29.0, 36.0, 36.0, 31.0, 22.0, 25.0, 22.0, 22.0, 17.0, 19.0, 15.0, 13.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.47252655029297, -16.934345245361328, -16.396163940429688, -15.857982635498047, -15.319801330566406, -14.781620025634766, -14.243437767028809, -13.705256462097168, -13.167075157165527, -12.628893852233887, -12.090712547302246, -11.552531242370605, -11.014348983764648, -10.476167678833008, -9.937986373901367, -9.399805068969727, -8.861623764038086, -8.323442459106445, -7.785261154174805, -7.247079372406006, -6.708898067474365, -6.170716762542725, -5.632534980773926, -5.094353675842285, -4.5561723709106445, -4.017991065979004, -3.479809522628784, -2.9416279792785645, -2.403446674346924, -1.8652653694152832, -1.3270838260650635, -0.7889022827148438, -0.2507190704345703, 0.28746235370635986, 0.82564377784729, 1.3638252019882202, 1.9020066261291504, 2.440187931060791, 2.9783694744110107, 3.5165510177612305, 4.054732322692871, 4.592913627624512, 5.131094932556152, 5.669276714324951, 6.207458019256592, 6.745639324188232, 7.283821105957031, 7.822002410888672, 8.360183715820312, 8.898365020751953, 9.436546325683594, 9.974727630615234, 10.512908935546875, 11.051090240478516, 11.589272499084473, 12.127453804016113, 12.665635108947754, 13.203816413879395, 13.741997718811035, 14.280179023742676, 14.818361282348633, 15.356542587280273, 15.894723892211914, 16.432905197143555, 16.971086502075195]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 5.0, 8.0, 13.0, 18.0, 21.0, 38.0, 42.0, 47.0, 79.0, 104.0, 135.0, 206.0, 298.0, 449.0, 588.0, 897.0, 1352.0, 2101.0, 3218.0, 5135.0, 8505.0, 14722.0, 26095.0, 50439.0, 105853.0, 238844.0, 522270.0, 902423.0, 1003259.0, 681320.0, 330820.0, 147003.0, 67629.0, 34318.0, 18488.0, 10468.0, 6377.0, 3702.0, 2383.0, 1475.0, 1013.0, 627.0, 455.0, 320.0, 213.0, 147.0, 107.0, 82.0, 67.0, 36.0, 22.0, 25.0, 14.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-15.5625, -15.063720703125, -14.56494140625, -14.066162109375, -13.5673828125, -13.068603515625, -12.56982421875, -12.071044921875, -11.572265625, -11.073486328125, -10.57470703125, -10.075927734375, -9.5771484375, -9.078369140625, -8.57958984375, -8.080810546875, -7.58203125, -7.083251953125, -6.58447265625, -6.085693359375, -5.5869140625, -5.088134765625, -4.58935546875, -4.090576171875, -3.591796875, -3.093017578125, -2.59423828125, -2.095458984375, -1.5966796875, -1.097900390625, -0.59912109375, -0.100341796875, 0.3984375, 0.897216796875, 1.39599609375, 1.894775390625, 2.3935546875, 2.892333984375, 3.39111328125, 3.889892578125, 4.388671875, 4.887451171875, 5.38623046875, 5.885009765625, 6.3837890625, 6.882568359375, 7.38134765625, 7.880126953125, 8.37890625, 8.877685546875, 9.37646484375, 9.875244140625, 10.3740234375, 10.872802734375, 11.37158203125, 11.870361328125, 12.369140625, 12.867919921875, 13.36669921875, 13.865478515625, 14.3642578125, 14.863037109375, 15.36181640625, 15.860595703125, 16.359375]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 9.0, 8.0, 10.0, 8.0, 18.0, 19.0, 20.0, 15.0, 35.0, 18.0, 35.0, 35.0, 26.0, 39.0, 36.0, 48.0, 39.0, 36.0, 29.0, 45.0, 44.0, 52.0, 49.0, 33.0, 43.0, 23.0, 28.0, 25.0, 28.0, 22.0, 14.0, 20.0, 19.0, 16.0, 15.0, 8.0, 13.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.0416259765625, -11.637939453125, -11.2342529296875, -10.83056640625, -10.4268798828125, -10.023193359375, -9.6195068359375, -9.2158203125, -8.8121337890625, -8.408447265625, -8.0047607421875, -7.60107421875, -7.1973876953125, -6.793701171875, -6.3900146484375, -5.986328125, -5.5826416015625, -5.178955078125, -4.7752685546875, -4.37158203125, -3.9678955078125, -3.564208984375, -3.1605224609375, -2.7568359375, -2.3531494140625, -1.949462890625, -1.5457763671875, -1.14208984375, -0.7384033203125, -0.334716796875, 0.0689697265625, 0.47265625, 0.8763427734375, 1.280029296875, 1.6837158203125, 2.08740234375, 2.4910888671875, 2.894775390625, 3.2984619140625, 3.7021484375, 4.1058349609375, 4.509521484375, 4.9132080078125, 5.31689453125, 5.7205810546875, 6.124267578125, 6.5279541015625, 6.931640625, 7.3353271484375, 7.739013671875, 8.1427001953125, 8.54638671875, 8.9500732421875, 9.353759765625, 9.7574462890625, 10.1611328125, 10.5648193359375, 10.968505859375, 11.3721923828125, 11.77587890625, 12.1795654296875, 12.583251953125, 12.9869384765625, 13.390625]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 6.0, 11.0, 23.0, 34.0, 38.0, 46.0, 80.0, 113.0, 159.0, 261.0, 352.0, 529.0, 792.0, 1121.0, 1589.0, 2379.0, 4013.0, 6112.0, 9868.0, 17360.0, 31192.0, 60609.0, 126407.0, 279536.0, 621375.0, 1123482.0, 987334.0, 490009.0, 217164.0, 99216.0, 49247.0, 25749.0, 14409.0, 8503.0, 5197.0, 3232.0, 2173.0, 1436.0, 963.0, 693.0, 454.0, 312.0, 242.0, 131.0, 109.0, 67.0, 52.0, 37.0, 23.0, 12.0, 8.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0], "bins": [-20.359375, -19.739501953125, -19.11962890625, -18.499755859375, -17.8798828125, -17.260009765625, -16.64013671875, -16.020263671875, -15.400390625, -14.780517578125, -14.16064453125, -13.540771484375, -12.9208984375, -12.301025390625, -11.68115234375, -11.061279296875, -10.44140625, -9.821533203125, -9.20166015625, -8.581787109375, -7.9619140625, -7.342041015625, -6.72216796875, -6.102294921875, -5.482421875, -4.862548828125, -4.24267578125, -3.622802734375, -3.0029296875, -2.383056640625, -1.76318359375, -1.143310546875, -0.5234375, 0.096435546875, 0.71630859375, 1.336181640625, 1.9560546875, 2.575927734375, 3.19580078125, 3.815673828125, 4.435546875, 5.055419921875, 5.67529296875, 6.295166015625, 6.9150390625, 7.534912109375, 8.15478515625, 8.774658203125, 9.39453125, 10.014404296875, 10.63427734375, 11.254150390625, 11.8740234375, 12.493896484375, 13.11376953125, 13.733642578125, 14.353515625, 14.973388671875, 15.59326171875, 16.213134765625, 16.8330078125, 17.452880859375, 18.07275390625, 18.692626953125, 19.3125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 8.0, 8.0, 7.0, 13.0, 12.0, 18.0, 22.0, 30.0, 38.0, 33.0, 53.0, 77.0, 96.0, 116.0, 147.0, 178.0, 243.0, 235.0, 270.0, 326.0, 282.0, 287.0, 286.0, 244.0, 184.0, 156.0, 161.0, 117.0, 80.0, 56.0, 46.0, 53.0, 38.0, 42.0, 18.0, 19.0, 15.0, 18.0, 14.0, 7.0, 6.0, 0.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.08203125, -5.88873291015625, -5.6954345703125, -5.50213623046875, -5.308837890625, -5.11553955078125, -4.9222412109375, -4.72894287109375, -4.53564453125, -4.34234619140625, -4.1490478515625, -3.95574951171875, -3.762451171875, -3.56915283203125, -3.3758544921875, -3.18255615234375, -2.9892578125, -2.79595947265625, -2.6026611328125, -2.40936279296875, -2.216064453125, -2.02276611328125, -1.8294677734375, -1.63616943359375, -1.44287109375, -1.24957275390625, -1.0562744140625, -0.86297607421875, -0.669677734375, -0.47637939453125, -0.2830810546875, -0.08978271484375, 0.103515625, 0.29681396484375, 0.4901123046875, 0.68341064453125, 0.876708984375, 1.07000732421875, 1.2633056640625, 1.45660400390625, 1.64990234375, 1.84320068359375, 2.0364990234375, 2.22979736328125, 2.423095703125, 2.61639404296875, 2.8096923828125, 3.00299072265625, 3.1962890625, 3.38958740234375, 3.5828857421875, 3.77618408203125, 3.969482421875, 4.16278076171875, 4.3560791015625, 4.54937744140625, 4.74267578125, 4.93597412109375, 5.1292724609375, 5.32257080078125, 5.515869140625, 5.70916748046875, 5.9024658203125, 6.09576416015625, 6.2890625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 5.0, 7.0, 14.0, 11.0, 21.0, 18.0, 25.0, 39.0, 35.0, 48.0, 51.0, 67.0, 66.0, 67.0, 85.0, 74.0, 67.0, 57.0, 52.0, 48.0, 44.0, 15.0, 17.0, 16.0, 11.0, 6.0, 4.0, 5.0, 2.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.09061622619629, -20.388193130493164, -19.68577003479004, -18.983346939086914, -18.28092384338379, -17.578502655029297, -16.876079559326172, -16.173656463623047, -15.471233367919922, -14.768810272216797, -14.066387176513672, -13.363964080810547, -12.661541938781738, -11.959118843078613, -11.256695747375488, -10.55427360534668, -9.851849555969238, -9.149426460266113, -8.447003364562988, -7.7445807456970215, -7.042158126831055, -6.33973503112793, -5.637311935424805, -4.934889316558838, -4.232466220855713, -3.530043363571167, -2.827620506286621, -2.125197410583496, -1.4227745532989502, -0.7203516960144043, -0.017928600311279297, 0.6844940185546875, 1.3869171142578125, 2.0893399715423584, 2.7917628288269043, 3.4941859245300293, 4.196608543395996, 4.899031639099121, 5.601454734802246, 6.303877353668213, 7.006300449371338, 7.708723545074463, 8.41114616394043, 9.113569259643555, 9.81599235534668, 10.518415451049805, 11.22083854675293, 11.923260688781738, 12.625683784484863, 13.328106880187988, 14.030529975891113, 14.732952117919922, 15.435375213623047, 16.137798309326172, 16.840221405029297, 17.542644500732422, 18.245067596435547, 18.947490692138672, 19.649913787841797, 20.352336883544922, 21.054759979248047, 21.757183074951172, 22.459606170654297, 23.16202735900879, 23.864450454711914]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 7.0, 7.0, 5.0, 10.0, 16.0, 17.0, 15.0, 18.0, 17.0, 38.0, 37.0, 46.0, 39.0, 33.0, 44.0, 55.0, 44.0, 40.0, 46.0, 50.0, 35.0, 37.0, 47.0, 34.0, 50.0, 23.0, 24.0, 35.0, 24.0, 22.0, 23.0, 19.0, 9.0, 5.0, 12.0, 5.0, 3.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.85476303100586, -18.307764053344727, -17.760765075683594, -17.21376609802246, -16.666767120361328, -16.119768142700195, -15.572769165039062, -15.02577018737793, -14.478771209716797, -13.931772232055664, -13.384773254394531, -12.837774276733398, -12.290775299072266, -11.743776321411133, -11.19677734375, -10.649778366088867, -10.102779388427734, -9.555780410766602, -9.008781433105469, -8.461782455444336, -7.914783477783203, -7.36778450012207, -6.8207855224609375, -6.273786544799805, -5.726787567138672, -5.179788589477539, -4.632789611816406, -4.085790634155273, -3.5387916564941406, -2.991792678833008, -2.444793701171875, -1.8977947235107422, -1.3507938385009766, -0.8037948608398438, -0.25679588317871094, 0.2902030944824219, 0.8372020721435547, 1.3842010498046875, 1.9312000274658203, 2.478199005126953, 3.025197982788086, 3.5721969604492188, 4.119195938110352, 4.666194915771484, 5.213193893432617, 5.76019287109375, 6.307191848754883, 6.854190826416016, 7.401189804077148, 7.948188781738281, 8.495187759399414, 9.042186737060547, 9.58918571472168, 10.136184692382812, 10.683183670043945, 11.230182647705078, 11.777181625366211, 12.324180603027344, 12.871179580688477, 13.41817855834961, 13.965177536010742, 14.512176513671875, 15.059175491333008, 15.60617446899414, 16.153173446655273]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 2.0, 9.0, 13.0, 16.0, 18.0, 24.0, 47.0, 61.0, 82.0, 107.0, 152.0, 266.0, 329.0, 484.0, 690.0, 1103.0, 1539.0, 2471.0, 3800.0, 6092.0, 10224.0, 17452.0, 30273.0, 55875.0, 105671.0, 190598.0, 241624.0, 170599.0, 92394.0, 49293.0, 26879.0, 15401.0, 8982.0, 5589.0, 3522.0, 2286.0, 1461.0, 965.0, 652.0, 476.0, 298.0, 221.0, 162.0, 95.0, 84.0, 58.0, 24.0, 27.0, 22.0, 14.0, 10.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-8.5546875, -8.29852294921875, -8.0423583984375, -7.78619384765625, -7.530029296875, -7.27386474609375, -7.0177001953125, -6.76153564453125, -6.50537109375, -6.24920654296875, -5.9930419921875, -5.73687744140625, -5.480712890625, -5.22454833984375, -4.9683837890625, -4.71221923828125, -4.4560546875, -4.19989013671875, -3.9437255859375, -3.68756103515625, -3.431396484375, -3.17523193359375, -2.9190673828125, -2.66290283203125, -2.40673828125, -2.15057373046875, -1.8944091796875, -1.63824462890625, -1.382080078125, -1.12591552734375, -0.8697509765625, -0.61358642578125, -0.357421875, -0.10125732421875, 0.1549072265625, 0.41107177734375, 0.667236328125, 0.92340087890625, 1.1795654296875, 1.43572998046875, 1.69189453125, 1.94805908203125, 2.2042236328125, 2.46038818359375, 2.716552734375, 2.97271728515625, 3.2288818359375, 3.48504638671875, 3.7412109375, 3.99737548828125, 4.2535400390625, 4.50970458984375, 4.765869140625, 5.02203369140625, 5.2781982421875, 5.53436279296875, 5.79052734375, 6.04669189453125, 6.3028564453125, 6.55902099609375, 6.815185546875, 7.07135009765625, 7.3275146484375, 7.58367919921875, 7.83984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 5.0, 1.0, 10.0, 14.0, 6.0, 14.0, 16.0, 23.0, 26.0, 27.0, 20.0, 28.0, 39.0, 50.0, 43.0, 38.0, 42.0, 46.0, 41.0, 45.0, 47.0, 47.0, 33.0, 37.0, 37.0, 46.0, 32.0, 23.0, 24.0, 34.0, 21.0, 20.0, 12.0, 9.0, 11.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.671875, -17.12353515625, -16.5751953125, -16.02685546875, -15.478515625, -14.93017578125, -14.3818359375, -13.83349609375, -13.28515625, -12.73681640625, -12.1884765625, -11.64013671875, -11.091796875, -10.54345703125, -9.9951171875, -9.44677734375, -8.8984375, -8.35009765625, -7.8017578125, -7.25341796875, -6.705078125, -6.15673828125, -5.6083984375, -5.06005859375, -4.51171875, -3.96337890625, -3.4150390625, -2.86669921875, -2.318359375, -1.77001953125, -1.2216796875, -0.67333984375, -0.125, 0.42333984375, 0.9716796875, 1.52001953125, 2.068359375, 2.61669921875, 3.1650390625, 3.71337890625, 4.26171875, 4.81005859375, 5.3583984375, 5.90673828125, 6.455078125, 7.00341796875, 7.5517578125, 8.10009765625, 8.6484375, 9.19677734375, 9.7451171875, 10.29345703125, 10.841796875, 11.39013671875, 11.9384765625, 12.48681640625, 13.03515625, 13.58349609375, 14.1318359375, 14.68017578125, 15.228515625, 15.77685546875, 16.3251953125, 16.87353515625, 17.421875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 0.0, 5.0, 5.0, 9.0, 19.0, 18.0, 29.0, 40.0, 67.0, 96.0, 188.0, 203.0, 298.0, 431.0, 636.0, 956.0, 1433.0, 2180.0, 3640.0, 6086.0, 10809.0, 21578.0, 87040.0, 840977.0, 35270.0, 15217.0, 8162.0, 4752.0, 2831.0, 1794.0, 1201.0, 816.0, 577.0, 347.0, 266.0, 177.0, 101.0, 80.0, 61.0, 38.0, 27.0, 28.0, 14.0, 15.0, 16.0, 4.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.4375, -16.861328125, -16.28515625, -15.708984375, -15.1328125, -14.556640625, -13.98046875, -13.404296875, -12.828125, -12.251953125, -11.67578125, -11.099609375, -10.5234375, -9.947265625, -9.37109375, -8.794921875, -8.21875, -7.642578125, -7.06640625, -6.490234375, -5.9140625, -5.337890625, -4.76171875, -4.185546875, -3.609375, -3.033203125, -2.45703125, -1.880859375, -1.3046875, -0.728515625, -0.15234375, 0.423828125, 1.0, 1.576171875, 2.15234375, 2.728515625, 3.3046875, 3.880859375, 4.45703125, 5.033203125, 5.609375, 6.185546875, 6.76171875, 7.337890625, 7.9140625, 8.490234375, 9.06640625, 9.642578125, 10.21875, 10.794921875, 11.37109375, 11.947265625, 12.5234375, 13.099609375, 13.67578125, 14.251953125, 14.828125, 15.404296875, 15.98046875, 16.556640625, 17.1328125, 17.708984375, 18.28515625, 18.861328125, 19.4375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 9.0, 12.0, 14.0, 24.0, 12.0, 28.0, 26.0, 35.0, 27.0, 39.0, 40.0, 34.0, 32.0, 43.0, 48.0, 44.0, 47.0, 41.0, 44.0, 42.0, 40.0, 30.0, 36.0, 34.0, 28.0, 37.0, 22.0, 18.0, 18.0, 14.0, 12.0, 10.0, 6.0, 4.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.5186767578125, -13.123291015625, -12.7279052734375, -12.33251953125, -11.9371337890625, -11.541748046875, -11.1463623046875, -10.7509765625, -10.3555908203125, -9.960205078125, -9.5648193359375, -9.16943359375, -8.7740478515625, -8.378662109375, -7.9832763671875, -7.587890625, -7.1925048828125, -6.797119140625, -6.4017333984375, -6.00634765625, -5.6109619140625, -5.215576171875, -4.8201904296875, -4.4248046875, -4.0294189453125, -3.634033203125, -3.2386474609375, -2.84326171875, -2.4478759765625, -2.052490234375, -1.6571044921875, -1.26171875, -0.8663330078125, -0.470947265625, -0.0755615234375, 0.31982421875, 0.7152099609375, 1.110595703125, 1.5059814453125, 1.9013671875, 2.2967529296875, 2.692138671875, 3.0875244140625, 3.48291015625, 3.8782958984375, 4.273681640625, 4.6690673828125, 5.064453125, 5.4598388671875, 5.855224609375, 6.2506103515625, 6.64599609375, 7.0413818359375, 7.436767578125, 7.8321533203125, 8.2275390625, 8.6229248046875, 9.018310546875, 9.4136962890625, 9.80908203125, 10.2044677734375, 10.599853515625, 10.9952392578125, 11.390625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 12.0, 11.0, 25.0, 44.0, 54.0, 83.0, 126.0, 209.0, 302.0, 536.0, 875.0, 1666.0, 3280.0, 7112.0, 19142.0, 280948.0, 697602.0, 21227.0, 7755.0, 3436.0, 1742.0, 928.0, 537.0, 311.0, 209.0, 115.0, 99.0, 48.0, 32.0, 24.0, 29.0, 9.0, 5.0, 5.0, 8.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.9375, -9.5953369140625, -9.253173828125, -8.9110107421875, -8.56884765625, -8.2266845703125, -7.884521484375, -7.5423583984375, -7.2001953125, -6.8580322265625, -6.515869140625, -6.1737060546875, -5.83154296875, -5.4893798828125, -5.147216796875, -4.8050537109375, -4.462890625, -4.1207275390625, -3.778564453125, -3.4364013671875, -3.09423828125, -2.7520751953125, -2.409912109375, -2.0677490234375, -1.7255859375, -1.3834228515625, -1.041259765625, -0.6990966796875, -0.35693359375, -0.0147705078125, 0.327392578125, 0.6695556640625, 1.01171875, 1.3538818359375, 1.696044921875, 2.0382080078125, 2.38037109375, 2.7225341796875, 3.064697265625, 3.4068603515625, 3.7490234375, 4.0911865234375, 4.433349609375, 4.7755126953125, 5.11767578125, 5.4598388671875, 5.802001953125, 6.1441650390625, 6.486328125, 6.8284912109375, 7.170654296875, 7.5128173828125, 7.85498046875, 8.1971435546875, 8.539306640625, 8.8814697265625, 9.2236328125, 9.5657958984375, 9.907958984375, 10.2501220703125, 10.59228515625, 10.9344482421875, 11.276611328125, 11.6187744140625, 11.9609375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 8.0, 8.0, 9.0, 11.0, 16.0, 22.0, 26.0, 39.0, 43.0, 58.0, 76.0, 149.0, 156.0, 95.0, 60.0, 46.0, 41.0, 27.0, 16.0, 14.0, 12.0, 15.0, 5.0, 6.0, 2.0, 8.0, 2.0, 9.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0008363723754882812, -0.0008103474974632263, -0.0007843226194381714, -0.0007582977414131165, -0.0007322728633880615, -0.0007062479853630066, -0.0006802231073379517, -0.0006541982293128967, -0.0006281733512878418, -0.0006021484732627869, -0.0005761235952377319, -0.000550098717212677, -0.0005240738391876221, -0.0004980489611625671, -0.0004720240831375122, -0.0004459992051124573, -0.00041997432708740234, -0.0003939494490623474, -0.0003679245710372925, -0.00034189969301223755, -0.0003158748149871826, -0.0002898499369621277, -0.00026382505893707275, -0.00023780018091201782, -0.0002117753028869629, -0.00018575042486190796, -0.00015972554683685303, -0.0001337006688117981, -0.00010767579078674316, -8.165091276168823e-05, -5.56260347366333e-05, -2.960115671157837e-05, -3.5762786865234375e-06, 2.2448599338531494e-05, 4.8473477363586426e-05, 7.449835538864136e-05, 0.00010052323341369629, 0.00012654811143875122, 0.00015257298946380615, 0.00017859786748886108, 0.00020462274551391602, 0.00023064762353897095, 0.0002566725015640259, 0.0002826973795890808, 0.00030872225761413574, 0.0003347471356391907, 0.0003607720136642456, 0.00038679689168930054, 0.00041282176971435547, 0.0004388466477394104, 0.00046487152576446533, 0.0004908964037895203, 0.0005169212818145752, 0.0005429461598396301, 0.0005689710378646851, 0.00059499591588974, 0.0006210207939147949, 0.0006470456719398499, 0.0006730705499649048, 0.0006990954279899597, 0.0007251203060150146, 0.0007511451840400696, 0.0007771700620651245, 0.0008031949400901794, 0.0008292198181152344]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 18.0, 24.0, 43.0, 44.0, 64.0, 73.0, 170.0, 188.0, 259.0, 396.0, 505.0, 647.0, 1003.0, 1376.0, 2207.0, 3298.0, 5014.0, 8232.0, 13592.0, 23360.0, 41796.0, 78212.0, 143545.0, 225865.0, 212067.0, 126674.0, 68395.0, 37054.0, 20824.0, 12090.0, 7363.0, 4618.0, 3030.0, 1917.0, 1352.0, 959.0, 644.0, 465.0, 353.0, 220.0, 174.0, 129.0, 93.0, 58.0, 40.0, 32.0, 18.0, 12.0, 15.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.0703125, -2.005401611328125, -1.94049072265625, -1.875579833984375, -1.8106689453125, -1.745758056640625, -1.68084716796875, -1.615936279296875, -1.551025390625, -1.486114501953125, -1.42120361328125, -1.356292724609375, -1.2913818359375, -1.226470947265625, -1.16156005859375, -1.096649169921875, -1.03173828125, -0.966827392578125, -0.90191650390625, -0.837005615234375, -0.7720947265625, -0.707183837890625, -0.64227294921875, -0.577362060546875, -0.512451171875, -0.447540283203125, -0.38262939453125, -0.317718505859375, -0.2528076171875, -0.187896728515625, -0.12298583984375, -0.058074951171875, 0.0068359375, 0.071746826171875, 0.13665771484375, 0.201568603515625, 0.2664794921875, 0.331390380859375, 0.39630126953125, 0.461212158203125, 0.526123046875, 0.591033935546875, 0.65594482421875, 0.720855712890625, 0.7857666015625, 0.850677490234375, 0.91558837890625, 0.980499267578125, 1.04541015625, 1.110321044921875, 1.17523193359375, 1.240142822265625, 1.3050537109375, 1.369964599609375, 1.43487548828125, 1.499786376953125, 1.564697265625, 1.629608154296875, 1.69451904296875, 1.759429931640625, 1.8243408203125, 1.889251708984375, 1.95416259765625, 2.019073486328125, 2.083984375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 0.0, 7.0, 5.0, 9.0, 6.0, 8.0, 11.0, 20.0, 16.0, 21.0, 33.0, 32.0, 36.0, 38.0, 57.0, 62.0, 64.0, 78.0, 64.0, 67.0, 51.0, 45.0, 41.0, 54.0, 24.0, 25.0, 29.0, 15.0, 12.0, 13.0, 7.0, 9.0, 10.0, 5.0, 4.0, 7.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47607421875, -0.45957183837890625, -0.4430694580078125, -0.42656707763671875, -0.410064697265625, -0.39356231689453125, -0.3770599365234375, -0.36055755615234375, -0.34405517578125, -0.32755279541015625, -0.3110504150390625, -0.29454803466796875, -0.278045654296875, -0.26154327392578125, -0.2450408935546875, -0.22853851318359375, -0.2120361328125, -0.19553375244140625, -0.1790313720703125, -0.16252899169921875, -0.146026611328125, -0.12952423095703125, -0.1130218505859375, -0.09651947021484375, -0.08001708984375, -0.06351470947265625, -0.0470123291015625, -0.03050994873046875, -0.014007568359375, 0.00249481201171875, 0.0189971923828125, 0.03549957275390625, 0.052001953125, 0.06850433349609375, 0.0850067138671875, 0.10150909423828125, 0.118011474609375, 0.13451385498046875, 0.1510162353515625, 0.16751861572265625, 0.18402099609375, 0.20052337646484375, 0.2170257568359375, 0.23352813720703125, 0.250030517578125, 0.26653289794921875, 0.2830352783203125, 0.29953765869140625, 0.3160400390625, 0.33254241943359375, 0.3490447998046875, 0.36554718017578125, 0.382049560546875, 0.39855194091796875, 0.4150543212890625, 0.43155670166015625, 0.44805908203125, 0.46456146240234375, 0.4810638427734375, 0.49756622314453125, 0.514068603515625, 0.5305709838867188, 0.5470733642578125, 0.5635757446289062, 0.580078125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 3.0, 5.0, 12.0, 17.0, 20.0, 25.0, 30.0, 34.0, 44.0, 49.0, 59.0, 57.0, 61.0, 68.0, 77.0, 79.0, 72.0, 53.0, 47.0, 39.0, 34.0, 24.0, 16.0, 13.0, 9.0, 8.0, 5.0, 5.0, 1.0, 6.0, 4.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.875024795532227, -19.204059600830078, -18.533092498779297, -17.86212730407715, -17.191160202026367, -16.52019500732422, -15.849228858947754, -15.178262710571289, -14.507296562194824, -13.83633041381836, -13.165364265441895, -12.49439811706543, -11.823432922363281, -11.1524658203125, -10.481500625610352, -9.810534477233887, -9.139568328857422, -8.468602180480957, -7.797636032104492, -7.1266703605651855, -6.455704212188721, -5.784738063812256, -5.113772392272949, -4.442806243896484, -3.7718400955200195, -3.1008739471435547, -2.429908037185669, -1.7589421272277832, -1.0879759788513184, -0.4170098304748535, 0.2539558410644531, 0.924921989440918, 1.5958900451660156, 2.2668561935424805, 2.937822103500366, 3.608788013458252, 4.279754161834717, 4.950720310211182, 5.621685981750488, 6.292652130126953, 6.963618278503418, 7.634584426879883, 8.305550575256348, 8.976516723632812, 9.647481918334961, 10.318449020385742, 10.98941421508789, 11.660380363464355, 12.33134651184082, 13.002312660217285, 13.67327880859375, 14.344244003295898, 15.01521110534668, 15.686176300048828, 16.35714340209961, 17.028108596801758, 17.699073791503906, 18.370038986206055, 19.041006088256836, 19.711971282958984, 20.382938385009766, 21.053903579711914, 21.724868774414062, 22.395835876464844, 23.066802978515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 8.0, 6.0, 8.0, 7.0, 18.0, 17.0, 14.0, 21.0, 20.0, 33.0, 37.0, 49.0, 36.0, 36.0, 47.0, 51.0, 49.0, 36.0, 49.0, 43.0, 41.0, 35.0, 50.0, 34.0, 44.0, 24.0, 29.0, 35.0, 24.0, 19.0, 23.0, 17.0, 7.0, 8.0, 8.0, 7.0, 3.0, 6.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.524703979492188, -17.98550796508789, -17.446311950683594, -16.907114028930664, -16.367918014526367, -15.82872200012207, -15.289525985717773, -14.75032901763916, -14.211132049560547, -13.67193603515625, -13.132739067077637, -12.59354305267334, -12.054346084594727, -11.51515007019043, -10.975954055786133, -10.43675708770752, -9.897561073303223, -9.358365058898926, -8.819168090820312, -8.279972076416016, -7.740775108337402, -7.2015790939331055, -6.66238260269165, -6.123186111450195, -5.58398962020874, -5.044793128967285, -4.50559663772583, -3.966400384902954, -3.427203893661499, -2.888007402420044, -2.348811149597168, -1.809614658355713, -1.2704191207885742, -0.7312226891517639, -0.1920262575149536, 0.3471701145172119, 0.886366605758667, 1.425563097000122, 1.964759349822998, 2.503955841064453, 3.043152332305908, 3.5823488235473633, 4.121545314788818, 4.660741806030273, 5.19993782043457, 5.739134788513184, 6.2783308029174805, 6.8175272941589355, 7.356723785400391, 7.895920276641846, 8.4351167678833, 8.974312782287598, 9.513509750366211, 10.052705764770508, 10.591901779174805, 11.131098747253418, 11.670295715332031, 12.209491729736328, 12.748688697814941, 13.287884712219238, 13.827081680297852, 14.366277694702148, 14.905473709106445, 15.444670677185059, 15.983866691589355]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 1.0, 8.0, 11.0, 16.0, 24.0, 34.0, 36.0, 57.0, 77.0, 113.0, 181.0, 244.0, 353.0, 502.0, 722.0, 1067.0, 1544.0, 2336.0, 3322.0, 5320.0, 8171.0, 12864.0, 20739.0, 34090.0, 57875.0, 99114.0, 159452.0, 200428.0, 169798.0, 107308.0, 63192.0, 37346.0, 22292.0, 13979.0, 8713.0, 5757.0, 3698.0, 2506.0, 1691.0, 1069.0, 762.0, 493.0, 378.0, 258.0, 174.0, 138.0, 90.0, 66.0, 45.0, 28.0, 25.0, 18.0, 14.0, 7.0, 2.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-17.875, -17.29052734375, -16.7060546875, -16.12158203125, -15.537109375, -14.95263671875, -14.3681640625, -13.78369140625, -13.19921875, -12.61474609375, -12.0302734375, -11.44580078125, -10.861328125, -10.27685546875, -9.6923828125, -9.10791015625, -8.5234375, -7.93896484375, -7.3544921875, -6.77001953125, -6.185546875, -5.60107421875, -5.0166015625, -4.43212890625, -3.84765625, -3.26318359375, -2.6787109375, -2.09423828125, -1.509765625, -0.92529296875, -0.3408203125, 0.24365234375, 0.828125, 1.41259765625, 1.9970703125, 2.58154296875, 3.166015625, 3.75048828125, 4.3349609375, 4.91943359375, 5.50390625, 6.08837890625, 6.6728515625, 7.25732421875, 7.841796875, 8.42626953125, 9.0107421875, 9.59521484375, 10.1796875, 10.76416015625, 11.3486328125, 11.93310546875, 12.517578125, 13.10205078125, 13.6865234375, 14.27099609375, 14.85546875, 15.43994140625, 16.0244140625, 16.60888671875, 17.193359375, 17.77783203125, 18.3623046875, 18.94677734375, 19.53125]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 17.0, 15.0, 15.0, 18.0, 22.0, 23.0, 32.0, 41.0, 31.0, 36.0, 53.0, 42.0, 46.0, 37.0, 47.0, 54.0, 44.0, 33.0, 46.0, 39.0, 27.0, 48.0, 29.0, 25.0, 27.0, 20.0, 31.0, 14.0, 19.0, 12.0, 10.0, 10.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.4375, -15.9610595703125, -15.484619140625, -15.0081787109375, -14.53173828125, -14.0552978515625, -13.578857421875, -13.1024169921875, -12.6259765625, -12.1495361328125, -11.673095703125, -11.1966552734375, -10.72021484375, -10.2437744140625, -9.767333984375, -9.2908935546875, -8.814453125, -8.3380126953125, -7.861572265625, -7.3851318359375, -6.90869140625, -6.4322509765625, -5.955810546875, -5.4793701171875, -5.0029296875, -4.5264892578125, -4.050048828125, -3.5736083984375, -3.09716796875, -2.6207275390625, -2.144287109375, -1.6678466796875, -1.19140625, -0.7149658203125, -0.238525390625, 0.2379150390625, 0.71435546875, 1.1907958984375, 1.667236328125, 2.1436767578125, 2.6201171875, 3.0965576171875, 3.572998046875, 4.0494384765625, 4.52587890625, 5.0023193359375, 5.478759765625, 5.9552001953125, 6.431640625, 6.9080810546875, 7.384521484375, 7.8609619140625, 8.33740234375, 8.8138427734375, 9.290283203125, 9.7667236328125, 10.2431640625, 10.7196044921875, 11.196044921875, 11.6724853515625, 12.14892578125, 12.6253662109375, 13.101806640625, 13.5782470703125, 14.0546875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 8.0, 9.0, 18.0, 23.0, 25.0, 54.0, 102.0, 154.0, 245.0, 389.0, 637.0, 1073.0, 1884.0, 3086.0, 5115.0, 8857.0, 15747.0, 28307.0, 51468.0, 94340.0, 158699.0, 212492.0, 189929.0, 121725.0, 68136.0, 37574.0, 20766.0, 11515.0, 6506.0, 3883.0, 2271.0, 1360.0, 823.0, 487.0, 339.0, 196.0, 123.0, 55.0, 54.0, 29.0, 23.0, 10.0, 11.0, 2.0, 3.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.03125, -17.5120849609375, -16.992919921875, -16.4737548828125, -15.95458984375, -15.4354248046875, -14.916259765625, -14.3970947265625, -13.8779296875, -13.3587646484375, -12.839599609375, -12.3204345703125, -11.80126953125, -11.2821044921875, -10.762939453125, -10.2437744140625, -9.724609375, -9.2054443359375, -8.686279296875, -8.1671142578125, -7.64794921875, -7.1287841796875, -6.609619140625, -6.0904541015625, -5.5712890625, -5.0521240234375, -4.532958984375, -4.0137939453125, -3.49462890625, -2.9754638671875, -2.456298828125, -1.9371337890625, -1.41796875, -0.8988037109375, -0.379638671875, 0.1395263671875, 0.65869140625, 1.1778564453125, 1.697021484375, 2.2161865234375, 2.7353515625, 3.2545166015625, 3.773681640625, 4.2928466796875, 4.81201171875, 5.3311767578125, 5.850341796875, 6.3695068359375, 6.888671875, 7.4078369140625, 7.927001953125, 8.4461669921875, 8.96533203125, 9.4844970703125, 10.003662109375, 10.5228271484375, 11.0419921875, 11.5611572265625, 12.080322265625, 12.5994873046875, 13.11865234375, 13.6378173828125, 14.156982421875, 14.6761474609375, 15.1953125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 8.0, 13.0, 13.0, 10.0, 18.0, 17.0, 31.0, 40.0, 26.0, 30.0, 34.0, 35.0, 43.0, 49.0, 32.0, 30.0, 52.0, 25.0, 42.0, 39.0, 37.0, 39.0, 46.0, 30.0, 43.0, 27.0, 25.0, 22.0, 23.0, 14.0, 19.0, 21.0, 11.0, 7.0, 7.0, 4.0, 4.0, 9.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3671875, -9.0867919921875, -8.806396484375, -8.5260009765625, -8.24560546875, -7.9652099609375, -7.684814453125, -7.4044189453125, -7.1240234375, -6.8436279296875, -6.563232421875, -6.2828369140625, -6.00244140625, -5.7220458984375, -5.441650390625, -5.1612548828125, -4.880859375, -4.6004638671875, -4.320068359375, -4.0396728515625, -3.75927734375, -3.4788818359375, -3.198486328125, -2.9180908203125, -2.6376953125, -2.3572998046875, -2.076904296875, -1.7965087890625, -1.51611328125, -1.2357177734375, -0.955322265625, -0.6749267578125, -0.39453125, -0.1141357421875, 0.166259765625, 0.4466552734375, 0.72705078125, 1.0074462890625, 1.287841796875, 1.5682373046875, 1.8486328125, 2.1290283203125, 2.409423828125, 2.6898193359375, 2.97021484375, 3.2506103515625, 3.531005859375, 3.8114013671875, 4.091796875, 4.3721923828125, 4.652587890625, 4.9329833984375, 5.21337890625, 5.4937744140625, 5.774169921875, 6.0545654296875, 6.3349609375, 6.6153564453125, 6.895751953125, 7.1761474609375, 7.45654296875, 7.7369384765625, 8.017333984375, 8.2977294921875, 8.578125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 18.0, 15.0, 23.0, 20.0, 50.0, 57.0, 95.0, 119.0, 241.0, 386.0, 671.0, 1324.0, 2468.0, 5339.0, 12977.0, 38287.0, 151302.0, 468241.0, 268411.0, 64346.0, 19547.0, 7576.0, 3272.0, 1688.0, 861.0, 463.0, 264.0, 155.0, 115.0, 64.0, 37.0, 34.0, 30.0, 23.0, 9.0, 7.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-40.8125, -39.700439453125, -38.58837890625, -37.476318359375, -36.3642578125, -35.252197265625, -34.14013671875, -33.028076171875, -31.916015625, -30.803955078125, -29.69189453125, -28.579833984375, -27.4677734375, -26.355712890625, -25.24365234375, -24.131591796875, -23.01953125, -21.907470703125, -20.79541015625, -19.683349609375, -18.5712890625, -17.459228515625, -16.34716796875, -15.235107421875, -14.123046875, -13.010986328125, -11.89892578125, -10.786865234375, -9.6748046875, -8.562744140625, -7.45068359375, -6.338623046875, -5.2265625, -4.114501953125, -3.00244140625, -1.890380859375, -0.7783203125, 0.333740234375, 1.44580078125, 2.557861328125, 3.669921875, 4.781982421875, 5.89404296875, 7.006103515625, 8.1181640625, 9.230224609375, 10.34228515625, 11.454345703125, 12.56640625, 13.678466796875, 14.79052734375, 15.902587890625, 17.0146484375, 18.126708984375, 19.23876953125, 20.350830078125, 21.462890625, 22.574951171875, 23.68701171875, 24.799072265625, 25.9111328125, 27.023193359375, 28.13525390625, 29.247314453125, 30.359375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 6.0, 18.0, 13.0, 28.0, 43.0, 54.0, 75.0, 103.0, 111.0, 89.0, 111.0, 79.0, 61.0, 43.0, 36.0, 29.0, 14.0, 12.0, 12.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028171539306640625, -0.0027351677417755127, -0.002653181552886963, -0.002571195363998413, -0.0024892091751098633, -0.0024072229862213135, -0.0023252367973327637, -0.002243250608444214, -0.002161264419555664, -0.0020792782306671143, -0.0019972920417785645, -0.0019153058528900146, -0.0018333196640014648, -0.001751333475112915, -0.0016693472862243652, -0.0015873610973358154, -0.0015053749084472656, -0.0014233887195587158, -0.001341402530670166, -0.0012594163417816162, -0.0011774301528930664, -0.0010954439640045166, -0.0010134577751159668, -0.000931471586227417, -0.0008494853973388672, -0.0007674992084503174, -0.0006855130195617676, -0.0006035268306732178, -0.000521540641784668, -0.00043955445289611816, -0.00035756826400756836, -0.00027558207511901855, -0.00019359588623046875, -0.00011160969734191895, -2.962350845336914e-05, 5.2362680435180664e-05, 0.00013434886932373047, 0.00021633505821228027, 0.0002983212471008301, 0.0003803074359893799, 0.0004622936248779297, 0.0005442798137664795, 0.0006262660026550293, 0.0007082521915435791, 0.0007902383804321289, 0.0008722245693206787, 0.0009542107582092285, 0.0010361969470977783, 0.0011181831359863281, 0.001200169324874878, 0.0012821555137634277, 0.0013641417026519775, 0.0014461278915405273, 0.0015281140804290771, 0.001610100269317627, 0.0016920864582061768, 0.0017740726470947266, 0.0018560588359832764, 0.0019380450248718262, 0.002020031213760376, 0.0021020174026489258, 0.0021840035915374756, 0.0022659897804260254, 0.002347975969314575, 0.002429962158203125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 7.0, 10.0, 19.0, 14.0, 22.0, 36.0, 38.0, 41.0, 57.0, 77.0, 117.0, 170.0, 255.0, 420.0, 711.0, 1299.0, 2656.0, 6356.0, 16951.0, 55664.0, 200505.0, 428738.0, 234670.0, 66208.0, 19896.0, 7014.0, 3016.0, 1464.0, 781.0, 410.0, 256.0, 172.0, 118.0, 82.0, 61.0, 55.0, 42.0, 35.0, 25.0, 14.0, 14.0, 14.0, 12.0, 6.0, 5.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-30.765625, -29.791015625, -28.81640625, -27.841796875, -26.8671875, -25.892578125, -24.91796875, -23.943359375, -22.96875, -21.994140625, -21.01953125, -20.044921875, -19.0703125, -18.095703125, -17.12109375, -16.146484375, -15.171875, -14.197265625, -13.22265625, -12.248046875, -11.2734375, -10.298828125, -9.32421875, -8.349609375, -7.375, -6.400390625, -5.42578125, -4.451171875, -3.4765625, -2.501953125, -1.52734375, -0.552734375, 0.421875, 1.396484375, 2.37109375, 3.345703125, 4.3203125, 5.294921875, 6.26953125, 7.244140625, 8.21875, 9.193359375, 10.16796875, 11.142578125, 12.1171875, 13.091796875, 14.06640625, 15.041015625, 16.015625, 16.990234375, 17.96484375, 18.939453125, 19.9140625, 20.888671875, 21.86328125, 22.837890625, 23.8125, 24.787109375, 25.76171875, 26.736328125, 27.7109375, 28.685546875, 29.66015625, 30.634765625, 31.609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 7.0, 3.0, 3.0, 4.0, 12.0, 5.0, 11.0, 14.0, 17.0, 27.0, 22.0, 38.0, 42.0, 49.0, 49.0, 37.0, 60.0, 64.0, 64.0, 66.0, 48.0, 52.0, 48.0, 39.0, 33.0, 37.0, 28.0, 24.0, 15.0, 16.0, 13.0, 14.0, 11.0, 6.0, 7.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.86328125, -3.7313232421875, -3.599365234375, -3.4674072265625, -3.33544921875, -3.2034912109375, -3.071533203125, -2.9395751953125, -2.8076171875, -2.6756591796875, -2.543701171875, -2.4117431640625, -2.27978515625, -2.1478271484375, -2.015869140625, -1.8839111328125, -1.751953125, -1.6199951171875, -1.488037109375, -1.3560791015625, -1.22412109375, -1.0921630859375, -0.960205078125, -0.8282470703125, -0.6962890625, -0.5643310546875, -0.432373046875, -0.3004150390625, -0.16845703125, -0.0364990234375, 0.095458984375, 0.2274169921875, 0.359375, 0.4913330078125, 0.623291015625, 0.7552490234375, 0.88720703125, 1.0191650390625, 1.151123046875, 1.2830810546875, 1.4150390625, 1.5469970703125, 1.678955078125, 1.8109130859375, 1.94287109375, 2.0748291015625, 2.206787109375, 2.3387451171875, 2.470703125, 2.6026611328125, 2.734619140625, 2.8665771484375, 2.99853515625, 3.1304931640625, 3.262451171875, 3.3944091796875, 3.5263671875, 3.6583251953125, 3.790283203125, 3.9222412109375, 4.05419921875, 4.1861572265625, 4.318115234375, 4.4500732421875, 4.58203125]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 4.0, 7.0, 8.0, 13.0, 16.0, 17.0, 27.0, 26.0, 33.0, 54.0, 56.0, 67.0, 71.0, 75.0, 67.0, 59.0, 52.0, 62.0, 60.0, 38.0, 45.0, 27.0, 21.0, 21.0, 25.0, 11.0, 8.0, 10.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.250307083129883, -18.629356384277344, -18.008403778076172, -17.387453079223633, -16.766502380371094, -16.145551681518555, -15.524599075317383, -14.903648376464844, -14.282697677612305, -13.66174602508545, -13.04079532623291, -12.419843673706055, -11.798892974853516, -11.17794132232666, -10.556989669799805, -9.936038970947266, -9.31508731842041, -8.694135665893555, -8.073184967041016, -7.45223331451416, -6.831282615661621, -6.210330963134766, -5.589379787445068, -4.968428611755371, -4.347477436065674, -3.7265262603759766, -3.1055750846862793, -2.484623670578003, -1.8636724948883057, -1.2427213191986084, -0.621769905090332, -0.0008187294006347656, 0.6201324462890625, 1.2410836219787598, 1.8620349168777466, 2.4829862117767334, 3.1039373874664307, 3.724888563156128, 4.345839977264404, 4.966791152954102, 5.587742328643799, 6.208693504333496, 6.829644680023193, 7.450595855712891, 8.071547508239746, 8.692498207092285, 9.31344985961914, 9.93440055847168, 10.555352210998535, 11.17630386352539, 11.79725456237793, 12.418206214904785, 13.039156913757324, 13.66010856628418, 14.281059265136719, 14.902010917663574, 15.52296257019043, 16.14391326904297, 16.76486587524414, 17.38581657409668, 18.00676727294922, 18.627717971801758, 19.24867057800293, 19.86962127685547, 20.490571975708008]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 0.0, 4.0, 8.0, 1.0, 8.0, 9.0, 12.0, 10.0, 14.0, 23.0, 13.0, 19.0, 31.0, 29.0, 27.0, 26.0, 44.0, 38.0, 33.0, 36.0, 34.0, 39.0, 56.0, 40.0, 40.0, 38.0, 39.0, 34.0, 30.0, 33.0, 32.0, 27.0, 25.0, 27.0, 19.0, 14.0, 26.0, 16.0, 6.0, 9.0, 7.0, 4.0, 4.0, 3.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-14.2223482131958, -13.786551475524902, -13.35075569152832, -12.914958953857422, -12.479162216186523, -12.043366432189941, -11.607569694519043, -11.171773910522461, -10.735977172851562, -10.300180435180664, -9.864384651184082, -9.428587913513184, -8.992792129516602, -8.556995391845703, -8.121198654174805, -7.6854023933410645, -7.249606132507324, -6.813809871673584, -6.378013610839844, -5.942216873168945, -5.506420612335205, -5.070624351501465, -4.634827613830566, -4.199031352996826, -3.763235092163086, -3.3274388313293457, -2.8916423320770264, -2.455845832824707, -2.020049571990967, -1.5842533111572266, -1.1484568119049072, -0.7126603126525879, -0.27686500549316406, 0.15893137454986572, 0.5947277545928955, 1.0305241346359253, 1.466320514678955, 1.9021167755126953, 2.3379132747650146, 2.773709774017334, 3.209506034851074, 3.6453022956848145, 4.081098556518555, 4.516895294189453, 4.952691555023193, 5.388487815856934, 5.824284553527832, 6.260080814361572, 6.6958770751953125, 7.131673336029053, 7.567469596862793, 8.003266334533691, 8.439062118530273, 8.874858856201172, 9.31065559387207, 9.746452331542969, 10.18224811553955, 10.61804485321045, 11.053840637207031, 11.48963737487793, 11.925434112548828, 12.36122989654541, 12.797026634216309, 13.23282241821289, 13.668619155883789]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 12.0, 10.0, 12.0, 13.0, 22.0, 31.0, 54.0, 49.0, 80.0, 107.0, 117.0, 180.0, 252.0, 350.0, 601.0, 898.0, 1229.0, 2072.0, 3323.0, 5505.0, 9981.0, 18981.0, 38196.0, 89105.0, 232238.0, 632572.0, 1208463.0, 1100142.0, 516235.0, 189167.0, 73783.0, 33079.0, 16215.0, 8708.0, 4796.0, 2879.0, 1633.0, 1071.0, 656.0, 431.0, 312.0, 216.0, 154.0, 106.0, 67.0, 50.0, 39.0, 35.0, 23.0, 20.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.9765625, -15.4593505859375, -14.942138671875, -14.4249267578125, -13.90771484375, -13.3905029296875, -12.873291015625, -12.3560791015625, -11.8388671875, -11.3216552734375, -10.804443359375, -10.2872314453125, -9.77001953125, -9.2528076171875, -8.735595703125, -8.2183837890625, -7.701171875, -7.1839599609375, -6.666748046875, -6.1495361328125, -5.63232421875, -5.1151123046875, -4.597900390625, -4.0806884765625, -3.5634765625, -3.0462646484375, -2.529052734375, -2.0118408203125, -1.49462890625, -0.9774169921875, -0.460205078125, 0.0570068359375, 0.57421875, 1.0914306640625, 1.608642578125, 2.1258544921875, 2.64306640625, 3.1602783203125, 3.677490234375, 4.1947021484375, 4.7119140625, 5.2291259765625, 5.746337890625, 6.2635498046875, 6.78076171875, 7.2979736328125, 7.815185546875, 8.3323974609375, 8.849609375, 9.3668212890625, 9.884033203125, 10.4012451171875, 10.91845703125, 11.4356689453125, 11.952880859375, 12.4700927734375, 12.9873046875, 13.5045166015625, 14.021728515625, 14.5389404296875, 15.05615234375, 15.5733642578125, 16.090576171875, 16.6077880859375, 17.125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 6.0, 6.0, 2.0, 9.0, 9.0, 12.0, 9.0, 7.0, 28.0, 27.0, 21.0, 33.0, 18.0, 20.0, 26.0, 32.0, 42.0, 33.0, 37.0, 36.0, 43.0, 47.0, 40.0, 35.0, 43.0, 41.0, 34.0, 31.0, 29.0, 34.0, 27.0, 17.0, 28.0, 22.0, 15.0, 16.0, 22.0, 12.0, 9.0, 9.0, 6.0, 9.0, 2.0, 4.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.8828125, -8.5960693359375, -8.309326171875, -8.0225830078125, -7.73583984375, -7.4490966796875, -7.162353515625, -6.8756103515625, -6.5888671875, -6.3021240234375, -6.015380859375, -5.7286376953125, -5.44189453125, -5.1551513671875, -4.868408203125, -4.5816650390625, -4.294921875, -4.0081787109375, -3.721435546875, -3.4346923828125, -3.14794921875, -2.8612060546875, -2.574462890625, -2.2877197265625, -2.0009765625, -1.7142333984375, -1.427490234375, -1.1407470703125, -0.85400390625, -0.5672607421875, -0.280517578125, 0.0062255859375, 0.29296875, 0.5797119140625, 0.866455078125, 1.1531982421875, 1.43994140625, 1.7266845703125, 2.013427734375, 2.3001708984375, 2.5869140625, 2.8736572265625, 3.160400390625, 3.4471435546875, 3.73388671875, 4.0206298828125, 4.307373046875, 4.5941162109375, 4.880859375, 5.1676025390625, 5.454345703125, 5.7410888671875, 6.02783203125, 6.3145751953125, 6.601318359375, 6.8880615234375, 7.1748046875, 7.4615478515625, 7.748291015625, 8.0350341796875, 8.32177734375, 8.6085205078125, 8.895263671875, 9.1820068359375, 9.46875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 17.0, 10.0, 26.0, 28.0, 57.0, 60.0, 112.0, 146.0, 230.0, 367.0, 543.0, 801.0, 1321.0, 2291.0, 3931.0, 6802.0, 13416.0, 28259.0, 68379.0, 191808.0, 593143.0, 1461263.0, 1179929.0, 409931.0, 134297.0, 50411.0, 22016.0, 10541.0, 5724.0, 3278.0, 1860.0, 1147.0, 749.0, 463.0, 293.0, 200.0, 137.0, 103.0, 61.0, 41.0, 28.0, 23.0, 8.0, 7.0, 7.0, 9.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.765625, -21.102783203125, -20.43994140625, -19.777099609375, -19.1142578125, -18.451416015625, -17.78857421875, -17.125732421875, -16.462890625, -15.800048828125, -15.13720703125, -14.474365234375, -13.8115234375, -13.148681640625, -12.48583984375, -11.822998046875, -11.16015625, -10.497314453125, -9.83447265625, -9.171630859375, -8.5087890625, -7.845947265625, -7.18310546875, -6.520263671875, -5.857421875, -5.194580078125, -4.53173828125, -3.868896484375, -3.2060546875, -2.543212890625, -1.88037109375, -1.217529296875, -0.5546875, 0.108154296875, 0.77099609375, 1.433837890625, 2.0966796875, 2.759521484375, 3.42236328125, 4.085205078125, 4.748046875, 5.410888671875, 6.07373046875, 6.736572265625, 7.3994140625, 8.062255859375, 8.72509765625, 9.387939453125, 10.05078125, 10.713623046875, 11.37646484375, 12.039306640625, 12.7021484375, 13.364990234375, 14.02783203125, 14.690673828125, 15.353515625, 16.016357421875, 16.67919921875, 17.342041015625, 18.0048828125, 18.667724609375, 19.33056640625, 19.993408203125, 20.65625]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 3.0, 11.0, 11.0, 18.0, 21.0, 28.0, 25.0, 48.0, 67.0, 101.0, 129.0, 164.0, 211.0, 278.0, 312.0, 332.0, 378.0, 358.0, 304.0, 294.0, 220.0, 192.0, 128.0, 90.0, 77.0, 71.0, 53.0, 25.0, 28.0, 16.0, 23.0, 15.0, 13.0, 9.0, 6.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.88671875, -4.703369140625, -4.52001953125, -4.336669921875, -4.1533203125, -3.969970703125, -3.78662109375, -3.603271484375, -3.419921875, -3.236572265625, -3.05322265625, -2.869873046875, -2.6865234375, -2.503173828125, -2.31982421875, -2.136474609375, -1.953125, -1.769775390625, -1.58642578125, -1.403076171875, -1.2197265625, -1.036376953125, -0.85302734375, -0.669677734375, -0.486328125, -0.302978515625, -0.11962890625, 0.063720703125, 0.2470703125, 0.430419921875, 0.61376953125, 0.797119140625, 0.98046875, 1.163818359375, 1.34716796875, 1.530517578125, 1.7138671875, 1.897216796875, 2.08056640625, 2.263916015625, 2.447265625, 2.630615234375, 2.81396484375, 2.997314453125, 3.1806640625, 3.364013671875, 3.54736328125, 3.730712890625, 3.9140625, 4.097412109375, 4.28076171875, 4.464111328125, 4.6474609375, 4.830810546875, 5.01416015625, 5.197509765625, 5.380859375, 5.564208984375, 5.74755859375, 5.930908203125, 6.1142578125, 6.297607421875, 6.48095703125, 6.664306640625, 6.84765625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 8.0, 9.0, 10.0, 10.0, 14.0, 15.0, 26.0, 39.0, 39.0, 51.0, 71.0, 75.0, 77.0, 67.0, 77.0, 74.0, 63.0, 65.0, 49.0, 33.0, 29.0, 19.0, 14.0, 16.0, 16.0, 10.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.141576766967773, -18.553462982177734, -17.965351104736328, -17.37723731994629, -16.78912353515625, -16.20100975036621, -15.612896919250488, -15.024784088134766, -14.436670303344727, -13.848556518554688, -13.260443687438965, -12.672330856323242, -12.084217071533203, -11.496103286743164, -10.907990455627441, -10.319877624511719, -9.73176383972168, -9.14365005493164, -8.555537223815918, -7.967423915863037, -7.379310607910156, -6.791197299957275, -6.2030839920043945, -5.614970684051514, -5.026857376098633, -4.438744068145752, -3.850630760192871, -3.2625174522399902, -2.6744041442871094, -2.0862908363342285, -1.4981775283813477, -0.9100642204284668, -0.32195091247558594, 0.2661623954772949, 0.8542757034301758, 1.4423890113830566, 2.0305023193359375, 2.6186156272888184, 3.206728935241699, 3.79484224319458, 4.382955551147461, 4.971068859100342, 5.559182167053223, 6.1472954750061035, 6.735408782958984, 7.323522090911865, 7.911635398864746, 8.499748229980469, 9.087862014770508, 9.675975799560547, 10.26408863067627, 10.852201461791992, 11.440315246582031, 12.02842903137207, 12.616541862487793, 13.204654693603516, 13.792768478393555, 14.380882263183594, 14.968995094299316, 15.557107925415039, 16.145221710205078, 16.733335494995117, 17.321449279785156, 17.909561157226562, 18.4976749420166]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 4.0, 7.0, 6.0, 6.0, 15.0, 7.0, 16.0, 14.0, 10.0, 15.0, 20.0, 21.0, 27.0, 28.0, 25.0, 30.0, 41.0, 33.0, 26.0, 27.0, 45.0, 27.0, 30.0, 33.0, 42.0, 36.0, 40.0, 48.0, 24.0, 25.0, 33.0, 27.0, 26.0, 27.0, 19.0, 24.0, 19.0, 17.0, 17.0, 9.0, 8.0, 5.0, 12.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-11.562013626098633, -11.219781875610352, -10.87755012512207, -10.535318374633789, -10.193086624145508, -9.850854873657227, -9.508623123168945, -9.166391372680664, -8.824159622192383, -8.481927871704102, -8.13969612121582, -7.797464370727539, -7.455232620239258, -7.113000869750977, -6.770769119262695, -6.428537368774414, -6.086305618286133, -5.744073867797852, -5.40184211730957, -5.059610366821289, -4.717378616333008, -4.375146865844727, -4.032915115356445, -3.690683364868164, -3.348451614379883, -3.0062198638916016, -2.6639881134033203, -2.321756362915039, -1.9795246124267578, -1.6372928619384766, -1.2950611114501953, -0.9528293609619141, -0.6105976104736328, -0.26836585998535156, 0.07386589050292969, 0.41609764099121094, 0.7583293914794922, 1.1005611419677734, 1.4427928924560547, 1.785024642944336, 2.127256393432617, 2.4694881439208984, 2.8117198944091797, 3.153951644897461, 3.496183395385742, 3.8384151458740234, 4.180646896362305, 4.522878646850586, 4.865110397338867, 5.207342147827148, 5.54957389831543, 5.891805648803711, 6.234037399291992, 6.576269149780273, 6.918500900268555, 7.260732650756836, 7.602964401245117, 7.945196151733398, 8.28742790222168, 8.629659652709961, 8.971891403198242, 9.314123153686523, 9.656354904174805, 9.998586654663086, 10.340818405151367]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 8.0, 5.0, 12.0, 10.0, 22.0, 24.0, 32.0, 41.0, 66.0, 89.0, 113.0, 163.0, 226.0, 314.0, 449.0, 682.0, 882.0, 1215.0, 1693.0, 2637.0, 3965.0, 6249.0, 9757.0, 15831.0, 26127.0, 45075.0, 76938.0, 129896.0, 195571.0, 197638.0, 134342.0, 79725.0, 46196.0, 26801.0, 16455.0, 10000.0, 6253.0, 4057.0, 2702.0, 1864.0, 1219.0, 890.0, 660.0, 471.0, 374.0, 209.0, 153.0, 126.0, 93.0, 77.0, 40.0, 36.0, 31.0, 22.0, 13.0, 10.0, 7.0, 4.0, 5.0, 2.0, 4.0], "bins": [-4.359375, -4.2232666015625, -4.087158203125, -3.9510498046875, -3.81494140625, -3.6788330078125, -3.542724609375, -3.4066162109375, -3.2705078125, -3.1343994140625, -2.998291015625, -2.8621826171875, -2.72607421875, -2.5899658203125, -2.453857421875, -2.3177490234375, -2.181640625, -2.0455322265625, -1.909423828125, -1.7733154296875, -1.63720703125, -1.5010986328125, -1.364990234375, -1.2288818359375, -1.0927734375, -0.9566650390625, -0.820556640625, -0.6844482421875, -0.54833984375, -0.4122314453125, -0.276123046875, -0.1400146484375, -0.00390625, 0.1322021484375, 0.268310546875, 0.4044189453125, 0.54052734375, 0.6766357421875, 0.812744140625, 0.9488525390625, 1.0849609375, 1.2210693359375, 1.357177734375, 1.4932861328125, 1.62939453125, 1.7655029296875, 1.901611328125, 2.0377197265625, 2.173828125, 2.3099365234375, 2.446044921875, 2.5821533203125, 2.71826171875, 2.8543701171875, 2.990478515625, 3.1265869140625, 3.2626953125, 3.3988037109375, 3.534912109375, 3.6710205078125, 3.80712890625, 3.9432373046875, 4.079345703125, 4.2154541015625, 4.3515625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 4.0, 3.0, 4.0, 8.0, 12.0, 7.0, 9.0, 19.0, 13.0, 15.0, 19.0, 23.0, 15.0, 36.0, 31.0, 41.0, 28.0, 29.0, 33.0, 31.0, 32.0, 33.0, 32.0, 32.0, 47.0, 36.0, 33.0, 32.0, 47.0, 30.0, 38.0, 28.0, 31.0, 15.0, 17.0, 12.0, 25.0, 15.0, 9.0, 12.0, 13.0, 10.0, 9.0, 8.0, 6.0, 3.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-12.5, -12.1417236328125, -11.783447265625, -11.4251708984375, -11.06689453125, -10.7086181640625, -10.350341796875, -9.9920654296875, -9.6337890625, -9.2755126953125, -8.917236328125, -8.5589599609375, -8.20068359375, -7.8424072265625, -7.484130859375, -7.1258544921875, -6.767578125, -6.4093017578125, -6.051025390625, -5.6927490234375, -5.33447265625, -4.9761962890625, -4.617919921875, -4.2596435546875, -3.9013671875, -3.5430908203125, -3.184814453125, -2.8265380859375, -2.46826171875, -2.1099853515625, -1.751708984375, -1.3934326171875, -1.03515625, -0.6768798828125, -0.318603515625, 0.0396728515625, 0.39794921875, 0.7562255859375, 1.114501953125, 1.4727783203125, 1.8310546875, 2.1893310546875, 2.547607421875, 2.9058837890625, 3.26416015625, 3.6224365234375, 3.980712890625, 4.3389892578125, 4.697265625, 5.0555419921875, 5.413818359375, 5.7720947265625, 6.13037109375, 6.4886474609375, 6.846923828125, 7.2052001953125, 7.5634765625, 7.9217529296875, 8.280029296875, 8.6383056640625, 8.99658203125, 9.3548583984375, 9.713134765625, 10.0714111328125, 10.4296875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 8.0, 4.0, 10.0, 27.0, 18.0, 35.0, 46.0, 74.0, 70.0, 119.0, 169.0, 246.0, 365.0, 447.0, 698.0, 994.0, 1486.0, 2230.0, 3444.0, 5553.0, 9717.0, 18915.0, 54032.0, 858167.0, 48031.0, 18065.0, 9686.0, 5515.0, 3393.0, 2135.0, 1379.0, 979.0, 656.0, 498.0, 348.0, 254.0, 184.0, 133.0, 103.0, 90.0, 60.0, 47.0, 30.0, 27.0, 17.0, 14.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-10.4765625, -10.1326904296875, -9.788818359375, -9.4449462890625, -9.10107421875, -8.7572021484375, -8.413330078125, -8.0694580078125, -7.7255859375, -7.3817138671875, -7.037841796875, -6.6939697265625, -6.35009765625, -6.0062255859375, -5.662353515625, -5.3184814453125, -4.974609375, -4.6307373046875, -4.286865234375, -3.9429931640625, -3.59912109375, -3.2552490234375, -2.911376953125, -2.5675048828125, -2.2236328125, -1.8797607421875, -1.535888671875, -1.1920166015625, -0.84814453125, -0.5042724609375, -0.160400390625, 0.1834716796875, 0.52734375, 0.8712158203125, 1.215087890625, 1.5589599609375, 1.90283203125, 2.2467041015625, 2.590576171875, 2.9344482421875, 3.2783203125, 3.6221923828125, 3.966064453125, 4.3099365234375, 4.65380859375, 4.9976806640625, 5.341552734375, 5.6854248046875, 6.029296875, 6.3731689453125, 6.717041015625, 7.0609130859375, 7.40478515625, 7.7486572265625, 8.092529296875, 8.4364013671875, 8.7802734375, 9.1241455078125, 9.468017578125, 9.8118896484375, 10.15576171875, 10.4996337890625, 10.843505859375, 11.1873779296875, 11.53125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 11.0, 6.0, 9.0, 16.0, 16.0, 16.0, 20.0, 16.0, 22.0, 30.0, 36.0, 32.0, 24.0, 32.0, 34.0, 35.0, 45.0, 40.0, 46.0, 29.0, 45.0, 52.0, 39.0, 37.0, 36.0, 30.0, 32.0, 27.0, 32.0, 21.0, 30.0, 18.0, 23.0, 8.0, 13.0, 13.0, 5.0, 7.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.46875, -10.178955078125, -9.88916015625, -9.599365234375, -9.3095703125, -9.019775390625, -8.72998046875, -8.440185546875, -8.150390625, -7.860595703125, -7.57080078125, -7.281005859375, -6.9912109375, -6.701416015625, -6.41162109375, -6.121826171875, -5.83203125, -5.542236328125, -5.25244140625, -4.962646484375, -4.6728515625, -4.383056640625, -4.09326171875, -3.803466796875, -3.513671875, -3.223876953125, -2.93408203125, -2.644287109375, -2.3544921875, -2.064697265625, -1.77490234375, -1.485107421875, -1.1953125, -0.905517578125, -0.61572265625, -0.325927734375, -0.0361328125, 0.253662109375, 0.54345703125, 0.833251953125, 1.123046875, 1.412841796875, 1.70263671875, 1.992431640625, 2.2822265625, 2.572021484375, 2.86181640625, 3.151611328125, 3.44140625, 3.731201171875, 4.02099609375, 4.310791015625, 4.6005859375, 4.890380859375, 5.18017578125, 5.469970703125, 5.759765625, 6.049560546875, 6.33935546875, 6.629150390625, 6.9189453125, 7.208740234375, 7.49853515625, 7.788330078125, 8.078125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 11.0, 15.0, 14.0, 15.0, 28.0, 36.0, 59.0, 55.0, 74.0, 101.0, 124.0, 179.0, 317.0, 420.0, 737.0, 1290.0, 2740.0, 6685.0, 23530.0, 928989.0, 63397.0, 11418.0, 4007.0, 1708.0, 893.0, 550.0, 299.0, 211.0, 150.0, 102.0, 85.0, 76.0, 41.0, 41.0, 25.0, 13.0, 13.0, 7.0, 8.0, 10.0, 14.0, 7.0, 2.0, 2.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-7.5, -7.2708740234375, -7.041748046875, -6.8126220703125, -6.58349609375, -6.3543701171875, -6.125244140625, -5.8961181640625, -5.6669921875, -5.4378662109375, -5.208740234375, -4.9796142578125, -4.75048828125, -4.5213623046875, -4.292236328125, -4.0631103515625, -3.833984375, -3.6048583984375, -3.375732421875, -3.1466064453125, -2.91748046875, -2.6883544921875, -2.459228515625, -2.2301025390625, -2.0009765625, -1.7718505859375, -1.542724609375, -1.3135986328125, -1.08447265625, -0.8553466796875, -0.626220703125, -0.3970947265625, -0.16796875, 0.0611572265625, 0.290283203125, 0.5194091796875, 0.74853515625, 0.9776611328125, 1.206787109375, 1.4359130859375, 1.6650390625, 1.8941650390625, 2.123291015625, 2.3524169921875, 2.58154296875, 2.8106689453125, 3.039794921875, 3.2689208984375, 3.498046875, 3.7271728515625, 3.956298828125, 4.1854248046875, 4.41455078125, 4.6436767578125, 4.872802734375, 5.1019287109375, 5.3310546875, 5.5601806640625, 5.789306640625, 6.0184326171875, 6.24755859375, 6.4766845703125, 6.705810546875, 6.9349365234375, 7.1640625]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 4.0, 7.0, 9.0, 12.0, 14.0, 24.0, 55.0, 124.0, 232.0, 223.0, 130.0, 66.0, 30.0, 18.0, 14.0, 17.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004839897155761719, -0.0004684031009674072, -0.0004528164863586426, -0.00043722987174987793, -0.0004216432571411133, -0.00040605664253234863, -0.000390470027923584, -0.00037488341331481934, -0.0003592967987060547, -0.00034371018409729004, -0.0003281235694885254, -0.00031253695487976074, -0.0002969503402709961, -0.00028136372566223145, -0.0002657771110534668, -0.00025019049644470215, -0.0002346038818359375, -0.00021901726722717285, -0.0002034306526184082, -0.00018784403800964355, -0.0001722574234008789, -0.00015667080879211426, -0.0001410841941833496, -0.00012549757957458496, -0.00010991096496582031, -9.432435035705566e-05, -7.873773574829102e-05, -6.315112113952637e-05, -4.756450653076172e-05, -3.197789192199707e-05, -1.6391277313232422e-05, -8.046627044677734e-07, 1.4781951904296875e-05, 3.0368566513061523e-05, 4.595518112182617e-05, 6.154179573059082e-05, 7.712841033935547e-05, 9.271502494812012e-05, 0.00010830163955688477, 0.00012388825416564941, 0.00013947486877441406, 0.0001550614833831787, 0.00017064809799194336, 0.000186234712600708, 0.00020182132720947266, 0.0002174079418182373, 0.00023299455642700195, 0.0002485811710357666, 0.00026416778564453125, 0.0002797544002532959, 0.00029534101486206055, 0.0003109276294708252, 0.00032651424407958984, 0.0003421008586883545, 0.00035768747329711914, 0.0003732740879058838, 0.00038886070251464844, 0.0004044473171234131, 0.00042003393173217773, 0.0004356205463409424, 0.00045120716094970703, 0.0004667937755584717, 0.00048238039016723633, 0.000497967004776001, 0.0005135536193847656]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 12.0, 14.0, 15.0, 29.0, 47.0, 62.0, 101.0, 178.0, 242.0, 424.0, 713.0, 1267.0, 2510.0, 5396.0, 13287.0, 38150.0, 126506.0, 418255.0, 308858.0, 86430.0, 27272.0, 9871.0, 4139.0, 2081.0, 1112.0, 608.0, 339.0, 232.0, 135.0, 71.0, 61.0, 41.0, 29.0, 21.0, 12.0, 8.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.66015625, -2.576629638671875, -2.49310302734375, -2.409576416015625, -2.3260498046875, -2.242523193359375, -2.15899658203125, -2.075469970703125, -1.991943359375, -1.908416748046875, -1.82489013671875, -1.741363525390625, -1.6578369140625, -1.574310302734375, -1.49078369140625, -1.407257080078125, -1.32373046875, -1.240203857421875, -1.15667724609375, -1.073150634765625, -0.9896240234375, -0.906097412109375, -0.82257080078125, -0.739044189453125, -0.655517578125, -0.571990966796875, -0.48846435546875, -0.404937744140625, -0.3214111328125, -0.237884521484375, -0.15435791015625, -0.070831298828125, 0.0126953125, 0.096221923828125, 0.17974853515625, 0.263275146484375, 0.3468017578125, 0.430328369140625, 0.51385498046875, 0.597381591796875, 0.680908203125, 0.764434814453125, 0.84796142578125, 0.931488037109375, 1.0150146484375, 1.098541259765625, 1.18206787109375, 1.265594482421875, 1.34912109375, 1.432647705078125, 1.51617431640625, 1.599700927734375, 1.6832275390625, 1.766754150390625, 1.85028076171875, 1.933807373046875, 2.017333984375, 2.100860595703125, 2.18438720703125, 2.267913818359375, 2.3514404296875, 2.434967041015625, 2.51849365234375, 2.602020263671875, 2.685546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 14.0, 16.0, 19.0, 17.0, 37.0, 44.0, 49.0, 69.0, 94.0, 121.0, 111.0, 100.0, 67.0, 62.0, 47.0, 33.0, 21.0, 24.0, 11.0, 13.0, 7.0, 3.0, 3.0, 7.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88134765625, -0.8582687377929688, -0.8351898193359375, -0.8121109008789062, -0.789031982421875, -0.7659530639648438, -0.7428741455078125, -0.7197952270507812, -0.69671630859375, -0.6736373901367188, -0.6505584716796875, -0.6274795532226562, -0.604400634765625, -0.5813217163085938, -0.5582427978515625, -0.5351638793945312, -0.5120849609375, -0.48900604248046875, -0.4659271240234375, -0.44284820556640625, -0.419769287109375, -0.39669036865234375, -0.3736114501953125, -0.35053253173828125, -0.32745361328125, -0.30437469482421875, -0.2812957763671875, -0.25821685791015625, -0.235137939453125, -0.21205902099609375, -0.1889801025390625, -0.16590118408203125, -0.142822265625, -0.11974334716796875, -0.0966644287109375, -0.07358551025390625, -0.050506591796875, -0.02742767333984375, -0.0043487548828125, 0.01873016357421875, 0.04180908203125, 0.06488800048828125, 0.0879669189453125, 0.11104583740234375, 0.134124755859375, 0.15720367431640625, 0.1802825927734375, 0.20336151123046875, 0.2264404296875, 0.24951934814453125, 0.2725982666015625, 0.29567718505859375, 0.318756103515625, 0.34183502197265625, 0.3649139404296875, 0.38799285888671875, 0.41107177734375, 0.43415069580078125, 0.4572296142578125, 0.48030853271484375, 0.503387451171875, 0.5264663696289062, 0.5495452880859375, 0.5726242065429688, 0.595703125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 8.0, 8.0, 10.0, 10.0, 14.0, 32.0, 31.0, 35.0, 54.0, 49.0, 83.0, 65.0, 85.0, 65.0, 76.0, 73.0, 64.0, 44.0, 47.0, 29.0, 21.0, 17.0, 18.0, 17.0, 10.0, 7.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.477375030517578, -18.905975341796875, -18.334575653076172, -17.763174057006836, -17.191774368286133, -16.62037467956543, -16.048974990844727, -15.477575302124023, -14.906174659729004, -14.3347749710083, -13.763374328613281, -13.191974639892578, -12.620574951171875, -12.049174308776855, -11.477774620056152, -10.906373977661133, -10.33497428894043, -9.763574600219727, -9.192173957824707, -8.620774269104004, -8.049373626708984, -7.477973937988281, -6.906574249267578, -6.335174083709717, -5.7637739181518555, -5.192373752593994, -4.620973587036133, -4.04957389831543, -3.4781737327575684, -2.906773567199707, -2.335373640060425, -1.7639737129211426, -1.1925735473632812, -0.6211735010147095, -0.049773454666137695, 0.5216265916824341, 1.0930266380310059, 1.6644268035888672, 2.2358267307281494, 2.8072266578674316, 3.378626823425293, 3.9500269889831543, 4.521427154541016, 5.092826843261719, 5.66422700881958, 6.235627174377441, 6.8070268630981445, 7.378427028656006, 7.949827194213867, 8.52122688293457, 9.09262752532959, 9.664027214050293, 10.235427856445312, 10.806827545166016, 11.378227233886719, 11.949626922607422, 12.521027565002441, 13.092427253723145, 13.663827896118164, 14.235227584838867, 14.80662727355957, 15.37802791595459, 15.949427604675293, 16.520828247070312, 17.092227935791016]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 5.0, 7.0, 9.0, 11.0, 10.0, 11.0, 16.0, 16.0, 17.0, 17.0, 23.0, 31.0, 24.0, 25.0, 31.0, 45.0, 28.0, 31.0, 39.0, 34.0, 22.0, 39.0, 33.0, 34.0, 43.0, 43.0, 34.0, 32.0, 26.0, 30.0, 28.0, 23.0, 28.0, 18.0, 26.0, 16.0, 16.0, 13.0, 9.0, 7.0, 7.0, 6.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-11.280834197998047, -10.943718910217285, -10.606603622436523, -10.269489288330078, -9.932374000549316, -9.595258712768555, -9.25814437866211, -8.921029090881348, -8.583913803100586, -8.246798515319824, -7.909683704376221, -7.572568893432617, -7.2354536056518555, -6.898338317871094, -6.56122350692749, -6.224108695983887, -5.886993408203125, -5.549878120422363, -5.21276330947876, -4.875648498535156, -4.5385332107543945, -4.201417922973633, -3.8643031120300293, -3.5271880626678467, -3.190073013305664, -2.8529579639434814, -2.515842914581299, -2.178727865219116, -1.8416128158569336, -1.504497766494751, -1.1673827171325684, -0.8302676677703857, -0.4931526184082031, -0.1560375690460205, 0.1810774803161621, 0.5181925296783447, 0.8553075790405273, 1.19242262840271, 1.5295376777648926, 1.8666527271270752, 2.203767776489258, 2.5408828258514404, 2.877997875213623, 3.2151129245758057, 3.5522279739379883, 3.889343023300171, 4.2264580726623535, 4.563572883605957, 4.900688171386719, 5.2378034591674805, 5.574918270111084, 5.9120330810546875, 6.249148368835449, 6.586263656616211, 6.9233784675598145, 7.260493278503418, 7.59760856628418, 7.934723854064941, 8.271839141845703, 8.608953475952148, 8.94606876373291, 9.283184051513672, 9.620298385620117, 9.957413673400879, 10.29452896118164]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 1.0, 4.0, 5.0, 8.0, 7.0, 16.0, 19.0, 36.0, 31.0, 48.0, 84.0, 112.0, 192.0, 295.0, 512.0, 765.0, 1372.0, 2329.0, 4144.0, 7684.0, 14785.0, 30246.0, 65166.0, 142278.0, 254883.0, 255372.0, 141103.0, 65002.0, 29751.0, 14806.0, 7556.0, 4150.0, 2305.0, 1338.0, 794.0, 468.0, 262.0, 211.0, 142.0, 97.0, 57.0, 25.0, 37.0, 15.0, 14.0, 10.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.359375, -17.747314453125, -17.13525390625, -16.523193359375, -15.9111328125, -15.299072265625, -14.68701171875, -14.074951171875, -13.462890625, -12.850830078125, -12.23876953125, -11.626708984375, -11.0146484375, -10.402587890625, -9.79052734375, -9.178466796875, -8.56640625, -7.954345703125, -7.34228515625, -6.730224609375, -6.1181640625, -5.506103515625, -4.89404296875, -4.281982421875, -3.669921875, -3.057861328125, -2.44580078125, -1.833740234375, -1.2216796875, -0.609619140625, 0.00244140625, 0.614501953125, 1.2265625, 1.838623046875, 2.45068359375, 3.062744140625, 3.6748046875, 4.286865234375, 4.89892578125, 5.510986328125, 6.123046875, 6.735107421875, 7.34716796875, 7.959228515625, 8.5712890625, 9.183349609375, 9.79541015625, 10.407470703125, 11.01953125, 11.631591796875, 12.24365234375, 12.855712890625, 13.4677734375, 14.079833984375, 14.69189453125, 15.303955078125, 15.916015625, 16.528076171875, 17.14013671875, 17.752197265625, 18.3642578125, 18.976318359375, 19.58837890625, 20.200439453125, 20.8125]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 4.0, 10.0, 10.0, 11.0, 9.0, 14.0, 7.0, 16.0, 25.0, 27.0, 19.0, 23.0, 31.0, 33.0, 27.0, 37.0, 31.0, 29.0, 34.0, 37.0, 30.0, 41.0, 44.0, 36.0, 45.0, 42.0, 28.0, 29.0, 30.0, 31.0, 28.0, 25.0, 21.0, 31.0, 16.0, 10.0, 13.0, 14.0, 7.0, 6.0, 8.0, 6.0, 5.0, 3.0, 8.0, 4.0, 3.0, 1.0, 2.0], "bins": [-11.8359375, -11.50830078125, -11.1806640625, -10.85302734375, -10.525390625, -10.19775390625, -9.8701171875, -9.54248046875, -9.21484375, -8.88720703125, -8.5595703125, -8.23193359375, -7.904296875, -7.57666015625, -7.2490234375, -6.92138671875, -6.59375, -6.26611328125, -5.9384765625, -5.61083984375, -5.283203125, -4.95556640625, -4.6279296875, -4.30029296875, -3.97265625, -3.64501953125, -3.3173828125, -2.98974609375, -2.662109375, -2.33447265625, -2.0068359375, -1.67919921875, -1.3515625, -1.02392578125, -0.6962890625, -0.36865234375, -0.041015625, 0.28662109375, 0.6142578125, 0.94189453125, 1.26953125, 1.59716796875, 1.9248046875, 2.25244140625, 2.580078125, 2.90771484375, 3.2353515625, 3.56298828125, 3.890625, 4.21826171875, 4.5458984375, 4.87353515625, 5.201171875, 5.52880859375, 5.8564453125, 6.18408203125, 6.51171875, 6.83935546875, 7.1669921875, 7.49462890625, 7.822265625, 8.14990234375, 8.4775390625, 8.80517578125, 9.1328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 3.0, 2.0, 10.0, 12.0, 16.0, 16.0, 32.0, 47.0, 57.0, 85.0, 138.0, 232.0, 378.0, 729.0, 1225.0, 2353.0, 4394.0, 8962.0, 18935.0, 40694.0, 91925.0, 187236.0, 269691.0, 214915.0, 111161.0, 50178.0, 22901.0, 10722.0, 5294.0, 2788.0, 1407.0, 824.0, 430.0, 276.0, 162.0, 99.0, 66.0, 48.0, 31.0, 25.0, 13.0, 13.0, 7.0, 10.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-15.7109375, -15.2572021484375, -14.803466796875, -14.3497314453125, -13.89599609375, -13.4422607421875, -12.988525390625, -12.5347900390625, -12.0810546875, -11.6273193359375, -11.173583984375, -10.7198486328125, -10.26611328125, -9.8123779296875, -9.358642578125, -8.9049072265625, -8.451171875, -7.9974365234375, -7.543701171875, -7.0899658203125, -6.63623046875, -6.1824951171875, -5.728759765625, -5.2750244140625, -4.8212890625, -4.3675537109375, -3.913818359375, -3.4600830078125, -3.00634765625, -2.5526123046875, -2.098876953125, -1.6451416015625, -1.19140625, -0.7376708984375, -0.283935546875, 0.1697998046875, 0.62353515625, 1.0772705078125, 1.531005859375, 1.9847412109375, 2.4384765625, 2.8922119140625, 3.345947265625, 3.7996826171875, 4.25341796875, 4.7071533203125, 5.160888671875, 5.6146240234375, 6.068359375, 6.5220947265625, 6.975830078125, 7.4295654296875, 7.88330078125, 8.3370361328125, 8.790771484375, 9.2445068359375, 9.6982421875, 10.1519775390625, 10.605712890625, 11.0594482421875, 11.51318359375, 11.9669189453125, 12.420654296875, 12.8743896484375, 13.328125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 12.0, 6.0, 7.0, 10.0, 13.0, 18.0, 13.0, 19.0, 21.0, 31.0, 29.0, 39.0, 48.0, 42.0, 40.0, 56.0, 50.0, 46.0, 42.0, 56.0, 41.0, 50.0, 36.0, 33.0, 43.0, 27.0, 29.0, 30.0, 20.0, 22.0, 16.0, 11.0, 16.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7109375, -8.46038818359375, -8.2098388671875, -7.95928955078125, -7.708740234375, -7.45819091796875, -7.2076416015625, -6.95709228515625, -6.70654296875, -6.45599365234375, -6.2054443359375, -5.95489501953125, -5.704345703125, -5.45379638671875, -5.2032470703125, -4.95269775390625, -4.7021484375, -4.45159912109375, -4.2010498046875, -3.95050048828125, -3.699951171875, -3.44940185546875, -3.1988525390625, -2.94830322265625, -2.69775390625, -2.44720458984375, -2.1966552734375, -1.94610595703125, -1.695556640625, -1.44500732421875, -1.1944580078125, -0.94390869140625, -0.693359375, -0.44281005859375, -0.1922607421875, 0.05828857421875, 0.308837890625, 0.55938720703125, 0.8099365234375, 1.06048583984375, 1.31103515625, 1.56158447265625, 1.8121337890625, 2.06268310546875, 2.313232421875, 2.56378173828125, 2.8143310546875, 3.06488037109375, 3.3154296875, 3.56597900390625, 3.8165283203125, 4.06707763671875, 4.317626953125, 4.56817626953125, 4.8187255859375, 5.06927490234375, 5.31982421875, 5.57037353515625, 5.8209228515625, 6.07147216796875, 6.322021484375, 6.57257080078125, 6.8231201171875, 7.07366943359375, 7.32421875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 21.0, 18.0, 30.0, 70.0, 79.0, 124.0, 168.0, 314.0, 481.0, 875.0, 1448.0, 2767.0, 5332.0, 10873.0, 23439.0, 52961.0, 126169.0, 259901.0, 288427.0, 154468.0, 65543.0, 28413.0, 12910.0, 6367.0, 3180.0, 1742.0, 986.0, 580.0, 292.0, 205.0, 107.0, 80.0, 57.0, 41.0, 21.0, 20.0, 12.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.2734375, -12.8726806640625, -12.471923828125, -12.0711669921875, -11.67041015625, -11.2696533203125, -10.868896484375, -10.4681396484375, -10.0673828125, -9.6666259765625, -9.265869140625, -8.8651123046875, -8.46435546875, -8.0635986328125, -7.662841796875, -7.2620849609375, -6.861328125, -6.4605712890625, -6.059814453125, -5.6590576171875, -5.25830078125, -4.8575439453125, -4.456787109375, -4.0560302734375, -3.6552734375, -3.2545166015625, -2.853759765625, -2.4530029296875, -2.05224609375, -1.6514892578125, -1.250732421875, -0.8499755859375, -0.44921875, -0.0484619140625, 0.352294921875, 0.7530517578125, 1.15380859375, 1.5545654296875, 1.955322265625, 2.3560791015625, 2.7568359375, 3.1575927734375, 3.558349609375, 3.9591064453125, 4.35986328125, 4.7606201171875, 5.161376953125, 5.5621337890625, 5.962890625, 6.3636474609375, 6.764404296875, 7.1651611328125, 7.56591796875, 7.9666748046875, 8.367431640625, 8.7681884765625, 9.1689453125, 9.5697021484375, 9.970458984375, 10.3712158203125, 10.77197265625, 11.1727294921875, 11.573486328125, 11.9742431640625, 12.375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 6.0, 2.0, 4.0, 7.0, 15.0, 22.0, 16.0, 27.0, 27.0, 29.0, 36.0, 64.0, 66.0, 76.0, 82.0, 78.0, 76.0, 56.0, 50.0, 60.0, 48.0, 40.0, 21.0, 28.0, 15.0, 10.0, 13.0, 9.0, 7.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008873939514160156, -0.000857226550579071, -0.0008270591497421265, -0.0007968917489051819, -0.0007667243480682373, -0.0007365569472312927, -0.0007063895463943481, -0.0006762221455574036, -0.000646054744720459, -0.0006158873438835144, -0.0005857199430465698, -0.0005555525422096252, -0.0005253851413726807, -0.0004952177405357361, -0.0004650503396987915, -0.0004348829388618469, -0.00040471553802490234, -0.00037454813718795776, -0.0003443807363510132, -0.0003142133355140686, -0.000284045934677124, -0.00025387853384017944, -0.00022371113300323486, -0.00019354373216629028, -0.0001633763313293457, -0.00013320893049240112, -0.00010304152965545654, -7.287412881851196e-05, -4.270672798156738e-05, -1.2539327144622803e-05, 1.7628073692321777e-05, 4.779547452926636e-05, 7.796287536621094e-05, 0.00010813027620315552, 0.0001382976770401001, 0.00016846507787704468, 0.00019863247871398926, 0.00022879987955093384, 0.0002589672803878784, 0.000289134681224823, 0.0003193020820617676, 0.00034946948289871216, 0.00037963688373565674, 0.0004098042845726013, 0.0004399716854095459, 0.0004701390862464905, 0.0005003064870834351, 0.0005304738879203796, 0.0005606412887573242, 0.0005908086895942688, 0.0006209760904312134, 0.000651143491268158, 0.0006813108921051025, 0.0007114782929420471, 0.0007416456937789917, 0.0007718130946159363, 0.0008019804954528809, 0.0008321478962898254, 0.00086231529712677, 0.0008924826979637146, 0.0009226500988006592, 0.0009528174996376038, 0.0009829849004745483, 0.001013152301311493, 0.0010433197021484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 11.0, 21.0, 29.0, 31.0, 49.0, 64.0, 93.0, 157.0, 203.0, 308.0, 461.0, 723.0, 1099.0, 1772.0, 2910.0, 4844.0, 8104.0, 14898.0, 26945.0, 51107.0, 96142.0, 166448.0, 218329.0, 190878.0, 120271.0, 64869.0, 34377.0, 18188.0, 10097.0, 5695.0, 3413.0, 2167.0, 1336.0, 866.0, 543.0, 338.0, 220.0, 173.0, 123.0, 71.0, 47.0, 37.0, 22.0, 16.0, 25.0, 10.0, 11.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.15625, -8.8760986328125, -8.595947265625, -8.3157958984375, -8.03564453125, -7.7554931640625, -7.475341796875, -7.1951904296875, -6.9150390625, -6.6348876953125, -6.354736328125, -6.0745849609375, -5.79443359375, -5.5142822265625, -5.234130859375, -4.9539794921875, -4.673828125, -4.3936767578125, -4.113525390625, -3.8333740234375, -3.55322265625, -3.2730712890625, -2.992919921875, -2.7127685546875, -2.4326171875, -2.1524658203125, -1.872314453125, -1.5921630859375, -1.31201171875, -1.0318603515625, -0.751708984375, -0.4715576171875, -0.19140625, 0.0887451171875, 0.368896484375, 0.6490478515625, 0.92919921875, 1.2093505859375, 1.489501953125, 1.7696533203125, 2.0498046875, 2.3299560546875, 2.610107421875, 2.8902587890625, 3.17041015625, 3.4505615234375, 3.730712890625, 4.0108642578125, 4.291015625, 4.5711669921875, 4.851318359375, 5.1314697265625, 5.41162109375, 5.6917724609375, 5.971923828125, 6.2520751953125, 6.5322265625, 6.8123779296875, 7.092529296875, 7.3726806640625, 7.65283203125, 7.9329833984375, 8.213134765625, 8.4932861328125, 8.7734375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 7.0, 1.0, 2.0, 4.0, 5.0, 7.0, 9.0, 10.0, 11.0, 14.0, 20.0, 17.0, 25.0, 30.0, 46.0, 48.0, 50.0, 40.0, 56.0, 52.0, 55.0, 46.0, 56.0, 66.0, 56.0, 40.0, 38.0, 34.0, 26.0, 23.0, 22.0, 21.0, 16.0, 11.0, 12.0, 11.0, 2.0, 3.0, 4.0, 2.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.16796875, -3.080841064453125, -2.99371337890625, -2.906585693359375, -2.8194580078125, -2.732330322265625, -2.64520263671875, -2.558074951171875, -2.470947265625, -2.383819580078125, -2.29669189453125, -2.209564208984375, -2.1224365234375, -2.035308837890625, -1.94818115234375, -1.861053466796875, -1.77392578125, -1.686798095703125, -1.59967041015625, -1.512542724609375, -1.4254150390625, -1.338287353515625, -1.25115966796875, -1.164031982421875, -1.076904296875, -0.989776611328125, -0.90264892578125, -0.815521240234375, -0.7283935546875, -0.641265869140625, -0.55413818359375, -0.467010498046875, -0.3798828125, -0.292755126953125, -0.20562744140625, -0.118499755859375, -0.0313720703125, 0.055755615234375, 0.14288330078125, 0.230010986328125, 0.317138671875, 0.404266357421875, 0.49139404296875, 0.578521728515625, 0.6656494140625, 0.752777099609375, 0.83990478515625, 0.927032470703125, 1.01416015625, 1.101287841796875, 1.18841552734375, 1.275543212890625, 1.3626708984375, 1.449798583984375, 1.53692626953125, 1.624053955078125, 1.711181640625, 1.798309326171875, 1.88543701171875, 1.972564697265625, 2.0596923828125, 2.146820068359375, 2.23394775390625, 2.321075439453125, 2.408203125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 4.0, 10.0, 2.0, 5.0, 12.0, 12.0, 11.0, 21.0, 21.0, 28.0, 46.0, 50.0, 59.0, 56.0, 69.0, 81.0, 86.0, 70.0, 61.0, 60.0, 44.0, 41.0, 34.0, 25.0, 20.0, 16.0, 15.0, 11.0, 4.0, 7.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.780900955200195, -15.27371883392334, -14.766536712646484, -14.259353637695312, -13.752171516418457, -13.244989395141602, -12.73780632019043, -12.230624198913574, -11.723442077636719, -11.216259956359863, -10.709077835083008, -10.201894760131836, -9.69471263885498, -9.187530517578125, -8.680347442626953, -8.173165321350098, -7.665983200073242, -7.158801078796387, -6.651618480682373, -6.144435882568359, -5.637253761291504, -5.130071640014648, -4.622889041900635, -4.115706443786621, -3.6085243225097656, -3.101341962814331, -2.5941596031188965, -2.086977243423462, -1.5797948837280273, -1.0726125240325928, -0.5654301643371582, -0.05824780464172363, 0.4489326477050781, 0.9561150074005127, 1.4632973670959473, 1.9704797267913818, 2.4776620864868164, 2.984844446182251, 3.4920268058776855, 3.99920916557312, 4.506391525268555, 5.01357364654541, 5.520756244659424, 6.0279388427734375, 6.535120964050293, 7.042303085327148, 7.549485683441162, 8.056668281555176, 8.563850402832031, 9.071032524108887, 9.578214645385742, 10.085397720336914, 10.59257984161377, 11.099761962890625, 11.606945037841797, 12.114127159118652, 12.621309280395508, 13.128491401672363, 13.635673522949219, 14.14285659790039, 14.650038719177246, 15.157220840454102, 15.664403915405273, 16.171585083007812, 16.678768157958984]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 7.0, 6.0, 13.0, 12.0, 6.0, 12.0, 13.0, 12.0, 20.0, 15.0, 18.0, 29.0, 38.0, 30.0, 33.0, 33.0, 44.0, 39.0, 34.0, 27.0, 39.0, 33.0, 51.0, 38.0, 33.0, 39.0, 39.0, 29.0, 24.0, 28.0, 32.0, 21.0, 25.0, 13.0, 16.0, 15.0, 16.0, 13.0, 10.0, 8.0, 8.0, 11.0, 1.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0], "bins": [-12.379487991333008, -12.038076400756836, -11.696664810180664, -11.355253219604492, -11.01384162902832, -10.672430038452148, -10.331018447875977, -9.989607810974121, -9.64819622039795, -9.306784629821777, -8.965373039245605, -8.623961448669434, -8.282549858093262, -7.941138744354248, -7.599727153778076, -7.2583160400390625, -6.916903972625732, -6.5754923820495605, -6.234080791473389, -5.892669677734375, -5.551258087158203, -5.209846496582031, -4.868434906005859, -4.5270233154296875, -4.185611724853516, -3.8442001342773438, -3.502788782119751, -3.161377191543579, -2.8199658393859863, -2.4785542488098145, -2.1371426582336426, -1.7957313060760498, -1.454319953918457, -1.1129084825515747, -0.7714969515800476, -0.4300854206085205, -0.08867394924163818, 0.25273752212524414, 0.594149112701416, 0.9355604648590088, 1.2769720554351807, 1.618383526802063, 1.9597949981689453, 2.301206588745117, 2.642618179321289, 2.984029531478882, 3.3254411220550537, 3.6668524742126465, 4.008264064788818, 4.34967565536499, 4.691087245941162, 5.032498359680176, 5.373909950256348, 5.7153215408325195, 6.056733131408691, 6.398144721984863, 6.739556312561035, 7.080967903137207, 7.422379493713379, 7.763791084289551, 8.105202674865723, 8.446613311767578, 8.78802490234375, 9.129436492919922, 9.470848083496094]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 6.0, 18.0, 10.0, 17.0, 28.0, 42.0, 57.0, 72.0, 93.0, 168.0, 236.0, 375.0, 547.0, 855.0, 1248.0, 2090.0, 3493.0, 5964.0, 10889.0, 21800.0, 47722.0, 118593.0, 345364.0, 934261.0, 1380447.0, 830425.0, 296863.0, 105712.0, 42875.0, 19653.0, 10156.0, 5542.0, 3235.0, 1898.0, 1228.0, 746.0, 531.0, 291.0, 208.0, 161.0, 97.0, 80.0, 52.0, 38.0, 34.0, 24.0, 6.0, 12.0, 9.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.8359375, -13.395751953125, -12.95556640625, -12.515380859375, -12.0751953125, -11.635009765625, -11.19482421875, -10.754638671875, -10.314453125, -9.874267578125, -9.43408203125, -8.993896484375, -8.5537109375, -8.113525390625, -7.67333984375, -7.233154296875, -6.79296875, -6.352783203125, -5.91259765625, -5.472412109375, -5.0322265625, -4.592041015625, -4.15185546875, -3.711669921875, -3.271484375, -2.831298828125, -2.39111328125, -1.950927734375, -1.5107421875, -1.070556640625, -0.63037109375, -0.190185546875, 0.25, 0.690185546875, 1.13037109375, 1.570556640625, 2.0107421875, 2.450927734375, 2.89111328125, 3.331298828125, 3.771484375, 4.211669921875, 4.65185546875, 5.092041015625, 5.5322265625, 5.972412109375, 6.41259765625, 6.852783203125, 7.29296875, 7.733154296875, 8.17333984375, 8.613525390625, 9.0537109375, 9.493896484375, 9.93408203125, 10.374267578125, 10.814453125, 11.254638671875, 11.69482421875, 12.135009765625, 12.5751953125, 13.015380859375, 13.45556640625, 13.895751953125, 14.3359375]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 7.0, 1.0, 11.0, 9.0, 5.0, 14.0, 10.0, 10.0, 13.0, 22.0, 20.0, 20.0, 29.0, 38.0, 35.0, 26.0, 30.0, 28.0, 47.0, 34.0, 38.0, 27.0, 39.0, 39.0, 41.0, 26.0, 35.0, 30.0, 28.0, 26.0, 44.0, 23.0, 25.0, 22.0, 15.0, 24.0, 16.0, 15.0, 15.0, 13.0, 14.0, 6.0, 8.0, 6.0, 5.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.3046875, -7.0875244140625, -6.870361328125, -6.6531982421875, -6.43603515625, -6.2188720703125, -6.001708984375, -5.7845458984375, -5.5673828125, -5.3502197265625, -5.133056640625, -4.9158935546875, -4.69873046875, -4.4815673828125, -4.264404296875, -4.0472412109375, -3.830078125, -3.6129150390625, -3.395751953125, -3.1785888671875, -2.96142578125, -2.7442626953125, -2.527099609375, -2.3099365234375, -2.0927734375, -1.8756103515625, -1.658447265625, -1.4412841796875, -1.22412109375, -1.0069580078125, -0.789794921875, -0.5726318359375, -0.35546875, -0.1383056640625, 0.078857421875, 0.2960205078125, 0.51318359375, 0.7303466796875, 0.947509765625, 1.1646728515625, 1.3818359375, 1.5989990234375, 1.816162109375, 2.0333251953125, 2.25048828125, 2.4676513671875, 2.684814453125, 2.9019775390625, 3.119140625, 3.3363037109375, 3.553466796875, 3.7706298828125, 3.98779296875, 4.2049560546875, 4.422119140625, 4.6392822265625, 4.8564453125, 5.0736083984375, 5.290771484375, 5.5079345703125, 5.72509765625, 5.9422607421875, 6.159423828125, 6.3765869140625, 6.59375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 6.0, 21.0, 20.0, 17.0, 27.0, 51.0, 72.0, 98.0, 155.0, 217.0, 340.0, 513.0, 781.0, 1373.0, 2301.0, 4042.0, 7437.0, 15318.0, 35115.0, 94669.0, 301189.0, 1031369.0, 1675663.0, 701551.0, 201935.0, 66802.0, 26673.0, 12019.0, 6102.0, 3228.0, 1924.0, 1150.0, 740.0, 467.0, 295.0, 208.0, 129.0, 73.0, 58.0, 42.0, 28.0, 22.0, 17.0, 7.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.65625, -17.07421875, -16.4921875, -15.91015625, -15.328125, -14.74609375, -14.1640625, -13.58203125, -13.0, -12.41796875, -11.8359375, -11.25390625, -10.671875, -10.08984375, -9.5078125, -8.92578125, -8.34375, -7.76171875, -7.1796875, -6.59765625, -6.015625, -5.43359375, -4.8515625, -4.26953125, -3.6875, -3.10546875, -2.5234375, -1.94140625, -1.359375, -0.77734375, -0.1953125, 0.38671875, 0.96875, 1.55078125, 2.1328125, 2.71484375, 3.296875, 3.87890625, 4.4609375, 5.04296875, 5.625, 6.20703125, 6.7890625, 7.37109375, 7.953125, 8.53515625, 9.1171875, 9.69921875, 10.28125, 10.86328125, 11.4453125, 12.02734375, 12.609375, 13.19140625, 13.7734375, 14.35546875, 14.9375, 15.51953125, 16.1015625, 16.68359375, 17.265625, 17.84765625, 18.4296875, 19.01171875, 19.59375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 8.0, 9.0, 14.0, 11.0, 14.0, 27.0, 42.0, 37.0, 56.0, 83.0, 110.0, 125.0, 173.0, 197.0, 252.0, 283.0, 363.0, 330.0, 302.0, 302.0, 250.0, 218.0, 204.0, 155.0, 110.0, 89.0, 69.0, 54.0, 47.0, 30.0, 17.0, 23.0, 14.0, 10.0, 14.0, 6.0, 4.0, 7.0, 2.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.15625, -4.0205078125, -3.884765625, -3.7490234375, -3.61328125, -3.4775390625, -3.341796875, -3.2060546875, -3.0703125, -2.9345703125, -2.798828125, -2.6630859375, -2.52734375, -2.3916015625, -2.255859375, -2.1201171875, -1.984375, -1.8486328125, -1.712890625, -1.5771484375, -1.44140625, -1.3056640625, -1.169921875, -1.0341796875, -0.8984375, -0.7626953125, -0.626953125, -0.4912109375, -0.35546875, -0.2197265625, -0.083984375, 0.0517578125, 0.1875, 0.3232421875, 0.458984375, 0.5947265625, 0.73046875, 0.8662109375, 1.001953125, 1.1376953125, 1.2734375, 1.4091796875, 1.544921875, 1.6806640625, 1.81640625, 1.9521484375, 2.087890625, 2.2236328125, 2.359375, 2.4951171875, 2.630859375, 2.7666015625, 2.90234375, 3.0380859375, 3.173828125, 3.3095703125, 3.4453125, 3.5810546875, 3.716796875, 3.8525390625, 3.98828125, 4.1240234375, 4.259765625, 4.3955078125, 4.53125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 7.0, 7.0, 4.0, 7.0, 10.0, 8.0, 20.0, 15.0, 15.0, 34.0, 40.0, 41.0, 48.0, 75.0, 88.0, 63.0, 62.0, 72.0, 57.0, 63.0, 54.0, 49.0, 34.0, 19.0, 29.0, 17.0, 21.0, 8.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-16.066513061523438, -15.63431453704834, -15.202116012573242, -14.769916534423828, -14.33771800994873, -13.905519485473633, -13.473320007324219, -13.041121482849121, -12.608922958374023, -12.176724433898926, -11.744525909423828, -11.312326431274414, -10.880127906799316, -10.447929382324219, -10.015729904174805, -9.583531379699707, -9.15133285522461, -8.719134330749512, -8.286935806274414, -7.854736328125, -7.422537803649902, -6.990339279174805, -6.558140277862549, -6.125941276550293, -5.693742752075195, -5.261544227600098, -4.829345226287842, -4.397146224975586, -3.9649477005004883, -3.5327489376068115, -3.1005501747131348, -2.668351411819458, -2.236151695251465, -1.803952932357788, -1.3717541694641113, -0.9395554065704346, -0.5073566436767578, -0.07515788078308105, 0.3570408821105957, 0.7892396450042725, 1.2214384078979492, 1.653637170791626, 2.0858359336853027, 2.5180346965789795, 2.9502334594726562, 3.382432222366333, 3.8146309852600098, 4.246829986572266, 4.679028511047363, 5.111227035522461, 5.543426036834717, 5.975625038146973, 6.40782356262207, 6.840022087097168, 7.272221088409424, 7.70442008972168, 8.136618614196777, 8.568817138671875, 9.001016616821289, 9.433215141296387, 9.865413665771484, 10.297612190246582, 10.72981071472168, 11.162010192871094, 11.594208717346191]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 6.0, 10.0, 4.0, 7.0, 10.0, 12.0, 13.0, 16.0, 31.0, 20.0, 24.0, 21.0, 26.0, 38.0, 32.0, 37.0, 36.0, 38.0, 38.0, 37.0, 39.0, 33.0, 43.0, 37.0, 30.0, 30.0, 30.0, 38.0, 37.0, 28.0, 24.0, 22.0, 14.0, 22.0, 22.0, 20.0, 20.0, 4.0, 12.0, 5.0, 12.0, 5.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.12672233581543, -9.836066246032715, -9.54541015625, -9.254754066467285, -8.96409797668457, -8.673441886901855, -8.38278579711914, -8.092129707336426, -7.801473617553711, -7.510817527770996, -7.220161437988281, -6.929505348205566, -6.638849258422852, -6.348193168640137, -6.057537078857422, -5.766880989074707, -5.47622537612915, -5.1855692863464355, -4.894913196563721, -4.604257106781006, -4.313601016998291, -4.022944927215576, -3.7322890758514404, -3.4416329860687256, -3.1509768962860107, -2.860320806503296, -2.569664716720581, -2.2790088653564453, -1.988352656364441, -1.697696566581726, -1.4070405960083008, -1.116384506225586, -0.8257284164428711, -0.5350723266601562, -0.24441629648208618, 0.04623973369598389, 0.33689582347869873, 0.6275519132614136, 0.9182078838348389, 1.2088639736175537, 1.4995200634002686, 1.7901761531829834, 2.0808322429656982, 2.371488094329834, 2.662144184112549, 2.9528002738952637, 3.2434563636779785, 3.5341124534606934, 3.824768543243408, 4.115424633026123, 4.406080722808838, 4.696736812591553, 4.987392902374268, 5.278048992156982, 5.568704605102539, 5.859360694885254, 6.150016784667969, 6.440672874450684, 6.731328964233398, 7.021985054016113, 7.312641143798828, 7.603297233581543, 7.893953323364258, 8.184609413146973, 8.475265502929688]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 10.0, 13.0, 19.0, 14.0, 44.0, 45.0, 73.0, 116.0, 150.0, 217.0, 270.0, 423.0, 612.0, 1048.0, 1654.0, 2712.0, 4712.0, 8903.0, 18180.0, 39214.0, 90287.0, 203565.0, 311141.0, 200060.0, 88160.0, 38625.0, 17666.0, 8605.0, 4742.0, 2568.0, 1579.0, 1019.0, 647.0, 450.0, 312.0, 200.0, 144.0, 103.0, 75.0, 45.0, 43.0, 24.0, 21.0, 14.0, 11.0, 6.0, 3.0, 2.0, 3.0, 3.0], "bins": [-4.3359375, -4.21710205078125, -4.0982666015625, -3.97943115234375, -3.860595703125, -3.74176025390625, -3.6229248046875, -3.50408935546875, -3.38525390625, -3.26641845703125, -3.1475830078125, -3.02874755859375, -2.909912109375, -2.79107666015625, -2.6722412109375, -2.55340576171875, -2.4345703125, -2.31573486328125, -2.1968994140625, -2.07806396484375, -1.959228515625, -1.84039306640625, -1.7215576171875, -1.60272216796875, -1.48388671875, -1.36505126953125, -1.2462158203125, -1.12738037109375, -1.008544921875, -0.88970947265625, -0.7708740234375, -0.65203857421875, -0.533203125, -0.41436767578125, -0.2955322265625, -0.17669677734375, -0.057861328125, 0.06097412109375, 0.1798095703125, 0.29864501953125, 0.41748046875, 0.53631591796875, 0.6551513671875, 0.77398681640625, 0.892822265625, 1.01165771484375, 1.1304931640625, 1.24932861328125, 1.3681640625, 1.48699951171875, 1.6058349609375, 1.72467041015625, 1.843505859375, 1.96234130859375, 2.0811767578125, 2.20001220703125, 2.31884765625, 2.43768310546875, 2.5565185546875, 2.67535400390625, 2.794189453125, 2.91302490234375, 3.0318603515625, 3.15069580078125, 3.26953125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 8.0, 6.0, 6.0, 8.0, 6.0, 11.0, 15.0, 14.0, 21.0, 19.0, 15.0, 24.0, 37.0, 27.0, 26.0, 37.0, 45.0, 41.0, 33.0, 44.0, 40.0, 36.0, 31.0, 39.0, 43.0, 36.0, 43.0, 34.0, 36.0, 24.0, 30.0, 20.0, 22.0, 23.0, 17.0, 13.0, 17.0, 16.0, 5.0, 6.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-10.875, -10.56005859375, -10.2451171875, -9.93017578125, -9.615234375, -9.30029296875, -8.9853515625, -8.67041015625, -8.35546875, -8.04052734375, -7.7255859375, -7.41064453125, -7.095703125, -6.78076171875, -6.4658203125, -6.15087890625, -5.8359375, -5.52099609375, -5.2060546875, -4.89111328125, -4.576171875, -4.26123046875, -3.9462890625, -3.63134765625, -3.31640625, -3.00146484375, -2.6865234375, -2.37158203125, -2.056640625, -1.74169921875, -1.4267578125, -1.11181640625, -0.796875, -0.48193359375, -0.1669921875, 0.14794921875, 0.462890625, 0.77783203125, 1.0927734375, 1.40771484375, 1.72265625, 2.03759765625, 2.3525390625, 2.66748046875, 2.982421875, 3.29736328125, 3.6123046875, 3.92724609375, 4.2421875, 4.55712890625, 4.8720703125, 5.18701171875, 5.501953125, 5.81689453125, 6.1318359375, 6.44677734375, 6.76171875, 7.07666015625, 7.3916015625, 7.70654296875, 8.021484375, 8.33642578125, 8.6513671875, 8.96630859375, 9.28125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 15.0, 24.0, 26.0, 25.0, 36.0, 73.0, 123.0, 204.0, 302.0, 563.0, 1060.0, 2104.0, 4862.0, 13154.0, 54536.0, 918758.0, 34910.0, 10030.0, 3780.0, 1742.0, 932.0, 509.0, 278.0, 161.0, 107.0, 69.0, 47.0, 32.0, 27.0, 10.0, 17.0, 5.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.87451171875, -8.5380859375, -8.20166015625, -7.865234375, -7.52880859375, -7.1923828125, -6.85595703125, -6.51953125, -6.18310546875, -5.8466796875, -5.51025390625, -5.173828125, -4.83740234375, -4.5009765625, -4.16455078125, -3.828125, -3.49169921875, -3.1552734375, -2.81884765625, -2.482421875, -2.14599609375, -1.8095703125, -1.47314453125, -1.13671875, -0.80029296875, -0.4638671875, -0.12744140625, 0.208984375, 0.54541015625, 0.8818359375, 1.21826171875, 1.5546875, 1.89111328125, 2.2275390625, 2.56396484375, 2.900390625, 3.23681640625, 3.5732421875, 3.90966796875, 4.24609375, 4.58251953125, 4.9189453125, 5.25537109375, 5.591796875, 5.92822265625, 6.2646484375, 6.60107421875, 6.9375, 7.27392578125, 7.6103515625, 7.94677734375, 8.283203125, 8.61962890625, 8.9560546875, 9.29248046875, 9.62890625, 9.96533203125, 10.3017578125, 10.63818359375, 10.974609375, 11.31103515625, 11.6474609375, 11.98388671875, 12.3203125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 7.0, 7.0, 3.0, 10.0, 5.0, 18.0, 12.0, 15.0, 17.0, 18.0, 19.0, 25.0, 27.0, 48.0, 32.0, 45.0, 47.0, 38.0, 51.0, 44.0, 51.0, 48.0, 50.0, 40.0, 34.0, 44.0, 40.0, 31.0, 31.0, 26.0, 21.0, 21.0, 14.0, 19.0, 7.0, 14.0, 14.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.58685302734375, -8.3299560546875, -8.07305908203125, -7.816162109375, -7.55926513671875, -7.3023681640625, -7.04547119140625, -6.78857421875, -6.53167724609375, -6.2747802734375, -6.01788330078125, -5.760986328125, -5.50408935546875, -5.2471923828125, -4.99029541015625, -4.7333984375, -4.47650146484375, -4.2196044921875, -3.96270751953125, -3.705810546875, -3.44891357421875, -3.1920166015625, -2.93511962890625, -2.67822265625, -2.42132568359375, -2.1644287109375, -1.90753173828125, -1.650634765625, -1.39373779296875, -1.1368408203125, -0.87994384765625, -0.623046875, -0.36614990234375, -0.1092529296875, 0.14764404296875, 0.404541015625, 0.66143798828125, 0.9183349609375, 1.17523193359375, 1.43212890625, 1.68902587890625, 1.9459228515625, 2.20281982421875, 2.459716796875, 2.71661376953125, 2.9735107421875, 3.23040771484375, 3.4873046875, 3.74420166015625, 4.0010986328125, 4.25799560546875, 4.514892578125, 4.77178955078125, 5.0286865234375, 5.28558349609375, 5.54248046875, 5.79937744140625, 6.0562744140625, 6.31317138671875, 6.570068359375, 6.82696533203125, 7.0838623046875, 7.34075927734375, 7.59765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 8.0, 11.0, 14.0, 14.0, 24.0, 37.0, 57.0, 84.0, 110.0, 181.0, 260.0, 393.0, 636.0, 1040.0, 1646.0, 2665.0, 5066.0, 9547.0, 19970.0, 62850.0, 874084.0, 36882.0, 15130.0, 7784.0, 3936.0, 2373.0, 1329.0, 843.0, 508.0, 360.0, 241.0, 151.0, 85.0, 70.0, 52.0, 40.0, 15.0, 11.0, 9.0, 11.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.189453125, -2.1256866455078125, -2.061920166015625, -1.9981536865234375, -1.93438720703125, -1.8706207275390625, -1.806854248046875, -1.7430877685546875, -1.6793212890625, -1.6155548095703125, -1.551788330078125, -1.4880218505859375, -1.42425537109375, -1.3604888916015625, -1.296722412109375, -1.2329559326171875, -1.169189453125, -1.1054229736328125, -1.041656494140625, -0.9778900146484375, -0.91412353515625, -0.8503570556640625, -0.786590576171875, -0.7228240966796875, -0.6590576171875, -0.5952911376953125, -0.531524658203125, -0.4677581787109375, -0.40399169921875, -0.3402252197265625, -0.276458740234375, -0.2126922607421875, -0.14892578125, -0.0851593017578125, -0.021392822265625, 0.0423736572265625, 0.10614013671875, 0.1699066162109375, 0.233673095703125, 0.2974395751953125, 0.3612060546875, 0.4249725341796875, 0.488739013671875, 0.5525054931640625, 0.61627197265625, 0.6800384521484375, 0.743804931640625, 0.8075714111328125, 0.871337890625, 0.9351043701171875, 0.998870849609375, 1.0626373291015625, 1.12640380859375, 1.1901702880859375, 1.253936767578125, 1.3177032470703125, 1.3814697265625, 1.4452362060546875, 1.509002685546875, 1.5727691650390625, 1.63653564453125, 1.7003021240234375, 1.764068603515625, 1.8278350830078125, 1.8916015625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 12.0, 15.0, 15.0, 30.0, 22.0, 27.0, 47.0, 57.0, 66.0, 81.0, 78.0, 98.0, 105.0, 65.0, 57.0, 55.0, 29.0, 37.0, 23.0, 14.0, 13.0, 12.0, 8.0, 6.0, 7.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.00011229515075683594, -0.00010942574590444565, -0.00010655634105205536, -0.00010368693619966507, -0.00010081753134727478, -9.794812649488449e-05, -9.50787216424942e-05, -9.220931679010391e-05, -8.933991193771362e-05, -8.647050708532333e-05, -8.360110223293304e-05, -8.073169738054276e-05, -7.786229252815247e-05, -7.499288767576218e-05, -7.212348282337189e-05, -6.92540779709816e-05, -6.638467311859131e-05, -6.351526826620102e-05, -6.064586341381073e-05, -5.777645856142044e-05, -5.490705370903015e-05, -5.203764885663986e-05, -4.916824400424957e-05, -4.6298839151859283e-05, -4.3429434299468994e-05, -4.0560029447078705e-05, -3.7690624594688416e-05, -3.4821219742298126e-05, -3.195181488990784e-05, -2.9082410037517548e-05, -2.6213005185127258e-05, -2.334360033273697e-05, -2.047419548034668e-05, -1.760479062795639e-05, -1.4735385775566101e-05, -1.1865980923175812e-05, -8.996576070785522e-06, -6.127171218395233e-06, -3.257766366004944e-06, -3.8836151361465454e-07, 2.4810433387756348e-06, 5.350448191165924e-06, 8.219853043556213e-06, 1.1089257895946503e-05, 1.3958662748336792e-05, 1.682806760072708e-05, 1.969747245311737e-05, 2.256687730550766e-05, 2.543628215789795e-05, 2.830568701028824e-05, 3.117509186267853e-05, 3.404449671506882e-05, 3.6913901567459106e-05, 3.9783306419849396e-05, 4.2652711272239685e-05, 4.5522116124629974e-05, 4.8391520977020264e-05, 5.126092582941055e-05, 5.413033068180084e-05, 5.699973553419113e-05, 5.986914038658142e-05, 6.273854523897171e-05, 6.5607950091362e-05, 6.847735494375229e-05, 7.134675979614258e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 10.0, 32.0, 38.0, 48.0, 56.0, 90.0, 137.0, 187.0, 297.0, 430.0, 621.0, 1081.0, 1589.0, 2551.0, 4306.0, 7137.0, 11570.0, 19834.0, 35561.0, 63153.0, 115840.0, 203751.0, 238351.0, 150283.0, 82825.0, 45326.0, 25583.0, 14752.0, 8783.0, 5358.0, 3193.0, 2026.0, 1278.0, 829.0, 526.0, 349.0, 246.0, 143.0, 107.0, 72.0, 56.0, 39.0, 30.0, 19.0, 14.0, 9.0, 11.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.783203125, -0.7588958740234375, -0.734588623046875, -0.7102813720703125, -0.68597412109375, -0.6616668701171875, -0.637359619140625, -0.6130523681640625, -0.5887451171875, -0.5644378662109375, -0.540130615234375, -0.5158233642578125, -0.49151611328125, -0.4672088623046875, -0.442901611328125, -0.4185943603515625, -0.394287109375, -0.3699798583984375, -0.345672607421875, -0.3213653564453125, -0.29705810546875, -0.2727508544921875, -0.248443603515625, -0.2241363525390625, -0.1998291015625, -0.1755218505859375, -0.151214599609375, -0.1269073486328125, -0.10260009765625, -0.0782928466796875, -0.053985595703125, -0.0296783447265625, -0.00537109375, 0.0189361572265625, 0.043243408203125, 0.0675506591796875, 0.09185791015625, 0.1161651611328125, 0.140472412109375, 0.1647796630859375, 0.1890869140625, 0.2133941650390625, 0.237701416015625, 0.2620086669921875, 0.28631591796875, 0.3106231689453125, 0.334930419921875, 0.3592376708984375, 0.383544921875, 0.4078521728515625, 0.432159423828125, 0.4564666748046875, 0.48077392578125, 0.5050811767578125, 0.529388427734375, 0.5536956787109375, 0.5780029296875, 0.6023101806640625, 0.626617431640625, 0.6509246826171875, 0.67523193359375, 0.6995391845703125, 0.723846435546875, 0.7481536865234375, 0.7724609375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 17.0, 16.0, 17.0, 14.0, 19.0, 13.0, 30.0, 31.0, 24.0, 35.0, 43.0, 52.0, 60.0, 75.0, 74.0, 75.0, 63.0, 59.0, 48.0, 44.0, 33.0, 28.0, 30.0, 6.0, 22.0, 11.0, 12.0, 6.0, 6.0, 4.0, 5.0, 2.0, 2.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.386962890625, -0.37703895568847656, -0.3671150207519531, -0.3571910858154297, -0.34726715087890625, -0.3373432159423828, -0.3274192810058594, -0.31749534606933594, -0.3075714111328125, -0.29764747619628906, -0.2877235412597656, -0.2777996063232422, -0.26787567138671875, -0.2579517364501953, -0.24802780151367188, -0.23810386657714844, -0.228179931640625, -0.21825599670410156, -0.20833206176757812, -0.1984081268310547, -0.18848419189453125, -0.1785602569580078, -0.16863632202148438, -0.15871238708496094, -0.1487884521484375, -0.13886451721191406, -0.12894058227539062, -0.11901664733886719, -0.10909271240234375, -0.09916877746582031, -0.08924484252929688, -0.07932090759277344, -0.06939697265625, -0.05947303771972656, -0.049549102783203125, -0.03962516784667969, -0.02970123291015625, -0.019777297973632812, -0.009853363037109375, 7.05718994140625e-05, 0.0099945068359375, 0.019918441772460938, 0.029842376708984375, 0.03976631164550781, 0.04969024658203125, 0.05961418151855469, 0.06953811645507812, 0.07946205139160156, 0.089385986328125, 0.09930992126464844, 0.10923385620117188, 0.11915779113769531, 0.12908172607421875, 0.1390056610107422, 0.14892959594726562, 0.15885353088378906, 0.1687774658203125, 0.17870140075683594, 0.18862533569335938, 0.1985492706298828, 0.20847320556640625, 0.2183971405029297, 0.22832107543945312, 0.23824501037597656, 0.2481689453125]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 4.0, 6.0, 4.0, 11.0, 7.0, 16.0, 13.0, 16.0, 23.0, 36.0, 41.0, 47.0, 56.0, 79.0, 71.0, 61.0, 69.0, 63.0, 65.0, 56.0, 53.0, 39.0, 32.0, 24.0, 18.0, 21.0, 22.0, 10.0, 8.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-16.004314422607422, -15.583285331726074, -15.16225528717041, -14.741226196289062, -14.320196151733398, -13.89916706085205, -13.478137969970703, -13.057107925415039, -12.636078834533691, -12.215049743652344, -11.79401969909668, -11.372990608215332, -10.951961517333984, -10.53093147277832, -10.109902381896973, -9.688873291015625, -9.267843246459961, -8.846814155578613, -8.42578411102295, -8.004755020141602, -7.583725452423096, -7.16269588470459, -6.741666793823242, -6.320637226104736, -5.8996076583862305, -5.478578090667725, -5.057548522949219, -4.636519432067871, -4.215489864349365, -3.7944602966308594, -3.3734309673309326, -2.952401638031006, -2.5313720703125, -2.110342502593994, -1.6893131732940674, -1.268283724784851, -0.8472542762756348, -0.4262247085571289, -0.0051953792572021484, 0.4158339500427246, 0.8368635177612305, 1.2578929662704468, 1.678922414779663, 2.09995174407959, 2.5209813117980957, 2.9420108795166016, 3.3630402088165283, 3.784069538116455, 4.205099105834961, 4.626128673553467, 5.047158241271973, 5.46818733215332, 5.889216899871826, 6.310246467590332, 6.73127555847168, 7.1523051261901855, 7.573334693908691, 7.994364261627197, 8.415393829345703, 8.83642292022705, 9.257452011108398, 9.678482055664062, 10.09951114654541, 10.520540237426758, 10.941570281982422]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 4.0, 9.0, 6.0, 6.0, 9.0, 4.0, 16.0, 13.0, 21.0, 22.0, 29.0, 17.0, 26.0, 21.0, 40.0, 36.0, 30.0, 42.0, 39.0, 36.0, 34.0, 43.0, 35.0, 45.0, 32.0, 30.0, 37.0, 30.0, 40.0, 31.0, 30.0, 22.0, 19.0, 21.0, 21.0, 20.0, 21.0, 14.0, 9.0, 7.0, 6.0, 14.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-10.072715759277344, -9.782402038574219, -9.492088317871094, -9.201774597167969, -8.911460876464844, -8.621147155761719, -8.330833435058594, -8.040519714355469, -7.750205993652344, -7.459892272949219, -7.169578552246094, -6.879264831542969, -6.588951110839844, -6.298637390136719, -6.008323669433594, -5.718009948730469, -5.4276957511901855, -5.1373820304870605, -4.8470683097839355, -4.5567545890808105, -4.2664408683776855, -3.9761271476745605, -3.6858131885528564, -3.3954994678497314, -3.1051857471466064, -2.8148720264434814, -2.5245583057403564, -2.2342443466186523, -1.943930745124817, -1.653617024421692, -1.3633031845092773, -1.0729894638061523, -0.7826757431030273, -0.49236199259757996, -0.20204824209213257, 0.08826553821563721, 0.3785792589187622, 0.6688929796218872, 0.9592068195343018, 1.2495205402374268, 1.5398342609405518, 1.8301479816436768, 2.1204617023468018, 2.410775661468506, 2.701089382171631, 2.991403102874756, 3.281716823577881, 3.572030544281006, 3.862344264984131, 4.152657985687256, 4.442971706390381, 4.733285427093506, 5.023599147796631, 5.313912868499756, 5.604227066040039, 5.894540786743164, 6.184854507446289, 6.475168228149414, 6.765481948852539, 7.055795669555664, 7.346109390258789, 7.636423110961914, 7.926736831665039, 8.217050552368164, 8.507364273071289]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 4.0, 3.0, 13.0, 17.0, 19.0, 46.0, 58.0, 89.0, 168.0, 242.0, 385.0, 608.0, 904.0, 1310.0, 2139.0, 3544.0, 5476.0, 8959.0, 14602.0, 24465.0, 40214.0, 66458.0, 105616.0, 149499.0, 173452.0, 155192.0, 112068.0, 71506.0, 43724.0, 26478.0, 15744.0, 9540.0, 5889.0, 3682.0, 2274.0, 1525.0, 958.0, 611.0, 376.0, 255.0, 150.0, 107.0, 59.0, 48.0, 28.0, 21.0, 14.0, 12.0, 6.0, 1.0, 2.0, 3.0], "bins": [-8.890625, -8.64752197265625, -8.4044189453125, -8.16131591796875, -7.918212890625, -7.67510986328125, -7.4320068359375, -7.18890380859375, -6.94580078125, -6.70269775390625, -6.4595947265625, -6.21649169921875, -5.973388671875, -5.73028564453125, -5.4871826171875, -5.24407958984375, -5.0009765625, -4.75787353515625, -4.5147705078125, -4.27166748046875, -4.028564453125, -3.78546142578125, -3.5423583984375, -3.29925537109375, -3.05615234375, -2.81304931640625, -2.5699462890625, -2.32684326171875, -2.083740234375, -1.84063720703125, -1.5975341796875, -1.35443115234375, -1.111328125, -0.86822509765625, -0.6251220703125, -0.38201904296875, -0.138916015625, 0.10418701171875, 0.3472900390625, 0.59039306640625, 0.83349609375, 1.07659912109375, 1.3197021484375, 1.56280517578125, 1.805908203125, 2.04901123046875, 2.2921142578125, 2.53521728515625, 2.7783203125, 3.02142333984375, 3.2645263671875, 3.50762939453125, 3.750732421875, 3.99383544921875, 4.2369384765625, 4.48004150390625, 4.72314453125, 4.96624755859375, 5.2093505859375, 5.45245361328125, 5.695556640625, 5.93865966796875, 6.1817626953125, 6.42486572265625, 6.66796875]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 10.0, 3.0, 4.0, 6.0, 13.0, 11.0, 18.0, 27.0, 23.0, 21.0, 30.0, 28.0, 30.0, 38.0, 38.0, 29.0, 33.0, 31.0, 45.0, 47.0, 37.0, 43.0, 35.0, 33.0, 48.0, 29.0, 39.0, 31.0, 24.0, 30.0, 23.0, 16.0, 23.0, 25.0, 12.0, 8.0, 12.0, 8.0, 10.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0], "bins": [-10.6640625, -10.3746337890625, -10.085205078125, -9.7957763671875, -9.50634765625, -9.2169189453125, -8.927490234375, -8.6380615234375, -8.3486328125, -8.0592041015625, -7.769775390625, -7.4803466796875, -7.19091796875, -6.9014892578125, -6.612060546875, -6.3226318359375, -6.033203125, -5.7437744140625, -5.454345703125, -5.1649169921875, -4.87548828125, -4.5860595703125, -4.296630859375, -4.0072021484375, -3.7177734375, -3.4283447265625, -3.138916015625, -2.8494873046875, -2.56005859375, -2.2706298828125, -1.981201171875, -1.6917724609375, -1.40234375, -1.1129150390625, -0.823486328125, -0.5340576171875, -0.24462890625, 0.0447998046875, 0.334228515625, 0.6236572265625, 0.9130859375, 1.2025146484375, 1.491943359375, 1.7813720703125, 2.07080078125, 2.3602294921875, 2.649658203125, 2.9390869140625, 3.228515625, 3.5179443359375, 3.807373046875, 4.0968017578125, 4.38623046875, 4.6756591796875, 4.965087890625, 5.2545166015625, 5.5439453125, 5.8333740234375, 6.122802734375, 6.4122314453125, 6.70166015625, 6.9910888671875, 7.280517578125, 7.5699462890625, 7.859375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 10.0, 11.0, 24.0, 16.0, 32.0, 41.0, 61.0, 121.0, 177.0, 288.0, 436.0, 662.0, 1101.0, 1847.0, 3151.0, 5376.0, 9346.0, 16991.0, 30355.0, 54934.0, 94352.0, 147674.0, 188011.0, 178915.0, 129850.0, 80134.0, 46093.0, 25298.0, 14002.0, 7861.0, 4576.0, 2659.0, 1582.0, 956.0, 590.0, 360.0, 240.0, 151.0, 91.0, 61.0, 27.0, 35.0, 18.0, 11.0, 13.0, 12.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.3497314453125, -6.136962890625, -5.9241943359375, -5.71142578125, -5.4986572265625, -5.285888671875, -5.0731201171875, -4.8603515625, -4.6475830078125, -4.434814453125, -4.2220458984375, -4.00927734375, -3.7965087890625, -3.583740234375, -3.3709716796875, -3.158203125, -2.9454345703125, -2.732666015625, -2.5198974609375, -2.30712890625, -2.0943603515625, -1.881591796875, -1.6688232421875, -1.4560546875, -1.2432861328125, -1.030517578125, -0.8177490234375, -0.60498046875, -0.3922119140625, -0.179443359375, 0.0333251953125, 0.24609375, 0.4588623046875, 0.671630859375, 0.8843994140625, 1.09716796875, 1.3099365234375, 1.522705078125, 1.7354736328125, 1.9482421875, 2.1610107421875, 2.373779296875, 2.5865478515625, 2.79931640625, 3.0120849609375, 3.224853515625, 3.4376220703125, 3.650390625, 3.8631591796875, 4.075927734375, 4.2886962890625, 4.50146484375, 4.7142333984375, 4.927001953125, 5.1397705078125, 5.3525390625, 5.5653076171875, 5.778076171875, 5.9908447265625, 6.20361328125, 6.4163818359375, 6.629150390625, 6.8419189453125, 7.0546875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 6.0, 8.0, 4.0, 7.0, 16.0, 8.0, 12.0, 19.0, 27.0, 23.0, 40.0, 33.0, 33.0, 24.0, 44.0, 43.0, 45.0, 49.0, 35.0, 49.0, 50.0, 40.0, 45.0, 49.0, 27.0, 28.0, 35.0, 29.0, 17.0, 28.0, 31.0, 18.0, 20.0, 6.0, 9.0, 11.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.65625, -5.4681396484375, -5.280029296875, -5.0919189453125, -4.90380859375, -4.7156982421875, -4.527587890625, -4.3394775390625, -4.1513671875, -3.9632568359375, -3.775146484375, -3.5870361328125, -3.39892578125, -3.2108154296875, -3.022705078125, -2.8345947265625, -2.646484375, -2.4583740234375, -2.270263671875, -2.0821533203125, -1.89404296875, -1.7059326171875, -1.517822265625, -1.3297119140625, -1.1416015625, -0.9534912109375, -0.765380859375, -0.5772705078125, -0.38916015625, -0.2010498046875, -0.012939453125, 0.1751708984375, 0.36328125, 0.5513916015625, 0.739501953125, 0.9276123046875, 1.11572265625, 1.3038330078125, 1.491943359375, 1.6800537109375, 1.8681640625, 2.0562744140625, 2.244384765625, 2.4324951171875, 2.62060546875, 2.8087158203125, 2.996826171875, 3.1849365234375, 3.373046875, 3.5611572265625, 3.749267578125, 3.9373779296875, 4.12548828125, 4.3135986328125, 4.501708984375, 4.6898193359375, 4.8779296875, 5.0660400390625, 5.254150390625, 5.4422607421875, 5.63037109375, 5.8184814453125, 6.006591796875, 6.1947021484375, 6.3828125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 18.0, 32.0, 44.0, 60.0, 98.0, 136.0, 234.0, 368.0, 649.0, 1099.0, 1994.0, 3631.0, 7327.0, 14096.0, 29433.0, 63175.0, 135720.0, 243809.0, 257010.0, 151426.0, 71817.0, 33261.0, 15818.0, 7902.0, 4139.0, 2179.0, 1226.0, 717.0, 427.0, 267.0, 146.0, 86.0, 62.0, 48.0, 32.0, 12.0, 14.0, 7.0, 6.0, 7.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.78515625, -6.54351806640625, -6.3018798828125, -6.06024169921875, -5.818603515625, -5.57696533203125, -5.3353271484375, -5.09368896484375, -4.85205078125, -4.61041259765625, -4.3687744140625, -4.12713623046875, -3.885498046875, -3.64385986328125, -3.4022216796875, -3.16058349609375, -2.9189453125, -2.67730712890625, -2.4356689453125, -2.19403076171875, -1.952392578125, -1.71075439453125, -1.4691162109375, -1.22747802734375, -0.98583984375, -0.74420166015625, -0.5025634765625, -0.26092529296875, -0.019287109375, 0.22235107421875, 0.4639892578125, 0.70562744140625, 0.947265625, 1.18890380859375, 1.4305419921875, 1.67218017578125, 1.913818359375, 2.15545654296875, 2.3970947265625, 2.63873291015625, 2.88037109375, 3.12200927734375, 3.3636474609375, 3.60528564453125, 3.846923828125, 4.08856201171875, 4.3302001953125, 4.57183837890625, 4.8134765625, 5.05511474609375, 5.2967529296875, 5.53839111328125, 5.780029296875, 6.02166748046875, 6.2633056640625, 6.50494384765625, 6.74658203125, 6.98822021484375, 7.2298583984375, 7.47149658203125, 7.713134765625, 7.95477294921875, 8.1964111328125, 8.43804931640625, 8.6796875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 7.0, 11.0, 10.0, 8.0, 11.0, 19.0, 29.0, 34.0, 38.0, 49.0, 69.0, 80.0, 63.0, 62.0, 85.0, 67.0, 67.0, 59.0, 50.0, 43.0, 35.0, 29.0, 21.0, 21.0, 11.0, 6.0, 10.0, 3.0, 2.0, 5.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006189346313476562, -0.000600174069404602, -0.0005814135074615479, -0.0005626529455184937, -0.0005438923835754395, -0.0005251318216323853, -0.0005063712596893311, -0.00048761069774627686, -0.00046885013580322266, -0.00045008957386016846, -0.00043132901191711426, -0.00041256844997406006, -0.00039380788803100586, -0.00037504732608795166, -0.00035628676414489746, -0.00033752620220184326, -0.00031876564025878906, -0.00030000507831573486, -0.00028124451637268066, -0.00026248395442962646, -0.00024372339248657227, -0.00022496283054351807, -0.00020620226860046387, -0.00018744170665740967, -0.00016868114471435547, -0.00014992058277130127, -0.00013116002082824707, -0.00011239945888519287, -9.363889694213867e-05, -7.487833499908447e-05, -5.6117773056030273e-05, -3.7357211112976074e-05, -1.8596649169921875e-05, 1.6391277313232422e-07, 1.8924474716186523e-05, 3.768503665924072e-05, 5.644559860229492e-05, 7.520616054534912e-05, 9.396672248840332e-05, 0.00011272728443145752, 0.00013148784637451172, 0.00015024840831756592, 0.00016900897026062012, 0.00018776953220367432, 0.00020653009414672852, 0.00022529065608978271, 0.00024405121803283691, 0.0002628117799758911, 0.0002815723419189453, 0.0003003329038619995, 0.0003190934658050537, 0.0003378540277481079, 0.0003566145896911621, 0.0003753751516342163, 0.0003941357135772705, 0.0004128962755203247, 0.0004316568374633789, 0.0004504173994064331, 0.0004691779613494873, 0.0004879385232925415, 0.0005066990852355957, 0.0005254596471786499, 0.0005442202091217041, 0.0005629807710647583, 0.0005817413330078125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 13.0, 6.0, 14.0, 28.0, 32.0, 47.0, 93.0, 125.0, 229.0, 352.0, 596.0, 1052.0, 1901.0, 3685.0, 7880.0, 17664.0, 43572.0, 112566.0, 250307.0, 309145.0, 177346.0, 70987.0, 27756.0, 11643.0, 5430.0, 2621.0, 1414.0, 764.0, 454.0, 292.0, 190.0, 124.0, 73.0, 52.0, 27.0, 24.0, 19.0, 14.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.25, -8.97998046875, -8.7099609375, -8.43994140625, -8.169921875, -7.89990234375, -7.6298828125, -7.35986328125, -7.08984375, -6.81982421875, -6.5498046875, -6.27978515625, -6.009765625, -5.73974609375, -5.4697265625, -5.19970703125, -4.9296875, -4.65966796875, -4.3896484375, -4.11962890625, -3.849609375, -3.57958984375, -3.3095703125, -3.03955078125, -2.76953125, -2.49951171875, -2.2294921875, -1.95947265625, -1.689453125, -1.41943359375, -1.1494140625, -0.87939453125, -0.609375, -0.33935546875, -0.0693359375, 0.20068359375, 0.470703125, 0.74072265625, 1.0107421875, 1.28076171875, 1.55078125, 1.82080078125, 2.0908203125, 2.36083984375, 2.630859375, 2.90087890625, 3.1708984375, 3.44091796875, 3.7109375, 3.98095703125, 4.2509765625, 4.52099609375, 4.791015625, 5.06103515625, 5.3310546875, 5.60107421875, 5.87109375, 6.14111328125, 6.4111328125, 6.68115234375, 6.951171875, 7.22119140625, 7.4912109375, 7.76123046875, 8.03125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 5.0, 9.0, 14.0, 13.0, 21.0, 23.0, 26.0, 29.0, 57.0, 53.0, 67.0, 77.0, 76.0, 81.0, 71.0, 60.0, 74.0, 57.0, 27.0, 27.0, 34.0, 19.0, 15.0, 11.0, 12.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.32421875, -3.2415313720703125, -3.158843994140625, -3.0761566162109375, -2.99346923828125, -2.9107818603515625, -2.828094482421875, -2.7454071044921875, -2.6627197265625, -2.5800323486328125, -2.497344970703125, -2.4146575927734375, -2.33197021484375, -2.2492828369140625, -2.166595458984375, -2.0839080810546875, -2.001220703125, -1.9185333251953125, -1.835845947265625, -1.7531585693359375, -1.67047119140625, -1.5877838134765625, -1.505096435546875, -1.4224090576171875, -1.3397216796875, -1.2570343017578125, -1.174346923828125, -1.0916595458984375, -1.00897216796875, -0.9262847900390625, -0.843597412109375, -0.7609100341796875, -0.67822265625, -0.5955352783203125, -0.512847900390625, -0.4301605224609375, -0.34747314453125, -0.2647857666015625, -0.182098388671875, -0.0994110107421875, -0.0167236328125, 0.0659637451171875, 0.148651123046875, 0.2313385009765625, 0.31402587890625, 0.3967132568359375, 0.479400634765625, 0.5620880126953125, 0.644775390625, 0.7274627685546875, 0.810150146484375, 0.8928375244140625, 0.97552490234375, 1.0582122802734375, 1.140899658203125, 1.2235870361328125, 1.3062744140625, 1.3889617919921875, 1.471649169921875, 1.5543365478515625, 1.63702392578125, 1.7197113037109375, 1.802398681640625, 1.8850860595703125, 1.9677734375]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 7.0, 8.0, 6.0, 4.0, 10.0, 19.0, 11.0, 14.0, 29.0, 32.0, 34.0, 45.0, 51.0, 58.0, 77.0, 70.0, 69.0, 64.0, 68.0, 59.0, 44.0, 37.0, 40.0, 29.0, 17.0, 23.0, 17.0, 16.0, 13.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.85523509979248, -13.458773612976074, -13.062311172485352, -12.665849685668945, -12.269388198852539, -11.872926712036133, -11.476465225219727, -11.080002784729004, -10.683541297912598, -10.287079811096191, -9.890617370605469, -9.494155883789062, -9.097694396972656, -8.70123291015625, -8.304771423339844, -7.908308982849121, -7.511847496032715, -7.115386009216309, -6.718924045562744, -6.32246208190918, -5.926000595092773, -5.529539108276367, -5.133077144622803, -4.736615180969238, -4.340153694152832, -3.9436919689178467, -3.5472302436828613, -3.150768518447876, -2.7543067932128906, -2.3578450679779053, -1.96138334274292, -1.5649216175079346, -1.1684589385986328, -0.7719972133636475, -0.3755354881286621, 0.020926237106323242, 0.4173879623413086, 0.813849687576294, 1.2103114128112793, 1.6067731380462646, 2.00323486328125, 2.3996965885162354, 2.7961583137512207, 3.192620038986206, 3.5890817642211914, 3.9855434894561768, 4.382005214691162, 4.778467178344727, 5.174928665161133, 5.571390151977539, 5.9678521156311035, 6.364314079284668, 6.760775566101074, 7.1572370529174805, 7.553699016571045, 7.950160980224609, 8.346622467041016, 8.743083953857422, 9.139545440673828, 9.53600788116455, 9.932469367980957, 10.328930854797363, 10.725393295288086, 11.121854782104492, 11.518316268920898]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 6.0, 2.0, 2.0, 5.0, 8.0, 7.0, 7.0, 11.0, 11.0, 13.0, 14.0, 22.0, 20.0, 16.0, 33.0, 30.0, 25.0, 36.0, 31.0, 25.0, 35.0, 38.0, 28.0, 42.0, 30.0, 37.0, 33.0, 38.0, 31.0, 42.0, 37.0, 38.0, 24.0, 33.0, 27.0, 21.0, 23.0, 18.0, 25.0, 10.0, 16.0, 8.0, 12.0, 8.0, 7.0, 4.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0], "bins": [-9.883431434631348, -9.607135772705078, -9.330839157104492, -9.054543495178223, -8.778246879577637, -8.501951217651367, -8.225654602050781, -7.949358940124512, -7.673062801361084, -7.396766662597656, -7.1204705238342285, -6.844174385070801, -6.567878723144531, -6.291582107543945, -6.015286445617676, -5.738990306854248, -5.46269416809082, -5.186398029327393, -4.910101890563965, -4.633805751800537, -4.357509613037109, -4.08121395111084, -3.804917812347412, -3.5286216735839844, -3.2523255348205566, -2.976029396057129, -2.699733257293701, -2.4234373569488525, -2.147141218185425, -1.870845079421997, -1.5945490598678589, -1.3182530403137207, -1.0419573783874512, -0.7656612992286682, -0.48936522006988525, -0.2130691409111023, 0.06322693824768066, 0.3395230770111084, 0.6158190965652466, 0.8921151161193848, 1.1684112548828125, 1.4447073936462402, 1.7210034132003784, 1.9972994327545166, 2.2735955715179443, 2.549891710281372, 2.8261876106262207, 3.1024837493896484, 3.378779888153076, 3.655076026916504, 3.9313721656799316, 4.207668304443359, 4.483963966369629, 4.760260581970215, 5.036556243896484, 5.312852382659912, 5.58914852142334, 5.865444660186768, 6.141740798950195, 6.418036937713623, 6.694333076477051, 6.97062873840332, 7.246924877166748, 7.523221015930176, 7.7995171546936035]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 9.0, 16.0, 26.0, 40.0, 37.0, 64.0, 94.0, 119.0, 174.0, 258.0, 402.0, 557.0, 798.0, 1277.0, 2043.0, 3303.0, 5820.0, 11242.0, 23751.0, 58877.0, 173961.0, 589065.0, 1438158.0, 1233062.0, 434579.0, 129696.0, 45350.0, 19050.0, 9501.0, 4896.0, 2748.0, 1788.0, 1137.0, 676.0, 552.0, 338.0, 238.0, 152.0, 117.0, 83.0, 70.0, 43.0, 32.0, 19.0, 17.0, 14.0, 17.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-13.5234375, -13.09912109375, -12.6748046875, -12.25048828125, -11.826171875, -11.40185546875, -10.9775390625, -10.55322265625, -10.12890625, -9.70458984375, -9.2802734375, -8.85595703125, -8.431640625, -8.00732421875, -7.5830078125, -7.15869140625, -6.734375, -6.31005859375, -5.8857421875, -5.46142578125, -5.037109375, -4.61279296875, -4.1884765625, -3.76416015625, -3.33984375, -2.91552734375, -2.4912109375, -2.06689453125, -1.642578125, -1.21826171875, -0.7939453125, -0.36962890625, 0.0546875, 0.47900390625, 0.9033203125, 1.32763671875, 1.751953125, 2.17626953125, 2.6005859375, 3.02490234375, 3.44921875, 3.87353515625, 4.2978515625, 4.72216796875, 5.146484375, 5.57080078125, 5.9951171875, 6.41943359375, 6.84375, 7.26806640625, 7.6923828125, 8.11669921875, 8.541015625, 8.96533203125, 9.3896484375, 9.81396484375, 10.23828125, 10.66259765625, 11.0869140625, 11.51123046875, 11.935546875, 12.35986328125, 12.7841796875, 13.20849609375, 13.6328125]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 2.0, 7.0, 6.0, 7.0, 8.0, 13.0, 7.0, 23.0, 21.0, 22.0, 27.0, 18.0, 30.0, 27.0, 31.0, 37.0, 30.0, 44.0, 43.0, 41.0, 38.0, 34.0, 30.0, 38.0, 36.0, 28.0, 31.0, 38.0, 36.0, 35.0, 26.0, 23.0, 21.0, 15.0, 23.0, 20.0, 13.0, 11.0, 6.0, 10.0, 7.0, 10.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-6.703125, -6.5133056640625, -6.323486328125, -6.1336669921875, -5.94384765625, -5.7540283203125, -5.564208984375, -5.3743896484375, -5.1845703125, -4.9947509765625, -4.804931640625, -4.6151123046875, -4.42529296875, -4.2354736328125, -4.045654296875, -3.8558349609375, -3.666015625, -3.4761962890625, -3.286376953125, -3.0965576171875, -2.90673828125, -2.7169189453125, -2.527099609375, -2.3372802734375, -2.1474609375, -1.9576416015625, -1.767822265625, -1.5780029296875, -1.38818359375, -1.1983642578125, -1.008544921875, -0.8187255859375, -0.62890625, -0.4390869140625, -0.249267578125, -0.0594482421875, 0.13037109375, 0.3201904296875, 0.510009765625, 0.6998291015625, 0.8896484375, 1.0794677734375, 1.269287109375, 1.4591064453125, 1.64892578125, 1.8387451171875, 2.028564453125, 2.2183837890625, 2.408203125, 2.5980224609375, 2.787841796875, 2.9776611328125, 3.16748046875, 3.3572998046875, 3.547119140625, 3.7369384765625, 3.9267578125, 4.1165771484375, 4.306396484375, 4.4962158203125, 4.68603515625, 4.8758544921875, 5.065673828125, 5.2554931640625, 5.4453125]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 2.0, 7.0, 10.0, 17.0, 20.0, 12.0, 24.0, 39.0, 53.0, 88.0, 109.0, 169.0, 226.0, 345.0, 531.0, 790.0, 1127.0, 1863.0, 3059.0, 5093.0, 9262.0, 17806.0, 39188.0, 99871.0, 315865.0, 1113535.0, 1681311.0, 610451.0, 175347.0, 61438.0, 25938.0, 12918.0, 6868.0, 4006.0, 2429.0, 1487.0, 959.0, 616.0, 440.0, 298.0, 191.0, 136.0, 95.0, 51.0, 63.0, 32.0, 26.0, 25.0, 16.0, 9.0, 8.0, 11.0, 3.0, 3.0, 1.0, 3.0, 2.0], "bins": [-16.65625, -16.1553955078125, -15.654541015625, -15.1536865234375, -14.65283203125, -14.1519775390625, -13.651123046875, -13.1502685546875, -12.6494140625, -12.1485595703125, -11.647705078125, -11.1468505859375, -10.64599609375, -10.1451416015625, -9.644287109375, -9.1434326171875, -8.642578125, -8.1417236328125, -7.640869140625, -7.1400146484375, -6.63916015625, -6.1383056640625, -5.637451171875, -5.1365966796875, -4.6357421875, -4.1348876953125, -3.634033203125, -3.1331787109375, -2.63232421875, -2.1314697265625, -1.630615234375, -1.1297607421875, -0.62890625, -0.1280517578125, 0.372802734375, 0.8736572265625, 1.37451171875, 1.8753662109375, 2.376220703125, 2.8770751953125, 3.3779296875, 3.8787841796875, 4.379638671875, 4.8804931640625, 5.38134765625, 5.8822021484375, 6.383056640625, 6.8839111328125, 7.384765625, 7.8856201171875, 8.386474609375, 8.8873291015625, 9.38818359375, 9.8890380859375, 10.389892578125, 10.8907470703125, 11.3916015625, 11.8924560546875, 12.393310546875, 12.8941650390625, 13.39501953125, 13.8958740234375, 14.396728515625, 14.8975830078125, 15.3984375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 9.0, 10.0, 11.0, 18.0, 13.0, 23.0, 24.0, 33.0, 48.0, 69.0, 91.0, 112.0, 163.0, 222.0, 227.0, 300.0, 353.0, 361.0, 379.0, 328.0, 305.0, 230.0, 170.0, 138.0, 90.0, 72.0, 56.0, 56.0, 38.0, 19.0, 18.0, 11.0, 18.0, 16.0, 8.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.26171875, -4.139190673828125, -4.01666259765625, -3.894134521484375, -3.7716064453125, -3.649078369140625, -3.52655029296875, -3.404022216796875, -3.281494140625, -3.158966064453125, -3.03643798828125, -2.913909912109375, -2.7913818359375, -2.668853759765625, -2.54632568359375, -2.423797607421875, -2.30126953125, -2.178741455078125, -2.05621337890625, -1.933685302734375, -1.8111572265625, -1.688629150390625, -1.56610107421875, -1.443572998046875, -1.321044921875, -1.198516845703125, -1.07598876953125, -0.953460693359375, -0.8309326171875, -0.708404541015625, -0.58587646484375, -0.463348388671875, -0.3408203125, -0.218292236328125, -0.09576416015625, 0.026763916015625, 0.1492919921875, 0.271820068359375, 0.39434814453125, 0.516876220703125, 0.639404296875, 0.761932373046875, 0.88446044921875, 1.006988525390625, 1.1295166015625, 1.252044677734375, 1.37457275390625, 1.497100830078125, 1.61962890625, 1.742156982421875, 1.86468505859375, 1.987213134765625, 2.1097412109375, 2.232269287109375, 2.35479736328125, 2.477325439453125, 2.599853515625, 2.722381591796875, 2.84490966796875, 2.967437744140625, 3.0899658203125, 3.212493896484375, 3.33502197265625, 3.457550048828125, 3.580078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 4.0, 3.0, 3.0, 6.0, 11.0, 13.0, 15.0, 25.0, 40.0, 33.0, 63.0, 49.0, 78.0, 91.0, 83.0, 77.0, 81.0, 72.0, 59.0, 40.0, 35.0, 22.0, 25.0, 14.0, 10.0, 11.0, 6.0, 6.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.674912452697754, -13.257781028747559, -12.840649604797363, -12.423518180847168, -12.006386756896973, -11.589255332946777, -11.172122955322266, -10.75499153137207, -10.337860107421875, -9.92072868347168, -9.503597259521484, -9.086465835571289, -8.669334411621094, -8.252202987670898, -7.835071086883545, -7.41793966293335, -7.0008087158203125, -6.583677291870117, -6.166545867919922, -5.749414443969727, -5.332283020019531, -4.915151596069336, -4.498019695281982, -4.080888271331787, -3.663756847381592, -3.2466254234313965, -2.829493999481201, -2.4123623371124268, -1.9952309131622314, -1.5780994892120361, -1.1609678268432617, -0.7438364028930664, -0.3267049789428711, 0.090426504611969, 0.5075579881668091, 0.924689531326294, 1.3418209552764893, 1.7589523792266846, 2.176084041595459, 2.5932154655456543, 3.0103468894958496, 3.427478313446045, 3.8446097373962402, 4.261741638183594, 4.678873062133789, 5.096004486083984, 5.51313591003418, 5.930267333984375, 6.34739875793457, 6.764530181884766, 7.181661605834961, 7.598793029785156, 8.015924453735352, 8.433055877685547, 8.850187301635742, 9.267318725585938, 9.684450149536133, 10.101581573486328, 10.518712997436523, 10.935844421386719, 11.352975845336914, 11.77010726928711, 12.187238693237305, 12.6043701171875, 13.021502494812012]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 7.0, 7.0, 13.0, 8.0, 11.0, 12.0, 13.0, 22.0, 17.0, 32.0, 26.0, 27.0, 36.0, 22.0, 31.0, 41.0, 37.0, 44.0, 33.0, 47.0, 50.0, 45.0, 36.0, 45.0, 33.0, 31.0, 48.0, 23.0, 37.0, 28.0, 27.0, 16.0, 12.0, 12.0, 12.0, 13.0, 6.0, 9.0, 11.0, 3.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.19663143157959, -8.93133544921875, -8.666040420532227, -8.400744438171387, -8.135449409484863, -7.870153427124023, -7.604857921600342, -7.33956241607666, -7.0742669105529785, -6.808971405029297, -6.543675899505615, -6.278380393981934, -6.013084411621094, -5.74778938293457, -5.4824934005737305, -5.217197895050049, -4.951902389526367, -4.6866068840026855, -4.421311378479004, -4.156015872955322, -3.8907201290130615, -3.62542462348938, -3.360128879547119, -3.0948333740234375, -2.829537868499756, -2.564242362976074, -2.2989468574523926, -2.033651113510132, -1.7683556079864502, -1.5030601024627686, -1.2377644777297974, -0.9724688529968262, -0.7071738243103027, -0.4418782591819763, -0.1765826940536499, 0.08871287107467651, 0.35400843620300293, 0.6193039417266846, 0.8845995664596558, 1.149895191192627, 1.4151906967163086, 1.6804862022399902, 1.9457818269729614, 2.2110774517059326, 2.4763729572296143, 2.741668462753296, 3.0069642066955566, 3.2722597122192383, 3.53755521774292, 3.8028507232666016, 4.068146228790283, 4.333441734313965, 4.598737716674805, 4.864032745361328, 5.129328727722168, 5.39462423324585, 5.659919738769531, 5.925215244293213, 6.1905107498168945, 6.455806255340576, 6.721101760864258, 6.986397743225098, 7.251693248748779, 7.516988754272461, 7.782284259796143]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 11.0, 4.0, 12.0, 22.0, 23.0, 37.0, 52.0, 83.0, 115.0, 198.0, 301.0, 446.0, 768.0, 1292.0, 2258.0, 3779.0, 7079.0, 12895.0, 23370.0, 44620.0, 83512.0, 154920.0, 236384.0, 210049.0, 123195.0, 66052.0, 35084.0, 18475.0, 10157.0, 5520.0, 3185.0, 1765.0, 1069.0, 693.0, 397.0, 252.0, 162.0, 112.0, 75.0, 41.0, 34.0, 12.0, 18.0, 12.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.5902099609375, -1.536865234375, -1.4835205078125, -1.43017578125, -1.3768310546875, -1.323486328125, -1.2701416015625, -1.216796875, -1.1634521484375, -1.110107421875, -1.0567626953125, -1.00341796875, -0.9500732421875, -0.896728515625, -0.8433837890625, -0.7900390625, -0.7366943359375, -0.683349609375, -0.6300048828125, -0.57666015625, -0.5233154296875, -0.469970703125, -0.4166259765625, -0.36328125, -0.3099365234375, -0.256591796875, -0.2032470703125, -0.14990234375, -0.0965576171875, -0.043212890625, 0.0101318359375, 0.0634765625, 0.1168212890625, 0.170166015625, 0.2235107421875, 0.27685546875, 0.3302001953125, 0.383544921875, 0.4368896484375, 0.490234375, 0.5435791015625, 0.596923828125, 0.6502685546875, 0.70361328125, 0.7569580078125, 0.810302734375, 0.8636474609375, 0.9169921875, 0.9703369140625, 1.023681640625, 1.0770263671875, 1.13037109375, 1.1837158203125, 1.237060546875, 1.2904052734375, 1.34375, 1.3970947265625, 1.450439453125, 1.5037841796875, 1.55712890625, 1.6104736328125, 1.663818359375, 1.7171630859375, 1.7705078125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 12.0, 9.0, 10.0, 9.0, 16.0, 18.0, 15.0, 14.0, 30.0, 20.0, 29.0, 34.0, 36.0, 39.0, 37.0, 44.0, 23.0, 39.0, 32.0, 40.0, 40.0, 36.0, 53.0, 35.0, 33.0, 35.0, 34.0, 36.0, 35.0, 34.0, 21.0, 16.0, 12.0, 12.0, 8.0, 11.0, 11.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-10.21875, -9.93572998046875, -9.6527099609375, -9.36968994140625, -9.086669921875, -8.80364990234375, -8.5206298828125, -8.23760986328125, -7.95458984375, -7.67156982421875, -7.3885498046875, -7.10552978515625, -6.822509765625, -6.53948974609375, -6.2564697265625, -5.97344970703125, -5.6904296875, -5.40740966796875, -5.1243896484375, -4.84136962890625, -4.558349609375, -4.27532958984375, -3.9923095703125, -3.70928955078125, -3.42626953125, -3.14324951171875, -2.8602294921875, -2.57720947265625, -2.294189453125, -2.01116943359375, -1.7281494140625, -1.44512939453125, -1.162109375, -0.87908935546875, -0.5960693359375, -0.31304931640625, -0.030029296875, 0.25299072265625, 0.5360107421875, 0.81903076171875, 1.10205078125, 1.38507080078125, 1.6680908203125, 1.95111083984375, 2.234130859375, 2.51715087890625, 2.8001708984375, 3.08319091796875, 3.3662109375, 3.64923095703125, 3.9322509765625, 4.21527099609375, 4.498291015625, 4.78131103515625, 5.0643310546875, 5.34735107421875, 5.63037109375, 5.91339111328125, 6.1964111328125, 6.47943115234375, 6.762451171875, 7.04547119140625, 7.3284912109375, 7.61151123046875, 7.89453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 11.0, 19.0, 14.0, 34.0, 50.0, 68.0, 69.0, 109.0, 171.0, 257.0, 370.0, 605.0, 973.0, 1729.0, 3237.0, 6576.0, 15103.0, 45482.0, 859346.0, 77984.0, 19350.0, 7994.0, 3767.0, 2011.0, 1155.0, 697.0, 456.0, 284.0, 190.0, 108.0, 94.0, 78.0, 43.0, 27.0, 19.0, 16.0, 15.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.2578125, -4.1273193359375, -3.996826171875, -3.8663330078125, -3.73583984375, -3.6053466796875, -3.474853515625, -3.3443603515625, -3.2138671875, -3.0833740234375, -2.952880859375, -2.8223876953125, -2.69189453125, -2.5614013671875, -2.430908203125, -2.3004150390625, -2.169921875, -2.0394287109375, -1.908935546875, -1.7784423828125, -1.64794921875, -1.5174560546875, -1.386962890625, -1.2564697265625, -1.1259765625, -0.9954833984375, -0.864990234375, -0.7344970703125, -0.60400390625, -0.4735107421875, -0.343017578125, -0.2125244140625, -0.08203125, 0.0484619140625, 0.178955078125, 0.3094482421875, 0.43994140625, 0.5704345703125, 0.700927734375, 0.8314208984375, 0.9619140625, 1.0924072265625, 1.222900390625, 1.3533935546875, 1.48388671875, 1.6143798828125, 1.744873046875, 1.8753662109375, 2.005859375, 2.1363525390625, 2.266845703125, 2.3973388671875, 2.52783203125, 2.6583251953125, 2.788818359375, 2.9193115234375, 3.0498046875, 3.1802978515625, 3.310791015625, 3.4412841796875, 3.57177734375, 3.7022705078125, 3.832763671875, 3.9632568359375, 4.09375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 0.0, 5.0, 6.0, 5.0, 8.0, 8.0, 8.0, 13.0, 20.0, 17.0, 20.0, 26.0, 30.0, 32.0, 32.0, 43.0, 42.0, 31.0, 40.0, 42.0, 45.0, 46.0, 40.0, 40.0, 42.0, 33.0, 46.0, 38.0, 34.0, 39.0, 23.0, 15.0, 30.0, 25.0, 18.0, 13.0, 9.0, 4.0, 7.0, 6.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.68359375, -6.48358154296875, -6.2835693359375, -6.08355712890625, -5.883544921875, -5.68353271484375, -5.4835205078125, -5.28350830078125, -5.08349609375, -4.88348388671875, -4.6834716796875, -4.48345947265625, -4.283447265625, -4.08343505859375, -3.8834228515625, -3.68341064453125, -3.4833984375, -3.28338623046875, -3.0833740234375, -2.88336181640625, -2.683349609375, -2.48333740234375, -2.2833251953125, -2.08331298828125, -1.88330078125, -1.68328857421875, -1.4832763671875, -1.28326416015625, -1.083251953125, -0.88323974609375, -0.6832275390625, -0.48321533203125, -0.283203125, -0.08319091796875, 0.1168212890625, 0.31683349609375, 0.516845703125, 0.71685791015625, 0.9168701171875, 1.11688232421875, 1.31689453125, 1.51690673828125, 1.7169189453125, 1.91693115234375, 2.116943359375, 2.31695556640625, 2.5169677734375, 2.71697998046875, 2.9169921875, 3.11700439453125, 3.3170166015625, 3.51702880859375, 3.717041015625, 3.91705322265625, 4.1170654296875, 4.31707763671875, 4.51708984375, 4.71710205078125, 4.9171142578125, 5.11712646484375, 5.317138671875, 5.51715087890625, 5.7171630859375, 5.91717529296875, 6.1171875]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 11.0, 14.0, 15.0, 29.0, 37.0, 53.0, 62.0, 88.0, 153.0, 201.0, 342.0, 533.0, 803.0, 1387.0, 2482.0, 4626.0, 9681.0, 23191.0, 322396.0, 636109.0, 25043.0, 10145.0, 4860.0, 2447.0, 1421.0, 846.0, 539.0, 318.0, 207.0, 150.0, 99.0, 59.0, 73.0, 41.0, 16.0, 17.0, 19.0, 9.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.50390625, -1.4554443359375, -1.406982421875, -1.3585205078125, -1.31005859375, -1.2615966796875, -1.213134765625, -1.1646728515625, -1.1162109375, -1.0677490234375, -1.019287109375, -0.9708251953125, -0.92236328125, -0.8739013671875, -0.825439453125, -0.7769775390625, -0.728515625, -0.6800537109375, -0.631591796875, -0.5831298828125, -0.53466796875, -0.4862060546875, -0.437744140625, -0.3892822265625, -0.3408203125, -0.2923583984375, -0.243896484375, -0.1954345703125, -0.14697265625, -0.0985107421875, -0.050048828125, -0.0015869140625, 0.046875, 0.0953369140625, 0.143798828125, 0.1922607421875, 0.24072265625, 0.2891845703125, 0.337646484375, 0.3861083984375, 0.4345703125, 0.4830322265625, 0.531494140625, 0.5799560546875, 0.62841796875, 0.6768798828125, 0.725341796875, 0.7738037109375, 0.822265625, 0.8707275390625, 0.919189453125, 0.9676513671875, 1.01611328125, 1.0645751953125, 1.113037109375, 1.1614990234375, 1.2099609375, 1.2584228515625, 1.306884765625, 1.3553466796875, 1.40380859375, 1.4522705078125, 1.500732421875, 1.5491943359375, 1.59765625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 7.0, 12.0, 10.0, 12.0, 16.0, 23.0, 24.0, 27.0, 49.0, 59.0, 64.0, 91.0, 86.0, 95.0, 83.0, 75.0, 65.0, 54.0, 35.0, 29.0, 18.0, 12.0, 10.0, 4.0, 12.0, 5.0, 1.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.306171417236328e-05, -6.080605089664459e-05, -5.85503876209259e-05, -5.6294724345207214e-05, -5.4039061069488525e-05, -5.1783397793769836e-05, -4.952773451805115e-05, -4.727207124233246e-05, -4.501640796661377e-05, -4.276074469089508e-05, -4.050508141517639e-05, -3.82494181394577e-05, -3.5993754863739014e-05, -3.3738091588020325e-05, -3.1482428312301636e-05, -2.9226765036582947e-05, -2.6971101760864258e-05, -2.471543848514557e-05, -2.245977520942688e-05, -2.020411193370819e-05, -1.7948448657989502e-05, -1.5692785382270813e-05, -1.3437122106552124e-05, -1.1181458830833435e-05, -8.925795555114746e-06, -6.670132279396057e-06, -4.414469003677368e-06, -2.158805727958679e-06, 9.685754776000977e-08, 2.3525208234786987e-06, 4.608184099197388e-06, 6.863847374916077e-06, 9.119510650634766e-06, 1.1375173926353455e-05, 1.3630837202072144e-05, 1.5886500477790833e-05, 1.814216375350952e-05, 2.039782702922821e-05, 2.26534903049469e-05, 2.490915358066559e-05, 2.7164816856384277e-05, 2.9420480132102966e-05, 3.1676143407821655e-05, 3.3931806683540344e-05, 3.618746995925903e-05, 3.844313323497772e-05, 4.069879651069641e-05, 4.29544597864151e-05, 4.521012306213379e-05, 4.746578633785248e-05, 4.972144961357117e-05, 5.1977112889289856e-05, 5.4232776165008545e-05, 5.6488439440727234e-05, 5.874410271644592e-05, 6.099976599216461e-05, 6.32554292678833e-05, 6.551109254360199e-05, 6.776675581932068e-05, 7.002241909503937e-05, 7.227808237075806e-05, 7.453374564647675e-05, 7.678940892219543e-05, 7.904507219791412e-05, 8.130073547363281e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 13.0, 11.0, 9.0, 20.0, 28.0, 42.0, 56.0, 78.0, 121.0, 195.0, 285.0, 431.0, 595.0, 1004.0, 1554.0, 2627.0, 4331.0, 7568.0, 14587.0, 28920.0, 62222.0, 148977.0, 330887.0, 250561.0, 101816.0, 44241.0, 21141.0, 11014.0, 6045.0, 3434.0, 2056.0, 1324.0, 839.0, 494.0, 347.0, 203.0, 149.0, 101.0, 63.0, 50.0, 40.0, 24.0, 16.0, 15.0, 8.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58837890625, -0.5692672729492188, -0.5501556396484375, -0.5310440063476562, -0.511932373046875, -0.49282073974609375, -0.4737091064453125, -0.45459747314453125, -0.43548583984375, -0.41637420654296875, -0.3972625732421875, -0.37815093994140625, -0.359039306640625, -0.33992767333984375, -0.3208160400390625, -0.30170440673828125, -0.2825927734375, -0.26348114013671875, -0.2443695068359375, -0.22525787353515625, -0.206146240234375, -0.18703460693359375, -0.1679229736328125, -0.14881134033203125, -0.12969970703125, -0.11058807373046875, -0.0914764404296875, -0.07236480712890625, -0.053253173828125, -0.03414154052734375, -0.0150299072265625, 0.00408172607421875, 0.023193359375, 0.04230499267578125, 0.0614166259765625, 0.08052825927734375, 0.099639892578125, 0.11875152587890625, 0.1378631591796875, 0.15697479248046875, 0.17608642578125, 0.19519805908203125, 0.2143096923828125, 0.23342132568359375, 0.252532958984375, 0.27164459228515625, 0.2907562255859375, 0.30986785888671875, 0.3289794921875, 0.34809112548828125, 0.3672027587890625, 0.38631439208984375, 0.405426025390625, 0.42453765869140625, 0.4436492919921875, 0.46276092529296875, 0.48187255859375, 0.5009841918945312, 0.5200958251953125, 0.5392074584960938, 0.558319091796875, 0.5774307250976562, 0.5965423583984375, 0.6156539916992188, 0.634765625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 11.0, 15.0, 14.0, 20.0, 26.0, 29.0, 60.0, 60.0, 82.0, 99.0, 121.0, 89.0, 73.0, 52.0, 50.0, 44.0, 21.0, 19.0, 21.0, 11.0, 13.0, 7.0, 5.0, 7.0, 8.0, 2.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2042236328125, -0.1982898712158203, -0.19235610961914062, -0.18642234802246094, -0.18048858642578125, -0.17455482482910156, -0.16862106323242188, -0.1626873016357422, -0.1567535400390625, -0.1508197784423828, -0.14488601684570312, -0.13895225524902344, -0.13301849365234375, -0.12708473205566406, -0.12115097045898438, -0.11521720886230469, -0.109283447265625, -0.10334968566894531, -0.09741592407226562, -0.09148216247558594, -0.08554840087890625, -0.07961463928222656, -0.07368087768554688, -0.06774711608886719, -0.0618133544921875, -0.05587959289550781, -0.049945831298828125, -0.04401206970214844, -0.03807830810546875, -0.03214454650878906, -0.026210784912109375, -0.020277023315429688, -0.01434326171875, -0.008409500122070312, -0.002475738525390625, 0.0034580230712890625, 0.00939178466796875, 0.015325546264648438, 0.021259307861328125, 0.027193069458007812, 0.0331268310546875, 0.03906059265136719, 0.044994354248046875, 0.05092811584472656, 0.05686187744140625, 0.06279563903808594, 0.06872940063476562, 0.07466316223144531, 0.080596923828125, 0.08653068542480469, 0.09246444702148438, 0.09839820861816406, 0.10433197021484375, 0.11026573181152344, 0.11619949340820312, 0.12213325500488281, 0.1280670166015625, 0.1340007781982422, 0.13993453979492188, 0.14586830139160156, 0.15180206298828125, 0.15773582458496094, 0.16366958618164062, 0.1696033477783203, 0.175537109375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 8.0, 10.0, 13.0, 19.0, 35.0, 38.0, 49.0, 56.0, 63.0, 92.0, 83.0, 78.0, 83.0, 70.0, 67.0, 56.0, 39.0, 24.0, 20.0, 25.0, 9.0, 8.0, 11.0, 5.0, 8.0, 3.0, 3.0, 2.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.630773544311523, -13.208733558654785, -12.786693572998047, -12.364654541015625, -11.942614555358887, -11.520574569702148, -11.09853458404541, -10.676494598388672, -10.25445556640625, -9.832415580749512, -9.410375595092773, -8.988336563110352, -8.566296577453613, -8.144256591796875, -7.722216606140137, -7.300176620483398, -6.87813663482666, -6.456096649169922, -6.034057140350342, -5.6120171546936035, -5.189977645874023, -4.767937660217285, -4.345897674560547, -3.9238579273223877, -3.5018181800842285, -3.0797784328460693, -2.65773868560791, -2.235698699951172, -1.8136589527130127, -1.3916192054748535, -0.9695792198181152, -0.547539472579956, -0.12550067901611328, 0.2965391278266907, 0.7185789346694946, 1.1406188011169434, 1.5626585483551025, 1.9846982955932617, 2.40673828125, 2.828778028488159, 3.2508177757263184, 3.6728575229644775, 4.094897270202637, 4.516937255859375, 4.938977241516113, 5.361016750335693, 5.783056735992432, 6.205096244812012, 6.62713623046875, 7.049176216125488, 7.471215724945068, 7.893255710601807, 8.315295219421387, 8.737335205078125, 9.159375190734863, 9.581415176391602, 10.003454208374023, 10.425494194030762, 10.8475341796875, 11.269573211669922, 11.69161319732666, 12.113653182983398, 12.535693168640137, 12.957733154296875, 13.379773139953613]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 14.0, 7.0, 12.0, 10.0, 9.0, 23.0, 17.0, 32.0, 28.0, 25.0, 36.0, 19.0, 33.0, 38.0, 34.0, 44.0, 35.0, 48.0, 44.0, 44.0, 40.0, 37.0, 43.0, 34.0, 40.0, 30.0, 37.0, 29.0, 26.0, 17.0, 17.0, 10.0, 12.0, 13.0, 7.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.23351001739502, -8.968831062316895, -8.704153060913086, -8.439474105834961, -8.174795150756836, -7.910117149353027, -7.645438194274902, -7.3807597160339355, -7.116081237792969, -6.851402759552002, -6.586723804473877, -6.32204532623291, -6.057366847991943, -5.792688369750977, -5.528009414672852, -5.263330936431885, -4.99865198135376, -4.733973503112793, -4.469294548034668, -4.204616069793701, -3.9399375915527344, -3.6752588748931885, -3.4105801582336426, -3.145901679992676, -2.88122296333313, -2.616544246673584, -2.351865768432617, -2.0871870517730713, -1.822508454322815, -1.5578298568725586, -1.2931511402130127, -1.0284725427627563, -0.7637939453125, -0.49911531805992126, -0.23443669080734253, 0.030241966247558594, 0.29492056369781494, 0.5595991611480713, 0.8242778778076172, 1.0889564752578735, 1.3536350727081299, 1.6183136701583862, 1.8829922676086426, 2.1476709842681885, 2.4123497009277344, 2.677028179168701, 2.941706895828247, 3.206385612487793, 3.4710640907287598, 3.7357428073883057, 4.000421524047852, 4.265100002288818, 4.529778480529785, 4.79445743560791, 5.059135913848877, 5.323814392089844, 5.588493347167969, 5.8531718254089355, 6.1178507804870605, 6.382529258728027, 6.647207736968994, 6.911886215209961, 7.176565170288086, 7.441243648529053, 7.7059221267700195]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 3.0, 4.0, 7.0, 11.0, 9.0, 16.0, 31.0, 40.0, 49.0, 71.0, 98.0, 161.0, 212.0, 368.0, 550.0, 760.0, 1244.0, 1862.0, 3097.0, 5025.0, 8344.0, 14241.0, 24754.0, 42147.0, 71078.0, 112856.0, 155749.0, 174662.0, 153833.0, 109642.0, 68072.0, 40990.0, 23627.0, 13793.0, 7899.0, 4846.0, 2904.0, 1856.0, 1206.0, 775.0, 517.0, 355.0, 241.0, 157.0, 125.0, 71.0, 67.0, 41.0, 28.0, 18.0, 12.0, 10.0, 7.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.89453125, -5.7010498046875, -5.507568359375, -5.3140869140625, -5.12060546875, -4.9271240234375, -4.733642578125, -4.5401611328125, -4.3466796875, -4.1531982421875, -3.959716796875, -3.7662353515625, -3.57275390625, -3.3792724609375, -3.185791015625, -2.9923095703125, -2.798828125, -2.6053466796875, -2.411865234375, -2.2183837890625, -2.02490234375, -1.8314208984375, -1.637939453125, -1.4444580078125, -1.2509765625, -1.0574951171875, -0.864013671875, -0.6705322265625, -0.47705078125, -0.2835693359375, -0.090087890625, 0.1033935546875, 0.296875, 0.4903564453125, 0.683837890625, 0.8773193359375, 1.07080078125, 1.2642822265625, 1.457763671875, 1.6512451171875, 1.8447265625, 2.0382080078125, 2.231689453125, 2.4251708984375, 2.61865234375, 2.8121337890625, 3.005615234375, 3.1990966796875, 3.392578125, 3.5860595703125, 3.779541015625, 3.9730224609375, 4.16650390625, 4.3599853515625, 4.553466796875, 4.7469482421875, 4.9404296875, 5.1339111328125, 5.327392578125, 5.5208740234375, 5.71435546875, 5.9078369140625, 6.101318359375, 6.2947998046875, 6.48828125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 7.0, 5.0, 5.0, 7.0, 11.0, 8.0, 16.0, 10.0, 12.0, 19.0, 20.0, 31.0, 19.0, 36.0, 32.0, 31.0, 29.0, 37.0, 37.0, 41.0, 39.0, 41.0, 26.0, 39.0, 56.0, 47.0, 41.0, 38.0, 32.0, 25.0, 24.0, 31.0, 21.0, 17.0, 18.0, 15.0, 12.0, 14.0, 5.0, 6.0, 6.0, 10.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.223388671875, -7.96240234375, -7.701416015625, -7.4404296875, -7.179443359375, -6.91845703125, -6.657470703125, -6.396484375, -6.135498046875, -5.87451171875, -5.613525390625, -5.3525390625, -5.091552734375, -4.83056640625, -4.569580078125, -4.30859375, -4.047607421875, -3.78662109375, -3.525634765625, -3.2646484375, -3.003662109375, -2.74267578125, -2.481689453125, -2.220703125, -1.959716796875, -1.69873046875, -1.437744140625, -1.1767578125, -0.915771484375, -0.65478515625, -0.393798828125, -0.1328125, 0.128173828125, 0.38916015625, 0.650146484375, 0.9111328125, 1.172119140625, 1.43310546875, 1.694091796875, 1.955078125, 2.216064453125, 2.47705078125, 2.738037109375, 2.9990234375, 3.260009765625, 3.52099609375, 3.781982421875, 4.04296875, 4.303955078125, 4.56494140625, 4.825927734375, 5.0869140625, 5.347900390625, 5.60888671875, 5.869873046875, 6.130859375, 6.391845703125, 6.65283203125, 6.913818359375, 7.1748046875, 7.435791015625, 7.69677734375, 7.957763671875, 8.21875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 15.0, 19.0, 26.0, 42.0, 58.0, 99.0, 165.0, 250.0, 469.0, 799.0, 1299.0, 2265.0, 4176.0, 7602.0, 14643.0, 28025.0, 54474.0, 100309.0, 165524.0, 211517.0, 188939.0, 123180.0, 68261.0, 36096.0, 18560.0, 9680.0, 5132.0, 2961.0, 1656.0, 972.0, 550.0, 307.0, 174.0, 124.0, 69.0, 43.0, 37.0, 14.0, 10.0, 7.0, 1.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.46221923828125, -6.2369384765625, -6.01165771484375, -5.786376953125, -5.56109619140625, -5.3358154296875, -5.11053466796875, -4.88525390625, -4.65997314453125, -4.4346923828125, -4.20941162109375, -3.984130859375, -3.75885009765625, -3.5335693359375, -3.30828857421875, -3.0830078125, -2.85772705078125, -2.6324462890625, -2.40716552734375, -2.181884765625, -1.95660400390625, -1.7313232421875, -1.50604248046875, -1.28076171875, -1.05548095703125, -0.8302001953125, -0.60491943359375, -0.379638671875, -0.15435791015625, 0.0709228515625, 0.29620361328125, 0.521484375, 0.74676513671875, 0.9720458984375, 1.19732666015625, 1.422607421875, 1.64788818359375, 1.8731689453125, 2.09844970703125, 2.32373046875, 2.54901123046875, 2.7742919921875, 2.99957275390625, 3.224853515625, 3.45013427734375, 3.6754150390625, 3.90069580078125, 4.1259765625, 4.35125732421875, 4.5765380859375, 4.80181884765625, 5.027099609375, 5.25238037109375, 5.4776611328125, 5.70294189453125, 5.92822265625, 6.15350341796875, 6.3787841796875, 6.60406494140625, 6.829345703125, 7.05462646484375, 7.2799072265625, 7.50518798828125, 7.73046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 11.0, 8.0, 8.0, 17.0, 10.0, 19.0, 23.0, 22.0, 25.0, 28.0, 22.0, 33.0, 45.0, 47.0, 44.0, 36.0, 37.0, 36.0, 55.0, 38.0, 27.0, 41.0, 35.0, 48.0, 39.0, 33.0, 30.0, 25.0, 24.0, 20.0, 24.0, 16.0, 10.0, 15.0, 9.0, 9.0, 10.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3515625, -5.1917724609375, -5.031982421875, -4.8721923828125, -4.71240234375, -4.5526123046875, -4.392822265625, -4.2330322265625, -4.0732421875, -3.9134521484375, -3.753662109375, -3.5938720703125, -3.43408203125, -3.2742919921875, -3.114501953125, -2.9547119140625, -2.794921875, -2.6351318359375, -2.475341796875, -2.3155517578125, -2.15576171875, -1.9959716796875, -1.836181640625, -1.6763916015625, -1.5166015625, -1.3568115234375, -1.197021484375, -1.0372314453125, -0.87744140625, -0.7176513671875, -0.557861328125, -0.3980712890625, -0.23828125, -0.0784912109375, 0.081298828125, 0.2410888671875, 0.40087890625, 0.5606689453125, 0.720458984375, 0.8802490234375, 1.0400390625, 1.1998291015625, 1.359619140625, 1.5194091796875, 1.67919921875, 1.8389892578125, 1.998779296875, 2.1585693359375, 2.318359375, 2.4781494140625, 2.637939453125, 2.7977294921875, 2.95751953125, 3.1173095703125, 3.277099609375, 3.4368896484375, 3.5966796875, 3.7564697265625, 3.916259765625, 4.0760498046875, 4.23583984375, 4.3956298828125, 4.555419921875, 4.7152099609375, 4.875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 9.0, 12.0, 17.0, 32.0, 37.0, 46.0, 76.0, 114.0, 192.0, 265.0, 372.0, 629.0, 999.0, 1785.0, 3072.0, 5683.0, 11285.0, 22890.0, 49565.0, 107350.0, 214324.0, 274196.0, 185458.0, 89178.0, 40771.0, 19111.0, 9434.0, 4881.0, 2696.0, 1522.0, 988.0, 503.0, 346.0, 216.0, 140.0, 103.0, 79.0, 59.0, 31.0, 25.0, 15.0, 16.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.67059326171875, -4.4935302734375, -4.31646728515625, -4.139404296875, -3.96234130859375, -3.7852783203125, -3.60821533203125, -3.43115234375, -3.25408935546875, -3.0770263671875, -2.89996337890625, -2.722900390625, -2.54583740234375, -2.3687744140625, -2.19171142578125, -2.0146484375, -1.83758544921875, -1.6605224609375, -1.48345947265625, -1.306396484375, -1.12933349609375, -0.9522705078125, -0.77520751953125, -0.59814453125, -0.42108154296875, -0.2440185546875, -0.06695556640625, 0.110107421875, 0.28717041015625, 0.4642333984375, 0.64129638671875, 0.818359375, 0.99542236328125, 1.1724853515625, 1.34954833984375, 1.526611328125, 1.70367431640625, 1.8807373046875, 2.05780029296875, 2.23486328125, 2.41192626953125, 2.5889892578125, 2.76605224609375, 2.943115234375, 3.12017822265625, 3.2972412109375, 3.47430419921875, 3.6513671875, 3.82843017578125, 4.0054931640625, 4.18255615234375, 4.359619140625, 4.53668212890625, 4.7137451171875, 4.89080810546875, 5.06787109375, 5.24493408203125, 5.4219970703125, 5.59906005859375, 5.776123046875, 5.95318603515625, 6.1302490234375, 6.30731201171875, 6.484375]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 5.0, 4.0, 8.0, 14.0, 8.0, 17.0, 14.0, 17.0, 26.0, 23.0, 22.0, 31.0, 26.0, 32.0, 45.0, 46.0, 56.0, 52.0, 47.0, 55.0, 47.0, 40.0, 47.0, 47.0, 28.0, 24.0, 27.0, 33.0, 26.0, 21.0, 13.0, 17.0, 12.0, 8.0, 11.0, 9.0, 7.0, 5.0, 8.0, 5.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0002551078796386719, -0.0002466663718223572, -0.00023822486400604248, -0.00022978335618972778, -0.00022134184837341309, -0.0002129003405570984, -0.0002044588327407837, -0.000196017324924469, -0.0001875758171081543, -0.0001791343092918396, -0.0001706928014755249, -0.0001622512936592102, -0.0001538097858428955, -0.0001453682780265808, -0.0001369267702102661, -0.00012848526239395142, -0.00012004375457763672, -0.00011160224676132202, -0.00010316073894500732, -9.471923112869263e-05, -8.627772331237793e-05, -7.783621549606323e-05, -6.939470767974854e-05, -6.095319986343384e-05, -5.251169204711914e-05, -4.407018423080444e-05, -3.5628676414489746e-05, -2.718716859817505e-05, -1.874566078186035e-05, -1.0304152965545654e-05, -1.862645149230957e-06, 6.57886266708374e-06, 1.5020370483398438e-05, 2.3461878299713135e-05, 3.190338611602783e-05, 4.034489393234253e-05, 4.8786401748657227e-05, 5.7227909564971924e-05, 6.566941738128662e-05, 7.411092519760132e-05, 8.255243301391602e-05, 9.099394083023071e-05, 9.943544864654541e-05, 0.00010787695646286011, 0.0001163184642791748, 0.0001247599720954895, 0.0001332014799118042, 0.0001416429877281189, 0.0001500844955444336, 0.0001585260033607483, 0.000166967511177063, 0.00017540901899337769, 0.00018385052680969238, 0.00019229203462600708, 0.00020073354244232178, 0.00020917505025863647, 0.00021761655807495117, 0.00022605806589126587, 0.00023449957370758057, 0.00024294108152389526, 0.00025138258934020996, 0.00025982409715652466, 0.00026826560497283936, 0.00027670711278915405, 0.00028514862060546875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 12.0, 4.0, 12.0, 28.0, 37.0, 52.0, 60.0, 110.0, 159.0, 215.0, 327.0, 527.0, 812.0, 1214.0, 1998.0, 3265.0, 5327.0, 9287.0, 16223.0, 29274.0, 53170.0, 96868.0, 162058.0, 212075.0, 185707.0, 118999.0, 66464.0, 36132.0, 19918.0, 11305.0, 6429.0, 3911.0, 2463.0, 1480.0, 901.0, 590.0, 354.0, 242.0, 169.0, 107.0, 89.0, 41.0, 44.0, 20.0, 17.0, 15.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0], "bins": [-4.41015625, -4.27520751953125, -4.1402587890625, -4.00531005859375, -3.870361328125, -3.73541259765625, -3.6004638671875, -3.46551513671875, -3.33056640625, -3.19561767578125, -3.0606689453125, -2.92572021484375, -2.790771484375, -2.65582275390625, -2.5208740234375, -2.38592529296875, -2.2509765625, -2.11602783203125, -1.9810791015625, -1.84613037109375, -1.711181640625, -1.57623291015625, -1.4412841796875, -1.30633544921875, -1.17138671875, -1.03643798828125, -0.9014892578125, -0.76654052734375, -0.631591796875, -0.49664306640625, -0.3616943359375, -0.22674560546875, -0.091796875, 0.04315185546875, 0.1781005859375, 0.31304931640625, 0.447998046875, 0.58294677734375, 0.7178955078125, 0.85284423828125, 0.98779296875, 1.12274169921875, 1.2576904296875, 1.39263916015625, 1.527587890625, 1.66253662109375, 1.7974853515625, 1.93243408203125, 2.0673828125, 2.20233154296875, 2.3372802734375, 2.47222900390625, 2.607177734375, 2.74212646484375, 2.8770751953125, 3.01202392578125, 3.14697265625, 3.28192138671875, 3.4168701171875, 3.55181884765625, 3.686767578125, 3.82171630859375, 3.9566650390625, 4.09161376953125, 4.2265625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 2.0, 3.0, 6.0, 7.0, 10.0, 8.0, 10.0, 12.0, 13.0, 18.0, 20.0, 22.0, 32.0, 32.0, 33.0, 42.0, 56.0, 61.0, 58.0, 48.0, 65.0, 50.0, 49.0, 49.0, 45.0, 36.0, 36.0, 26.0, 22.0, 20.0, 16.0, 11.0, 12.0, 14.0, 13.0, 10.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.3740234375, -1.337493896484375, -1.30096435546875, -1.264434814453125, -1.2279052734375, -1.191375732421875, -1.15484619140625, -1.118316650390625, -1.081787109375, -1.045257568359375, -1.00872802734375, -0.972198486328125, -0.9356689453125, -0.899139404296875, -0.86260986328125, -0.826080322265625, -0.78955078125, -0.753021240234375, -0.71649169921875, -0.679962158203125, -0.6434326171875, -0.606903076171875, -0.57037353515625, -0.533843994140625, -0.497314453125, -0.460784912109375, -0.42425537109375, -0.387725830078125, -0.3511962890625, -0.314666748046875, -0.27813720703125, -0.241607666015625, -0.205078125, -0.168548583984375, -0.13201904296875, -0.095489501953125, -0.0589599609375, -0.022430419921875, 0.01409912109375, 0.050628662109375, 0.087158203125, 0.123687744140625, 0.16021728515625, 0.196746826171875, 0.2332763671875, 0.269805908203125, 0.30633544921875, 0.342864990234375, 0.37939453125, 0.415924072265625, 0.45245361328125, 0.488983154296875, 0.5255126953125, 0.562042236328125, 0.59857177734375, 0.635101318359375, 0.671630859375, 0.708160400390625, 0.74468994140625, 0.781219482421875, 0.8177490234375, 0.854278564453125, 0.89080810546875, 0.927337646484375, 0.9638671875]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 5.0, 19.0, 23.0, 27.0, 40.0, 60.0, 57.0, 80.0, 74.0, 87.0, 107.0, 74.0, 71.0, 54.0, 42.0, 44.0, 31.0, 17.0, 14.0, 10.0, 10.0, 5.0, 7.0, 6.0, 3.0, 6.0, 0.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.410272598266602, -11.983416557312012, -11.556561470031738, -11.129705429077148, -10.702850341796875, -10.275994300842285, -9.849138259887695, -9.422283172607422, -8.995427131652832, -8.568571090698242, -8.141716003417969, -7.714859962463379, -7.288004398345947, -6.861148834228516, -6.434293270111084, -6.007437705993652, -5.580582141876221, -5.153726577758789, -4.726871013641357, -4.300015449523926, -3.873159408569336, -3.4463038444519043, -3.0194482803344727, -2.592592477798462, -2.1657369136810303, -1.738881230354309, -1.312025547027588, -0.8851699829101562, -0.45831429958343506, -0.03145861625671387, 0.3953969478607178, 0.8222527503967285, 1.2491083145141602, 1.6759639978408813, 2.1028196811676025, 2.529675245285034, 2.956531047821045, 3.3833866119384766, 3.810242176055908, 4.23709774017334, 4.66395378112793, 5.090809345245361, 5.517664909362793, 5.944520950317383, 6.3713765144348145, 6.798232078552246, 7.225087642669678, 7.651943206787109, 8.078798294067383, 8.505654335021973, 8.932509422302246, 9.359365463256836, 9.78622055053711, 10.2130765914917, 10.639932632446289, 11.066787719726562, 11.493643760681152, 11.920499801635742, 12.347354888916016, 12.774210929870605, 13.201066017150879, 13.627922058105469, 14.054777145385742, 14.481633186340332, 14.908489227294922]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 7.0, 4.0, 2.0, 2.0, 6.0, 9.0, 8.0, 13.0, 14.0, 11.0, 15.0, 24.0, 34.0, 33.0, 28.0, 29.0, 28.0, 38.0, 35.0, 39.0, 52.0, 40.0, 45.0, 44.0, 43.0, 55.0, 41.0, 37.0, 24.0, 43.0, 31.0, 36.0, 21.0, 18.0, 16.0, 17.0, 11.0, 13.0, 5.0, 7.0, 6.0, 4.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.970541954040527, -8.701791763305664, -8.433040618896484, -8.164290428161621, -7.895540237426758, -7.626789569854736, -7.358038902282715, -7.089288711547852, -6.82053804397583, -6.551787376403809, -6.283037185668945, -6.014286518096924, -5.745535850524902, -5.476785659790039, -5.208034992218018, -4.939284324645996, -4.670534133911133, -4.401783466339111, -4.133033275604248, -3.8642826080322266, -3.595532178878784, -3.326781749725342, -3.0580310821533203, -2.789280652999878, -2.5205302238464355, -2.251779794692993, -1.9830292463302612, -1.7142786979675293, -1.445528268814087, -1.1767778396606445, -0.9080272912979126, -0.6392767429351807, -0.3705263137817383, -0.10177582502365112, 0.16697466373443604, 0.4357251524925232, 0.7044756412506104, 0.9732260704040527, 1.2419766187667847, 1.5107271671295166, 1.779477596282959, 2.0482280254364014, 2.3169784545898438, 2.5857291221618652, 2.8544795513153076, 3.12322998046875, 3.3919806480407715, 3.660731077194214, 3.9294815063476562, 4.198232173919678, 4.466982364654541, 4.7357330322265625, 5.004483222961426, 5.273233890533447, 5.541984558105469, 5.810734748840332, 6.0794854164123535, 6.348236083984375, 6.616986274719238, 6.88573694229126, 7.154487609863281, 7.4232378005981445, 7.691988468170166, 7.9607391357421875, 8.22948932647705]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 12.0, 11.0, 20.0, 26.0, 44.0, 81.0, 119.0, 150.0, 212.0, 292.0, 336.0, 500.0, 728.0, 1021.0, 1509.0, 2382.0, 3723.0, 6215.0, 10901.0, 21349.0, 48899.0, 140529.0, 498906.0, 1462024.0, 1340880.0, 434034.0, 125514.0, 45694.0, 20604.0, 10648.0, 6009.0, 3660.0, 2259.0, 1459.0, 1041.0, 703.0, 515.0, 386.0, 280.0, 164.0, 133.0, 88.0, 73.0, 40.0, 27.0, 17.0, 15.0, 13.0, 13.0, 3.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-12.7578125, -12.3455810546875, -11.933349609375, -11.5211181640625, -11.10888671875, -10.6966552734375, -10.284423828125, -9.8721923828125, -9.4599609375, -9.0477294921875, -8.635498046875, -8.2232666015625, -7.81103515625, -7.3988037109375, -6.986572265625, -6.5743408203125, -6.162109375, -5.7498779296875, -5.337646484375, -4.9254150390625, -4.51318359375, -4.1009521484375, -3.688720703125, -3.2764892578125, -2.8642578125, -2.4520263671875, -2.039794921875, -1.6275634765625, -1.21533203125, -0.8031005859375, -0.390869140625, 0.0213623046875, 0.43359375, 0.8458251953125, 1.258056640625, 1.6702880859375, 2.08251953125, 2.4947509765625, 2.906982421875, 3.3192138671875, 3.7314453125, 4.1436767578125, 4.555908203125, 4.9681396484375, 5.38037109375, 5.7926025390625, 6.204833984375, 6.6170654296875, 7.029296875, 7.4415283203125, 7.853759765625, 8.2659912109375, 8.67822265625, 9.0904541015625, 9.502685546875, 9.9149169921875, 10.3271484375, 10.7393798828125, 11.151611328125, 11.5638427734375, 11.97607421875, 12.3883056640625, 12.800537109375, 13.2127685546875, 13.625]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 8.0, 4.0, 6.0, 5.0, 8.0, 9.0, 12.0, 19.0, 16.0, 22.0, 32.0, 26.0, 29.0, 29.0, 29.0, 37.0, 40.0, 39.0, 44.0, 47.0, 50.0, 39.0, 44.0, 38.0, 36.0, 43.0, 34.0, 48.0, 24.0, 25.0, 22.0, 22.0, 18.0, 20.0, 15.0, 9.0, 5.0, 11.0, 3.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.82421875, -5.64447021484375, -5.4647216796875, -5.28497314453125, -5.105224609375, -4.92547607421875, -4.7457275390625, -4.56597900390625, -4.38623046875, -4.20648193359375, -4.0267333984375, -3.84698486328125, -3.667236328125, -3.48748779296875, -3.3077392578125, -3.12799072265625, -2.9482421875, -2.76849365234375, -2.5887451171875, -2.40899658203125, -2.229248046875, -2.04949951171875, -1.8697509765625, -1.69000244140625, -1.51025390625, -1.33050537109375, -1.1507568359375, -0.97100830078125, -0.791259765625, -0.61151123046875, -0.4317626953125, -0.25201416015625, -0.072265625, 0.10748291015625, 0.2872314453125, 0.46697998046875, 0.646728515625, 0.82647705078125, 1.0062255859375, 1.18597412109375, 1.36572265625, 1.54547119140625, 1.7252197265625, 1.90496826171875, 2.084716796875, 2.26446533203125, 2.4442138671875, 2.62396240234375, 2.8037109375, 2.98345947265625, 3.1632080078125, 3.34295654296875, 3.522705078125, 3.70245361328125, 3.8822021484375, 4.06195068359375, 4.24169921875, 4.42144775390625, 4.6011962890625, 4.78094482421875, 4.960693359375, 5.14044189453125, 5.3201904296875, 5.49993896484375, 5.6796875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 14.0, 15.0, 15.0, 23.0, 35.0, 39.0, 76.0, 113.0, 134.0, 189.0, 331.0, 505.0, 742.0, 1182.0, 1930.0, 3449.0, 6035.0, 11138.0, 22774.0, 52314.0, 150885.0, 562934.0, 1793609.0, 1143125.0, 286181.0, 86705.0, 34152.0, 15829.0, 8136.0, 4581.0, 2733.0, 1549.0, 999.0, 619.0, 395.0, 247.0, 184.0, 114.0, 78.0, 57.0, 29.0, 27.0, 24.0, 13.0, 9.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.7421875, -15.2303466796875, -14.718505859375, -14.2066650390625, -13.69482421875, -13.1829833984375, -12.671142578125, -12.1593017578125, -11.6474609375, -11.1356201171875, -10.623779296875, -10.1119384765625, -9.60009765625, -9.0882568359375, -8.576416015625, -8.0645751953125, -7.552734375, -7.0408935546875, -6.529052734375, -6.0172119140625, -5.50537109375, -4.9935302734375, -4.481689453125, -3.9698486328125, -3.4580078125, -2.9461669921875, -2.434326171875, -1.9224853515625, -1.41064453125, -0.8988037109375, -0.386962890625, 0.1248779296875, 0.63671875, 1.1485595703125, 1.660400390625, 2.1722412109375, 2.68408203125, 3.1959228515625, 3.707763671875, 4.2196044921875, 4.7314453125, 5.2432861328125, 5.755126953125, 6.2669677734375, 6.77880859375, 7.2906494140625, 7.802490234375, 8.3143310546875, 8.826171875, 9.3380126953125, 9.849853515625, 10.3616943359375, 10.87353515625, 11.3853759765625, 11.897216796875, 12.4090576171875, 12.9208984375, 13.4327392578125, 13.944580078125, 14.4564208984375, 14.96826171875, 15.4801025390625, 15.991943359375, 16.5037841796875, 17.015625]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 9.0, 10.0, 8.0, 16.0, 16.0, 14.0, 39.0, 47.0, 54.0, 80.0, 94.0, 140.0, 191.0, 247.0, 315.0, 329.0, 375.0, 378.0, 349.0, 295.0, 246.0, 195.0, 156.0, 116.0, 70.0, 77.0, 57.0, 28.0, 18.0, 21.0, 15.0, 12.0, 16.0, 8.0, 5.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.193359375, -3.075347900390625, -2.95733642578125, -2.839324951171875, -2.7213134765625, -2.603302001953125, -2.48529052734375, -2.367279052734375, -2.249267578125, -2.131256103515625, -2.01324462890625, -1.895233154296875, -1.7772216796875, -1.659210205078125, -1.54119873046875, -1.423187255859375, -1.30517578125, -1.187164306640625, -1.06915283203125, -0.951141357421875, -0.8331298828125, -0.715118408203125, -0.59710693359375, -0.479095458984375, -0.361083984375, -0.243072509765625, -0.12506103515625, -0.007049560546875, 0.1109619140625, 0.228973388671875, 0.34698486328125, 0.464996337890625, 0.5830078125, 0.701019287109375, 0.81903076171875, 0.937042236328125, 1.0550537109375, 1.173065185546875, 1.29107666015625, 1.409088134765625, 1.527099609375, 1.645111083984375, 1.76312255859375, 1.881134033203125, 1.9991455078125, 2.117156982421875, 2.23516845703125, 2.353179931640625, 2.47119140625, 2.589202880859375, 2.70721435546875, 2.825225830078125, 2.9432373046875, 3.061248779296875, 3.17926025390625, 3.297271728515625, 3.415283203125, 3.533294677734375, 3.65130615234375, 3.769317626953125, 3.8873291015625, 4.005340576171875, 4.12335205078125, 4.241363525390625, 4.359375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 1.0, 5.0, 4.0, 9.0, 8.0, 12.0, 16.0, 16.0, 22.0, 32.0, 40.0, 41.0, 55.0, 68.0, 83.0, 83.0, 81.0, 92.0, 67.0, 58.0, 42.0, 37.0, 28.0, 20.0, 16.0, 8.0, 12.0, 7.0, 9.0, 8.0, 2.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.338517189025879, -10.969694137573242, -10.600870132446289, -10.232047080993652, -9.863224029541016, -9.494400024414062, -9.125576972961426, -8.756753921508789, -8.387929916381836, -8.0191068649292, -7.650283336639404, -7.281459808349609, -6.912636756896973, -6.543813228607178, -6.174989700317383, -5.806166648864746, -5.437343597412109, -5.0685200691223145, -4.699697017669678, -4.330873489379883, -3.962050199508667, -3.593226909637451, -3.2244033813476562, -2.8555800914764404, -2.4867568016052246, -2.117933511734009, -1.7491101026535034, -1.380286693572998, -1.0114634037017822, -0.6426401138305664, -0.2738165855407715, 0.09500670433044434, 0.46382904052734375, 0.8326523900032043, 1.201475739479065, 1.5702991485595703, 1.9391224384307861, 2.307945728302002, 2.676769256591797, 3.0455925464630127, 3.4144158363342285, 3.7832391262054443, 4.15206241607666, 4.520885944366455, 4.88970947265625, 5.258532524108887, 5.627356052398682, 5.996179580688477, 6.365002632141113, 6.733826160430908, 7.102649211883545, 7.47147274017334, 7.840295791625977, 8.20911979675293, 8.577942848205566, 8.946765899658203, 9.315589904785156, 9.684412956237793, 10.053236961364746, 10.422060012817383, 10.79088306427002, 11.159706115722656, 11.52853012084961, 11.897353172302246, 12.266176223754883]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 3.0, 7.0, 9.0, 9.0, 12.0, 11.0, 17.0, 20.0, 29.0, 20.0, 29.0, 30.0, 38.0, 37.0, 46.0, 47.0, 43.0, 54.0, 45.0, 58.0, 52.0, 59.0, 51.0, 33.0, 34.0, 39.0, 33.0, 23.0, 21.0, 20.0, 16.0, 8.0, 8.0, 4.0, 6.0, 9.0, 6.0, 1.0, 8.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.338496208190918, -9.068501472473145, -8.798506736755371, -8.528511047363281, -8.258516311645508, -7.988521575927734, -7.718526840209961, -7.4485321044921875, -7.178536891937256, -6.908542156219482, -6.638546943664551, -6.368552207946777, -6.098557472229004, -5.828562259674072, -5.558567523956299, -5.288572311401367, -5.018577575683594, -4.74858283996582, -4.478587627410889, -4.208592891693115, -3.9385979175567627, -3.66860294342041, -3.3986082077026367, -3.128613233566284, -2.8586182594299316, -2.588623285293579, -2.3186283111572266, -2.048633575439453, -1.7786386013031006, -1.508643627166748, -1.238648772239685, -0.9686539173126221, -0.6986584663391113, -0.42866355180740356, -0.1586686372756958, 0.11132627725601196, 0.3813211917877197, 0.6513161659240723, 0.9213110208511353, 1.1913058757781982, 1.4613008499145508, 1.7312958240509033, 2.001290798187256, 2.2712855339050293, 2.541280508041382, 2.8112754821777344, 3.081270217895508, 3.3512651920318604, 3.621260166168213, 3.8912551403045654, 4.161250114440918, 4.431244850158691, 4.701239585876465, 4.9712347984313965, 5.24122953414917, 5.511224746704102, 5.781219482421875, 6.051214218139648, 6.32120943069458, 6.5912041664123535, 6.861199378967285, 7.131194114685059, 7.401188850402832, 7.6711835861206055, 7.941178798675537]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 12.0, 9.0, 24.0, 37.0, 33.0, 51.0, 92.0, 90.0, 156.0, 205.0, 314.0, 441.0, 613.0, 939.0, 1484.0, 2363.0, 3868.0, 6561.0, 11258.0, 20798.0, 39475.0, 79208.0, 159218.0, 262598.0, 219084.0, 116100.0, 56685.0, 29100.0, 15358.0, 8728.0, 4993.0, 3024.0, 1875.0, 1181.0, 762.0, 528.0, 390.0, 239.0, 194.0, 129.0, 99.0, 62.0, 43.0, 36.0, 27.0, 10.0, 14.0, 13.0, 9.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.359375, -1.3178863525390625, -1.276397705078125, -1.2349090576171875, -1.19342041015625, -1.1519317626953125, -1.110443115234375, -1.0689544677734375, -1.0274658203125, -0.9859771728515625, -0.944488525390625, -0.9029998779296875, -0.86151123046875, -0.8200225830078125, -0.778533935546875, -0.7370452880859375, -0.695556640625, -0.6540679931640625, -0.612579345703125, -0.5710906982421875, -0.52960205078125, -0.4881134033203125, -0.446624755859375, -0.4051361083984375, -0.3636474609375, -0.3221588134765625, -0.280670166015625, -0.2391815185546875, -0.19769287109375, -0.1562042236328125, -0.114715576171875, -0.0732269287109375, -0.03173828125, 0.0097503662109375, 0.051239013671875, 0.0927276611328125, 0.13421630859375, 0.1757049560546875, 0.217193603515625, 0.2586822509765625, 0.3001708984375, 0.3416595458984375, 0.383148193359375, 0.4246368408203125, 0.46612548828125, 0.5076141357421875, 0.549102783203125, 0.5905914306640625, 0.632080078125, 0.6735687255859375, 0.715057373046875, 0.7565460205078125, 0.79803466796875, 0.8395233154296875, 0.881011962890625, 0.9225006103515625, 0.9639892578125, 1.0054779052734375, 1.046966552734375, 1.0884552001953125, 1.12994384765625, 1.1714324951171875, 1.212921142578125, 1.2544097900390625, 1.2958984375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 7.0, 14.0, 11.0, 16.0, 20.0, 20.0, 20.0, 24.0, 25.0, 30.0, 37.0, 29.0, 58.0, 49.0, 49.0, 54.0, 46.0, 65.0, 57.0, 49.0, 34.0, 42.0, 39.0, 32.0, 24.0, 42.0, 22.0, 12.0, 11.0, 8.0, 10.0, 5.0, 3.0, 9.0, 8.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0], "bins": [-10.4609375, -10.171630859375, -9.88232421875, -9.593017578125, -9.3037109375, -9.014404296875, -8.72509765625, -8.435791015625, -8.146484375, -7.857177734375, -7.56787109375, -7.278564453125, -6.9892578125, -6.699951171875, -6.41064453125, -6.121337890625, -5.83203125, -5.542724609375, -5.25341796875, -4.964111328125, -4.6748046875, -4.385498046875, -4.09619140625, -3.806884765625, -3.517578125, -3.228271484375, -2.93896484375, -2.649658203125, -2.3603515625, -2.071044921875, -1.78173828125, -1.492431640625, -1.203125, -0.913818359375, -0.62451171875, -0.335205078125, -0.0458984375, 0.243408203125, 0.53271484375, 0.822021484375, 1.111328125, 1.400634765625, 1.68994140625, 1.979248046875, 2.2685546875, 2.557861328125, 2.84716796875, 3.136474609375, 3.42578125, 3.715087890625, 4.00439453125, 4.293701171875, 4.5830078125, 4.872314453125, 5.16162109375, 5.450927734375, 5.740234375, 6.029541015625, 6.31884765625, 6.608154296875, 6.8974609375, 7.186767578125, 7.47607421875, 7.765380859375, 8.0546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 7.0, 11.0, 14.0, 17.0, 20.0, 40.0, 60.0, 104.0, 146.0, 180.0, 299.0, 501.0, 790.0, 1301.0, 2558.0, 5363.0, 13102.0, 42689.0, 878591.0, 71698.0, 17203.0, 6778.0, 3016.0, 1627.0, 916.0, 535.0, 339.0, 203.0, 151.0, 80.0, 65.0, 50.0, 31.0, 22.0, 12.0, 5.0, 11.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.48046875, -4.36138916015625, -4.2423095703125, -4.12322998046875, -4.004150390625, -3.88507080078125, -3.7659912109375, -3.64691162109375, -3.52783203125, -3.40875244140625, -3.2896728515625, -3.17059326171875, -3.051513671875, -2.93243408203125, -2.8133544921875, -2.69427490234375, -2.5751953125, -2.45611572265625, -2.3370361328125, -2.21795654296875, -2.098876953125, -1.97979736328125, -1.8607177734375, -1.74163818359375, -1.62255859375, -1.50347900390625, -1.3843994140625, -1.26531982421875, -1.146240234375, -1.02716064453125, -0.9080810546875, -0.78900146484375, -0.669921875, -0.55084228515625, -0.4317626953125, -0.31268310546875, -0.193603515625, -0.07452392578125, 0.0445556640625, 0.16363525390625, 0.28271484375, 0.40179443359375, 0.5208740234375, 0.63995361328125, 0.759033203125, 0.87811279296875, 0.9971923828125, 1.11627197265625, 1.2353515625, 1.35443115234375, 1.4735107421875, 1.59259033203125, 1.711669921875, 1.83074951171875, 1.9498291015625, 2.06890869140625, 2.18798828125, 2.30706787109375, 2.4261474609375, 2.54522705078125, 2.664306640625, 2.78338623046875, 2.9024658203125, 3.02154541015625, 3.140625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 11.0, 11.0, 11.0, 18.0, 19.0, 9.0, 23.0, 25.0, 29.0, 32.0, 34.0, 36.0, 41.0, 33.0, 38.0, 39.0, 43.0, 33.0, 51.0, 48.0, 37.0, 37.0, 36.0, 35.0, 34.0, 34.0, 25.0, 22.0, 27.0, 19.0, 18.0, 13.0, 17.0, 13.0, 14.0, 6.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.7457275390625, -4.589111328125, -4.4324951171875, -4.27587890625, -4.1192626953125, -3.962646484375, -3.8060302734375, -3.6494140625, -3.4927978515625, -3.336181640625, -3.1795654296875, -3.02294921875, -2.8663330078125, -2.709716796875, -2.5531005859375, -2.396484375, -2.2398681640625, -2.083251953125, -1.9266357421875, -1.77001953125, -1.6134033203125, -1.456787109375, -1.3001708984375, -1.1435546875, -0.9869384765625, -0.830322265625, -0.6737060546875, -0.51708984375, -0.3604736328125, -0.203857421875, -0.0472412109375, 0.109375, 0.2659912109375, 0.422607421875, 0.5792236328125, 0.73583984375, 0.8924560546875, 1.049072265625, 1.2056884765625, 1.3623046875, 1.5189208984375, 1.675537109375, 1.8321533203125, 1.98876953125, 2.1453857421875, 2.302001953125, 2.4586181640625, 2.615234375, 2.7718505859375, 2.928466796875, 3.0850830078125, 3.24169921875, 3.3983154296875, 3.554931640625, 3.7115478515625, 3.8681640625, 4.0247802734375, 4.181396484375, 4.3380126953125, 4.49462890625, 4.6512451171875, 4.807861328125, 4.9644775390625, 5.12109375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 10.0, 14.0, 27.0, 34.0, 54.0, 82.0, 113.0, 166.0, 248.0, 384.0, 609.0, 1124.0, 2240.0, 4454.0, 9659.0, 27056.0, 874968.0, 94088.0, 18362.0, 7305.0, 3466.0, 1631.0, 979.0, 554.0, 330.0, 208.0, 117.0, 77.0, 56.0, 36.0, 16.0, 20.0, 17.0, 12.0, 12.0, 9.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1669921875, -1.12506103515625, -1.0831298828125, -1.04119873046875, -0.999267578125, -0.95733642578125, -0.9154052734375, -0.87347412109375, -0.83154296875, -0.78961181640625, -0.7476806640625, -0.70574951171875, -0.663818359375, -0.62188720703125, -0.5799560546875, -0.53802490234375, -0.49609375, -0.45416259765625, -0.4122314453125, -0.37030029296875, -0.328369140625, -0.28643798828125, -0.2445068359375, -0.20257568359375, -0.16064453125, -0.11871337890625, -0.0767822265625, -0.03485107421875, 0.007080078125, 0.04901123046875, 0.0909423828125, 0.13287353515625, 0.1748046875, 0.21673583984375, 0.2586669921875, 0.30059814453125, 0.342529296875, 0.38446044921875, 0.4263916015625, 0.46832275390625, 0.51025390625, 0.55218505859375, 0.5941162109375, 0.63604736328125, 0.677978515625, 0.71990966796875, 0.7618408203125, 0.80377197265625, 0.845703125, 0.88763427734375, 0.9295654296875, 0.97149658203125, 1.013427734375, 1.05535888671875, 1.0972900390625, 1.13922119140625, 1.18115234375, 1.22308349609375, 1.2650146484375, 1.30694580078125, 1.348876953125, 1.39080810546875, 1.4327392578125, 1.47467041015625, 1.5166015625]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 8.0, 7.0, 11.0, 18.0, 27.0, 24.0, 24.0, 34.0, 31.0, 43.0, 57.0, 50.0, 49.0, 60.0, 61.0, 74.0, 45.0, 54.0, 51.0, 45.0, 40.0, 33.0, 32.0, 24.0, 18.0, 12.0, 10.0, 7.0, 6.0, 5.0, 0.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9114227294921875e-05, -4.7594308853149414e-05, -4.607439041137695e-05, -4.455447196960449e-05, -4.303455352783203e-05, -4.151463508605957e-05, -3.999471664428711e-05, -3.847479820251465e-05, -3.695487976074219e-05, -3.5434961318969727e-05, -3.3915042877197266e-05, -3.2395124435424805e-05, -3.0875205993652344e-05, -2.9355287551879883e-05, -2.7835369110107422e-05, -2.631545066833496e-05, -2.47955322265625e-05, -2.327561378479004e-05, -2.1755695343017578e-05, -2.0235776901245117e-05, -1.8715858459472656e-05, -1.7195940017700195e-05, -1.5676021575927734e-05, -1.4156103134155273e-05, -1.2636184692382812e-05, -1.1116266250610352e-05, -9.59634780883789e-06, -8.07642936706543e-06, -6.556510925292969e-06, -5.036592483520508e-06, -3.516674041748047e-06, -1.996755599975586e-06, -4.76837158203125e-07, 1.043081283569336e-06, 2.562999725341797e-06, 4.082918167114258e-06, 5.602836608886719e-06, 7.12275505065918e-06, 8.64267349243164e-06, 1.0162591934204102e-05, 1.1682510375976562e-05, 1.3202428817749023e-05, 1.4722347259521484e-05, 1.6242265701293945e-05, 1.7762184143066406e-05, 1.9282102584838867e-05, 2.0802021026611328e-05, 2.232193946838379e-05, 2.384185791015625e-05, 2.536177635192871e-05, 2.6881694793701172e-05, 2.8401613235473633e-05, 2.9921531677246094e-05, 3.1441450119018555e-05, 3.2961368560791016e-05, 3.4481287002563477e-05, 3.600120544433594e-05, 3.75211238861084e-05, 3.904104232788086e-05, 4.056096076965332e-05, 4.208087921142578e-05, 4.360079765319824e-05, 4.51207160949707e-05, 4.6640634536743164e-05, 4.8160552978515625e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 13.0, 17.0, 32.0, 40.0, 52.0, 71.0, 87.0, 160.0, 184.0, 288.0, 409.0, 594.0, 992.0, 1557.0, 2391.0, 3665.0, 6321.0, 10728.0, 18661.0, 34454.0, 67708.0, 145515.0, 272531.0, 240388.0, 117620.0, 55580.0, 28599.0, 15749.0, 9211.0, 5417.0, 3394.0, 2089.0, 1366.0, 840.0, 595.0, 354.0, 271.0, 199.0, 105.0, 76.0, 73.0, 48.0, 26.0, 16.0, 19.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.311767578125, -0.3013267517089844, -0.29088592529296875, -0.2804450988769531, -0.2700042724609375, -0.2595634460449219, -0.24912261962890625, -0.23868179321289062, -0.228240966796875, -0.21780014038085938, -0.20735931396484375, -0.19691848754882812, -0.1864776611328125, -0.17603683471679688, -0.16559600830078125, -0.15515518188476562, -0.14471435546875, -0.13427352905273438, -0.12383270263671875, -0.11339187622070312, -0.1029510498046875, -0.09251022338867188, -0.08206939697265625, -0.07162857055664062, -0.061187744140625, -0.050746917724609375, -0.04030609130859375, -0.029865264892578125, -0.0194244384765625, -0.008983612060546875, 0.00145721435546875, 0.011898040771484375, 0.0223388671875, 0.032779693603515625, 0.04322052001953125, 0.053661346435546875, 0.0641021728515625, 0.07454299926757812, 0.08498382568359375, 0.09542465209960938, 0.105865478515625, 0.11630630493164062, 0.12674713134765625, 0.13718795776367188, 0.1476287841796875, 0.15806961059570312, 0.16851043701171875, 0.17895126342773438, 0.18939208984375, 0.19983291625976562, 0.21027374267578125, 0.22071456909179688, 0.2311553955078125, 0.24159622192382812, 0.25203704833984375, 0.2624778747558594, 0.272918701171875, 0.2833595275878906, 0.29380035400390625, 0.3042411804199219, 0.3146820068359375, 0.3251228332519531, 0.33556365966796875, 0.3460044860839844, 0.3564453125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 12.0, 20.0, 19.0, 26.0, 31.0, 26.0, 54.0, 48.0, 52.0, 80.0, 76.0, 78.0, 67.0, 78.0, 54.0, 57.0, 42.0, 35.0, 29.0, 27.0, 18.0, 9.0, 9.0, 9.0, 12.0, 4.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0986328125, -0.09576606750488281, -0.09289932250976562, -0.09003257751464844, -0.08716583251953125, -0.08429908752441406, -0.08143234252929688, -0.07856559753417969, -0.0756988525390625, -0.07283210754394531, -0.06996536254882812, -0.06709861755371094, -0.06423187255859375, -0.06136512756347656, -0.058498382568359375, -0.05563163757324219, -0.052764892578125, -0.04989814758300781, -0.047031402587890625, -0.04416465759277344, -0.04129791259765625, -0.03843116760253906, -0.035564422607421875, -0.03269767761230469, -0.0298309326171875, -0.026964187622070312, -0.024097442626953125, -0.021230697631835938, -0.01836395263671875, -0.015497207641601562, -0.012630462646484375, -0.009763717651367188, -0.00689697265625, -0.0040302276611328125, -0.001163482666015625, 0.0017032623291015625, 0.00457000732421875, 0.0074367523193359375, 0.010303497314453125, 0.013170242309570312, 0.0160369873046875, 0.018903732299804688, 0.021770477294921875, 0.024637222290039062, 0.02750396728515625, 0.030370712280273438, 0.033237457275390625, 0.03610420227050781, 0.038970947265625, 0.04183769226074219, 0.044704437255859375, 0.04757118225097656, 0.05043792724609375, 0.05330467224121094, 0.056171417236328125, 0.05903816223144531, 0.0619049072265625, 0.06477165222167969, 0.06763839721679688, 0.07050514221191406, 0.07337188720703125, 0.07623863220214844, 0.07910537719726562, 0.08197212219238281, 0.0848388671875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 7.0, 9.0, 9.0, 13.0, 15.0, 21.0, 23.0, 37.0, 39.0, 52.0, 55.0, 82.0, 86.0, 82.0, 94.0, 74.0, 60.0, 53.0, 35.0, 33.0, 24.0, 19.0, 12.0, 8.0, 11.0, 11.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15794563293457, -10.789390563964844, -10.420836448669434, -10.052281379699707, -9.68372631072998, -9.31517219543457, -8.946617126464844, -8.578062057495117, -8.209507942199707, -7.840953350067139, -7.472398281097412, -7.103843688964844, -6.735289096832275, -6.366734504699707, -5.9981794357299805, -5.629624843597412, -5.2610697746276855, -4.892515182495117, -4.523960113525391, -4.155405521392822, -3.786850929260254, -3.4182960987091064, -3.049741268157959, -2.6811866760253906, -2.312631845474243, -1.9440771341323853, -1.5755224227905273, -1.2069675922393799, -0.838412880897522, -0.46985816955566406, -0.1013033390045166, 0.26725125312805176, 0.6358060836791992, 1.0043607950210571, 1.372915506362915, 1.7414703369140625, 2.110024929046631, 2.4785797595977783, 2.847134590148926, 3.215689182281494, 3.5842440128326416, 3.952798843383789, 4.321353435516357, 4.689908027648926, 5.058463096618652, 5.427017688751221, 5.795572280883789, 6.164127349853516, 6.532681941986084, 6.901236534118652, 7.269791603088379, 7.638346195220947, 8.006900787353516, 8.375455856323242, 8.744010925292969, 9.112565040588379, 9.481120109558105, 9.849675178527832, 10.218229293823242, 10.586784362792969, 10.955339431762695, 11.323893547058105, 11.692448616027832, 12.061002731323242, 12.429557800292969]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 11.0, 13.0, 14.0, 20.0, 32.0, 21.0, 26.0, 32.0, 36.0, 35.0, 47.0, 52.0, 39.0, 49.0, 50.0, 58.0, 51.0, 61.0, 50.0, 34.0, 36.0, 39.0, 31.0, 24.0, 21.0, 21.0, 16.0, 8.0, 7.0, 5.0, 5.0, 8.0, 7.0, 1.0, 8.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2908353805542, -9.021008491516113, -8.751181602478027, -8.481354713439941, -8.211527824401855, -7.9417009353637695, -7.671874523162842, -7.402047634124756, -7.13222074508667, -6.862393856048584, -6.592566967010498, -6.322740077972412, -6.052913665771484, -5.783086776733398, -5.5132598876953125, -5.243432998657227, -4.973606109619141, -4.703779220581055, -4.433952331542969, -4.164125442504883, -3.894298791885376, -3.62447190284729, -3.354645252227783, -3.0848183631896973, -2.8149914741516113, -2.5451645851135254, -2.2753376960754395, -2.0055110454559326, -1.7356841564178467, -1.4658572673797607, -1.1960304975509644, -0.926203727722168, -0.6563777923583984, -0.3865509629249573, -0.11672413349151611, 0.15310269594192505, 0.4229295253753662, 0.6927564144134521, 0.9625831842422485, 1.232409954071045, 1.5022368431091309, 1.7720637321472168, 2.0418906211853027, 2.3117172718048096, 2.5815441608428955, 2.8513710498809814, 3.1211977005004883, 3.391024589538574, 3.66085147857666, 3.930678367614746, 4.200505256652832, 4.470332145690918, 4.740159034729004, 5.00998592376709, 5.279812335968018, 5.5496392250061035, 5.8194661140441895, 6.089293003082275, 6.359119892120361, 6.628946781158447, 6.898773193359375, 7.168600082397461, 7.438426971435547, 7.708253860473633, 7.978080749511719]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 10.0, 14.0, 11.0, 29.0, 37.0, 41.0, 74.0, 92.0, 123.0, 194.0, 266.0, 400.0, 610.0, 1069.0, 1604.0, 2619.0, 4395.0, 7773.0, 13964.0, 26563.0, 51779.0, 100296.0, 174994.0, 227476.0, 190716.0, 114142.0, 60544.0, 31071.0, 15980.0, 8760.0, 4988.0, 2936.0, 1729.0, 1111.0, 714.0, 433.0, 326.0, 209.0, 138.0, 98.0, 71.0, 37.0, 43.0, 25.0, 12.0, 11.0, 8.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.03515625, -6.79754638671875, -6.5599365234375, -6.32232666015625, -6.084716796875, -5.84710693359375, -5.6094970703125, -5.37188720703125, -5.13427734375, -4.89666748046875, -4.6590576171875, -4.42144775390625, -4.183837890625, -3.94622802734375, -3.7086181640625, -3.47100830078125, -3.2333984375, -2.99578857421875, -2.7581787109375, -2.52056884765625, -2.282958984375, -2.04534912109375, -1.8077392578125, -1.57012939453125, -1.33251953125, -1.09490966796875, -0.8572998046875, -0.61968994140625, -0.382080078125, -0.14447021484375, 0.0931396484375, 0.33074951171875, 0.568359375, 0.80596923828125, 1.0435791015625, 1.28118896484375, 1.518798828125, 1.75640869140625, 1.9940185546875, 2.23162841796875, 2.46923828125, 2.70684814453125, 2.9444580078125, 3.18206787109375, 3.419677734375, 3.65728759765625, 3.8948974609375, 4.13250732421875, 4.3701171875, 4.60772705078125, 4.8453369140625, 5.08294677734375, 5.320556640625, 5.55816650390625, 5.7957763671875, 6.03338623046875, 6.27099609375, 6.50860595703125, 6.7462158203125, 6.98382568359375, 7.221435546875, 7.45904541015625, 7.6966552734375, 7.93426513671875, 8.171875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 12.0, 15.0, 14.0, 14.0, 24.0, 18.0, 18.0, 24.0, 45.0, 26.0, 47.0, 54.0, 53.0, 59.0, 42.0, 39.0, 44.0, 66.0, 48.0, 50.0, 34.0, 38.0, 31.0, 26.0, 24.0, 19.0, 18.0, 13.0, 11.0, 7.0, 4.0, 12.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.21875, -9.93756103515625, -9.6563720703125, -9.37518310546875, -9.093994140625, -8.81280517578125, -8.5316162109375, -8.25042724609375, -7.96923828125, -7.68804931640625, -7.4068603515625, -7.12567138671875, -6.844482421875, -6.56329345703125, -6.2821044921875, -6.00091552734375, -5.7197265625, -5.43853759765625, -5.1573486328125, -4.87615966796875, -4.594970703125, -4.31378173828125, -4.0325927734375, -3.75140380859375, -3.47021484375, -3.18902587890625, -2.9078369140625, -2.62664794921875, -2.345458984375, -2.06427001953125, -1.7830810546875, -1.50189208984375, -1.220703125, -0.93951416015625, -0.6583251953125, -0.37713623046875, -0.095947265625, 0.18524169921875, 0.4664306640625, 0.74761962890625, 1.02880859375, 1.30999755859375, 1.5911865234375, 1.87237548828125, 2.153564453125, 2.43475341796875, 2.7159423828125, 2.99713134765625, 3.2783203125, 3.55950927734375, 3.8406982421875, 4.12188720703125, 4.403076171875, 4.68426513671875, 4.9654541015625, 5.24664306640625, 5.52783203125, 5.80902099609375, 6.0902099609375, 6.37139892578125, 6.652587890625, 6.93377685546875, 7.2149658203125, 7.49615478515625, 7.77734375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 8.0, 10.0, 17.0, 26.0, 40.0, 52.0, 106.0, 138.0, 238.0, 350.0, 629.0, 1078.0, 1980.0, 3556.0, 7354.0, 16342.0, 39052.0, 95980.0, 215599.0, 301191.0, 207093.0, 90893.0, 36387.0, 15520.0, 7073.0, 3513.0, 1797.0, 976.0, 579.0, 353.0, 217.0, 148.0, 86.0, 56.0, 32.0, 27.0, 19.0, 5.0, 11.0, 3.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.0870361328125, -8.767822265625, -8.4486083984375, -8.12939453125, -7.8101806640625, -7.490966796875, -7.1717529296875, -6.8525390625, -6.5333251953125, -6.214111328125, -5.8948974609375, -5.57568359375, -5.2564697265625, -4.937255859375, -4.6180419921875, -4.298828125, -3.9796142578125, -3.660400390625, -3.3411865234375, -3.02197265625, -2.7027587890625, -2.383544921875, -2.0643310546875, -1.7451171875, -1.4259033203125, -1.106689453125, -0.7874755859375, -0.46826171875, -0.1490478515625, 0.170166015625, 0.4893798828125, 0.80859375, 1.1278076171875, 1.447021484375, 1.7662353515625, 2.08544921875, 2.4046630859375, 2.723876953125, 3.0430908203125, 3.3623046875, 3.6815185546875, 4.000732421875, 4.3199462890625, 4.63916015625, 4.9583740234375, 5.277587890625, 5.5968017578125, 5.916015625, 6.2352294921875, 6.554443359375, 6.8736572265625, 7.19287109375, 7.5120849609375, 7.831298828125, 8.1505126953125, 8.4697265625, 8.7889404296875, 9.108154296875, 9.4273681640625, 9.74658203125, 10.0657958984375, 10.385009765625, 10.7042236328125, 11.0234375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 2.0, 6.0, 9.0, 4.0, 14.0, 11.0, 24.0, 26.0, 26.0, 30.0, 33.0, 35.0, 34.0, 37.0, 31.0, 43.0, 38.0, 48.0, 43.0, 45.0, 41.0, 30.0, 35.0, 32.0, 36.0, 33.0, 31.0, 36.0, 32.0, 21.0, 17.0, 21.0, 18.0, 16.0, 11.0, 13.0, 3.0, 11.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.54296875, -4.40008544921875, -4.2572021484375, -4.11431884765625, -3.971435546875, -3.82855224609375, -3.6856689453125, -3.54278564453125, -3.39990234375, -3.25701904296875, -3.1141357421875, -2.97125244140625, -2.828369140625, -2.68548583984375, -2.5426025390625, -2.39971923828125, -2.2568359375, -2.11395263671875, -1.9710693359375, -1.82818603515625, -1.685302734375, -1.54241943359375, -1.3995361328125, -1.25665283203125, -1.11376953125, -0.97088623046875, -0.8280029296875, -0.68511962890625, -0.542236328125, -0.39935302734375, -0.2564697265625, -0.11358642578125, 0.029296875, 0.17218017578125, 0.3150634765625, 0.45794677734375, 0.600830078125, 0.74371337890625, 0.8865966796875, 1.02947998046875, 1.17236328125, 1.31524658203125, 1.4581298828125, 1.60101318359375, 1.743896484375, 1.88677978515625, 2.0296630859375, 2.17254638671875, 2.3154296875, 2.45831298828125, 2.6011962890625, 2.74407958984375, 2.886962890625, 3.02984619140625, 3.1727294921875, 3.31561279296875, 3.45849609375, 3.60137939453125, 3.7442626953125, 3.88714599609375, 4.030029296875, 4.17291259765625, 4.3157958984375, 4.45867919921875, 4.6015625]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 6.0, 4.0, 10.0, 13.0, 23.0, 40.0, 38.0, 48.0, 87.0, 98.0, 147.0, 222.0, 324.0, 453.0, 709.0, 1000.0, 1583.0, 2489.0, 4145.0, 6623.0, 11822.0, 20498.0, 37747.0, 70592.0, 132038.0, 215126.0, 223388.0, 144765.0, 78144.0, 41308.0, 22598.0, 12846.0, 7341.0, 4317.0, 2730.0, 1799.0, 1128.0, 721.0, 481.0, 329.0, 221.0, 168.0, 123.0, 65.0, 52.0, 46.0, 28.0, 27.0, 12.0, 11.0, 8.0, 6.0, 9.0, 2.0, 4.0, 0.0, 2.0], "bins": [-4.375, -4.24273681640625, -4.1104736328125, -3.97821044921875, -3.845947265625, -3.71368408203125, -3.5814208984375, -3.44915771484375, -3.31689453125, -3.18463134765625, -3.0523681640625, -2.92010498046875, -2.787841796875, -2.65557861328125, -2.5233154296875, -2.39105224609375, -2.2587890625, -2.12652587890625, -1.9942626953125, -1.86199951171875, -1.729736328125, -1.59747314453125, -1.4652099609375, -1.33294677734375, -1.20068359375, -1.06842041015625, -0.9361572265625, -0.80389404296875, -0.671630859375, -0.53936767578125, -0.4071044921875, -0.27484130859375, -0.142578125, -0.01031494140625, 0.1219482421875, 0.25421142578125, 0.386474609375, 0.51873779296875, 0.6510009765625, 0.78326416015625, 0.91552734375, 1.04779052734375, 1.1800537109375, 1.31231689453125, 1.444580078125, 1.57684326171875, 1.7091064453125, 1.84136962890625, 1.9736328125, 2.10589599609375, 2.2381591796875, 2.37042236328125, 2.502685546875, 2.63494873046875, 2.7672119140625, 2.89947509765625, 3.03173828125, 3.16400146484375, 3.2962646484375, 3.42852783203125, 3.560791015625, 3.69305419921875, 3.8253173828125, 3.95758056640625, 4.08984375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 11.0, 7.0, 4.0, 14.0, 11.0, 26.0, 42.0, 49.0, 54.0, 71.0, 84.0, 89.0, 84.0, 77.0, 85.0, 43.0, 38.0, 45.0, 43.0, 21.0, 18.0, 13.0, 14.0, 8.0, 3.0, 4.0, 6.0, 2.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0003750324249267578, -0.0003622807562351227, -0.00034952908754348755, -0.0003367774188518524, -0.0003240257501602173, -0.00031127408146858215, -0.000298522412776947, -0.0002857707440853119, -0.00027301907539367676, -0.0002602674067020416, -0.0002475157380104065, -0.00023476406931877136, -0.00022201240062713623, -0.0002092607319355011, -0.00019650906324386597, -0.00018375739455223083, -0.0001710057258605957, -0.00015825405716896057, -0.00014550238847732544, -0.0001327507197856903, -0.00011999905109405518, -0.00010724738240242004, -9.449571371078491e-05, -8.174404501914978e-05, -6.899237632751465e-05, -5.6240707635879517e-05, -4.3489038944244385e-05, -3.073737025260925e-05, -1.798570156097412e-05, -5.234032869338989e-06, 7.517635822296143e-06, 2.0269304513931274e-05, 3.3020973205566406e-05, 4.577264189720154e-05, 5.852431058883667e-05, 7.12759792804718e-05, 8.402764797210693e-05, 9.677931666374207e-05, 0.0001095309853553772, 0.00012228265404701233, 0.00013503432273864746, 0.0001477859914302826, 0.00016053766012191772, 0.00017328932881355286, 0.000186040997505188, 0.00019879266619682312, 0.00021154433488845825, 0.00022429600358009338, 0.00023704767227172852, 0.00024979934096336365, 0.0002625510096549988, 0.0002753026783466339, 0.00028805434703826904, 0.0003008060157299042, 0.0003135576844215393, 0.00032630935311317444, 0.00033906102180480957, 0.0003518126904964447, 0.00036456435918807983, 0.00037731602787971497, 0.0003900676965713501, 0.00040281936526298523, 0.00041557103395462036, 0.0004283227026462555, 0.0004410743713378906]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 5.0, 12.0, 8.0, 19.0, 25.0, 27.0, 61.0, 86.0, 116.0, 169.0, 276.0, 419.0, 576.0, 969.0, 1473.0, 2372.0, 4008.0, 6767.0, 12399.0, 23820.0, 47794.0, 103403.0, 204266.0, 269701.0, 186599.0, 91455.0, 43085.0, 21159.0, 11308.0, 6393.0, 3656.0, 2281.0, 1334.0, 870.0, 567.0, 329.0, 269.0, 130.0, 110.0, 78.0, 49.0, 32.0, 23.0, 18.0, 9.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.8046875, -4.656494140625, -4.50830078125, -4.360107421875, -4.2119140625, -4.063720703125, -3.91552734375, -3.767333984375, -3.619140625, -3.470947265625, -3.32275390625, -3.174560546875, -3.0263671875, -2.878173828125, -2.72998046875, -2.581787109375, -2.43359375, -2.285400390625, -2.13720703125, -1.989013671875, -1.8408203125, -1.692626953125, -1.54443359375, -1.396240234375, -1.248046875, -1.099853515625, -0.95166015625, -0.803466796875, -0.6552734375, -0.507080078125, -0.35888671875, -0.210693359375, -0.0625, 0.085693359375, 0.23388671875, 0.382080078125, 0.5302734375, 0.678466796875, 0.82666015625, 0.974853515625, 1.123046875, 1.271240234375, 1.41943359375, 1.567626953125, 1.7158203125, 1.864013671875, 2.01220703125, 2.160400390625, 2.30859375, 2.456787109375, 2.60498046875, 2.753173828125, 2.9013671875, 3.049560546875, 3.19775390625, 3.345947265625, 3.494140625, 3.642333984375, 3.79052734375, 3.938720703125, 4.0869140625, 4.235107421875, 4.38330078125, 4.531494140625, 4.6796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 4.0, 9.0, 10.0, 15.0, 14.0, 18.0, 16.0, 33.0, 36.0, 37.0, 46.0, 67.0, 56.0, 81.0, 81.0, 75.0, 70.0, 74.0, 59.0, 45.0, 41.0, 16.0, 21.0, 13.0, 13.0, 5.0, 10.0, 10.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.220703125, -1.1765594482421875, -1.132415771484375, -1.0882720947265625, -1.04412841796875, -0.9999847412109375, -0.955841064453125, -0.9116973876953125, -0.8675537109375, -0.8234100341796875, -0.779266357421875, -0.7351226806640625, -0.69097900390625, -0.6468353271484375, -0.602691650390625, -0.5585479736328125, -0.514404296875, -0.4702606201171875, -0.426116943359375, -0.3819732666015625, -0.33782958984375, -0.2936859130859375, -0.249542236328125, -0.2053985595703125, -0.1612548828125, -0.1171112060546875, -0.072967529296875, -0.0288238525390625, 0.01531982421875, 0.0594635009765625, 0.103607177734375, 0.1477508544921875, 0.19189453125, 0.2360382080078125, 0.280181884765625, 0.3243255615234375, 0.36846923828125, 0.4126129150390625, 0.456756591796875, 0.5009002685546875, 0.5450439453125, 0.5891876220703125, 0.633331298828125, 0.6774749755859375, 0.72161865234375, 0.7657623291015625, 0.809906005859375, 0.8540496826171875, 0.898193359375, 0.9423370361328125, 0.986480712890625, 1.0306243896484375, 1.07476806640625, 1.1189117431640625, 1.163055419921875, 1.2071990966796875, 1.2513427734375, 1.2954864501953125, 1.339630126953125, 1.3837738037109375, 1.42791748046875, 1.4720611572265625, 1.516204833984375, 1.5603485107421875, 1.6044921875]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 0.0, 5.0, 5.0, 7.0, 8.0, 10.0, 9.0, 15.0, 23.0, 29.0, 38.0, 34.0, 50.0, 60.0, 58.0, 91.0, 93.0, 89.0, 86.0, 56.0, 51.0, 44.0, 34.0, 21.0, 19.0, 12.0, 10.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4403076171875, -10.073962211608887, -9.707616806030273, -9.341270446777344, -8.97492504119873, -8.608579635620117, -8.242233276367188, -7.875887870788574, -7.509542465209961, -7.143197059631348, -6.776851177215576, -6.410505294799805, -6.044159889221191, -5.677814483642578, -5.311468601226807, -4.945122718811035, -4.578777313232422, -4.212431907653809, -3.846086025238037, -3.4797403812408447, -3.1133947372436523, -2.74704909324646, -2.3807034492492676, -2.014357805252075, -1.6480121612548828, -1.2816665172576904, -0.915320873260498, -0.5489752292633057, -0.18262958526611328, 0.1837160587310791, 0.5500617027282715, 0.9164073467254639, 1.2827520370483398, 1.6490976810455322, 2.0154433250427246, 2.381788969039917, 2.7481346130371094, 3.1144802570343018, 3.480825901031494, 3.8471715450286865, 4.213517189025879, 4.579862594604492, 4.946208477020264, 5.312554359436035, 5.678899765014648, 6.045245170593262, 6.411591053009033, 6.777936935424805, 7.144282341003418, 7.510627746582031, 7.876973628997803, 8.243319511413574, 8.609664916992188, 8.9760103225708, 9.342355728149414, 9.708702087402344, 10.075047492980957, 10.44139289855957, 10.8077392578125, 11.174084663391113, 11.540430068969727, 11.90677547454834, 12.273120880126953, 12.639467239379883, 13.005812644958496]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 6.0, 9.0, 14.0, 15.0, 12.0, 18.0, 26.0, 23.0, 31.0, 23.0, 28.0, 42.0, 35.0, 45.0, 52.0, 53.0, 57.0, 53.0, 55.0, 49.0, 48.0, 50.0, 39.0, 34.0, 26.0, 34.0, 26.0, 21.0, 16.0, 14.0, 12.0, 1.0, 7.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.169230461120605, -7.8959503173828125, -7.6226701736450195, -7.349390029907227, -7.076109886169434, -6.802829742431641, -6.529550075531006, -6.256269931793213, -5.98298978805542, -5.709709644317627, -5.436429500579834, -5.163149356842041, -4.889869689941406, -4.616589546203613, -4.34330940246582, -4.070029258728027, -3.7967491149902344, -3.5234689712524414, -3.2501888275146484, -2.9769089221954346, -2.7036287784576416, -2.4303486347198486, -2.1570687294006348, -1.8837885856628418, -1.6105084419250488, -1.3372282981872559, -1.0639482736587524, -0.7906681895256042, -0.517388105392456, -0.24410796165466309, 0.029172062873840332, 0.30245208740234375, 0.5757331848144531, 0.8490132689476013, 1.1222933530807495, 1.395573377609253, 1.668853521347046, 1.9421336650848389, 2.2154135704040527, 2.4886937141418457, 2.7619738578796387, 3.0352540016174316, 3.3085341453552246, 3.5818140506744385, 3.8550941944122314, 4.128374099731445, 4.401654243469238, 4.674934387207031, 4.948214530944824, 5.221494674682617, 5.49477481842041, 5.768054962158203, 6.041335105895996, 6.314615249633789, 6.587894916534424, 6.861175060272217, 7.13445520401001, 7.407735347747803, 7.681015491485596, 7.954295635223389, 8.227575302124023, 8.500855445861816, 8.77413558959961, 9.047415733337402, 9.320695877075195]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 10.0, 14.0, 21.0, 21.0, 32.0, 41.0, 54.0, 94.0, 120.0, 160.0, 262.0, 371.0, 522.0, 814.0, 1232.0, 2106.0, 3430.0, 5887.0, 10871.0, 23679.0, 63583.0, 243641.0, 1159808.0, 1928714.0, 556476.0, 119503.0, 37475.0, 15595.0, 7811.0, 4401.0, 2617.0, 1635.0, 1034.0, 692.0, 460.0, 330.0, 232.0, 155.0, 108.0, 75.0, 56.0, 42.0, 27.0, 21.0, 16.0, 16.0, 6.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-15.5078125, -15.027099609375, -14.54638671875, -14.065673828125, -13.5849609375, -13.104248046875, -12.62353515625, -12.142822265625, -11.662109375, -11.181396484375, -10.70068359375, -10.219970703125, -9.7392578125, -9.258544921875, -8.77783203125, -8.297119140625, -7.81640625, -7.335693359375, -6.85498046875, -6.374267578125, -5.8935546875, -5.412841796875, -4.93212890625, -4.451416015625, -3.970703125, -3.489990234375, -3.00927734375, -2.528564453125, -2.0478515625, -1.567138671875, -1.08642578125, -0.605712890625, -0.125, 0.355712890625, 0.83642578125, 1.317138671875, 1.7978515625, 2.278564453125, 2.75927734375, 3.239990234375, 3.720703125, 4.201416015625, 4.68212890625, 5.162841796875, 5.6435546875, 6.124267578125, 6.60498046875, 7.085693359375, 7.56640625, 8.047119140625, 8.52783203125, 9.008544921875, 9.4892578125, 9.969970703125, 10.45068359375, 10.931396484375, 11.412109375, 11.892822265625, 12.37353515625, 12.854248046875, 13.3349609375, 13.815673828125, 14.29638671875, 14.777099609375, 15.2578125]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 13.0, 7.0, 14.0, 14.0, 19.0, 20.0, 23.0, 30.0, 28.0, 38.0, 40.0, 51.0, 65.0, 68.0, 45.0, 56.0, 75.0, 62.0, 55.0, 49.0, 42.0, 31.0, 34.0, 21.0, 34.0, 13.0, 8.0, 13.0, 8.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.08447265625, -5.8681640625, -5.65185546875, -5.435546875, -5.21923828125, -5.0029296875, -4.78662109375, -4.5703125, -4.35400390625, -4.1376953125, -3.92138671875, -3.705078125, -3.48876953125, -3.2724609375, -3.05615234375, -2.83984375, -2.62353515625, -2.4072265625, -2.19091796875, -1.974609375, -1.75830078125, -1.5419921875, -1.32568359375, -1.109375, -0.89306640625, -0.6767578125, -0.46044921875, -0.244140625, -0.02783203125, 0.1884765625, 0.40478515625, 0.62109375, 0.83740234375, 1.0537109375, 1.27001953125, 1.486328125, 1.70263671875, 1.9189453125, 2.13525390625, 2.3515625, 2.56787109375, 2.7841796875, 3.00048828125, 3.216796875, 3.43310546875, 3.6494140625, 3.86572265625, 4.08203125, 4.29833984375, 4.5146484375, 4.73095703125, 4.947265625, 5.16357421875, 5.3798828125, 5.59619140625, 5.8125, 6.02880859375, 6.2451171875, 6.46142578125, 6.677734375, 6.89404296875, 7.1103515625, 7.32666015625, 7.54296875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 3.0, 9.0, 19.0, 13.0, 17.0, 24.0, 39.0, 50.0, 84.0, 100.0, 134.0, 252.0, 303.0, 510.0, 735.0, 1147.0, 1921.0, 3219.0, 5492.0, 9775.0, 19376.0, 41910.0, 104599.0, 326941.0, 1211883.0, 1682002.0, 519172.0, 152951.0, 56763.0, 25128.0, 12452.0, 6767.0, 3933.0, 2343.0, 1455.0, 933.0, 589.0, 393.0, 255.0, 177.0, 101.0, 85.0, 57.0, 42.0, 40.0, 24.0, 13.0, 10.0, 11.0, 11.0, 4.0, 4.0, 4.0, 1.0, 4.0], "bins": [-15.8125, -15.349853515625, -14.88720703125, -14.424560546875, -13.9619140625, -13.499267578125, -13.03662109375, -12.573974609375, -12.111328125, -11.648681640625, -11.18603515625, -10.723388671875, -10.2607421875, -9.798095703125, -9.33544921875, -8.872802734375, -8.41015625, -7.947509765625, -7.48486328125, -7.022216796875, -6.5595703125, -6.096923828125, -5.63427734375, -5.171630859375, -4.708984375, -4.246337890625, -3.78369140625, -3.321044921875, -2.8583984375, -2.395751953125, -1.93310546875, -1.470458984375, -1.0078125, -0.545166015625, -0.08251953125, 0.380126953125, 0.8427734375, 1.305419921875, 1.76806640625, 2.230712890625, 2.693359375, 3.156005859375, 3.61865234375, 4.081298828125, 4.5439453125, 5.006591796875, 5.46923828125, 5.931884765625, 6.39453125, 6.857177734375, 7.31982421875, 7.782470703125, 8.2451171875, 8.707763671875, 9.17041015625, 9.633056640625, 10.095703125, 10.558349609375, 11.02099609375, 11.483642578125, 11.9462890625, 12.408935546875, 12.87158203125, 13.334228515625, 13.796875]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 10.0, 17.0, 18.0, 13.0, 31.0, 26.0, 32.0, 49.0, 48.0, 81.0, 128.0, 125.0, 217.0, 219.0, 235.0, 301.0, 331.0, 349.0, 323.0, 293.0, 235.0, 202.0, 162.0, 118.0, 103.0, 71.0, 73.0, 50.0, 49.0, 22.0, 29.0, 20.0, 13.0, 15.0, 10.0, 12.0, 10.0, 4.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9453125, -2.851226806640625, -2.75714111328125, -2.663055419921875, -2.5689697265625, -2.474884033203125, -2.38079833984375, -2.286712646484375, -2.192626953125, -2.098541259765625, -2.00445556640625, -1.910369873046875, -1.8162841796875, -1.722198486328125, -1.62811279296875, -1.534027099609375, -1.43994140625, -1.345855712890625, -1.25177001953125, -1.157684326171875, -1.0635986328125, -0.969512939453125, -0.87542724609375, -0.781341552734375, -0.687255859375, -0.593170166015625, -0.49908447265625, -0.404998779296875, -0.3109130859375, -0.216827392578125, -0.12274169921875, -0.028656005859375, 0.0654296875, 0.159515380859375, 0.25360107421875, 0.347686767578125, 0.4417724609375, 0.535858154296875, 0.62994384765625, 0.724029541015625, 0.818115234375, 0.912200927734375, 1.00628662109375, 1.100372314453125, 1.1944580078125, 1.288543701171875, 1.38262939453125, 1.476715087890625, 1.57080078125, 1.664886474609375, 1.75897216796875, 1.853057861328125, 1.9471435546875, 2.041229248046875, 2.13531494140625, 2.229400634765625, 2.323486328125, 2.417572021484375, 2.51165771484375, 2.605743408203125, 2.6998291015625, 2.793914794921875, 2.88800048828125, 2.982086181640625, 3.076171875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 10.0, 12.0, 6.0, 5.0, 16.0, 16.0, 18.0, 22.0, 34.0, 37.0, 54.0, 69.0, 69.0, 91.0, 93.0, 86.0, 75.0, 67.0, 43.0, 44.0, 30.0, 22.0, 13.0, 14.0, 9.0, 10.0, 7.0, 3.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.406476020812988, -9.044198036193848, -8.681920051574707, -8.319642066955566, -7.957364082336426, -7.595086097717285, -7.2328081130981445, -6.870530128479004, -6.508252143859863, -6.145974159240723, -5.783696174621582, -5.421418190002441, -5.059140205383301, -4.69686222076416, -4.3345842361450195, -3.972306251525879, -3.6100282669067383, -3.2477502822875977, -2.885472297668457, -2.5231943130493164, -2.160916328430176, -1.7986383438110352, -1.4363603591918945, -1.074082374572754, -0.7118043899536133, -0.34952640533447266, 0.012751579284667969, 0.3750295639038086, 0.7373075485229492, 1.0995855331420898, 1.4618635177612305, 1.824141502380371, 2.186420440673828, 2.5486984252929688, 2.9109764099121094, 3.27325439453125, 3.6355323791503906, 3.9978103637695312, 4.360088348388672, 4.7223663330078125, 5.084644317626953, 5.446922302246094, 5.809200286865234, 6.171478271484375, 6.533756256103516, 6.896034240722656, 7.258312225341797, 7.6205902099609375, 7.982868194580078, 8.345146179199219, 8.70742416381836, 9.0697021484375, 9.43198013305664, 9.794258117675781, 10.156536102294922, 10.518814086914062, 10.881092071533203, 11.243370056152344, 11.605648040771484, 11.967926025390625, 12.330204010009766, 12.692481994628906, 13.054759979248047, 13.417037963867188, 13.779315948486328]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 8.0, 20.0, 14.0, 19.0, 27.0, 20.0, 23.0, 18.0, 28.0, 28.0, 27.0, 42.0, 42.0, 51.0, 38.0, 52.0, 44.0, 56.0, 56.0, 38.0, 48.0, 38.0, 40.0, 38.0, 26.0, 29.0, 16.0, 16.0, 21.0, 16.0, 9.0, 13.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3856658935546875, -7.149116039276123, -6.912566184997559, -6.676016807556152, -6.439466953277588, -6.202917098999023, -5.966367244720459, -5.7298173904418945, -5.49326753616333, -5.256717681884766, -5.020167827606201, -4.783617973327637, -4.5470685958862305, -4.310518741607666, -4.073968887329102, -3.837419033050537, -3.6008694171905518, -3.3643195629119873, -3.127769947052002, -2.8912200927734375, -2.654670238494873, -2.4181203842163086, -2.1815707683563232, -1.9450209140777588, -1.7084711790084839, -1.471921443939209, -1.2353715896606445, -0.9988218545913696, -0.76227205991745, -0.5257222652435303, -0.28917253017425537, -0.05262267589569092, 0.18392705917358398, 0.42047685384750366, 0.6570266485214233, 0.8935763835906982, 1.1301262378692627, 1.3666759729385376, 1.6032257080078125, 1.839775562286377, 2.0763254165649414, 2.312875270843506, 2.549424886703491, 2.7859747409820557, 3.02252459526062, 3.2590742111206055, 3.49562406539917, 3.7321739196777344, 3.9687235355377197, 4.205273151397705, 4.4418230056762695, 4.678372859954834, 4.914922714233398, 5.151472568511963, 5.388022422790527, 5.624571800231934, 5.861121654510498, 6.0976715087890625, 6.334221363067627, 6.570771217346191, 6.807320594787598, 7.043870449066162, 7.280420303344727, 7.516970157623291, 7.7535200119018555]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 4.0, 11.0, 10.0, 18.0, 27.0, 38.0, 39.0, 58.0, 99.0, 132.0, 187.0, 285.0, 394.0, 607.0, 908.0, 1331.0, 2128.0, 3333.0, 5019.0, 8148.0, 13186.0, 21955.0, 37451.0, 65452.0, 114441.0, 185501.0, 214867.0, 154100.0, 89968.0, 51465.0, 30362.0, 17523.0, 10628.0, 6658.0, 4238.0, 2678.0, 1748.0, 1129.0, 779.0, 504.0, 345.0, 260.0, 162.0, 115.0, 77.0, 56.0, 37.0, 28.0, 24.0, 8.0, 13.0, 11.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0], "bins": [-0.82275390625, -0.797271728515625, -0.77178955078125, -0.746307373046875, -0.7208251953125, -0.695343017578125, -0.66986083984375, -0.644378662109375, -0.618896484375, -0.593414306640625, -0.56793212890625, -0.542449951171875, -0.5169677734375, -0.491485595703125, -0.46600341796875, -0.440521240234375, -0.4150390625, -0.389556884765625, -0.36407470703125, -0.338592529296875, -0.3131103515625, -0.287628173828125, -0.26214599609375, -0.236663818359375, -0.211181640625, -0.185699462890625, -0.16021728515625, -0.134735107421875, -0.1092529296875, -0.083770751953125, -0.05828857421875, -0.032806396484375, -0.00732421875, 0.018157958984375, 0.04364013671875, 0.069122314453125, 0.0946044921875, 0.120086669921875, 0.14556884765625, 0.171051025390625, 0.196533203125, 0.222015380859375, 0.24749755859375, 0.272979736328125, 0.2984619140625, 0.323944091796875, 0.34942626953125, 0.374908447265625, 0.400390625, 0.425872802734375, 0.45135498046875, 0.476837158203125, 0.5023193359375, 0.527801513671875, 0.55328369140625, 0.578765869140625, 0.604248046875, 0.629730224609375, 0.65521240234375, 0.680694580078125, 0.7061767578125, 0.731658935546875, 0.75714111328125, 0.782623291015625, 0.80810546875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 14.0, 16.0, 21.0, 21.0, 20.0, 18.0, 32.0, 20.0, 37.0, 35.0, 39.0, 42.0, 37.0, 57.0, 52.0, 49.0, 55.0, 49.0, 53.0, 50.0, 48.0, 33.0, 36.0, 24.0, 18.0, 18.0, 18.0, 14.0, 7.0, 10.0, 10.0, 11.0, 3.0, 8.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.4915771484375, -8.217529296875, -7.9434814453125, -7.66943359375, -7.3953857421875, -7.121337890625, -6.8472900390625, -6.5732421875, -6.2991943359375, -6.025146484375, -5.7510986328125, -5.47705078125, -5.2030029296875, -4.928955078125, -4.6549072265625, -4.380859375, -4.1068115234375, -3.832763671875, -3.5587158203125, -3.28466796875, -3.0106201171875, -2.736572265625, -2.4625244140625, -2.1884765625, -1.9144287109375, -1.640380859375, -1.3663330078125, -1.09228515625, -0.8182373046875, -0.544189453125, -0.2701416015625, 0.00390625, 0.2779541015625, 0.552001953125, 0.8260498046875, 1.10009765625, 1.3741455078125, 1.648193359375, 1.9222412109375, 2.1962890625, 2.4703369140625, 2.744384765625, 3.0184326171875, 3.29248046875, 3.5665283203125, 3.840576171875, 4.1146240234375, 4.388671875, 4.6627197265625, 4.936767578125, 5.2108154296875, 5.48486328125, 5.7589111328125, 6.032958984375, 6.3070068359375, 6.5810546875, 6.8551025390625, 7.129150390625, 7.4031982421875, 7.67724609375, 7.9512939453125, 8.225341796875, 8.4993896484375, 8.7734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 9.0, 9.0, 10.0, 24.0, 32.0, 44.0, 57.0, 61.0, 90.0, 133.0, 194.0, 319.0, 454.0, 742.0, 1261.0, 2164.0, 4074.0, 8697.0, 21303.0, 103699.0, 833595.0, 42850.0, 14763.0, 6358.0, 3160.0, 1659.0, 936.0, 595.0, 388.0, 260.0, 178.0, 116.0, 88.0, 53.0, 51.0, 39.0, 28.0, 25.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.859375, -2.77349853515625, -2.6876220703125, -2.60174560546875, -2.515869140625, -2.42999267578125, -2.3441162109375, -2.25823974609375, -2.17236328125, -2.08648681640625, -2.0006103515625, -1.91473388671875, -1.828857421875, -1.74298095703125, -1.6571044921875, -1.57122802734375, -1.4853515625, -1.39947509765625, -1.3135986328125, -1.22772216796875, -1.141845703125, -1.05596923828125, -0.9700927734375, -0.88421630859375, -0.79833984375, -0.71246337890625, -0.6265869140625, -0.54071044921875, -0.454833984375, -0.36895751953125, -0.2830810546875, -0.19720458984375, -0.111328125, -0.02545166015625, 0.0604248046875, 0.14630126953125, 0.232177734375, 0.31805419921875, 0.4039306640625, 0.48980712890625, 0.57568359375, 0.66156005859375, 0.7474365234375, 0.83331298828125, 0.919189453125, 1.00506591796875, 1.0909423828125, 1.17681884765625, 1.2626953125, 1.34857177734375, 1.4344482421875, 1.52032470703125, 1.606201171875, 1.69207763671875, 1.7779541015625, 1.86383056640625, 1.94970703125, 2.03558349609375, 2.1214599609375, 2.20733642578125, 2.293212890625, 2.37908935546875, 2.4649658203125, 2.55084228515625, 2.63671875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 11.0, 8.0, 9.0, 16.0, 16.0, 16.0, 24.0, 15.0, 27.0, 26.0, 27.0, 40.0, 24.0, 38.0, 38.0, 60.0, 49.0, 54.0, 40.0, 49.0, 36.0, 49.0, 40.0, 41.0, 39.0, 35.0, 20.0, 34.0, 25.0, 19.0, 10.0, 7.0, 14.0, 10.0, 10.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.65625, -5.49835205078125, -5.3404541015625, -5.18255615234375, -5.024658203125, -4.86676025390625, -4.7088623046875, -4.55096435546875, -4.39306640625, -4.23516845703125, -4.0772705078125, -3.91937255859375, -3.761474609375, -3.60357666015625, -3.4456787109375, -3.28778076171875, -3.1298828125, -2.97198486328125, -2.8140869140625, -2.65618896484375, -2.498291015625, -2.34039306640625, -2.1824951171875, -2.02459716796875, -1.86669921875, -1.70880126953125, -1.5509033203125, -1.39300537109375, -1.235107421875, -1.07720947265625, -0.9193115234375, -0.76141357421875, -0.603515625, -0.44561767578125, -0.2877197265625, -0.12982177734375, 0.028076171875, 0.18597412109375, 0.3438720703125, 0.50177001953125, 0.65966796875, 0.81756591796875, 0.9754638671875, 1.13336181640625, 1.291259765625, 1.44915771484375, 1.6070556640625, 1.76495361328125, 1.9228515625, 2.08074951171875, 2.2386474609375, 2.39654541015625, 2.554443359375, 2.71234130859375, 2.8702392578125, 3.02813720703125, 3.18603515625, 3.34393310546875, 3.5018310546875, 3.65972900390625, 3.817626953125, 3.97552490234375, 4.1334228515625, 4.29132080078125, 4.44921875]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 7.0, 5.0, 10.0, 21.0, 29.0, 31.0, 34.0, 70.0, 112.0, 129.0, 185.0, 341.0, 538.0, 1039.0, 1870.0, 3832.0, 8554.0, 23764.0, 797469.0, 175834.0, 19850.0, 7507.0, 3295.0, 1697.0, 906.0, 513.0, 335.0, 171.0, 127.0, 91.0, 46.0, 25.0, 35.0, 19.0, 11.0, 10.0, 11.0, 12.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7666015625, -0.737030029296875, -0.70745849609375, -0.677886962890625, -0.6483154296875, -0.618743896484375, -0.58917236328125, -0.559600830078125, -0.530029296875, -0.500457763671875, -0.47088623046875, -0.441314697265625, -0.4117431640625, -0.382171630859375, -0.35260009765625, -0.323028564453125, -0.29345703125, -0.263885498046875, -0.23431396484375, -0.204742431640625, -0.1751708984375, -0.145599365234375, -0.11602783203125, -0.086456298828125, -0.056884765625, -0.027313232421875, 0.00225830078125, 0.031829833984375, 0.0614013671875, 0.090972900390625, 0.12054443359375, 0.150115966796875, 0.1796875, 0.209259033203125, 0.23883056640625, 0.268402099609375, 0.2979736328125, 0.327545166015625, 0.35711669921875, 0.386688232421875, 0.416259765625, 0.445831298828125, 0.47540283203125, 0.504974365234375, 0.5345458984375, 0.564117431640625, 0.59368896484375, 0.623260498046875, 0.65283203125, 0.682403564453125, 0.71197509765625, 0.741546630859375, 0.7711181640625, 0.800689697265625, 0.83026123046875, 0.859832763671875, 0.889404296875, 0.918975830078125, 0.94854736328125, 0.978118896484375, 1.0076904296875, 1.037261962890625, 1.06683349609375, 1.096405029296875, 1.1259765625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 5.0, 12.0, 8.0, 9.0, 11.0, 9.0, 8.0, 19.0, 12.0, 26.0, 20.0, 26.0, 22.0, 19.0, 22.0, 30.0, 35.0, 32.0, 31.0, 47.0, 38.0, 40.0, 41.0, 45.0, 57.0, 35.0, 34.0, 41.0, 33.0, 31.0, 30.0, 28.0, 29.0, 18.0, 17.0, 8.0, 15.0, 11.0, 9.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0], "bins": [-3.844499588012695e-05, -3.745127469301224e-05, -3.645755350589752e-05, -3.5463832318782806e-05, -3.447011113166809e-05, -3.3476389944553375e-05, -3.248266875743866e-05, -3.1488947570323944e-05, -3.049522638320923e-05, -2.9501505196094513e-05, -2.8507784008979797e-05, -2.7514062821865082e-05, -2.6520341634750366e-05, -2.552662044763565e-05, -2.4532899260520935e-05, -2.353917807340622e-05, -2.2545456886291504e-05, -2.155173569917679e-05, -2.0558014512062073e-05, -1.9564293324947357e-05, -1.857057213783264e-05, -1.7576850950717926e-05, -1.658312976360321e-05, -1.5589408576488495e-05, -1.459568738937378e-05, -1.3601966202259064e-05, -1.2608245015144348e-05, -1.1614523828029633e-05, -1.0620802640914917e-05, -9.627081453800201e-06, -8.633360266685486e-06, -7.63963907957077e-06, -6.645917892456055e-06, -5.652196705341339e-06, -4.6584755182266235e-06, -3.664754331111908e-06, -2.6710331439971924e-06, -1.6773119568824768e-06, -6.835907697677612e-07, 3.1013041734695435e-07, 1.30385160446167e-06, 2.2975727915763855e-06, 3.291293978691101e-06, 4.285015165805817e-06, 5.278736352920532e-06, 6.272457540035248e-06, 7.266178727149963e-06, 8.259899914264679e-06, 9.253621101379395e-06, 1.024734228849411e-05, 1.1241063475608826e-05, 1.2234784662723541e-05, 1.3228505849838257e-05, 1.4222227036952972e-05, 1.5215948224067688e-05, 1.6209669411182404e-05, 1.720339059829712e-05, 1.8197111785411835e-05, 1.919083297252655e-05, 2.0184554159641266e-05, 2.117827534675598e-05, 2.2171996533870697e-05, 2.3165717720985413e-05, 2.4159438908100128e-05, 2.5153160095214844e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 13.0, 14.0, 20.0, 43.0, 44.0, 81.0, 88.0, 135.0, 228.0, 384.0, 598.0, 1007.0, 1732.0, 3224.0, 6335.0, 13171.0, 30248.0, 78118.0, 216410.0, 380818.0, 193215.0, 70238.0, 27397.0, 11919.0, 5918.0, 3010.0, 1617.0, 954.0, 579.0, 336.0, 213.0, 132.0, 96.0, 65.0, 48.0, 29.0, 18.0, 12.0, 11.0, 15.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.384521484375, -0.3736724853515625, -0.362823486328125, -0.3519744873046875, -0.34112548828125, -0.3302764892578125, -0.319427490234375, -0.3085784912109375, -0.2977294921875, -0.2868804931640625, -0.276031494140625, -0.2651824951171875, -0.25433349609375, -0.2434844970703125, -0.232635498046875, -0.2217864990234375, -0.2109375, -0.2000885009765625, -0.189239501953125, -0.1783905029296875, -0.16754150390625, -0.1566925048828125, -0.145843505859375, -0.1349945068359375, -0.1241455078125, -0.1132965087890625, -0.102447509765625, -0.0915985107421875, -0.08074951171875, -0.0699005126953125, -0.059051513671875, -0.0482025146484375, -0.037353515625, -0.0265045166015625, -0.015655517578125, -0.0048065185546875, 0.00604248046875, 0.0168914794921875, 0.027740478515625, 0.0385894775390625, 0.0494384765625, 0.0602874755859375, 0.071136474609375, 0.0819854736328125, 0.09283447265625, 0.1036834716796875, 0.114532470703125, 0.1253814697265625, 0.13623046875, 0.1470794677734375, 0.157928466796875, 0.1687774658203125, 0.17962646484375, 0.1904754638671875, 0.201324462890625, 0.2121734619140625, 0.2230224609375, 0.2338714599609375, 0.244720458984375, 0.2555694580078125, 0.26641845703125, 0.2772674560546875, 0.288116455078125, 0.2989654541015625, 0.309814453125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 6.0, 4.0, 7.0, 2.0, 11.0, 8.0, 8.0, 13.0, 20.0, 27.0, 26.0, 36.0, 60.0, 42.0, 55.0, 71.0, 67.0, 76.0, 83.0, 64.0, 71.0, 53.0, 38.0, 33.0, 31.0, 23.0, 13.0, 10.0, 12.0, 9.0, 4.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08221435546875, -0.08006572723388672, -0.07791709899902344, -0.07576847076416016, -0.07361984252929688, -0.0714712142944336, -0.06932258605957031, -0.06717395782470703, -0.06502532958984375, -0.06287670135498047, -0.06072807312011719, -0.058579444885253906, -0.056430816650390625, -0.054282188415527344, -0.05213356018066406, -0.04998493194580078, -0.0478363037109375, -0.04568767547607422, -0.04353904724121094, -0.041390419006347656, -0.039241790771484375, -0.037093162536621094, -0.03494453430175781, -0.03279590606689453, -0.03064727783203125, -0.02849864959716797, -0.026350021362304688, -0.024201393127441406, -0.022052764892578125, -0.019904136657714844, -0.017755508422851562, -0.015606880187988281, -0.013458251953125, -0.011309623718261719, -0.009160995483398438, -0.007012367248535156, -0.004863739013671875, -0.0027151107788085938, -0.0005664825439453125, 0.0015821456909179688, 0.00373077392578125, 0.005879402160644531, 0.008028030395507812, 0.010176658630371094, 0.012325286865234375, 0.014473915100097656, 0.016622543334960938, 0.01877117156982422, 0.0209197998046875, 0.02306842803955078, 0.025217056274414062, 0.027365684509277344, 0.029514312744140625, 0.031662940979003906, 0.03381156921386719, 0.03596019744873047, 0.03810882568359375, 0.04025745391845703, 0.04240608215332031, 0.044554710388183594, 0.046703338623046875, 0.048851966857910156, 0.05100059509277344, 0.05314922332763672, 0.0552978515625]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 6.0, 10.0, 12.0, 5.0, 5.0, 18.0, 16.0, 15.0, 23.0, 36.0, 30.0, 58.0, 69.0, 64.0, 87.0, 91.0, 90.0, 75.0, 70.0, 44.0, 42.0, 31.0, 23.0, 12.0, 17.0, 8.0, 8.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.22718620300293, -8.87287712097168, -8.51856803894043, -8.16425895690918, -7.80994987487793, -7.45564079284668, -7.10133171081543, -6.74702262878418, -6.39271354675293, -6.03840446472168, -5.68409538269043, -5.32978630065918, -4.97547721862793, -4.62116813659668, -4.26685905456543, -3.9125497341156006, -3.5582404136657715, -3.2039313316345215, -2.8496222496032715, -2.4953131675720215, -2.1410040855407715, -1.786694884300232, -1.4323856830596924, -1.0780766010284424, -0.7237675189971924, -0.36945840716362, -0.015149295330047607, 0.33915984630584717, 0.6934689283370972, 1.0477780103683472, 1.4020872116088867, 1.7563962936401367, 2.1107053756713867, 2.4650144577026367, 2.8193235397338867, 3.1736326217651367, 3.5279417037963867, 3.8822507858276367, 4.236559867858887, 4.590868949890137, 4.945178031921387, 5.299487113952637, 5.653796195983887, 6.008105278015137, 6.362414360046387, 6.716723442077637, 7.071032524108887, 7.425341606140137, 7.779651165008545, 8.133960723876953, 8.488269805908203, 8.842578887939453, 9.196887969970703, 9.551197052001953, 9.905506134033203, 10.259815216064453, 10.614124298095703, 10.968433380126953, 11.322742462158203, 11.677051544189453, 12.031360626220703, 12.385669708251953, 12.739978790283203, 13.094287872314453, 13.448596954345703]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 0.0, 8.0, 7.0, 18.0, 14.0, 22.0, 21.0, 24.0, 21.0, 17.0, 31.0, 26.0, 30.0, 37.0, 43.0, 52.0, 38.0, 50.0, 42.0, 59.0, 51.0, 42.0, 47.0, 46.0, 37.0, 40.0, 22.0, 31.0, 19.0, 13.0, 20.0, 17.0, 8.0, 15.0, 7.0, 7.0, 2.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.396720886230469, -7.160707950592041, -6.924694538116455, -6.688681602478027, -6.452668190002441, -6.216655254364014, -5.980642318725586, -5.74462890625, -5.508615970611572, -5.2726030349731445, -5.036589622497559, -4.800576686859131, -4.564563751220703, -4.328550338745117, -4.0925374031066895, -3.8565242290496826, -3.620511054992676, -3.384497880935669, -3.148484706878662, -2.9124717712402344, -2.6764585971832275, -2.4404454231262207, -2.204432487487793, -1.9684193134307861, -1.7324061393737793, -1.4963929653167725, -1.2603799104690552, -1.024366855621338, -0.788353681564331, -0.5523405075073242, -0.31632745265960693, -0.08031439781188965, 0.1556987762451172, 0.39171189069747925, 0.6277250051498413, 0.8637381196022034, 1.0997512340545654, 1.3357644081115723, 1.5717774629592896, 1.8077905178070068, 2.0438036918640137, 2.2798168659210205, 2.5158300399780273, 2.751842975616455, 2.987856149673462, 3.2238693237304688, 3.4598822593688965, 3.6958954334259033, 3.93190860748291, 4.167921543121338, 4.403934955596924, 4.639947891235352, 4.8759613037109375, 5.111974239349365, 5.347987174987793, 5.584000587463379, 5.820013523101807, 6.056026458740234, 6.29203987121582, 6.528052806854248, 6.764065742492676, 7.000079154968262, 7.2360920906066895, 7.472105026245117, 7.708118438720703]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 4.0, 11.0, 15.0, 24.0, 35.0, 39.0, 79.0, 93.0, 153.0, 221.0, 290.0, 517.0, 754.0, 1226.0, 1988.0, 3521.0, 6057.0, 11231.0, 21499.0, 42916.0, 86420.0, 162521.0, 231918.0, 212181.0, 129254.0, 65542.0, 32923.0, 16348.0, 8641.0, 4776.0, 2776.0, 1655.0, 1060.0, 597.0, 416.0, 268.0, 161.0, 126.0, 83.0, 44.0, 40.0, 33.0, 30.0, 15.0, 15.0, 10.0, 5.0, 6.0, 2.0, 6.0, 0.0, 0.0, 2.0], "bins": [-7.35546875, -7.13787841796875, -6.9202880859375, -6.70269775390625, -6.485107421875, -6.26751708984375, -6.0499267578125, -5.83233642578125, -5.61474609375, -5.39715576171875, -5.1795654296875, -4.96197509765625, -4.744384765625, -4.52679443359375, -4.3092041015625, -4.09161376953125, -3.8740234375, -3.65643310546875, -3.4388427734375, -3.22125244140625, -3.003662109375, -2.78607177734375, -2.5684814453125, -2.35089111328125, -2.13330078125, -1.91571044921875, -1.6981201171875, -1.48052978515625, -1.262939453125, -1.04534912109375, -0.8277587890625, -0.61016845703125, -0.392578125, -0.17498779296875, 0.0426025390625, 0.26019287109375, 0.477783203125, 0.69537353515625, 0.9129638671875, 1.13055419921875, 1.34814453125, 1.56573486328125, 1.7833251953125, 2.00091552734375, 2.218505859375, 2.43609619140625, 2.6536865234375, 2.87127685546875, 3.0888671875, 3.30645751953125, 3.5240478515625, 3.74163818359375, 3.959228515625, 4.17681884765625, 4.3944091796875, 4.61199951171875, 4.82958984375, 5.04718017578125, 5.2647705078125, 5.48236083984375, 5.699951171875, 5.91754150390625, 6.1351318359375, 6.35272216796875, 6.5703125]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 15.0, 19.0, 17.0, 16.0, 21.0, 20.0, 18.0, 34.0, 29.0, 36.0, 36.0, 42.0, 44.0, 55.0, 62.0, 49.0, 51.0, 56.0, 43.0, 39.0, 49.0, 42.0, 35.0, 21.0, 24.0, 19.0, 23.0, 10.0, 15.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.74688720703125, -8.4859619140625, -8.22503662109375, -7.964111328125, -7.70318603515625, -7.4422607421875, -7.18133544921875, -6.92041015625, -6.65948486328125, -6.3985595703125, -6.13763427734375, -5.876708984375, -5.61578369140625, -5.3548583984375, -5.09393310546875, -4.8330078125, -4.57208251953125, -4.3111572265625, -4.05023193359375, -3.789306640625, -3.52838134765625, -3.2674560546875, -3.00653076171875, -2.74560546875, -2.48468017578125, -2.2237548828125, -1.96282958984375, -1.701904296875, -1.44097900390625, -1.1800537109375, -0.91912841796875, -0.658203125, -0.39727783203125, -0.1363525390625, 0.12457275390625, 0.385498046875, 0.64642333984375, 0.9073486328125, 1.16827392578125, 1.42919921875, 1.69012451171875, 1.9510498046875, 2.21197509765625, 2.472900390625, 2.73382568359375, 2.9947509765625, 3.25567626953125, 3.5166015625, 3.77752685546875, 4.0384521484375, 4.29937744140625, 4.560302734375, 4.82122802734375, 5.0821533203125, 5.34307861328125, 5.60400390625, 5.86492919921875, 6.1258544921875, 6.38677978515625, 6.647705078125, 6.90863037109375, 7.1695556640625, 7.43048095703125, 7.69140625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 14.0, 24.0, 22.0, 39.0, 52.0, 67.0, 98.0, 137.0, 189.0, 319.0, 433.0, 723.0, 1104.0, 1855.0, 3143.0, 5579.0, 10724.0, 21090.0, 43069.0, 90118.0, 169519.0, 240446.0, 210976.0, 124145.0, 61741.0, 29964.0, 14752.0, 7597.0, 4231.0, 2419.0, 1373.0, 855.0, 566.0, 335.0, 247.0, 156.0, 122.0, 96.0, 72.0, 44.0, 32.0, 12.0, 10.0, 12.0, 7.0, 6.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.203125, -6.9761962890625, -6.749267578125, -6.5223388671875, -6.29541015625, -6.0684814453125, -5.841552734375, -5.6146240234375, -5.3876953125, -5.1607666015625, -4.933837890625, -4.7069091796875, -4.47998046875, -4.2530517578125, -4.026123046875, -3.7991943359375, -3.572265625, -3.3453369140625, -3.118408203125, -2.8914794921875, -2.66455078125, -2.4376220703125, -2.210693359375, -1.9837646484375, -1.7568359375, -1.5299072265625, -1.302978515625, -1.0760498046875, -0.84912109375, -0.6221923828125, -0.395263671875, -0.1683349609375, 0.05859375, 0.2855224609375, 0.512451171875, 0.7393798828125, 0.96630859375, 1.1932373046875, 1.420166015625, 1.6470947265625, 1.8740234375, 2.1009521484375, 2.327880859375, 2.5548095703125, 2.78173828125, 3.0086669921875, 3.235595703125, 3.4625244140625, 3.689453125, 3.9163818359375, 4.143310546875, 4.3702392578125, 4.59716796875, 4.8240966796875, 5.051025390625, 5.2779541015625, 5.5048828125, 5.7318115234375, 5.958740234375, 6.1856689453125, 6.41259765625, 6.6395263671875, 6.866455078125, 7.0933837890625, 7.3203125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 9.0, 6.0, 7.0, 15.0, 18.0, 14.0, 19.0, 21.0, 31.0, 19.0, 27.0, 25.0, 38.0, 44.0, 38.0, 36.0, 40.0, 38.0, 47.0, 43.0, 40.0, 39.0, 33.0, 39.0, 46.0, 25.0, 30.0, 26.0, 29.0, 24.0, 13.0, 23.0, 17.0, 9.0, 19.0, 16.0, 8.0, 2.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.958984375, -3.835906982421875, -3.71282958984375, -3.589752197265625, -3.4666748046875, -3.343597412109375, -3.22052001953125, -3.097442626953125, -2.974365234375, -2.851287841796875, -2.72821044921875, -2.605133056640625, -2.4820556640625, -2.358978271484375, -2.23590087890625, -2.112823486328125, -1.98974609375, -1.866668701171875, -1.74359130859375, -1.620513916015625, -1.4974365234375, -1.374359130859375, -1.25128173828125, -1.128204345703125, -1.005126953125, -0.882049560546875, -0.75897216796875, -0.635894775390625, -0.5128173828125, -0.389739990234375, -0.26666259765625, -0.143585205078125, -0.0205078125, 0.102569580078125, 0.22564697265625, 0.348724365234375, 0.4718017578125, 0.594879150390625, 0.71795654296875, 0.841033935546875, 0.964111328125, 1.087188720703125, 1.21026611328125, 1.333343505859375, 1.4564208984375, 1.579498291015625, 1.70257568359375, 1.825653076171875, 1.94873046875, 2.071807861328125, 2.19488525390625, 2.317962646484375, 2.4410400390625, 2.564117431640625, 2.68719482421875, 2.810272216796875, 2.933349609375, 3.056427001953125, 3.17950439453125, 3.302581787109375, 3.4256591796875, 3.548736572265625, 3.67181396484375, 3.794891357421875, 3.91796875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 9.0, 7.0, 8.0, 10.0, 12.0, 14.0, 18.0, 28.0, 54.0, 65.0, 70.0, 119.0, 134.0, 244.0, 305.0, 423.0, 607.0, 937.0, 1467.0, 2395.0, 4021.0, 7246.0, 13278.0, 25164.0, 50702.0, 103535.0, 192175.0, 251968.0, 188657.0, 100533.0, 48881.0, 24467.0, 13236.0, 7008.0, 3935.0, 2400.0, 1472.0, 889.0, 649.0, 431.0, 277.0, 179.0, 146.0, 105.0, 73.0, 54.0, 45.0, 28.0, 26.0, 20.0, 9.0, 14.0, 5.0, 8.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.8359375, -3.71783447265625, -3.5997314453125, -3.48162841796875, -3.363525390625, -3.24542236328125, -3.1273193359375, -3.00921630859375, -2.89111328125, -2.77301025390625, -2.6549072265625, -2.53680419921875, -2.418701171875, -2.30059814453125, -2.1824951171875, -2.06439208984375, -1.9462890625, -1.82818603515625, -1.7100830078125, -1.59197998046875, -1.473876953125, -1.35577392578125, -1.2376708984375, -1.11956787109375, -1.00146484375, -0.88336181640625, -0.7652587890625, -0.64715576171875, -0.529052734375, -0.41094970703125, -0.2928466796875, -0.17474365234375, -0.056640625, 0.06146240234375, 0.1795654296875, 0.29766845703125, 0.415771484375, 0.53387451171875, 0.6519775390625, 0.77008056640625, 0.88818359375, 1.00628662109375, 1.1243896484375, 1.24249267578125, 1.360595703125, 1.47869873046875, 1.5968017578125, 1.71490478515625, 1.8330078125, 1.95111083984375, 2.0692138671875, 2.18731689453125, 2.305419921875, 2.42352294921875, 2.5416259765625, 2.65972900390625, 2.77783203125, 2.89593505859375, 3.0140380859375, 3.13214111328125, 3.250244140625, 3.36834716796875, 3.4864501953125, 3.60455322265625, 3.72265625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 8.0, 3.0, 8.0, 14.0, 16.0, 24.0, 21.0, 37.0, 47.0, 39.0, 64.0, 49.0, 56.0, 70.0, 66.0, 61.0, 74.0, 54.0, 51.0, 38.0, 32.0, 33.0, 28.0, 25.0, 9.0, 17.0, 9.0, 6.0, 6.0, 6.0, 5.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00026988983154296875, -0.0002610832452774048, -0.0002522766590118408, -0.00024347007274627686, -0.0002346634864807129, -0.00022585690021514893, -0.00021705031394958496, -0.000208243727684021, -0.00019943714141845703, -0.00019063055515289307, -0.0001818239688873291, -0.00017301738262176514, -0.00016421079635620117, -0.0001554042100906372, -0.00014659762382507324, -0.00013779103755950928, -0.0001289844512939453, -0.00012017786502838135, -0.00011137127876281738, -0.00010256469249725342, -9.375810623168945e-05, -8.495151996612549e-05, -7.614493370056152e-05, -6.733834743499756e-05, -5.8531761169433594e-05, -4.972517490386963e-05, -4.0918588638305664e-05, -3.21120023727417e-05, -2.3305416107177734e-05, -1.449882984161377e-05, -5.692243576049805e-06, 3.11434268951416e-06, 1.1920928955078125e-05, 2.072751522064209e-05, 2.9534101486206055e-05, 3.834068775177002e-05, 4.7147274017333984e-05, 5.595386028289795e-05, 6.476044654846191e-05, 7.356703281402588e-05, 8.237361907958984e-05, 9.118020534515381e-05, 9.998679161071777e-05, 0.00010879337787628174, 0.0001175999641418457, 0.00012640655040740967, 0.00013521313667297363, 0.0001440197229385376, 0.00015282630920410156, 0.00016163289546966553, 0.0001704394817352295, 0.00017924606800079346, 0.00018805265426635742, 0.0001968592405319214, 0.00020566582679748535, 0.00021447241306304932, 0.00022327899932861328, 0.00023208558559417725, 0.0002408921718597412, 0.0002496987581253052, 0.00025850534439086914, 0.0002673119306564331, 0.00027611851692199707, 0.00028492510318756104, 0.000293731689453125]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 5.0, 13.0, 12.0, 15.0, 21.0, 39.0, 40.0, 81.0, 105.0, 147.0, 241.0, 340.0, 567.0, 896.0, 1501.0, 2455.0, 4360.0, 7657.0, 13950.0, 26583.0, 50954.0, 98074.0, 171549.0, 227284.0, 192922.0, 117011.0, 61828.0, 31471.0, 16602.0, 9173.0, 5060.0, 3022.0, 1681.0, 1034.0, 661.0, 410.0, 257.0, 161.0, 113.0, 65.0, 61.0, 40.0, 25.0, 17.0, 14.0, 16.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.328125, -3.226165771484375, -3.12420654296875, -3.022247314453125, -2.9202880859375, -2.818328857421875, -2.71636962890625, -2.614410400390625, -2.512451171875, -2.410491943359375, -2.30853271484375, -2.206573486328125, -2.1046142578125, -2.002655029296875, -1.90069580078125, -1.798736572265625, -1.69677734375, -1.594818115234375, -1.49285888671875, -1.390899658203125, -1.2889404296875, -1.186981201171875, -1.08502197265625, -0.983062744140625, -0.881103515625, -0.779144287109375, -0.67718505859375, -0.575225830078125, -0.4732666015625, -0.371307373046875, -0.26934814453125, -0.167388916015625, -0.0654296875, 0.036529541015625, 0.13848876953125, 0.240447998046875, 0.3424072265625, 0.444366455078125, 0.54632568359375, 0.648284912109375, 0.750244140625, 0.852203369140625, 0.95416259765625, 1.056121826171875, 1.1580810546875, 1.260040283203125, 1.36199951171875, 1.463958740234375, 1.56591796875, 1.667877197265625, 1.76983642578125, 1.871795654296875, 1.9737548828125, 2.075714111328125, 2.17767333984375, 2.279632568359375, 2.381591796875, 2.483551025390625, 2.58551025390625, 2.687469482421875, 2.7894287109375, 2.891387939453125, 2.99334716796875, 3.095306396484375, 3.197265625]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 6.0, 15.0, 24.0, 22.0, 12.0, 19.0, 33.0, 41.0, 36.0, 42.0, 52.0, 56.0, 40.0, 48.0, 46.0, 48.0, 62.0, 45.0, 44.0, 40.0, 28.0, 27.0, 23.0, 21.0, 19.0, 25.0, 9.0, 24.0, 4.0, 8.0, 18.0, 5.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.84912109375, -0.8260726928710938, -0.8030242919921875, -0.7799758911132812, -0.756927490234375, -0.7338790893554688, -0.7108306884765625, -0.6877822875976562, -0.66473388671875, -0.6416854858398438, -0.6186370849609375, -0.5955886840820312, -0.572540283203125, -0.5494918823242188, -0.5264434814453125, -0.5033950805664062, -0.4803466796875, -0.45729827880859375, -0.4342498779296875, -0.41120147705078125, -0.388153076171875, -0.36510467529296875, -0.3420562744140625, -0.31900787353515625, -0.29595947265625, -0.27291107177734375, -0.2498626708984375, -0.22681427001953125, -0.203765869140625, -0.18071746826171875, -0.1576690673828125, -0.13462066650390625, -0.111572265625, -0.08852386474609375, -0.0654754638671875, -0.04242706298828125, -0.019378662109375, 0.00366973876953125, 0.0267181396484375, 0.04976654052734375, 0.07281494140625, 0.09586334228515625, 0.1189117431640625, 0.14196014404296875, 0.165008544921875, 0.18805694580078125, 0.2111053466796875, 0.23415374755859375, 0.2572021484375, 0.28025054931640625, 0.3032989501953125, 0.32634735107421875, 0.349395751953125, 0.37244415283203125, 0.3954925537109375, 0.41854095458984375, 0.44158935546875, 0.46463775634765625, 0.4876861572265625, 0.5107345581054688, 0.533782958984375, 0.5568313598632812, 0.5798797607421875, 0.6029281616210938, 0.6259765625]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 5.0, 10.0, 8.0, 14.0, 11.0, 12.0, 17.0, 22.0, 25.0, 26.0, 31.0, 42.0, 52.0, 63.0, 79.0, 97.0, 73.0, 77.0, 56.0, 58.0, 50.0, 47.0, 24.0, 20.0, 20.0, 11.0, 8.0, 9.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.244050025939941, -9.918441772460938, -9.592832565307617, -9.267223358154297, -8.941615104675293, -8.616006851196289, -8.290397644042969, -7.964788913726807, -7.6391801834106445, -7.313571453094482, -6.98796272277832, -6.662353992462158, -6.336745262145996, -6.011136531829834, -5.685527801513672, -5.35991907119751, -5.034310340881348, -4.7087016105651855, -4.383092880249023, -4.057484149932861, -3.731875419616699, -3.406266689300537, -3.080657958984375, -2.755049228668213, -2.429440498352051, -2.1038317680358887, -1.7782230377197266, -1.4526143074035645, -1.1270055770874023, -0.8013968467712402, -0.4757881164550781, -0.15017938613891602, 0.1754302978515625, 0.5010390281677246, 0.8266477584838867, 1.1522564888000488, 1.477865219116211, 1.803473949432373, 2.129082679748535, 2.4546914100646973, 2.7803001403808594, 3.1059088706970215, 3.4315176010131836, 3.7571263313293457, 4.082735061645508, 4.40834379196167, 4.733952522277832, 5.059561252593994, 5.385169982910156, 5.710778713226318, 6.0363874435424805, 6.361996173858643, 6.687604904174805, 7.013213634490967, 7.338822364807129, 7.664431095123291, 7.990039825439453, 8.315649032592773, 8.641257286071777, 8.966865539550781, 9.292474746704102, 9.618083953857422, 9.943692207336426, 10.26930046081543, 10.59490966796875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 10.0, 8.0, 11.0, 17.0, 12.0, 20.0, 36.0, 27.0, 24.0, 25.0, 37.0, 44.0, 43.0, 38.0, 62.0, 42.0, 55.0, 54.0, 52.0, 42.0, 40.0, 46.0, 35.0, 35.0, 32.0, 36.0, 25.0, 15.0, 13.0, 21.0, 7.0, 8.0, 5.0, 5.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.624178409576416, -7.379016876220703, -7.133855819702148, -6.8886942863464355, -6.643532752990723, -6.398371696472168, -6.153210163116455, -5.908048629760742, -5.6628875732421875, -5.417726039886475, -5.17256498336792, -4.927403450012207, -4.682242393493652, -4.4370808601379395, -4.191919326782227, -3.9467580318450928, -3.701596736907959, -3.456435441970825, -3.2112741470336914, -2.9661126136779785, -2.7209513187408447, -2.475790023803711, -2.230628490447998, -1.9854671955108643, -1.7403059005737305, -1.4951446056365967, -1.2499831914901733, -1.00482177734375, -0.7596604824066162, -0.5144991874694824, -0.2693377733230591, -0.024176359176635742, 0.22098541259765625, 0.4661467671394348, 0.7113081216812134, 0.9564694762229919, 1.2016308307647705, 1.4467921257019043, 1.6919535398483276, 1.937114953994751, 2.1822762489318848, 2.4274375438690186, 2.6725988388061523, 2.9177603721618652, 3.162921667098999, 3.408082962036133, 3.6532444953918457, 3.8984057903289795, 4.143567085266113, 4.388728618621826, 4.633889675140381, 4.879051208496094, 5.124212265014648, 5.369373798370361, 5.614535331726074, 5.859696388244629, 6.104857921600342, 6.350019454956055, 6.595180511474609, 6.840342044830322, 7.085503578186035, 7.33066463470459, 7.575826168060303, 7.820987701416016, 8.06614875793457]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 9.0, 5.0, 17.0, 36.0, 24.0, 28.0, 60.0, 87.0, 125.0, 222.0, 303.0, 433.0, 804.0, 1331.0, 2242.0, 3982.0, 7708.0, 16928.0, 46930.0, 187407.0, 1043840.0, 2119863.0, 586146.0, 114751.0, 33722.0, 13098.0, 6248.0, 3170.0, 1779.0, 1097.0, 641.0, 416.0, 256.0, 172.0, 118.0, 87.0, 67.0, 39.0, 26.0, 18.0, 17.0, 9.0, 5.0, 7.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.203125, -14.684814453125, -14.16650390625, -13.648193359375, -13.1298828125, -12.611572265625, -12.09326171875, -11.574951171875, -11.056640625, -10.538330078125, -10.02001953125, -9.501708984375, -8.9833984375, -8.465087890625, -7.94677734375, -7.428466796875, -6.91015625, -6.391845703125, -5.87353515625, -5.355224609375, -4.8369140625, -4.318603515625, -3.80029296875, -3.281982421875, -2.763671875, -2.245361328125, -1.72705078125, -1.208740234375, -0.6904296875, -0.172119140625, 0.34619140625, 0.864501953125, 1.3828125, 1.901123046875, 2.41943359375, 2.937744140625, 3.4560546875, 3.974365234375, 4.49267578125, 5.010986328125, 5.529296875, 6.047607421875, 6.56591796875, 7.084228515625, 7.6025390625, 8.120849609375, 8.63916015625, 9.157470703125, 9.67578125, 10.194091796875, 10.71240234375, 11.230712890625, 11.7490234375, 12.267333984375, 12.78564453125, 13.303955078125, 13.822265625, 14.340576171875, 14.85888671875, 15.377197265625, 15.8955078125, 16.413818359375, 16.93212890625, 17.450439453125, 17.96875]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 8.0, 11.0, 8.0, 11.0, 14.0, 21.0, 22.0, 23.0, 27.0, 32.0, 32.0, 26.0, 42.0, 53.0, 49.0, 41.0, 48.0, 43.0, 63.0, 42.0, 48.0, 50.0, 49.0, 34.0, 33.0, 29.0, 29.0, 27.0, 20.0, 16.0, 12.0, 6.0, 8.0, 7.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.37109375, -6.1834716796875, -5.995849609375, -5.8082275390625, -5.62060546875, -5.4329833984375, -5.245361328125, -5.0577392578125, -4.8701171875, -4.6824951171875, -4.494873046875, -4.3072509765625, -4.11962890625, -3.9320068359375, -3.744384765625, -3.5567626953125, -3.369140625, -3.1815185546875, -2.993896484375, -2.8062744140625, -2.61865234375, -2.4310302734375, -2.243408203125, -2.0557861328125, -1.8681640625, -1.6805419921875, -1.492919921875, -1.3052978515625, -1.11767578125, -0.9300537109375, -0.742431640625, -0.5548095703125, -0.3671875, -0.1795654296875, 0.008056640625, 0.1956787109375, 0.38330078125, 0.5709228515625, 0.758544921875, 0.9461669921875, 1.1337890625, 1.3214111328125, 1.509033203125, 1.6966552734375, 1.88427734375, 2.0718994140625, 2.259521484375, 2.4471435546875, 2.634765625, 2.8223876953125, 3.010009765625, 3.1976318359375, 3.38525390625, 3.5728759765625, 3.760498046875, 3.9481201171875, 4.1357421875, 4.3233642578125, 4.510986328125, 4.6986083984375, 4.88623046875, 5.0738525390625, 5.261474609375, 5.4490966796875, 5.63671875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 12.0, 16.0, 18.0, 20.0, 53.0, 94.0, 107.0, 182.0, 336.0, 504.0, 1038.0, 2036.0, 4009.0, 9447.0, 23279.0, 76056.0, 372641.0, 2255136.0, 1196285.0, 179119.0, 45125.0, 15694.0, 6526.0, 3107.0, 1482.0, 819.0, 419.0, 256.0, 155.0, 109.0, 69.0, 45.0, 30.0, 14.0, 12.0, 9.0, 4.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.5, -20.8017578125, -20.103515625, -19.4052734375, -18.70703125, -18.0087890625, -17.310546875, -16.6123046875, -15.9140625, -15.2158203125, -14.517578125, -13.8193359375, -13.12109375, -12.4228515625, -11.724609375, -11.0263671875, -10.328125, -9.6298828125, -8.931640625, -8.2333984375, -7.53515625, -6.8369140625, -6.138671875, -5.4404296875, -4.7421875, -4.0439453125, -3.345703125, -2.6474609375, -1.94921875, -1.2509765625, -0.552734375, 0.1455078125, 0.84375, 1.5419921875, 2.240234375, 2.9384765625, 3.63671875, 4.3349609375, 5.033203125, 5.7314453125, 6.4296875, 7.1279296875, 7.826171875, 8.5244140625, 9.22265625, 9.9208984375, 10.619140625, 11.3173828125, 12.015625, 12.7138671875, 13.412109375, 14.1103515625, 14.80859375, 15.5068359375, 16.205078125, 16.9033203125, 17.6015625, 18.2998046875, 18.998046875, 19.6962890625, 20.39453125, 21.0927734375, 21.791015625, 22.4892578125, 23.1875]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 12.0, 12.0, 27.0, 19.0, 33.0, 58.0, 65.0, 106.0, 144.0, 195.0, 296.0, 388.0, 423.0, 470.0, 401.0, 373.0, 283.0, 205.0, 149.0, 112.0, 69.0, 57.0, 48.0, 23.0, 19.0, 11.0, 18.0, 8.0, 9.0, 3.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.07421875, -3.948760986328125, -3.82330322265625, -3.697845458984375, -3.5723876953125, -3.446929931640625, -3.32147216796875, -3.196014404296875, -3.070556640625, -2.945098876953125, -2.81964111328125, -2.694183349609375, -2.5687255859375, -2.443267822265625, -2.31781005859375, -2.192352294921875, -2.06689453125, -1.941436767578125, -1.81597900390625, -1.690521240234375, -1.5650634765625, -1.439605712890625, -1.31414794921875, -1.188690185546875, -1.063232421875, -0.937774658203125, -0.81231689453125, -0.686859130859375, -0.5614013671875, -0.435943603515625, -0.31048583984375, -0.185028076171875, -0.0595703125, 0.065887451171875, 0.19134521484375, 0.316802978515625, 0.4422607421875, 0.567718505859375, 0.69317626953125, 0.818634033203125, 0.944091796875, 1.069549560546875, 1.19500732421875, 1.320465087890625, 1.4459228515625, 1.571380615234375, 1.69683837890625, 1.822296142578125, 1.94775390625, 2.073211669921875, 2.19866943359375, 2.324127197265625, 2.4495849609375, 2.575042724609375, 2.70050048828125, 2.825958251953125, 2.951416015625, 3.076873779296875, 3.20233154296875, 3.327789306640625, 3.4532470703125, 3.578704833984375, 3.70416259765625, 3.829620361328125, 3.955078125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 4.0, 6.0, 4.0, 4.0, 8.0, 8.0, 12.0, 20.0, 22.0, 36.0, 42.0, 44.0, 85.0, 96.0, 98.0, 119.0, 98.0, 71.0, 63.0, 44.0, 38.0, 19.0, 15.0, 13.0, 10.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.524490356445312, -15.080896377563477, -14.637303352355957, -14.193710327148438, -13.750116348266602, -13.306522369384766, -12.862929344177246, -12.419336318969727, -11.97574234008789, -11.532148361206055, -11.088555335998535, -10.644962310791016, -10.20136833190918, -9.757774353027344, -9.314181327819824, -8.870588302612305, -8.426994323730469, -7.983400821685791, -7.539807319641113, -7.0962138175964355, -6.652620315551758, -6.20902681350708, -5.765433311462402, -5.321839809417725, -4.878246307373047, -4.434652805328369, -3.9910593032836914, -3.5474658012390137, -3.103872299194336, -2.660278797149658, -2.2166852951049805, -1.7730917930603027, -1.329498291015625, -0.8859047889709473, -0.44231128692626953, 0.0012822151184082031, 0.44487571716308594, 0.8884692192077637, 1.3320627212524414, 1.7756562232971191, 2.219249725341797, 2.6628432273864746, 3.1064367294311523, 3.55003023147583, 3.993623733520508, 4.4372172355651855, 4.880810737609863, 5.324404239654541, 5.767997741699219, 6.2115912437438965, 6.655184745788574, 7.098778247833252, 7.54237174987793, 7.985965251922607, 8.429558753967285, 8.873151779174805, 9.31674575805664, 9.760339736938477, 10.203932762145996, 10.647525787353516, 11.091119766235352, 11.534713745117188, 11.978306770324707, 12.421899795532227, 12.865493774414062]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 1.0, 4.0, 0.0, 3.0, 7.0, 5.0, 10.0, 21.0, 14.0, 11.0, 18.0, 14.0, 36.0, 25.0, 28.0, 30.0, 35.0, 39.0, 43.0, 42.0, 39.0, 48.0, 55.0, 50.0, 41.0, 47.0, 33.0, 44.0, 38.0, 38.0, 32.0, 30.0, 20.0, 21.0, 20.0, 9.0, 16.0, 6.0, 8.0, 6.0, 6.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.328248023986816, -7.099712371826172, -6.8711771965026855, -6.642641544342041, -6.4141058921813965, -6.18557071685791, -5.957035064697266, -5.728499412536621, -5.499963760375977, -5.271428108215332, -5.042892932891846, -4.814357280731201, -4.585821628570557, -4.35728645324707, -4.128750801086426, -3.9002151489257812, -3.671679735183716, -3.4431443214416504, -3.214608669281006, -2.9860732555389404, -2.757537603378296, -2.5290021896362305, -2.300466537475586, -2.0719311237335205, -1.8433955907821655, -1.6148600578308105, -1.3863245248794556, -1.1577889919281006, -0.9292535185813904, -0.7007180452346802, -0.4721825122833252, -0.24364697933197021, -0.015111446380615234, 0.21342407166957855, 0.44195958971977234, 0.6704950928688049, 0.8990306258201599, 1.1275660991668701, 1.356101632118225, 1.58463716506958, 1.813172698020935, 2.04170823097229, 2.2702436447143555, 2.498779296875, 2.7273147106170654, 2.955850124359131, 3.1843857765197754, 3.41292142868042, 3.6414568424224854, 3.869992256164551, 4.098527908325195, 4.32706356048584, 4.555598735809326, 4.784134387969971, 5.012670040130615, 5.241205215454102, 5.469740867614746, 5.698276519775391, 5.926811695098877, 6.1553473472595215, 6.383882999420166, 6.612418174743652, 6.840953826904297, 7.069489479064941, 7.298025131225586]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 6.0, 12.0, 10.0, 13.0, 25.0, 34.0, 43.0, 44.0, 61.0, 89.0, 129.0, 167.0, 213.0, 296.0, 454.0, 660.0, 1130.0, 2275.0, 6037.0, 22700.0, 129660.0, 659307.0, 182451.0, 29145.0, 7345.0, 2534.0, 1249.0, 740.0, 468.0, 318.0, 231.0, 172.0, 153.0, 97.0, 59.0, 42.0, 35.0, 38.0, 32.0, 22.0, 10.0, 12.0, 11.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.8359375, -3.71820068359375, -3.6004638671875, -3.48272705078125, -3.364990234375, -3.24725341796875, -3.1295166015625, -3.01177978515625, -2.89404296875, -2.77630615234375, -2.6585693359375, -2.54083251953125, -2.423095703125, -2.30535888671875, -2.1876220703125, -2.06988525390625, -1.9521484375, -1.83441162109375, -1.7166748046875, -1.59893798828125, -1.481201171875, -1.36346435546875, -1.2457275390625, -1.12799072265625, -1.01025390625, -0.89251708984375, -0.7747802734375, -0.65704345703125, -0.539306640625, -0.42156982421875, -0.3038330078125, -0.18609619140625, -0.068359375, 0.04937744140625, 0.1671142578125, 0.28485107421875, 0.402587890625, 0.52032470703125, 0.6380615234375, 0.75579833984375, 0.87353515625, 0.99127197265625, 1.1090087890625, 1.22674560546875, 1.344482421875, 1.46221923828125, 1.5799560546875, 1.69769287109375, 1.8154296875, 1.93316650390625, 2.0509033203125, 2.16864013671875, 2.286376953125, 2.40411376953125, 2.5218505859375, 2.63958740234375, 2.75732421875, 2.87506103515625, 2.9927978515625, 3.11053466796875, 3.228271484375, 3.34600830078125, 3.4637451171875, 3.58148193359375, 3.69921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 4.0, 7.0, 1.0, 8.0, 8.0, 5.0, 10.0, 9.0, 13.0, 11.0, 18.0, 29.0, 25.0, 34.0, 32.0, 36.0, 31.0, 45.0, 52.0, 43.0, 53.0, 44.0, 63.0, 40.0, 46.0, 52.0, 33.0, 41.0, 38.0, 36.0, 22.0, 19.0, 16.0, 23.0, 11.0, 10.0, 11.0, 6.0, 9.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.8125, -8.5548095703125, -8.297119140625, -8.0394287109375, -7.78173828125, -7.5240478515625, -7.266357421875, -7.0086669921875, -6.7509765625, -6.4932861328125, -6.235595703125, -5.9779052734375, -5.72021484375, -5.4625244140625, -5.204833984375, -4.9471435546875, -4.689453125, -4.4317626953125, -4.174072265625, -3.9163818359375, -3.65869140625, -3.4010009765625, -3.143310546875, -2.8856201171875, -2.6279296875, -2.3702392578125, -2.112548828125, -1.8548583984375, -1.59716796875, -1.3394775390625, -1.081787109375, -0.8240966796875, -0.56640625, -0.3087158203125, -0.051025390625, 0.2066650390625, 0.46435546875, 0.7220458984375, 0.979736328125, 1.2374267578125, 1.4951171875, 1.7528076171875, 2.010498046875, 2.2681884765625, 2.52587890625, 2.7835693359375, 3.041259765625, 3.2989501953125, 3.556640625, 3.8143310546875, 4.072021484375, 4.3297119140625, 4.58740234375, 4.8450927734375, 5.102783203125, 5.3604736328125, 5.6181640625, 5.8758544921875, 6.133544921875, 6.3912353515625, 6.64892578125, 6.9066162109375, 7.164306640625, 7.4219970703125, 7.6796875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 7.0, 8.0, 15.0, 11.0, 11.0, 20.0, 27.0, 42.0, 40.0, 51.0, 69.0, 95.0, 154.0, 223.0, 380.0, 768.0, 1901.0, 5934.0, 31601.0, 956031.0, 40049.0, 6880.0, 2185.0, 820.0, 432.0, 228.0, 151.0, 93.0, 77.0, 59.0, 37.0, 27.0, 28.0, 22.0, 18.0, 15.0, 9.0, 7.0, 5.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.984375, -6.76983642578125, -6.5552978515625, -6.34075927734375, -6.126220703125, -5.91168212890625, -5.6971435546875, -5.48260498046875, -5.26806640625, -5.05352783203125, -4.8389892578125, -4.62445068359375, -4.409912109375, -4.19537353515625, -3.9808349609375, -3.76629638671875, -3.5517578125, -3.33721923828125, -3.1226806640625, -2.90814208984375, -2.693603515625, -2.47906494140625, -2.2645263671875, -2.04998779296875, -1.83544921875, -1.62091064453125, -1.4063720703125, -1.19183349609375, -0.977294921875, -0.76275634765625, -0.5482177734375, -0.33367919921875, -0.119140625, 0.09539794921875, 0.3099365234375, 0.52447509765625, 0.739013671875, 0.95355224609375, 1.1680908203125, 1.38262939453125, 1.59716796875, 1.81170654296875, 2.0262451171875, 2.24078369140625, 2.455322265625, 2.66986083984375, 2.8843994140625, 3.09893798828125, 3.3134765625, 3.52801513671875, 3.7425537109375, 3.95709228515625, 4.171630859375, 4.38616943359375, 4.6007080078125, 4.81524658203125, 5.02978515625, 5.24432373046875, 5.4588623046875, 5.67340087890625, 5.887939453125, 6.10247802734375, 6.3170166015625, 6.53155517578125, 6.74609375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 5.0, 12.0, 8.0, 10.0, 14.0, 15.0, 12.0, 24.0, 23.0, 29.0, 35.0, 31.0, 28.0, 44.0, 34.0, 37.0, 34.0, 39.0, 35.0, 43.0, 32.0, 35.0, 39.0, 32.0, 25.0, 38.0, 33.0, 25.0, 26.0, 33.0, 26.0, 21.0, 21.0, 14.0, 18.0, 10.0, 10.0, 8.0, 13.0, 8.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.14453125, -4.015380859375, -3.88623046875, -3.757080078125, -3.6279296875, -3.498779296875, -3.36962890625, -3.240478515625, -3.111328125, -2.982177734375, -2.85302734375, -2.723876953125, -2.5947265625, -2.465576171875, -2.33642578125, -2.207275390625, -2.078125, -1.948974609375, -1.81982421875, -1.690673828125, -1.5615234375, -1.432373046875, -1.30322265625, -1.174072265625, -1.044921875, -0.915771484375, -0.78662109375, -0.657470703125, -0.5283203125, -0.399169921875, -0.27001953125, -0.140869140625, -0.01171875, 0.117431640625, 0.24658203125, 0.375732421875, 0.5048828125, 0.634033203125, 0.76318359375, 0.892333984375, 1.021484375, 1.150634765625, 1.27978515625, 1.408935546875, 1.5380859375, 1.667236328125, 1.79638671875, 1.925537109375, 2.0546875, 2.183837890625, 2.31298828125, 2.442138671875, 2.5712890625, 2.700439453125, 2.82958984375, 2.958740234375, 3.087890625, 3.217041015625, 3.34619140625, 3.475341796875, 3.6044921875, 3.733642578125, 3.86279296875, 3.991943359375, 4.12109375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 6.0, 14.0, 9.0, 14.0, 22.0, 25.0, 39.0, 51.0, 50.0, 72.0, 82.0, 94.0, 123.0, 141.0, 185.0, 232.0, 270.0, 382.0, 536.0, 907.0, 1803.0, 4888.0, 17783.0, 925233.0, 77694.0, 10411.0, 3232.0, 1403.0, 726.0, 448.0, 352.0, 230.0, 199.0, 177.0, 117.0, 117.0, 106.0, 68.0, 61.0, 36.0, 39.0, 40.0, 29.0, 17.0, 14.0, 14.0, 9.0, 11.0, 12.0, 5.0, 3.0, 6.0, 5.0, 1.0], "bins": [-1.904296875, -1.847991943359375, -1.79168701171875, -1.735382080078125, -1.6790771484375, -1.622772216796875, -1.56646728515625, -1.510162353515625, -1.453857421875, -1.397552490234375, -1.34124755859375, -1.284942626953125, -1.2286376953125, -1.172332763671875, -1.11602783203125, -1.059722900390625, -1.00341796875, -0.947113037109375, -0.89080810546875, -0.834503173828125, -0.7781982421875, -0.721893310546875, -0.66558837890625, -0.609283447265625, -0.552978515625, -0.496673583984375, -0.44036865234375, -0.384063720703125, -0.3277587890625, -0.271453857421875, -0.21514892578125, -0.158843994140625, -0.1025390625, -0.046234130859375, 0.01007080078125, 0.066375732421875, 0.1226806640625, 0.178985595703125, 0.23529052734375, 0.291595458984375, 0.347900390625, 0.404205322265625, 0.46051025390625, 0.516815185546875, 0.5731201171875, 0.629425048828125, 0.68572998046875, 0.742034912109375, 0.79833984375, 0.854644775390625, 0.91094970703125, 0.967254638671875, 1.0235595703125, 1.079864501953125, 1.13616943359375, 1.192474365234375, 1.248779296875, 1.305084228515625, 1.36138916015625, 1.417694091796875, 1.4739990234375, 1.530303955078125, 1.58660888671875, 1.642913818359375, 1.69921875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 14.0, 32.0, 70.0, 162.0, 237.0, 248.0, 153.0, 53.0, 15.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00028896331787109375, -0.000281529501080513, -0.00027409568428993225, -0.0002666618674993515, -0.00025922805070877075, -0.00025179423391819, -0.00024436041712760925, -0.0002369266003370285, -0.00022949278354644775, -0.000222058966755867, -0.00021462514996528625, -0.0002071913331747055, -0.00019975751638412476, -0.000192323699593544, -0.00018488988280296326, -0.0001774560660123825, -0.00017002224922180176, -0.000162588432431221, -0.00015515461564064026, -0.0001477207988500595, -0.00014028698205947876, -0.000132853165268898, -0.00012541934847831726, -0.00011798553168773651, -0.00011055171489715576, -0.00010311789810657501, -9.568408131599426e-05, -8.825026452541351e-05, -8.081644773483276e-05, -7.338263094425201e-05, -6.594881415367126e-05, -5.8514997363090515e-05, -5.1081180572509766e-05, -4.3647363781929016e-05, -3.6213546991348267e-05, -2.8779730200767517e-05, -2.1345913410186768e-05, -1.3912096619606018e-05, -6.4782798290252686e-06, 9.55536961555481e-07, 8.38935375213623e-06, 1.582317054271698e-05, 2.325698733329773e-05, 3.069080412387848e-05, 3.812462091445923e-05, 4.555843770503998e-05, 5.299225449562073e-05, 6.042607128620148e-05, 6.785988807678223e-05, 7.529370486736298e-05, 8.272752165794373e-05, 9.016133844852448e-05, 9.759515523910522e-05, 0.00010502897202968597, 0.00011246278882026672, 0.00011989660561084747, 0.00012733042240142822, 0.00013476423919200897, 0.00014219805598258972, 0.00014963187277317047, 0.00015706568956375122, 0.00016449950635433197, 0.00017193332314491272, 0.00017936713993549347, 0.00018680095672607422]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 9.0, 10.0, 16.0, 21.0, 37.0, 50.0, 67.0, 87.0, 134.0, 206.0, 265.0, 382.0, 576.0, 879.0, 1387.0, 2353.0, 4105.0, 8286.0, 18731.0, 51712.0, 192581.0, 505879.0, 176171.0, 48585.0, 17703.0, 7841.0, 4075.0, 2334.0, 1390.0, 877.0, 564.0, 376.0, 254.0, 171.0, 120.0, 92.0, 55.0, 53.0, 33.0, 22.0, 16.0, 8.0, 12.0, 9.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4931640625, -0.4774932861328125, -0.461822509765625, -0.4461517333984375, -0.43048095703125, -0.4148101806640625, -0.399139404296875, -0.3834686279296875, -0.3677978515625, -0.3521270751953125, -0.336456298828125, -0.3207855224609375, -0.30511474609375, -0.2894439697265625, -0.273773193359375, -0.2581024169921875, -0.242431640625, -0.2267608642578125, -0.211090087890625, -0.1954193115234375, -0.17974853515625, -0.1640777587890625, -0.148406982421875, -0.1327362060546875, -0.1170654296875, -0.1013946533203125, -0.085723876953125, -0.0700531005859375, -0.05438232421875, -0.0387115478515625, -0.023040771484375, -0.0073699951171875, 0.00830078125, 0.0239715576171875, 0.039642333984375, 0.0553131103515625, 0.07098388671875, 0.0866546630859375, 0.102325439453125, 0.1179962158203125, 0.1336669921875, 0.1493377685546875, 0.165008544921875, 0.1806793212890625, 0.19635009765625, 0.2120208740234375, 0.227691650390625, 0.2433624267578125, 0.259033203125, 0.2747039794921875, 0.290374755859375, 0.3060455322265625, 0.32171630859375, 0.3373870849609375, 0.353057861328125, 0.3687286376953125, 0.3843994140625, 0.4000701904296875, 0.415740966796875, 0.4314117431640625, 0.44708251953125, 0.4627532958984375, 0.478424072265625, 0.4940948486328125, 0.509765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 2.0, 3.0, 7.0, 9.0, 15.0, 21.0, 28.0, 29.0, 54.0, 72.0, 96.0, 140.0, 127.0, 108.0, 85.0, 73.0, 34.0, 20.0, 26.0, 14.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1180419921875, -0.11439990997314453, -0.11075782775878906, -0.1071157455444336, -0.10347366333007812, -0.09983158111572266, -0.09618949890136719, -0.09254741668701172, -0.08890533447265625, -0.08526325225830078, -0.08162117004394531, -0.07797908782958984, -0.07433700561523438, -0.0706949234008789, -0.06705284118652344, -0.06341075897216797, -0.0597686767578125, -0.05612659454345703, -0.05248451232910156, -0.048842430114746094, -0.045200347900390625, -0.041558265686035156, -0.03791618347167969, -0.03427410125732422, -0.03063201904296875, -0.02698993682861328, -0.023347854614257812, -0.019705772399902344, -0.016063690185546875, -0.012421607971191406, -0.008779525756835938, -0.005137443542480469, -0.001495361328125, 0.0021467208862304688, 0.0057888031005859375, 0.009430885314941406, 0.013072967529296875, 0.016715049743652344, 0.020357131958007812, 0.02399921417236328, 0.02764129638671875, 0.03128337860107422, 0.03492546081542969, 0.038567543029785156, 0.042209625244140625, 0.045851707458496094, 0.04949378967285156, 0.05313587188720703, 0.0567779541015625, 0.06042003631591797, 0.06406211853027344, 0.0677042007446289, 0.07134628295898438, 0.07498836517333984, 0.07863044738769531, 0.08227252960205078, 0.08591461181640625, 0.08955669403076172, 0.09319877624511719, 0.09684085845947266, 0.10048294067382812, 0.1041250228881836, 0.10776710510253906, 0.11140918731689453, 0.11505126953125]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 6.0, 5.0, 3.0, 10.0, 10.0, 15.0, 19.0, 24.0, 47.0, 35.0, 73.0, 87.0, 105.0, 113.0, 113.0, 69.0, 81.0, 43.0, 43.0, 27.0, 17.0, 12.0, 11.0, 8.0, 8.0, 5.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.723735809326172, -15.279806137084961, -14.83587646484375, -14.391946792602539, -13.948017120361328, -13.504087448120117, -13.060157775878906, -12.616228103637695, -12.172298431396484, -11.728368759155273, -11.284439086914062, -10.840509414672852, -10.39657974243164, -9.95265007019043, -9.508720397949219, -9.064790725708008, -8.62086009979248, -8.17693042755127, -7.733000755310059, -7.289071083068848, -6.845141410827637, -6.401211738586426, -5.957281589508057, -5.513351917266846, -5.069422245025635, -4.625492572784424, -4.181562900543213, -3.737632989883423, -3.293703317642212, -2.849773645401001, -2.405843734741211, -1.9619140625, -1.5179834365844727, -1.0740537643432617, -0.6301239728927612, -0.18619418144226074, 0.2577354907989502, 0.7016651630401611, 1.1455950736999512, 1.589524745941162, 2.033454418182373, 2.477384090423584, 2.921313762664795, 3.365243673324585, 3.809173345565796, 4.253103256225586, 4.697032928466797, 5.140962600708008, 5.584892272949219, 6.02882194519043, 6.472751617431641, 6.916681289672852, 7.3606109619140625, 7.804540634155273, 8.248470306396484, 8.692399978637695, 9.136329650878906, 9.580259323120117, 10.024188995361328, 10.468118667602539, 10.91204833984375, 11.355978012084961, 11.799907684326172, 12.243837356567383, 12.68776798248291]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 8.0, 5.0, 10.0, 21.0, 15.0, 11.0, 14.0, 16.0, 33.0, 29.0, 26.0, 29.0, 31.0, 45.0, 40.0, 41.0, 41.0, 48.0, 50.0, 55.0, 42.0, 44.0, 38.0, 41.0, 38.0, 39.0, 33.0, 31.0, 20.0, 21.0, 21.0, 8.0, 15.0, 9.0, 6.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.372095108032227, -7.1438751220703125, -6.915655612945557, -6.687435626983643, -6.459216117858887, -6.230996131896973, -6.002776145935059, -5.774556636810303, -5.546336650848389, -5.318116664886475, -5.089897155761719, -4.861677169799805, -4.633457660675049, -4.405237674713135, -4.177018165588379, -3.948798179626465, -3.72057843208313, -3.492358684539795, -3.26413893699646, -3.035919189453125, -2.807699203491211, -2.579479455947876, -2.351259708404541, -2.123039722442627, -1.8948200941085815, -1.6666003465652466, -1.438380479812622, -1.210160732269287, -0.9819409251213074, -0.7537211179733276, -0.5255013704299927, -0.29728150367736816, -0.0690617561340332, 0.15915803611278534, 0.3873778283596039, 0.6155976057052612, 0.843817412853241, 1.0720372200012207, 1.3002569675445557, 1.5284768342971802, 1.7566965818405151, 1.98491632938385, 2.2131361961364746, 2.4413559436798096, 2.6695756912231445, 2.8977956771850586, 3.1260151863098145, 3.3542351722717285, 3.5824549198150635, 3.8106746673583984, 4.0388946533203125, 4.267114162445068, 4.495334148406982, 4.723553657531738, 4.951773643493652, 5.179993629455566, 5.408213138580322, 5.636433124542236, 5.864652633666992, 6.092872619628906, 6.321092128753662, 6.549312114715576, 6.777531623840332, 7.005751609802246, 7.23397159576416]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 12.0, 25.0, 21.0, 40.0, 65.0, 67.0, 105.0, 154.0, 199.0, 335.0, 528.0, 799.0, 1281.0, 2106.0, 3333.0, 5644.0, 10288.0, 19172.0, 37284.0, 72711.0, 136567.0, 213316.0, 222590.0, 150121.0, 81055.0, 41458.0, 21377.0, 11584.0, 6392.0, 3748.0, 2236.0, 1357.0, 862.0, 557.0, 338.0, 256.0, 162.0, 131.0, 77.0, 63.0, 35.0, 17.0, 26.0, 16.0, 5.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.59765625, -6.39202880859375, -6.1864013671875, -5.98077392578125, -5.775146484375, -5.56951904296875, -5.3638916015625, -5.15826416015625, -4.95263671875, -4.74700927734375, -4.5413818359375, -4.33575439453125, -4.130126953125, -3.92449951171875, -3.7188720703125, -3.51324462890625, -3.3076171875, -3.10198974609375, -2.8963623046875, -2.69073486328125, -2.485107421875, -2.27947998046875, -2.0738525390625, -1.86822509765625, -1.66259765625, -1.45697021484375, -1.2513427734375, -1.04571533203125, -0.840087890625, -0.63446044921875, -0.4288330078125, -0.22320556640625, -0.017578125, 0.18804931640625, 0.3936767578125, 0.59930419921875, 0.804931640625, 1.01055908203125, 1.2161865234375, 1.42181396484375, 1.62744140625, 1.83306884765625, 2.0386962890625, 2.24432373046875, 2.449951171875, 2.65557861328125, 2.8612060546875, 3.06683349609375, 3.2724609375, 3.47808837890625, 3.6837158203125, 3.88934326171875, 4.094970703125, 4.30059814453125, 4.5062255859375, 4.71185302734375, 4.91748046875, 5.12310791015625, 5.3287353515625, 5.53436279296875, 5.739990234375, 5.94561767578125, 6.1512451171875, 6.35687255859375, 6.5625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 15.0, 9.0, 20.0, 8.0, 19.0, 22.0, 29.0, 17.0, 33.0, 34.0, 41.0, 42.0, 45.0, 37.0, 54.0, 51.0, 52.0, 50.0, 41.0, 51.0, 37.0, 45.0, 37.0, 35.0, 36.0, 28.0, 13.0, 18.0, 19.0, 11.0, 9.0, 4.0, 7.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.75390625, -7.49566650390625, -7.2374267578125, -6.97918701171875, -6.720947265625, -6.46270751953125, -6.2044677734375, -5.94622802734375, -5.68798828125, -5.42974853515625, -5.1715087890625, -4.91326904296875, -4.655029296875, -4.39678955078125, -4.1385498046875, -3.88031005859375, -3.6220703125, -3.36383056640625, -3.1055908203125, -2.84735107421875, -2.589111328125, -2.33087158203125, -2.0726318359375, -1.81439208984375, -1.55615234375, -1.29791259765625, -1.0396728515625, -0.78143310546875, -0.523193359375, -0.26495361328125, -0.0067138671875, 0.25152587890625, 0.509765625, 0.76800537109375, 1.0262451171875, 1.28448486328125, 1.542724609375, 1.80096435546875, 2.0592041015625, 2.31744384765625, 2.57568359375, 2.83392333984375, 3.0921630859375, 3.35040283203125, 3.608642578125, 3.86688232421875, 4.1251220703125, 4.38336181640625, 4.6416015625, 4.89984130859375, 5.1580810546875, 5.41632080078125, 5.674560546875, 5.93280029296875, 6.1910400390625, 6.44927978515625, 6.70751953125, 6.96575927734375, 7.2239990234375, 7.48223876953125, 7.740478515625, 7.99871826171875, 8.2569580078125, 8.51519775390625, 8.7734375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 16.0, 23.0, 24.0, 45.0, 61.0, 91.0, 121.0, 190.0, 243.0, 385.0, 604.0, 924.0, 1412.0, 2172.0, 3467.0, 5590.0, 9080.0, 15469.0, 26514.0, 46574.0, 79818.0, 130867.0, 183142.0, 188546.0, 141381.0, 87727.0, 50978.0, 29229.0, 17082.0, 10221.0, 6088.0, 3718.0, 2272.0, 1494.0, 965.0, 639.0, 439.0, 279.0, 192.0, 144.0, 91.0, 58.0, 39.0, 35.0, 23.0, 20.0, 10.0, 11.0, 11.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -4.992431640625, -4.82080078125, -4.649169921875, -4.4775390625, -4.305908203125, -4.13427734375, -3.962646484375, -3.791015625, -3.619384765625, -3.44775390625, -3.276123046875, -3.1044921875, -2.932861328125, -2.76123046875, -2.589599609375, -2.41796875, -2.246337890625, -2.07470703125, -1.903076171875, -1.7314453125, -1.559814453125, -1.38818359375, -1.216552734375, -1.044921875, -0.873291015625, -0.70166015625, -0.530029296875, -0.3583984375, -0.186767578125, -0.01513671875, 0.156494140625, 0.328125, 0.499755859375, 0.67138671875, 0.843017578125, 1.0146484375, 1.186279296875, 1.35791015625, 1.529541015625, 1.701171875, 1.872802734375, 2.04443359375, 2.216064453125, 2.3876953125, 2.559326171875, 2.73095703125, 2.902587890625, 3.07421875, 3.245849609375, 3.41748046875, 3.589111328125, 3.7607421875, 3.932373046875, 4.10400390625, 4.275634765625, 4.447265625, 4.618896484375, 4.79052734375, 4.962158203125, 5.1337890625, 5.305419921875, 5.47705078125, 5.648681640625, 5.8203125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 12.0, 14.0, 20.0, 8.0, 22.0, 27.0, 25.0, 22.0, 29.0, 32.0, 26.0, 38.0, 29.0, 41.0, 31.0, 40.0, 37.0, 29.0, 44.0, 41.0, 30.0, 34.0, 36.0, 29.0, 29.0, 26.0, 20.0, 26.0, 29.0, 18.0, 24.0, 17.0, 14.0, 11.0, 10.0, 10.0, 6.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.64453125, -3.53057861328125, -3.4166259765625, -3.30267333984375, -3.188720703125, -3.07476806640625, -2.9608154296875, -2.84686279296875, -2.73291015625, -2.61895751953125, -2.5050048828125, -2.39105224609375, -2.277099609375, -2.16314697265625, -2.0491943359375, -1.93524169921875, -1.8212890625, -1.70733642578125, -1.5933837890625, -1.47943115234375, -1.365478515625, -1.25152587890625, -1.1375732421875, -1.02362060546875, -0.90966796875, -0.79571533203125, -0.6817626953125, -0.56781005859375, -0.453857421875, -0.33990478515625, -0.2259521484375, -0.11199951171875, 0.001953125, 0.11590576171875, 0.2298583984375, 0.34381103515625, 0.457763671875, 0.57171630859375, 0.6856689453125, 0.79962158203125, 0.91357421875, 1.02752685546875, 1.1414794921875, 1.25543212890625, 1.369384765625, 1.48333740234375, 1.5972900390625, 1.71124267578125, 1.8251953125, 1.93914794921875, 2.0531005859375, 2.16705322265625, 2.281005859375, 2.39495849609375, 2.5089111328125, 2.62286376953125, 2.73681640625, 2.85076904296875, 2.9647216796875, 3.07867431640625, 3.192626953125, 3.30657958984375, 3.4205322265625, 3.53448486328125, 3.6484375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 14.0, 17.0, 25.0, 35.0, 51.0, 75.0, 129.0, 188.0, 241.0, 417.0, 643.0, 1110.0, 1837.0, 3401.0, 6470.0, 14414.0, 37482.0, 113377.0, 327656.0, 344992.0, 125102.0, 40035.0, 15419.0, 6915.0, 3428.0, 1946.0, 1099.0, 726.0, 440.0, 283.0, 193.0, 121.0, 105.0, 48.0, 32.0, 29.0, 16.0, 13.0, 4.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.7109375, -6.5194091796875, -6.327880859375, -6.1363525390625, -5.94482421875, -5.7532958984375, -5.561767578125, -5.3702392578125, -5.1787109375, -4.9871826171875, -4.795654296875, -4.6041259765625, -4.41259765625, -4.2210693359375, -4.029541015625, -3.8380126953125, -3.646484375, -3.4549560546875, -3.263427734375, -3.0718994140625, -2.88037109375, -2.6888427734375, -2.497314453125, -2.3057861328125, -2.1142578125, -1.9227294921875, -1.731201171875, -1.5396728515625, -1.34814453125, -1.1566162109375, -0.965087890625, -0.7735595703125, -0.58203125, -0.3905029296875, -0.198974609375, -0.0074462890625, 0.18408203125, 0.3756103515625, 0.567138671875, 0.7586669921875, 0.9501953125, 1.1417236328125, 1.333251953125, 1.5247802734375, 1.71630859375, 1.9078369140625, 2.099365234375, 2.2908935546875, 2.482421875, 2.6739501953125, 2.865478515625, 3.0570068359375, 3.24853515625, 3.4400634765625, 3.631591796875, 3.8231201171875, 4.0146484375, 4.2061767578125, 4.397705078125, 4.5892333984375, 4.78076171875, 4.9722900390625, 5.163818359375, 5.3553466796875, 5.546875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 8.0, 12.0, 15.0, 27.0, 31.0, 59.0, 107.0, 123.0, 146.0, 141.0, 100.0, 91.0, 53.0, 34.0, 12.0, 11.0, 11.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004782676696777344, -0.00046218186616897583, -0.0004460960626602173, -0.00043001025915145874, -0.0004139244556427002, -0.00039783865213394165, -0.0003817528486251831, -0.00036566704511642456, -0.000349581241607666, -0.00033349543809890747, -0.0003174096345901489, -0.0003013238310813904, -0.00028523802757263184, -0.0002691522240638733, -0.00025306642055511475, -0.0002369806170463562, -0.00022089481353759766, -0.0002048090100288391, -0.00018872320652008057, -0.00017263740301132202, -0.00015655159950256348, -0.00014046579599380493, -0.0001243799924850464, -0.00010829418897628784, -9.22083854675293e-05, -7.612258195877075e-05, -6.003677845001221e-05, -4.395097494125366e-05, -2.7865171432495117e-05, -1.1779367923736572e-05, 4.306435585021973e-06, 2.0392239093780518e-05, 3.647804260253906e-05, 5.256384611129761e-05, 6.864964962005615e-05, 8.47354531288147e-05, 0.00010082125663757324, 0.00011690706014633179, 0.00013299286365509033, 0.00014907866716384888, 0.00016516447067260742, 0.00018125027418136597, 0.0001973360776901245, 0.00021342188119888306, 0.0002295076847076416, 0.00024559348821640015, 0.0002616792917251587, 0.00027776509523391724, 0.0002938508987426758, 0.0003099367022514343, 0.00032602250576019287, 0.0003421083092689514, 0.00035819411277770996, 0.0003742799162864685, 0.00039036571979522705, 0.0004064515233039856, 0.00042253732681274414, 0.0004386231303215027, 0.00045470893383026123, 0.0004707947373390198, 0.0004868805408477783, 0.0005029663443565369, 0.0005190521478652954, 0.000535137951374054, 0.0005512237548828125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 13.0, 6.0, 8.0, 8.0, 11.0, 20.0, 37.0, 40.0, 76.0, 78.0, 153.0, 190.0, 258.0, 431.0, 679.0, 1074.0, 1812.0, 3010.0, 5406.0, 10124.0, 20566.0, 46319.0, 113520.0, 250403.0, 302398.0, 164421.0, 68224.0, 28962.0, 13567.0, 7000.0, 3754.0, 2240.0, 1313.0, 824.0, 536.0, 341.0, 209.0, 166.0, 88.0, 80.0, 57.0, 32.0, 28.0, 21.0, 11.0, 12.0, 6.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-4.390625, -4.25433349609375, -4.1180419921875, -3.98175048828125, -3.845458984375, -3.70916748046875, -3.5728759765625, -3.43658447265625, -3.30029296875, -3.16400146484375, -3.0277099609375, -2.89141845703125, -2.755126953125, -2.61883544921875, -2.4825439453125, -2.34625244140625, -2.2099609375, -2.07366943359375, -1.9373779296875, -1.80108642578125, -1.664794921875, -1.52850341796875, -1.3922119140625, -1.25592041015625, -1.11962890625, -0.98333740234375, -0.8470458984375, -0.71075439453125, -0.574462890625, -0.43817138671875, -0.3018798828125, -0.16558837890625, -0.029296875, 0.10699462890625, 0.2432861328125, 0.37957763671875, 0.515869140625, 0.65216064453125, 0.7884521484375, 0.92474365234375, 1.06103515625, 1.19732666015625, 1.3336181640625, 1.46990966796875, 1.606201171875, 1.74249267578125, 1.8787841796875, 2.01507568359375, 2.1513671875, 2.28765869140625, 2.4239501953125, 2.56024169921875, 2.696533203125, 2.83282470703125, 2.9691162109375, 3.10540771484375, 3.24169921875, 3.37799072265625, 3.5142822265625, 3.65057373046875, 3.786865234375, 3.92315673828125, 4.0594482421875, 4.19573974609375, 4.33203125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 4.0, 7.0, 14.0, 20.0, 22.0, 16.0, 38.0, 27.0, 52.0, 66.0, 67.0, 83.0, 79.0, 98.0, 71.0, 78.0, 68.0, 52.0, 31.0, 27.0, 14.0, 14.0, 12.0, 12.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.998046875, -0.96197509765625, -0.9259033203125, -0.88983154296875, -0.853759765625, -0.81768798828125, -0.7816162109375, -0.74554443359375, -0.70947265625, -0.67340087890625, -0.6373291015625, -0.60125732421875, -0.565185546875, -0.52911376953125, -0.4930419921875, -0.45697021484375, -0.4208984375, -0.38482666015625, -0.3487548828125, -0.31268310546875, -0.276611328125, -0.24053955078125, -0.2044677734375, -0.16839599609375, -0.13232421875, -0.09625244140625, -0.0601806640625, -0.02410888671875, 0.011962890625, 0.04803466796875, 0.0841064453125, 0.12017822265625, 0.15625, 0.19232177734375, 0.2283935546875, 0.26446533203125, 0.300537109375, 0.33660888671875, 0.3726806640625, 0.40875244140625, 0.44482421875, 0.48089599609375, 0.5169677734375, 0.55303955078125, 0.589111328125, 0.62518310546875, 0.6612548828125, 0.69732666015625, 0.7333984375, 0.76947021484375, 0.8055419921875, 0.84161376953125, 0.877685546875, 0.91375732421875, 0.9498291015625, 0.98590087890625, 1.02197265625, 1.05804443359375, 1.0941162109375, 1.13018798828125, 1.166259765625, 1.20233154296875, 1.2384033203125, 1.27447509765625, 1.310546875]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 4.0, 10.0, 10.0, 20.0, 26.0, 36.0, 51.0, 64.0, 87.0, 98.0, 116.0, 113.0, 97.0, 58.0, 62.0, 45.0, 19.0, 19.0, 21.0, 8.0, 5.0, 8.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.716197967529297, -16.259613037109375, -15.80302906036377, -15.346445083618164, -14.889861106872559, -14.433277130126953, -13.976692199707031, -13.520108222961426, -13.06352424621582, -12.606940269470215, -12.150355339050293, -11.693771362304688, -11.237187385559082, -10.780603408813477, -10.324018478393555, -9.86743450164795, -9.410849571228027, -8.954265594482422, -8.4976806640625, -8.041096687316895, -7.584512710571289, -7.127928256988525, -6.671343803405762, -6.214759826660156, -5.758175373077393, -5.301590919494629, -4.845006942749023, -4.38842248916626, -3.931838274002075, -3.4752540588378906, -3.018669605255127, -2.5620853900909424, -2.1055002212524414, -1.6489160060882568, -1.1923316717147827, -0.7357473373413086, -0.279163122177124, 0.17742109298706055, 0.6340055465698242, 1.0905897617340088, 1.5471739768981934, 2.003758192062378, 2.4603424072265625, 2.916926860809326, 3.3735110759735107, 3.8300952911376953, 4.286679744720459, 4.743264198303223, 5.199848175048828, 5.656432628631592, 6.113016605377197, 6.569601058959961, 7.026185035705566, 7.48276948928833, 7.939353942871094, 8.3959379196167, 8.852521896362305, 9.30910587310791, 9.765690803527832, 10.222274780273438, 10.678858757019043, 11.135442733764648, 11.59202766418457, 12.048611640930176, 12.505196571350098]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 9.0, 15.0, 9.0, 20.0, 22.0, 23.0, 19.0, 23.0, 20.0, 30.0, 39.0, 38.0, 37.0, 55.0, 46.0, 41.0, 37.0, 50.0, 48.0, 44.0, 33.0, 45.0, 49.0, 36.0, 37.0, 32.0, 23.0, 19.0, 22.0, 15.0, 14.0, 11.0, 7.0, 6.0, 5.0, 5.0, 0.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.558339595794678, -7.334778308868408, -7.111217021942139, -6.887655735015869, -6.6640944480896, -6.44053316116333, -6.216971397399902, -5.993410110473633, -5.769848823547363, -5.546287536621094, -5.322726249694824, -5.099164962768555, -4.875603675842285, -4.652042388916016, -4.428481101989746, -4.204919815063477, -3.981358528137207, -3.7577972412109375, -3.534235954284668, -3.3106746673583984, -3.087113380432129, -2.8635520935058594, -2.6399905681610107, -2.416429281234741, -2.1928679943084717, -1.9693067073822021, -1.7457454204559326, -1.5221840143203735, -1.298622727394104, -1.0750614404678345, -0.8515000343322754, -0.6279387474060059, -0.4043769836425781, -0.1808156669139862, 0.04274564981460571, 0.26630699634552, 0.48986828327178955, 0.7134295701980591, 0.9369909763336182, 1.1605522632598877, 1.3841135501861572, 1.6076748371124268, 1.8312361240386963, 2.054797649383545, 2.2783589363098145, 2.501920223236084, 2.7254815101623535, 2.949042797088623, 3.1726040840148926, 3.396165370941162, 3.6197266578674316, 3.843287944793701, 4.066849231719971, 4.29041051864624, 4.513972282409668, 4.7375335693359375, 4.961094856262207, 5.184656143188477, 5.408217430114746, 5.631778717041016, 5.855340003967285, 6.078901290893555, 6.302462577819824, 6.526023864746094, 6.749585151672363]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 18.0, 20.0, 24.0, 39.0, 48.0, 81.0, 113.0, 216.0, 255.0, 422.0, 672.0, 1055.0, 1738.0, 3101.0, 5732.0, 11539.0, 28600.0, 99232.0, 533054.0, 2180336.0, 1074211.0, 176822.0, 43689.0, 15892.0, 7518.0, 3858.0, 2169.0, 1357.0, 804.0, 552.0, 348.0, 251.0, 151.0, 98.0, 69.0, 57.0, 46.0, 21.0, 16.0, 8.0, 16.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.09375, -15.5517578125, -15.009765625, -14.4677734375, -13.92578125, -13.3837890625, -12.841796875, -12.2998046875, -11.7578125, -11.2158203125, -10.673828125, -10.1318359375, -9.58984375, -9.0478515625, -8.505859375, -7.9638671875, -7.421875, -6.8798828125, -6.337890625, -5.7958984375, -5.25390625, -4.7119140625, -4.169921875, -3.6279296875, -3.0859375, -2.5439453125, -2.001953125, -1.4599609375, -0.91796875, -0.3759765625, 0.166015625, 0.7080078125, 1.25, 1.7919921875, 2.333984375, 2.8759765625, 3.41796875, 3.9599609375, 4.501953125, 5.0439453125, 5.5859375, 6.1279296875, 6.669921875, 7.2119140625, 7.75390625, 8.2958984375, 8.837890625, 9.3798828125, 9.921875, 10.4638671875, 11.005859375, 11.5478515625, 12.08984375, 12.6318359375, 13.173828125, 13.7158203125, 14.2578125, 14.7998046875, 15.341796875, 15.8837890625, 16.42578125, 16.9677734375, 17.509765625, 18.0517578125, 18.59375]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 10.0, 2.0, 8.0, 7.0, 9.0, 17.0, 23.0, 16.0, 22.0, 27.0, 36.0, 39.0, 33.0, 44.0, 40.0, 49.0, 60.0, 46.0, 54.0, 52.0, 43.0, 64.0, 53.0, 40.0, 42.0, 27.0, 30.0, 18.0, 29.0, 16.0, 11.0, 9.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.46875, -6.273193359375, -6.07763671875, -5.882080078125, -5.6865234375, -5.490966796875, -5.29541015625, -5.099853515625, -4.904296875, -4.708740234375, -4.51318359375, -4.317626953125, -4.1220703125, -3.926513671875, -3.73095703125, -3.535400390625, -3.33984375, -3.144287109375, -2.94873046875, -2.753173828125, -2.5576171875, -2.362060546875, -2.16650390625, -1.970947265625, -1.775390625, -1.579833984375, -1.38427734375, -1.188720703125, -0.9931640625, -0.797607421875, -0.60205078125, -0.406494140625, -0.2109375, -0.015380859375, 0.18017578125, 0.375732421875, 0.5712890625, 0.766845703125, 0.96240234375, 1.157958984375, 1.353515625, 1.549072265625, 1.74462890625, 1.940185546875, 2.1357421875, 2.331298828125, 2.52685546875, 2.722412109375, 2.91796875, 3.113525390625, 3.30908203125, 3.504638671875, 3.7001953125, 3.895751953125, 4.09130859375, 4.286865234375, 4.482421875, 4.677978515625, 4.87353515625, 5.069091796875, 5.2646484375, 5.460205078125, 5.65576171875, 5.851318359375, 6.046875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 3.0, 4.0, 6.0, 10.0, 12.0, 12.0, 22.0, 35.0, 50.0, 54.0, 88.0, 157.0, 198.0, 296.0, 486.0, 728.0, 1208.0, 1967.0, 3401.0, 5981.0, 11733.0, 25246.0, 60729.0, 183764.0, 765050.0, 2068584.0, 767619.0, 184329.0, 60517.0, 25112.0, 11995.0, 6141.0, 3413.0, 1872.0, 1229.0, 765.0, 510.0, 267.0, 200.0, 156.0, 106.0, 69.0, 46.0, 25.0, 30.0, 14.0, 18.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0], "bins": [-17.4375, -16.9169921875, -16.396484375, -15.8759765625, -15.35546875, -14.8349609375, -14.314453125, -13.7939453125, -13.2734375, -12.7529296875, -12.232421875, -11.7119140625, -11.19140625, -10.6708984375, -10.150390625, -9.6298828125, -9.109375, -8.5888671875, -8.068359375, -7.5478515625, -7.02734375, -6.5068359375, -5.986328125, -5.4658203125, -4.9453125, -4.4248046875, -3.904296875, -3.3837890625, -2.86328125, -2.3427734375, -1.822265625, -1.3017578125, -0.78125, -0.2607421875, 0.259765625, 0.7802734375, 1.30078125, 1.8212890625, 2.341796875, 2.8623046875, 3.3828125, 3.9033203125, 4.423828125, 4.9443359375, 5.46484375, 5.9853515625, 6.505859375, 7.0263671875, 7.546875, 8.0673828125, 8.587890625, 9.1083984375, 9.62890625, 10.1494140625, 10.669921875, 11.1904296875, 11.7109375, 12.2314453125, 12.751953125, 13.2724609375, 13.79296875, 14.3134765625, 14.833984375, 15.3544921875, 15.875]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 7.0, 9.0, 10.0, 23.0, 34.0, 37.0, 32.0, 53.0, 84.0, 110.0, 130.0, 169.0, 194.0, 278.0, 340.0, 397.0, 370.0, 361.0, 278.0, 232.0, 210.0, 167.0, 105.0, 83.0, 71.0, 53.0, 41.0, 38.0, 35.0, 10.0, 23.0, 13.0, 9.0, 9.0, 8.0, 6.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.990234375, -2.89190673828125, -2.7935791015625, -2.69525146484375, -2.596923828125, -2.49859619140625, -2.4002685546875, -2.30194091796875, -2.20361328125, -2.10528564453125, -2.0069580078125, -1.90863037109375, -1.810302734375, -1.71197509765625, -1.6136474609375, -1.51531982421875, -1.4169921875, -1.31866455078125, -1.2203369140625, -1.12200927734375, -1.023681640625, -0.92535400390625, -0.8270263671875, -0.72869873046875, -0.63037109375, -0.53204345703125, -0.4337158203125, -0.33538818359375, -0.237060546875, -0.13873291015625, -0.0404052734375, 0.05792236328125, 0.15625, 0.25457763671875, 0.3529052734375, 0.45123291015625, 0.549560546875, 0.64788818359375, 0.7462158203125, 0.84454345703125, 0.94287109375, 1.04119873046875, 1.1395263671875, 1.23785400390625, 1.336181640625, 1.43450927734375, 1.5328369140625, 1.63116455078125, 1.7294921875, 1.82781982421875, 1.9261474609375, 2.02447509765625, 2.122802734375, 2.22113037109375, 2.3194580078125, 2.41778564453125, 2.51611328125, 2.61444091796875, 2.7127685546875, 2.81109619140625, 2.909423828125, 3.00775146484375, 3.1060791015625, 3.20440673828125, 3.302734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 14.0, 11.0, 19.0, 19.0, 31.0, 31.0, 48.0, 73.0, 78.0, 94.0, 124.0, 85.0, 81.0, 71.0, 46.0, 39.0, 29.0, 25.0, 28.0, 14.0, 11.0, 9.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.885161399841309, -14.453387260437012, -14.021614074707031, -13.589839935302734, -13.158066749572754, -12.726292610168457, -12.294519424438477, -11.86274528503418, -11.4309720993042, -10.999197959899902, -10.567424774169922, -10.135650634765625, -9.703877449035645, -9.272103309631348, -8.840330123901367, -8.40855598449707, -7.976782321929932, -7.545008659362793, -7.113234996795654, -6.681461334228516, -6.249687671661377, -5.817914009094238, -5.386139869689941, -4.954366683959961, -4.522592544555664, -4.090818881988525, -3.6590452194213867, -3.227271556854248, -2.7954978942871094, -2.3637239933013916, -1.931950330734253, -1.5001766681671143, -1.0684032440185547, -0.636629581451416, -0.20485585927963257, 0.22691786289215088, 0.6586915254592896, 1.0904653072357178, 1.5222389698028564, 1.9540126323699951, 2.385786294937134, 2.8175599575042725, 3.249333620071411, 3.681107521057129, 4.112881183624268, 4.544654846191406, 4.976428508758545, 5.408202171325684, 5.839975833892822, 6.271749496459961, 6.7035231590271, 7.135296821594238, 7.567070484161377, 7.998844146728516, 8.430618286132812, 8.862391471862793, 9.29416561126709, 9.725939750671387, 10.157712936401367, 10.589487075805664, 11.021260261535645, 11.453034400939941, 11.884807586669922, 12.316581726074219, 12.7483549118042]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 8.0, 13.0, 12.0, 18.0, 21.0, 18.0, 34.0, 38.0, 32.0, 35.0, 43.0, 38.0, 50.0, 42.0, 42.0, 49.0, 47.0, 42.0, 46.0, 44.0, 43.0, 31.0, 43.0, 41.0, 29.0, 22.0, 24.0, 20.0, 17.0, 7.0, 9.0, 4.0, 10.0, 4.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.40715217590332, -8.174091339111328, -7.941031455993652, -7.707971096038818, -7.474910736083984, -7.24185037612915, -7.008790016174316, -6.775729179382324, -6.542669296264648, -6.3096089363098145, -6.0765485763549805, -5.8434882164001465, -5.6104278564453125, -5.3773674964904785, -5.1443071365356445, -4.911246299743652, -4.678185939788818, -4.445125579833984, -4.21206521987915, -3.9790048599243164, -3.7459444999694824, -3.5128841400146484, -3.2798235416412354, -3.0467631816864014, -2.8137028217315674, -2.5806424617767334, -2.3475821018218994, -2.1145215034484863, -1.881461262702942, -1.648400902748108, -1.4153404235839844, -1.1822800636291504, -0.9492201805114746, -0.7161598205566406, -0.48309940099716187, -0.2500389814376831, -0.01697862148284912, 0.21608173847198486, 0.4491422176361084, 0.6822025775909424, 0.9152629375457764, 1.1483232975006104, 1.3813836574554443, 1.6144441366195679, 1.8475044965744019, 2.0805649757385254, 2.3136253356933594, 2.5466856956481934, 2.7797460556030273, 3.0128064155578613, 3.2458667755126953, 3.4789271354675293, 3.7119874954223633, 3.9450478553771973, 4.178108215332031, 4.411169052124023, 4.644228935241699, 4.877289295196533, 5.110349655151367, 5.343410015106201, 5.576470375061035, 5.809530735015869, 6.042591094970703, 6.275651931762695, 6.508712291717529]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 9.0, 12.0, 17.0, 21.0, 35.0, 65.0, 89.0, 134.0, 262.0, 449.0, 782.0, 1449.0, 2667.0, 5342.0, 10535.0, 22702.0, 50738.0, 123854.0, 300544.0, 304875.0, 125525.0, 52576.0, 23123.0, 11149.0, 5399.0, 2744.0, 1476.0, 836.0, 441.0, 241.0, 173.0, 88.0, 70.0, 36.0, 24.0, 17.0, 14.0, 9.0, 10.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.3544921875, -1.314666748046875, -1.27484130859375, -1.235015869140625, -1.1951904296875, -1.155364990234375, -1.11553955078125, -1.075714111328125, -1.035888671875, -0.996063232421875, -0.95623779296875, -0.916412353515625, -0.8765869140625, -0.836761474609375, -0.79693603515625, -0.757110595703125, -0.71728515625, -0.677459716796875, -0.63763427734375, -0.597808837890625, -0.5579833984375, -0.518157958984375, -0.47833251953125, -0.438507080078125, -0.398681640625, -0.358856201171875, -0.31903076171875, -0.279205322265625, -0.2393798828125, -0.199554443359375, -0.15972900390625, -0.119903564453125, -0.080078125, -0.040252685546875, -0.00042724609375, 0.039398193359375, 0.0792236328125, 0.119049072265625, 0.15887451171875, 0.198699951171875, 0.238525390625, 0.278350830078125, 0.31817626953125, 0.358001708984375, 0.3978271484375, 0.437652587890625, 0.47747802734375, 0.517303466796875, 0.55712890625, 0.596954345703125, 0.63677978515625, 0.676605224609375, 0.7164306640625, 0.756256103515625, 0.79608154296875, 0.835906982421875, 0.875732421875, 0.915557861328125, 0.95538330078125, 0.995208740234375, 1.0350341796875, 1.074859619140625, 1.11468505859375, 1.154510498046875, 1.1943359375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 4.0, 5.0, 9.0, 11.0, 8.0, 16.0, 15.0, 18.0, 17.0, 23.0, 31.0, 23.0, 23.0, 34.0, 39.0, 45.0, 42.0, 39.0, 47.0, 41.0, 54.0, 43.0, 39.0, 38.0, 36.0, 49.0, 41.0, 28.0, 26.0, 30.0, 23.0, 25.0, 14.0, 12.0, 10.0, 8.0, 11.0, 5.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.47265625, -7.23370361328125, -6.9947509765625, -6.75579833984375, -6.516845703125, -6.27789306640625, -6.0389404296875, -5.79998779296875, -5.56103515625, -5.32208251953125, -5.0831298828125, -4.84417724609375, -4.605224609375, -4.36627197265625, -4.1273193359375, -3.88836669921875, -3.6494140625, -3.41046142578125, -3.1715087890625, -2.93255615234375, -2.693603515625, -2.45465087890625, -2.2156982421875, -1.97674560546875, -1.73779296875, -1.49884033203125, -1.2598876953125, -1.02093505859375, -0.781982421875, -0.54302978515625, -0.3040771484375, -0.06512451171875, 0.173828125, 0.41278076171875, 0.6517333984375, 0.89068603515625, 1.129638671875, 1.36859130859375, 1.6075439453125, 1.84649658203125, 2.08544921875, 2.32440185546875, 2.5633544921875, 2.80230712890625, 3.041259765625, 3.28021240234375, 3.5191650390625, 3.75811767578125, 3.9970703125, 4.23602294921875, 4.4749755859375, 4.71392822265625, 4.952880859375, 5.19183349609375, 5.4307861328125, 5.66973876953125, 5.90869140625, 6.14764404296875, 6.3865966796875, 6.62554931640625, 6.864501953125, 7.10345458984375, 7.3424072265625, 7.58135986328125, 7.8203125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 21.0, 19.0, 16.0, 36.0, 46.0, 62.0, 75.0, 104.0, 138.0, 174.0, 262.0, 329.0, 536.0, 763.0, 1156.0, 1824.0, 3012.0, 5174.0, 9631.0, 20055.0, 72109.0, 824879.0, 65906.0, 19304.0, 9486.0, 5196.0, 2843.0, 1704.0, 1068.0, 741.0, 514.0, 353.0, 250.0, 185.0, 141.0, 97.0, 79.0, 61.0, 42.0, 32.0, 23.0, 21.0, 17.0, 8.0, 6.0, 10.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-2.11328125, -2.0482177734375, -1.983154296875, -1.9180908203125, -1.85302734375, -1.7879638671875, -1.722900390625, -1.6578369140625, -1.5927734375, -1.5277099609375, -1.462646484375, -1.3975830078125, -1.33251953125, -1.2674560546875, -1.202392578125, -1.1373291015625, -1.072265625, -1.0072021484375, -0.942138671875, -0.8770751953125, -0.81201171875, -0.7469482421875, -0.681884765625, -0.6168212890625, -0.5517578125, -0.4866943359375, -0.421630859375, -0.3565673828125, -0.29150390625, -0.2264404296875, -0.161376953125, -0.0963134765625, -0.03125, 0.0338134765625, 0.098876953125, 0.1639404296875, 0.22900390625, 0.2940673828125, 0.359130859375, 0.4241943359375, 0.4892578125, 0.5543212890625, 0.619384765625, 0.6844482421875, 0.74951171875, 0.8145751953125, 0.879638671875, 0.9447021484375, 1.009765625, 1.0748291015625, 1.139892578125, 1.2049560546875, 1.27001953125, 1.3350830078125, 1.400146484375, 1.4652099609375, 1.5302734375, 1.5953369140625, 1.660400390625, 1.7254638671875, 1.79052734375, 1.8555908203125, 1.920654296875, 1.9857177734375, 2.05078125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 12.0, 6.0, 6.0, 12.0, 23.0, 21.0, 11.0, 21.0, 22.0, 24.0, 19.0, 23.0, 32.0, 38.0, 39.0, 22.0, 32.0, 41.0, 46.0, 36.0, 36.0, 43.0, 29.0, 28.0, 33.0, 41.0, 32.0, 33.0, 29.0, 25.0, 20.0, 21.0, 18.0, 18.0, 9.0, 24.0, 14.0, 10.0, 12.0, 6.0, 3.0, 5.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0], "bins": [-3.916015625, -3.794586181640625, -3.67315673828125, -3.551727294921875, -3.4302978515625, -3.308868408203125, -3.18743896484375, -3.066009521484375, -2.944580078125, -2.823150634765625, -2.70172119140625, -2.580291748046875, -2.4588623046875, -2.337432861328125, -2.21600341796875, -2.094573974609375, -1.97314453125, -1.851715087890625, -1.73028564453125, -1.608856201171875, -1.4874267578125, -1.365997314453125, -1.24456787109375, -1.123138427734375, -1.001708984375, -0.880279541015625, -0.75885009765625, -0.637420654296875, -0.5159912109375, -0.394561767578125, -0.27313232421875, -0.151702880859375, -0.0302734375, 0.091156005859375, 0.21258544921875, 0.334014892578125, 0.4554443359375, 0.576873779296875, 0.69830322265625, 0.819732666015625, 0.941162109375, 1.062591552734375, 1.18402099609375, 1.305450439453125, 1.4268798828125, 1.548309326171875, 1.66973876953125, 1.791168212890625, 1.91259765625, 2.034027099609375, 2.15545654296875, 2.276885986328125, 2.3983154296875, 2.519744873046875, 2.64117431640625, 2.762603759765625, 2.884033203125, 3.005462646484375, 3.12689208984375, 3.248321533203125, 3.3697509765625, 3.491180419921875, 3.61260986328125, 3.734039306640625, 3.85546875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 4.0, 8.0, 19.0, 33.0, 33.0, 44.0, 57.0, 71.0, 106.0, 139.0, 170.0, 272.0, 411.0, 607.0, 967.0, 1524.0, 2477.0, 4509.0, 9048.0, 21981.0, 192541.0, 764719.0, 25840.0, 10400.0, 5069.0, 2846.0, 1607.0, 992.0, 600.0, 418.0, 300.0, 196.0, 152.0, 97.0, 71.0, 65.0, 33.0, 22.0, 19.0, 22.0, 11.0, 11.0, 7.0, 5.0, 6.0, 2.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.716796875, -0.69512939453125, -0.6734619140625, -0.65179443359375, -0.630126953125, -0.60845947265625, -0.5867919921875, -0.56512451171875, -0.54345703125, -0.52178955078125, -0.5001220703125, -0.47845458984375, -0.456787109375, -0.43511962890625, -0.4134521484375, -0.39178466796875, -0.3701171875, -0.34844970703125, -0.3267822265625, -0.30511474609375, -0.283447265625, -0.26177978515625, -0.2401123046875, -0.21844482421875, -0.19677734375, -0.17510986328125, -0.1534423828125, -0.13177490234375, -0.110107421875, -0.08843994140625, -0.0667724609375, -0.04510498046875, -0.0234375, -0.00177001953125, 0.0198974609375, 0.04156494140625, 0.063232421875, 0.08489990234375, 0.1065673828125, 0.12823486328125, 0.14990234375, 0.17156982421875, 0.1932373046875, 0.21490478515625, 0.236572265625, 0.25823974609375, 0.2799072265625, 0.30157470703125, 0.3232421875, 0.34490966796875, 0.3665771484375, 0.38824462890625, 0.409912109375, 0.43157958984375, 0.4532470703125, 0.47491455078125, 0.49658203125, 0.51824951171875, 0.5399169921875, 0.56158447265625, 0.583251953125, 0.60491943359375, 0.6265869140625, 0.64825439453125, 0.669921875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 10.0, 13.0, 14.0, 20.0, 22.0, 23.0, 28.0, 37.0, 33.0, 32.0, 37.0, 40.0, 53.0, 42.0, 46.0, 62.0, 46.0, 61.0, 40.0, 50.0, 42.0, 36.0, 28.0, 30.0, 24.0, 17.0, 22.0, 18.0, 18.0, 9.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.279613494873047e-05, -4.151090979576111e-05, -4.022568464279175e-05, -3.894045948982239e-05, -3.765523433685303e-05, -3.637000918388367e-05, -3.508478403091431e-05, -3.3799558877944946e-05, -3.2514333724975586e-05, -3.1229108572006226e-05, -2.9943883419036865e-05, -2.8658658266067505e-05, -2.7373433113098145e-05, -2.6088207960128784e-05, -2.4802982807159424e-05, -2.3517757654190063e-05, -2.2232532501220703e-05, -2.0947307348251343e-05, -1.9662082195281982e-05, -1.8376857042312622e-05, -1.7091631889343262e-05, -1.58064067363739e-05, -1.4521181583404541e-05, -1.323595643043518e-05, -1.195073127746582e-05, -1.066550612449646e-05, -9.3802809715271e-06, -8.09505581855774e-06, -6.809830665588379e-06, -5.5246055126190186e-06, -4.239380359649658e-06, -2.954155206680298e-06, -1.6689300537109375e-06, -3.8370490074157715e-07, 9.015202522277832e-07, 2.1867454051971436e-06, 3.471970558166504e-06, 4.757195711135864e-06, 6.042420864105225e-06, 7.327646017074585e-06, 8.612871170043945e-06, 9.898096323013306e-06, 1.1183321475982666e-05, 1.2468546628952026e-05, 1.3753771781921387e-05, 1.5038996934890747e-05, 1.6324222087860107e-05, 1.7609447240829468e-05, 1.8894672393798828e-05, 2.017989754676819e-05, 2.146512269973755e-05, 2.275034785270691e-05, 2.403557300567627e-05, 2.532079815864563e-05, 2.660602331161499e-05, 2.789124846458435e-05, 2.917647361755371e-05, 3.046169877052307e-05, 3.174692392349243e-05, 3.303214907646179e-05, 3.431737422943115e-05, 3.560259938240051e-05, 3.688782453536987e-05, 3.8173049688339233e-05, 3.9458274841308594e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 8.0, 7.0, 11.0, 16.0, 22.0, 26.0, 40.0, 59.0, 77.0, 140.0, 232.0, 373.0, 619.0, 1189.0, 2367.0, 5194.0, 12381.0, 34583.0, 110308.0, 368411.0, 353045.0, 104926.0, 32720.0, 11769.0, 4918.0, 2359.0, 1097.0, 658.0, 380.0, 204.0, 146.0, 74.0, 59.0, 47.0, 33.0, 20.0, 15.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.340087890625, -0.32874298095703125, -0.3173980712890625, -0.30605316162109375, -0.294708251953125, -0.28336334228515625, -0.2720184326171875, -0.26067352294921875, -0.24932861328125, -0.23798370361328125, -0.2266387939453125, -0.21529388427734375, -0.203948974609375, -0.19260406494140625, -0.1812591552734375, -0.16991424560546875, -0.1585693359375, -0.14722442626953125, -0.1358795166015625, -0.12453460693359375, -0.113189697265625, -0.10184478759765625, -0.0904998779296875, -0.07915496826171875, -0.06781005859375, -0.05646514892578125, -0.0451202392578125, -0.03377532958984375, -0.022430419921875, -0.01108551025390625, 0.0002593994140625, 0.01160430908203125, 0.02294921875, 0.03429412841796875, 0.0456390380859375, 0.05698394775390625, 0.068328857421875, 0.07967376708984375, 0.0910186767578125, 0.10236358642578125, 0.11370849609375, 0.12505340576171875, 0.1363983154296875, 0.14774322509765625, 0.159088134765625, 0.17043304443359375, 0.1817779541015625, 0.19312286376953125, 0.2044677734375, 0.21581268310546875, 0.2271575927734375, 0.23850250244140625, 0.249847412109375, 0.26119232177734375, 0.2725372314453125, 0.28388214111328125, 0.29522705078125, 0.30657196044921875, 0.3179168701171875, 0.32926177978515625, 0.340606689453125, 0.35195159912109375, 0.3632965087890625, 0.37464141845703125, 0.385986328125]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 10.0, 9.0, 6.0, 20.0, 20.0, 14.0, 32.0, 28.0, 44.0, 44.0, 41.0, 56.0, 67.0, 59.0, 61.0, 67.0, 52.0, 49.0, 46.0, 58.0, 45.0, 21.0, 34.0, 31.0, 17.0, 19.0, 6.0, 14.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.051025390625, -0.049411773681640625, -0.04779815673828125, -0.046184539794921875, -0.0445709228515625, -0.042957305908203125, -0.04134368896484375, -0.039730072021484375, -0.038116455078125, -0.036502838134765625, -0.03488922119140625, -0.033275604248046875, -0.0316619873046875, -0.030048370361328125, -0.02843475341796875, -0.026821136474609375, -0.02520751953125, -0.023593902587890625, -0.02198028564453125, -0.020366668701171875, -0.0187530517578125, -0.017139434814453125, -0.01552581787109375, -0.013912200927734375, -0.012298583984375, -0.010684967041015625, -0.00907135009765625, -0.007457733154296875, -0.0058441162109375, -0.004230499267578125, -0.00261688232421875, -0.001003265380859375, 0.0006103515625, 0.002223968505859375, 0.00383758544921875, 0.005451202392578125, 0.0070648193359375, 0.008678436279296875, 0.01029205322265625, 0.011905670166015625, 0.013519287109375, 0.015132904052734375, 0.01674652099609375, 0.018360137939453125, 0.0199737548828125, 0.021587371826171875, 0.02320098876953125, 0.024814605712890625, 0.02642822265625, 0.028041839599609375, 0.02965545654296875, 0.031269073486328125, 0.0328826904296875, 0.034496307373046875, 0.03610992431640625, 0.037723541259765625, 0.039337158203125, 0.040950775146484375, 0.04256439208984375, 0.044178009033203125, 0.0457916259765625, 0.047405242919921875, 0.04901885986328125, 0.050632476806640625, 0.05224609375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 13.0, 18.0, 25.0, 25.0, 41.0, 55.0, 79.0, 86.0, 109.0, 108.0, 88.0, 77.0, 60.0, 50.0, 26.0, 33.0, 17.0, 24.0, 17.0, 7.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.745636940002441, -14.31353759765625, -13.881438255310059, -13.449338912963867, -13.017240524291992, -12.5851411819458, -12.15304183959961, -11.720942497253418, -11.288843154907227, -10.856743812561035, -10.424644470214844, -9.992546081542969, -9.560446739196777, -9.128347396850586, -8.696248054504395, -8.264148712158203, -7.832050323486328, -7.399950981140137, -6.9678521156311035, -6.535752773284912, -6.103653907775879, -5.6715545654296875, -5.239455223083496, -4.807355880737305, -4.3752570152282715, -3.943157911300659, -3.511058807373047, -3.0789594650268555, -2.646860361099243, -2.214761257171631, -1.7826619148254395, -1.3505628108978271, -0.9184637069702148, -0.48636454343795776, -0.054265379905700684, 0.37783384323120117, 0.8099329471588135, 1.2420320510864258, 1.6741313934326172, 2.1062304973602295, 2.538329601287842, 2.970428705215454, 3.4025278091430664, 3.834627151489258, 4.266726493835449, 4.698825359344482, 5.130924701690674, 5.563023567199707, 5.995122909545898, 6.42722225189209, 6.859321117401123, 7.2914204597473145, 7.723519325256348, 8.155618667602539, 8.58771800994873, 9.019817352294922, 9.451915740966797, 9.884015083312988, 10.31611442565918, 10.748212814331055, 11.180312156677246, 11.612411499023438, 12.044510841369629, 12.47661018371582, 12.908709526062012]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 7.0, 14.0, 11.0, 20.0, 16.0, 20.0, 32.0, 40.0, 32.0, 33.0, 40.0, 40.0, 53.0, 42.0, 41.0, 49.0, 44.0, 43.0, 45.0, 48.0, 44.0, 31.0, 44.0, 36.0, 33.0, 24.0, 20.0, 22.0, 15.0, 10.0, 10.0, 2.0, 11.0, 5.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.325665473937988, -8.093708038330078, -7.861751556396484, -7.629794120788574, -7.397837162017822, -7.16588020324707, -6.933923244476318, -6.701966285705566, -6.470008850097656, -6.238051891326904, -6.006094932556152, -5.774137496948242, -5.54218053817749, -5.310223579406738, -5.078266620635986, -4.846309661865234, -4.614352703094482, -4.3823957443237305, -4.1504387855529785, -3.9184815883636475, -3.6865243911743164, -3.4545674324035645, -3.2226104736328125, -2.9906535148620605, -2.7586963176727295, -2.5267393589019775, -2.2947821617126465, -2.0628252029418945, -1.830868124961853, -1.5989110469818115, -1.3669540882110596, -1.134997010231018, -0.9030404090881348, -0.6710833311080933, -0.43912631273269653, -0.2071692943572998, 0.0247877836227417, 0.2567448616027832, 0.48870182037353516, 0.7206588983535767, 0.9526159763336182, 1.1845730543136597, 1.4165301322937012, 1.6484870910644531, 1.8804441690444946, 2.112401247024536, 2.344358205795288, 2.576315402984619, 2.808272361755371, 3.040229320526123, 3.272186517715454, 3.504143476486206, 3.736100673675537, 3.968057632446289, 4.200014591217041, 4.431971549987793, 4.663928985595703, 4.895885944366455, 5.127842903137207, 5.359800338745117, 5.591757297515869, 5.823714256286621, 6.055671215057373, 6.287628173828125, 6.519585132598877]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 11.0, 12.0, 13.0, 18.0, 37.0, 43.0, 59.0, 93.0, 130.0, 174.0, 249.0, 344.0, 486.0, 705.0, 1079.0, 1791.0, 2829.0, 4620.0, 8195.0, 15523.0, 32489.0, 76388.0, 187318.0, 320497.0, 221687.0, 93304.0, 39150.0, 17888.0, 9287.0, 5173.0, 3155.0, 1936.0, 1266.0, 790.0, 535.0, 369.0, 249.0, 182.0, 131.0, 102.0, 66.0, 48.0, 35.0, 19.0, 22.0, 12.0, 7.0, 12.0, 8.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0], "bins": [-10.890625, -10.556640625, -10.22265625, -9.888671875, -9.5546875, -9.220703125, -8.88671875, -8.552734375, -8.21875, -7.884765625, -7.55078125, -7.216796875, -6.8828125, -6.548828125, -6.21484375, -5.880859375, -5.546875, -5.212890625, -4.87890625, -4.544921875, -4.2109375, -3.876953125, -3.54296875, -3.208984375, -2.875, -2.541015625, -2.20703125, -1.873046875, -1.5390625, -1.205078125, -0.87109375, -0.537109375, -0.203125, 0.130859375, 0.46484375, 0.798828125, 1.1328125, 1.466796875, 1.80078125, 2.134765625, 2.46875, 2.802734375, 3.13671875, 3.470703125, 3.8046875, 4.138671875, 4.47265625, 4.806640625, 5.140625, 5.474609375, 5.80859375, 6.142578125, 6.4765625, 6.810546875, 7.14453125, 7.478515625, 7.8125, 8.146484375, 8.48046875, 8.814453125, 9.1484375, 9.482421875, 9.81640625, 10.150390625, 10.484375]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 2.0, 11.0, 7.0, 11.0, 22.0, 17.0, 34.0, 35.0, 23.0, 37.0, 35.0, 40.0, 42.0, 51.0, 46.0, 46.0, 43.0, 44.0, 58.0, 63.0, 39.0, 40.0, 38.0, 32.0, 27.0, 29.0, 24.0, 22.0, 16.0, 8.0, 10.0, 9.0, 8.0, 10.0, 6.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.7109375, -9.4437255859375, -9.176513671875, -8.9093017578125, -8.64208984375, -8.3748779296875, -8.107666015625, -7.8404541015625, -7.5732421875, -7.3060302734375, -7.038818359375, -6.7716064453125, -6.50439453125, -6.2371826171875, -5.969970703125, -5.7027587890625, -5.435546875, -5.1683349609375, -4.901123046875, -4.6339111328125, -4.36669921875, -4.0994873046875, -3.832275390625, -3.5650634765625, -3.2978515625, -3.0306396484375, -2.763427734375, -2.4962158203125, -2.22900390625, -1.9617919921875, -1.694580078125, -1.4273681640625, -1.16015625, -0.8929443359375, -0.625732421875, -0.3585205078125, -0.09130859375, 0.1759033203125, 0.443115234375, 0.7103271484375, 0.9775390625, 1.2447509765625, 1.511962890625, 1.7791748046875, 2.04638671875, 2.3135986328125, 2.580810546875, 2.8480224609375, 3.115234375, 3.3824462890625, 3.649658203125, 3.9168701171875, 4.18408203125, 4.4512939453125, 4.718505859375, 4.9857177734375, 5.2529296875, 5.5201416015625, 5.787353515625, 6.0545654296875, 6.32177734375, 6.5889892578125, 6.856201171875, 7.1234130859375, 7.390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 11.0, 16.0, 19.0, 31.0, 43.0, 74.0, 121.0, 168.0, 281.0, 445.0, 835.0, 1505.0, 3123.0, 7440.0, 19859.0, 62991.0, 212211.0, 421067.0, 217995.0, 65301.0, 20568.0, 7557.0, 3258.0, 1525.0, 854.0, 445.0, 284.0, 171.0, 135.0, 58.0, 49.0, 35.0, 20.0, 15.0, 8.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.859375, -13.43310546875, -13.0068359375, -12.58056640625, -12.154296875, -11.72802734375, -11.3017578125, -10.87548828125, -10.44921875, -10.02294921875, -9.5966796875, -9.17041015625, -8.744140625, -8.31787109375, -7.8916015625, -7.46533203125, -7.0390625, -6.61279296875, -6.1865234375, -5.76025390625, -5.333984375, -4.90771484375, -4.4814453125, -4.05517578125, -3.62890625, -3.20263671875, -2.7763671875, -2.35009765625, -1.923828125, -1.49755859375, -1.0712890625, -0.64501953125, -0.21875, 0.20751953125, 0.6337890625, 1.06005859375, 1.486328125, 1.91259765625, 2.3388671875, 2.76513671875, 3.19140625, 3.61767578125, 4.0439453125, 4.47021484375, 4.896484375, 5.32275390625, 5.7490234375, 6.17529296875, 6.6015625, 7.02783203125, 7.4541015625, 7.88037109375, 8.306640625, 8.73291015625, 9.1591796875, 9.58544921875, 10.01171875, 10.43798828125, 10.8642578125, 11.29052734375, 11.716796875, 12.14306640625, 12.5693359375, 12.99560546875, 13.421875]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 7.0, 6.0, 15.0, 10.0, 9.0, 14.0, 14.0, 12.0, 18.0, 10.0, 23.0, 28.0, 31.0, 30.0, 35.0, 31.0, 43.0, 44.0, 35.0, 44.0, 39.0, 49.0, 46.0, 32.0, 31.0, 33.0, 41.0, 29.0, 32.0, 31.0, 24.0, 22.0, 21.0, 18.0, 15.0, 17.0, 13.0, 8.0, 10.0, 7.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.666015625, -3.547119140625, -3.42822265625, -3.309326171875, -3.1904296875, -3.071533203125, -2.95263671875, -2.833740234375, -2.71484375, -2.595947265625, -2.47705078125, -2.358154296875, -2.2392578125, -2.120361328125, -2.00146484375, -1.882568359375, -1.763671875, -1.644775390625, -1.52587890625, -1.406982421875, -1.2880859375, -1.169189453125, -1.05029296875, -0.931396484375, -0.8125, -0.693603515625, -0.57470703125, -0.455810546875, -0.3369140625, -0.218017578125, -0.09912109375, 0.019775390625, 0.138671875, 0.257568359375, 0.37646484375, 0.495361328125, 0.6142578125, 0.733154296875, 0.85205078125, 0.970947265625, 1.08984375, 1.208740234375, 1.32763671875, 1.446533203125, 1.5654296875, 1.684326171875, 1.80322265625, 1.922119140625, 2.041015625, 2.159912109375, 2.27880859375, 2.397705078125, 2.5166015625, 2.635498046875, 2.75439453125, 2.873291015625, 2.9921875, 3.111083984375, 3.22998046875, 3.348876953125, 3.4677734375, 3.586669921875, 3.70556640625, 3.824462890625, 3.943359375]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 6.0, 5.0, 8.0, 16.0, 24.0, 34.0, 44.0, 83.0, 69.0, 119.0, 176.0, 241.0, 377.0, 552.0, 765.0, 1153.0, 1792.0, 2863.0, 4721.0, 8035.0, 14586.0, 27247.0, 54770.0, 112554.0, 209446.0, 254533.0, 173232.0, 87623.0, 42858.0, 21237.0, 11627.0, 6469.0, 3968.0, 2453.0, 1576.0, 1047.0, 691.0, 456.0, 336.0, 217.0, 171.0, 117.0, 74.0, 52.0, 38.0, 30.0, 19.0, 17.0, 10.0, 6.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0], "bins": [-4.08203125, -3.95953369140625, -3.8370361328125, -3.71453857421875, -3.592041015625, -3.46954345703125, -3.3470458984375, -3.22454833984375, -3.10205078125, -2.97955322265625, -2.8570556640625, -2.73455810546875, -2.612060546875, -2.48956298828125, -2.3670654296875, -2.24456787109375, -2.1220703125, -1.99957275390625, -1.8770751953125, -1.75457763671875, -1.632080078125, -1.50958251953125, -1.3870849609375, -1.26458740234375, -1.14208984375, -1.01959228515625, -0.8970947265625, -0.77459716796875, -0.652099609375, -0.52960205078125, -0.4071044921875, -0.28460693359375, -0.162109375, -0.03961181640625, 0.0828857421875, 0.20538330078125, 0.327880859375, 0.45037841796875, 0.5728759765625, 0.69537353515625, 0.81787109375, 0.94036865234375, 1.0628662109375, 1.18536376953125, 1.307861328125, 1.43035888671875, 1.5528564453125, 1.67535400390625, 1.7978515625, 1.92034912109375, 2.0428466796875, 2.16534423828125, 2.287841796875, 2.41033935546875, 2.5328369140625, 2.65533447265625, 2.77783203125, 2.90032958984375, 3.0228271484375, 3.14532470703125, 3.267822265625, 3.39031982421875, 3.5128173828125, 3.63531494140625, 3.7578125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 18.0, 25.0, 60.0, 97.0, 125.0, 151.0, 137.0, 113.0, 92.0, 61.0, 33.0, 18.0, 13.0, 13.0, 6.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006403923034667969, -0.000621497631072998, -0.0006026029586791992, -0.0005837082862854004, -0.0005648136138916016, -0.0005459189414978027, -0.0005270242691040039, -0.0005081295967102051, -0.0004892349243164062, -0.0004703402519226074, -0.0004514455795288086, -0.00043255090713500977, -0.00041365623474121094, -0.0003947615623474121, -0.0003758668899536133, -0.00035697221755981445, -0.0003380775451660156, -0.0003191828727722168, -0.00030028820037841797, -0.00028139352798461914, -0.0002624988555908203, -0.00024360418319702148, -0.00022470951080322266, -0.00020581483840942383, -0.000186920166015625, -0.00016802549362182617, -0.00014913082122802734, -0.00013023614883422852, -0.00011134147644042969, -9.244680404663086e-05, -7.355213165283203e-05, -5.46574592590332e-05, -3.5762786865234375e-05, -1.6868114471435547e-05, 2.0265579223632812e-06, 2.092123031616211e-05, 3.981590270996094e-05, 5.8710575103759766e-05, 7.76052474975586e-05, 9.649991989135742e-05, 0.00011539459228515625, 0.00013428926467895508, 0.0001531839370727539, 0.00017207860946655273, 0.00019097328186035156, 0.0002098679542541504, 0.00022876262664794922, 0.00024765729904174805, 0.0002665519714355469, 0.0002854466438293457, 0.00030434131622314453, 0.00032323598861694336, 0.0003421306610107422, 0.000361025333404541, 0.00037992000579833984, 0.00039881467819213867, 0.0004177093505859375, 0.00043660402297973633, 0.00045549869537353516, 0.000474393367767334, 0.0004932880401611328, 0.0005121827125549316, 0.0005310773849487305, 0.0005499720573425293, 0.0005688667297363281]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 9.0, 10.0, 21.0, 19.0, 22.0, 34.0, 52.0, 60.0, 90.0, 133.0, 202.0, 280.0, 401.0, 590.0, 998.0, 1515.0, 2575.0, 4063.0, 7183.0, 13832.0, 27186.0, 58195.0, 124692.0, 228224.0, 258139.0, 163074.0, 79315.0, 36703.0, 18283.0, 9246.0, 5082.0, 2969.0, 1814.0, 1181.0, 741.0, 534.0, 310.0, 232.0, 162.0, 121.0, 71.0, 60.0, 33.0, 28.0, 25.0, 10.0, 10.0, 10.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.619140625, -3.499298095703125, -3.37945556640625, -3.259613037109375, -3.1397705078125, -3.019927978515625, -2.90008544921875, -2.780242919921875, -2.660400390625, -2.540557861328125, -2.42071533203125, -2.300872802734375, -2.1810302734375, -2.061187744140625, -1.94134521484375, -1.821502685546875, -1.70166015625, -1.581817626953125, -1.46197509765625, -1.342132568359375, -1.2222900390625, -1.102447509765625, -0.98260498046875, -0.862762451171875, -0.742919921875, -0.623077392578125, -0.50323486328125, -0.383392333984375, -0.2635498046875, -0.143707275390625, -0.02386474609375, 0.095977783203125, 0.2158203125, 0.335662841796875, 0.45550537109375, 0.575347900390625, 0.6951904296875, 0.815032958984375, 0.93487548828125, 1.054718017578125, 1.174560546875, 1.294403076171875, 1.41424560546875, 1.534088134765625, 1.6539306640625, 1.773773193359375, 1.89361572265625, 2.013458251953125, 2.13330078125, 2.253143310546875, 2.37298583984375, 2.492828369140625, 2.6126708984375, 2.732513427734375, 2.85235595703125, 2.972198486328125, 3.092041015625, 3.211883544921875, 3.33172607421875, 3.451568603515625, 3.5714111328125, 3.691253662109375, 3.81109619140625, 3.930938720703125, 4.05078125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 10.0, 8.0, 7.0, 11.0, 12.0, 21.0, 21.0, 39.0, 43.0, 55.0, 55.0, 65.0, 58.0, 72.0, 53.0, 46.0, 60.0, 47.0, 47.0, 52.0, 33.0, 32.0, 30.0, 18.0, 11.0, 6.0, 16.0, 6.0, 11.0, 3.0, 5.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.892578125, -0.8660430908203125, -0.839508056640625, -0.8129730224609375, -0.78643798828125, -0.7599029541015625, -0.733367919921875, -0.7068328857421875, -0.6802978515625, -0.6537628173828125, -0.627227783203125, -0.6006927490234375, -0.57415771484375, -0.5476226806640625, -0.521087646484375, -0.4945526123046875, -0.468017578125, -0.4414825439453125, -0.414947509765625, -0.3884124755859375, -0.36187744140625, -0.3353424072265625, -0.308807373046875, -0.2822723388671875, -0.2557373046875, -0.2292022705078125, -0.202667236328125, -0.1761322021484375, -0.14959716796875, -0.1230621337890625, -0.096527099609375, -0.0699920654296875, -0.04345703125, -0.0169219970703125, 0.009613037109375, 0.0361480712890625, 0.06268310546875, 0.0892181396484375, 0.115753173828125, 0.1422882080078125, 0.1688232421875, 0.1953582763671875, 0.221893310546875, 0.2484283447265625, 0.27496337890625, 0.3014984130859375, 0.328033447265625, 0.3545684814453125, 0.381103515625, 0.4076385498046875, 0.434173583984375, 0.4607086181640625, 0.48724365234375, 0.5137786865234375, 0.540313720703125, 0.5668487548828125, 0.5933837890625, 0.6199188232421875, 0.646453857421875, 0.6729888916015625, 0.69952392578125, 0.7260589599609375, 0.752593994140625, 0.7791290283203125, 0.8056640625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 1.0, 8.0, 5.0, 2.0, 4.0, 10.0, 23.0, 33.0, 23.0, 30.0, 56.0, 73.0, 104.0, 104.0, 122.0, 103.0, 68.0, 60.0, 41.0, 39.0, 30.0, 19.0, 10.0, 11.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0596923828125, -14.606082916259766, -14.152473449707031, -13.698863983154297, -13.245255470275879, -12.791646003723145, -12.33803653717041, -11.884427070617676, -11.430818557739258, -10.977209091186523, -10.523599624633789, -10.069990158081055, -9.616381645202637, -9.162772178649902, -8.709162712097168, -8.255553245544434, -7.801943778991699, -7.348334312438965, -6.894725322723389, -6.441115856170654, -5.987506866455078, -5.533897399902344, -5.080287933349609, -4.626678466796875, -4.173069477081299, -3.7194602489471436, -3.2658510208129883, -2.812241554260254, -2.3586323261260986, -1.9050230979919434, -1.451413631439209, -0.9978044033050537, -0.5441951751708984, -0.09058588743209839, 0.36302340030670166, 0.8166327476501465, 1.2702419757843018, 1.723851203918457, 2.1774606704711914, 2.6310698986053467, 3.084679126739502, 3.5382883548736572, 3.9918975830078125, 4.445507049560547, 4.899116516113281, 5.352725505828857, 5.806334972381592, 6.259943962097168, 6.713553428649902, 7.167162895202637, 7.620771884918213, 8.074380874633789, 8.527990341186523, 8.981599807739258, 9.435209274291992, 9.888818740844727, 10.342428207397461, 10.796037673950195, 11.24964714050293, 11.703256607055664, 12.156865119934082, 12.610474586486816, 13.06408405303955, 13.517693519592285, 13.971302032470703]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 6.0, 4.0, 9.0, 11.0, 9.0, 16.0, 16.0, 22.0, 24.0, 31.0, 25.0, 30.0, 34.0, 34.0, 43.0, 39.0, 53.0, 40.0, 48.0, 41.0, 36.0, 35.0, 33.0, 43.0, 40.0, 29.0, 36.0, 35.0, 31.0, 23.0, 25.0, 18.0, 16.0, 13.0, 15.0, 7.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-7.766757488250732, -7.558078289031982, -7.349399089813232, -7.140720367431641, -6.932041168212891, -6.723361968994141, -6.514682769775391, -6.306003570556641, -6.097324848175049, -5.888645648956299, -5.679966449737549, -5.471287727355957, -5.262608528137207, -5.053929328918457, -4.845250129699707, -4.636570930480957, -4.427891731262207, -4.219212532043457, -4.010533332824707, -3.801854372024536, -3.5931754112243652, -3.3844962120056152, -3.1758170127868652, -2.9671380519866943, -2.7584590911865234, -2.5497798919677734, -2.3411009311676025, -2.1324217319488525, -1.9237427711486816, -1.7150635719299316, -1.5063844919204712, -1.2977054119110107, -1.0890264511108398, -0.8803473711013794, -0.671668291091919, -0.4629891514778137, -0.25431007146835327, -0.04563093185424805, 0.1630481481552124, 0.37172722816467285, 0.5804063081741333, 0.7890853881835938, 0.9977644681930542, 1.2064435482025146, 1.4151227474212646, 1.623801827430725, 1.8324809074401855, 2.0411601066589355, 2.2498390674591064, 2.4585182666778564, 2.6671972274780273, 2.8758764266967773, 3.0845553874969482, 3.2932345867156982, 3.501913547515869, 3.710592746734619, 3.919271945953369, 4.127951145172119, 4.336630344390869, 4.545309066772461, 4.753988265991211, 4.962667465209961, 5.171346664428711, 5.380025863647461, 5.588704586029053]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 6.0, 6.0, 13.0, 6.0, 20.0, 23.0, 36.0, 46.0, 65.0, 96.0, 123.0, 179.0, 227.0, 365.0, 515.0, 765.0, 1156.0, 1690.0, 2719.0, 4479.0, 7405.0, 14669.0, 31737.0, 87031.0, 326137.0, 1389123.0, 1697974.0, 443591.0, 109376.0, 36987.0, 16171.0, 8260.0, 4679.0, 2924.0, 1826.0, 1224.0, 809.0, 542.0, 384.0, 248.0, 177.0, 135.0, 79.0, 72.0, 63.0, 34.0, 22.0, 18.0, 16.0, 9.0, 12.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.5625, -13.096435546875, -12.63037109375, -12.164306640625, -11.6982421875, -11.232177734375, -10.76611328125, -10.300048828125, -9.833984375, -9.367919921875, -8.90185546875, -8.435791015625, -7.9697265625, -7.503662109375, -7.03759765625, -6.571533203125, -6.10546875, -5.639404296875, -5.17333984375, -4.707275390625, -4.2412109375, -3.775146484375, -3.30908203125, -2.843017578125, -2.376953125, -1.910888671875, -1.44482421875, -0.978759765625, -0.5126953125, -0.046630859375, 0.41943359375, 0.885498046875, 1.3515625, 1.817626953125, 2.28369140625, 2.749755859375, 3.2158203125, 3.681884765625, 4.14794921875, 4.614013671875, 5.080078125, 5.546142578125, 6.01220703125, 6.478271484375, 6.9443359375, 7.410400390625, 7.87646484375, 8.342529296875, 8.80859375, 9.274658203125, 9.74072265625, 10.206787109375, 10.6728515625, 11.138916015625, 11.60498046875, 12.071044921875, 12.537109375, 13.003173828125, 13.46923828125, 13.935302734375, 14.4013671875, 14.867431640625, 15.33349609375, 15.799560546875, 16.265625]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 7.0, 6.0, 8.0, 11.0, 13.0, 20.0, 24.0, 23.0, 22.0, 36.0, 27.0, 28.0, 42.0, 38.0, 36.0, 46.0, 45.0, 46.0, 54.0, 42.0, 39.0, 46.0, 41.0, 42.0, 35.0, 32.0, 26.0, 24.0, 26.0, 17.0, 28.0, 15.0, 15.0, 6.0, 6.0, 9.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.12109375, -5.95159912109375, -5.7821044921875, -5.61260986328125, -5.443115234375, -5.27362060546875, -5.1041259765625, -4.93463134765625, -4.76513671875, -4.59564208984375, -4.4261474609375, -4.25665283203125, -4.087158203125, -3.91766357421875, -3.7481689453125, -3.57867431640625, -3.4091796875, -3.23968505859375, -3.0701904296875, -2.90069580078125, -2.731201171875, -2.56170654296875, -2.3922119140625, -2.22271728515625, -2.05322265625, -1.88372802734375, -1.7142333984375, -1.54473876953125, -1.375244140625, -1.20574951171875, -1.0362548828125, -0.86676025390625, -0.697265625, -0.52777099609375, -0.3582763671875, -0.18878173828125, -0.019287109375, 0.15020751953125, 0.3197021484375, 0.48919677734375, 0.65869140625, 0.82818603515625, 0.9976806640625, 1.16717529296875, 1.336669921875, 1.50616455078125, 1.6756591796875, 1.84515380859375, 2.0146484375, 2.18414306640625, 2.3536376953125, 2.52313232421875, 2.692626953125, 2.86212158203125, 3.0316162109375, 3.20111083984375, 3.37060546875, 3.54010009765625, 3.7095947265625, 3.87908935546875, 4.048583984375, 4.21807861328125, 4.3875732421875, 4.55706787109375, 4.7265625]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 5.0, 8.0, 11.0, 22.0, 16.0, 51.0, 58.0, 118.0, 159.0, 262.0, 473.0, 765.0, 1324.0, 2533.0, 4874.0, 10472.0, 23648.0, 63134.0, 219345.0, 1197450.0, 2089978.0, 415911.0, 100583.0, 34599.0, 14408.0, 6675.0, 3294.0, 1684.0, 949.0, 602.0, 299.0, 191.0, 142.0, 82.0, 60.0, 31.0, 28.0, 11.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-21.9375, -21.296142578125, -20.65478515625, -20.013427734375, -19.3720703125, -18.730712890625, -18.08935546875, -17.447998046875, -16.806640625, -16.165283203125, -15.52392578125, -14.882568359375, -14.2412109375, -13.599853515625, -12.95849609375, -12.317138671875, -11.67578125, -11.034423828125, -10.39306640625, -9.751708984375, -9.1103515625, -8.468994140625, -7.82763671875, -7.186279296875, -6.544921875, -5.903564453125, -5.26220703125, -4.620849609375, -3.9794921875, -3.338134765625, -2.69677734375, -2.055419921875, -1.4140625, -0.772705078125, -0.13134765625, 0.510009765625, 1.1513671875, 1.792724609375, 2.43408203125, 3.075439453125, 3.716796875, 4.358154296875, 4.99951171875, 5.640869140625, 6.2822265625, 6.923583984375, 7.56494140625, 8.206298828125, 8.84765625, 9.489013671875, 10.13037109375, 10.771728515625, 11.4130859375, 12.054443359375, 12.69580078125, 13.337158203125, 13.978515625, 14.619873046875, 15.26123046875, 15.902587890625, 16.5439453125, 17.185302734375, 17.82666015625, 18.468017578125, 19.109375]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 0.0, 2.0, 6.0, 11.0, 9.0, 10.0, 11.0, 16.0, 18.0, 32.0, 42.0, 52.0, 70.0, 88.0, 125.0, 183.0, 232.0, 354.0, 437.0, 418.0, 437.0, 376.0, 283.0, 225.0, 161.0, 118.0, 80.0, 65.0, 51.0, 40.0, 19.0, 38.0, 21.0, 17.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.583984375, -3.464019775390625, -3.34405517578125, -3.224090576171875, -3.1041259765625, -2.984161376953125, -2.86419677734375, -2.744232177734375, -2.624267578125, -2.504302978515625, -2.38433837890625, -2.264373779296875, -2.1444091796875, -2.024444580078125, -1.90447998046875, -1.784515380859375, -1.66455078125, -1.544586181640625, -1.42462158203125, -1.304656982421875, -1.1846923828125, -1.064727783203125, -0.94476318359375, -0.824798583984375, -0.704833984375, -0.584869384765625, -0.46490478515625, -0.344940185546875, -0.2249755859375, -0.105010986328125, 0.01495361328125, 0.134918212890625, 0.2548828125, 0.374847412109375, 0.49481201171875, 0.614776611328125, 0.7347412109375, 0.854705810546875, 0.97467041015625, 1.094635009765625, 1.214599609375, 1.334564208984375, 1.45452880859375, 1.574493408203125, 1.6944580078125, 1.814422607421875, 1.93438720703125, 2.054351806640625, 2.17431640625, 2.294281005859375, 2.41424560546875, 2.534210205078125, 2.6541748046875, 2.774139404296875, 2.89410400390625, 3.014068603515625, 3.134033203125, 3.253997802734375, 3.37396240234375, 3.493927001953125, 3.6138916015625, 3.733856201171875, 3.85382080078125, 3.973785400390625, 4.09375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 6.0, 11.0, 19.0, 32.0, 26.0, 45.0, 70.0, 93.0, 120.0, 121.0, 111.0, 90.0, 64.0, 54.0, 35.0, 24.0, 16.0, 14.0, 7.0, 8.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.796002388000488, -13.276734352111816, -12.757466316223145, -12.238198280334473, -11.7189302444458, -11.199662208557129, -10.68039321899414, -10.161125183105469, -9.641857147216797, -9.122589111328125, -8.603321075439453, -8.084053039550781, -7.564785003662109, -7.0455169677734375, -6.526248455047607, -6.0069804191589355, -5.487712860107422, -4.96844482421875, -4.449176788330078, -3.929908514022827, -3.4106404781341553, -2.8913724422454834, -2.3721041679382324, -1.8528361320495605, -1.3335680961608887, -0.814300000667572, -0.29503190517425537, 0.22423624992370605, 0.7435042858123779, 1.2627723217010498, 1.7820405960083008, 2.3013086318969727, 2.820577621459961, 3.339845657348633, 3.8591136932373047, 4.378381729125977, 4.897649765014648, 5.41691780090332, 5.93618631362915, 6.455454349517822, 6.974722385406494, 7.493990421295166, 8.013258934020996, 8.532526969909668, 9.05179500579834, 9.571063041687012, 10.090331077575684, 10.609599113464355, 11.128867149353027, 11.6481351852417, 12.167403221130371, 12.686671257019043, 13.205939292907715, 13.725207328796387, 14.244476318359375, 14.763744354248047, 15.283012390136719, 15.80228042602539, 16.321548461914062, 16.840816497802734, 17.360084533691406, 17.879352569580078, 18.39862060546875, 18.917888641357422, 19.437156677246094]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 10.0, 19.0, 22.0, 12.0, 13.0, 21.0, 36.0, 30.0, 32.0, 28.0, 47.0, 28.0, 48.0, 31.0, 50.0, 48.0, 53.0, 37.0, 47.0, 43.0, 41.0, 24.0, 36.0, 29.0, 38.0, 28.0, 22.0, 17.0, 13.0, 15.0, 13.0, 12.0, 9.0, 2.0, 3.0, 5.0, 6.0, 1.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-7.760763645172119, -7.5436296463012695, -7.32649564743042, -7.10936164855957, -6.892228126525879, -6.675093650817871, -6.45796012878418, -6.24082612991333, -6.0236921310424805, -5.806558132171631, -5.589424133300781, -5.372290134429932, -5.155156135559082, -4.938022613525391, -4.720888614654541, -4.503754615783691, -4.286620616912842, -4.069486618041992, -3.8523526191711426, -3.635218858718872, -3.4180848598480225, -3.200950860977173, -2.9838171005249023, -2.7666831016540527, -2.549549102783203, -2.3324151039123535, -2.115281105041504, -1.8981473445892334, -1.6810133457183838, -1.4638793468475342, -1.2467454671859741, -1.029611587524414, -0.8124771118164062, -0.5953431725502014, -0.3782092332839966, -0.16107529401779175, 0.056058645248413086, 0.2731926441192627, 0.49032652378082275, 0.7074604034423828, 0.9245944023132324, 1.141728401184082, 1.358862280845642, 1.5759961605072021, 1.7931301593780518, 2.0102641582489014, 2.227397918701172, 2.4445319175720215, 2.661665916442871, 2.8787999153137207, 3.0959339141845703, 3.313067674636841, 3.5302016735076904, 3.74733567237854, 3.9644694328308105, 4.18160343170166, 4.39873743057251, 4.615871429443359, 4.833005428314209, 5.050139427185059, 5.26727294921875, 5.484407424926758, 5.701540946960449, 5.918674945831299, 6.135808944702148]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 7.0, 7.0, 7.0, 15.0, 10.0, 38.0, 48.0, 60.0, 100.0, 118.0, 202.0, 289.0, 440.0, 603.0, 1138.0, 1773.0, 2917.0, 4869.0, 8993.0, 16840.0, 34116.0, 73883.0, 174594.0, 330399.0, 217618.0, 92867.0, 41410.0, 20082.0, 10508.0, 5796.0, 3289.0, 2059.0, 1240.0, 725.0, 470.0, 311.0, 235.0, 149.0, 103.0, 70.0, 46.0, 29.0, 16.0, 15.0, 16.0, 6.0, 8.0, 8.0, 1.0, 3.0, 5.0, 2.0, 3.0], "bins": [-1.0859375, -1.0545806884765625, -1.023223876953125, -0.9918670654296875, -0.96051025390625, -0.9291534423828125, -0.897796630859375, -0.8664398193359375, -0.8350830078125, -0.8037261962890625, -0.772369384765625, -0.7410125732421875, -0.70965576171875, -0.6782989501953125, -0.646942138671875, -0.6155853271484375, -0.584228515625, -0.5528717041015625, -0.521514892578125, -0.4901580810546875, -0.45880126953125, -0.4274444580078125, -0.396087646484375, -0.3647308349609375, -0.3333740234375, -0.3020172119140625, -0.270660400390625, -0.2393035888671875, -0.20794677734375, -0.1765899658203125, -0.145233154296875, -0.1138763427734375, -0.08251953125, -0.0511627197265625, -0.019805908203125, 0.0115509033203125, 0.04290771484375, 0.0742645263671875, 0.105621337890625, 0.1369781494140625, 0.1683349609375, 0.1996917724609375, 0.231048583984375, 0.2624053955078125, 0.29376220703125, 0.3251190185546875, 0.356475830078125, 0.3878326416015625, 0.419189453125, 0.4505462646484375, 0.481903076171875, 0.5132598876953125, 0.54461669921875, 0.5759735107421875, 0.607330322265625, 0.6386871337890625, 0.6700439453125, 0.7014007568359375, 0.732757568359375, 0.7641143798828125, 0.79547119140625, 0.8268280029296875, 0.858184814453125, 0.8895416259765625, 0.9208984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 6.0, 13.0, 17.0, 15.0, 14.0, 18.0, 19.0, 18.0, 27.0, 24.0, 22.0, 45.0, 29.0, 62.0, 40.0, 44.0, 52.0, 50.0, 58.0, 47.0, 37.0, 38.0, 44.0, 27.0, 34.0, 31.0, 31.0, 25.0, 16.0, 15.0, 17.0, 15.0, 12.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.5390625, -8.29241943359375, -8.0457763671875, -7.79913330078125, -7.552490234375, -7.30584716796875, -7.0592041015625, -6.81256103515625, -6.56591796875, -6.31927490234375, -6.0726318359375, -5.82598876953125, -5.579345703125, -5.33270263671875, -5.0860595703125, -4.83941650390625, -4.5927734375, -4.34613037109375, -4.0994873046875, -3.85284423828125, -3.606201171875, -3.35955810546875, -3.1129150390625, -2.86627197265625, -2.61962890625, -2.37298583984375, -2.1263427734375, -1.87969970703125, -1.633056640625, -1.38641357421875, -1.1397705078125, -0.89312744140625, -0.646484375, -0.39984130859375, -0.1531982421875, 0.09344482421875, 0.340087890625, 0.58673095703125, 0.8333740234375, 1.08001708984375, 1.32666015625, 1.57330322265625, 1.8199462890625, 2.06658935546875, 2.313232421875, 2.55987548828125, 2.8065185546875, 3.05316162109375, 3.2998046875, 3.54644775390625, 3.7930908203125, 4.03973388671875, 4.286376953125, 4.53302001953125, 4.7796630859375, 5.02630615234375, 5.27294921875, 5.51959228515625, 5.7662353515625, 6.01287841796875, 6.259521484375, 6.50616455078125, 6.7528076171875, 6.99945068359375, 7.24609375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 10.0, 9.0, 10.0, 31.0, 21.0, 34.0, 46.0, 65.0, 79.0, 117.0, 132.0, 188.0, 291.0, 468.0, 716.0, 1079.0, 1749.0, 3067.0, 5759.0, 12481.0, 33318.0, 702333.0, 238465.0, 25217.0, 10602.0, 4992.0, 2744.0, 1510.0, 945.0, 646.0, 401.0, 286.0, 182.0, 149.0, 110.0, 66.0, 52.0, 42.0, 41.0, 19.0, 11.0, 14.0, 7.0, 9.0, 9.0, 4.0, 3.0, 5.0, 1.0, 2.0, 4.0, 4.0], "bins": [-2.470703125, -2.397796630859375, -2.32489013671875, -2.251983642578125, -2.1790771484375, -2.106170654296875, -2.03326416015625, -1.960357666015625, -1.887451171875, -1.814544677734375, -1.74163818359375, -1.668731689453125, -1.5958251953125, -1.522918701171875, -1.45001220703125, -1.377105712890625, -1.30419921875, -1.231292724609375, -1.15838623046875, -1.085479736328125, -1.0125732421875, -0.939666748046875, -0.86676025390625, -0.793853759765625, -0.720947265625, -0.648040771484375, -0.57513427734375, -0.502227783203125, -0.4293212890625, -0.356414794921875, -0.28350830078125, -0.210601806640625, -0.1376953125, -0.064788818359375, 0.00811767578125, 0.081024169921875, 0.1539306640625, 0.226837158203125, 0.29974365234375, 0.372650146484375, 0.445556640625, 0.518463134765625, 0.59136962890625, 0.664276123046875, 0.7371826171875, 0.810089111328125, 0.88299560546875, 0.955902099609375, 1.02880859375, 1.101715087890625, 1.17462158203125, 1.247528076171875, 1.3204345703125, 1.393341064453125, 1.46624755859375, 1.539154052734375, 1.612060546875, 1.684967041015625, 1.75787353515625, 1.830780029296875, 1.9036865234375, 1.976593017578125, 2.04949951171875, 2.122406005859375, 2.1953125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 7.0, 8.0, 9.0, 5.0, 15.0, 13.0, 12.0, 17.0, 20.0, 19.0, 24.0, 40.0, 16.0, 34.0, 29.0, 33.0, 49.0, 41.0, 36.0, 46.0, 39.0, 48.0, 44.0, 44.0, 33.0, 38.0, 44.0, 29.0, 27.0, 25.0, 36.0, 13.0, 20.0, 21.0, 15.0, 9.0, 7.0, 7.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -4.14813232421875, -4.0111083984375, -3.87408447265625, -3.737060546875, -3.60003662109375, -3.4630126953125, -3.32598876953125, -3.18896484375, -3.05194091796875, -2.9149169921875, -2.77789306640625, -2.640869140625, -2.50384521484375, -2.3668212890625, -2.22979736328125, -2.0927734375, -1.95574951171875, -1.8187255859375, -1.68170166015625, -1.544677734375, -1.40765380859375, -1.2706298828125, -1.13360595703125, -0.99658203125, -0.85955810546875, -0.7225341796875, -0.58551025390625, -0.448486328125, -0.31146240234375, -0.1744384765625, -0.03741455078125, 0.099609375, 0.23663330078125, 0.3736572265625, 0.51068115234375, 0.647705078125, 0.78472900390625, 0.9217529296875, 1.05877685546875, 1.19580078125, 1.33282470703125, 1.4698486328125, 1.60687255859375, 1.743896484375, 1.88092041015625, 2.0179443359375, 2.15496826171875, 2.2919921875, 2.42901611328125, 2.5660400390625, 2.70306396484375, 2.840087890625, 2.97711181640625, 3.1141357421875, 3.25115966796875, 3.38818359375, 3.52520751953125, 3.6622314453125, 3.79925537109375, 3.936279296875, 4.07330322265625, 4.2103271484375, 4.34735107421875, 4.484375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 8.0, 8.0, 6.0, 7.0, 10.0, 16.0, 21.0, 28.0, 34.0, 57.0, 95.0, 129.0, 202.0, 263.0, 422.0, 730.0, 1124.0, 2059.0, 4082.0, 8443.0, 20241.0, 94523.0, 863017.0, 29720.0, 11428.0, 5229.0, 2698.0, 1524.0, 822.0, 538.0, 351.0, 174.0, 139.0, 110.0, 85.0, 54.0, 33.0, 25.0, 20.0, 10.0, 17.0, 8.0, 9.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.53271484375, -0.5156326293945312, -0.4985504150390625, -0.48146820068359375, -0.464385986328125, -0.44730377197265625, -0.4302215576171875, -0.41313934326171875, -0.39605712890625, -0.37897491455078125, -0.3618927001953125, -0.34481048583984375, -0.327728271484375, -0.31064605712890625, -0.2935638427734375, -0.27648162841796875, -0.2593994140625, -0.24231719970703125, -0.2252349853515625, -0.20815277099609375, -0.191070556640625, -0.17398834228515625, -0.1569061279296875, -0.13982391357421875, -0.12274169921875, -0.10565948486328125, -0.0885772705078125, -0.07149505615234375, -0.054412841796875, -0.03733062744140625, -0.0202484130859375, -0.00316619873046875, 0.013916015625, 0.03099822998046875, 0.0480804443359375, 0.06516265869140625, 0.082244873046875, 0.09932708740234375, 0.1164093017578125, 0.13349151611328125, 0.15057373046875, 0.16765594482421875, 0.1847381591796875, 0.20182037353515625, 0.218902587890625, 0.23598480224609375, 0.2530670166015625, 0.27014923095703125, 0.2872314453125, 0.30431365966796875, 0.3213958740234375, 0.33847808837890625, 0.355560302734375, 0.37264251708984375, 0.3897247314453125, 0.40680694580078125, 0.42388916015625, 0.44097137451171875, 0.4580535888671875, 0.47513580322265625, 0.492218017578125, 0.5093002319335938, 0.5263824462890625, 0.5434646606445312, 0.560546875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 12.0, 13.0, 15.0, 16.0, 21.0, 24.0, 20.0, 22.0, 28.0, 24.0, 29.0, 31.0, 40.0, 46.0, 39.0, 31.0, 44.0, 45.0, 56.0, 43.0, 39.0, 48.0, 46.0, 33.0, 36.0, 34.0, 22.0, 25.0, 8.0, 13.0, 11.0, 11.0, 9.0, 12.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1828880310058594e-05, -3.07401642203331e-05, -2.9651448130607605e-05, -2.856273204088211e-05, -2.7474015951156616e-05, -2.6385299861431122e-05, -2.5296583771705627e-05, -2.4207867681980133e-05, -2.311915159225464e-05, -2.2030435502529144e-05, -2.094171941280365e-05, -1.9853003323078156e-05, -1.876428723335266e-05, -1.7675571143627167e-05, -1.6586855053901672e-05, -1.5498138964176178e-05, -1.4409422874450684e-05, -1.332070678472519e-05, -1.2231990694999695e-05, -1.11432746052742e-05, -1.0054558515548706e-05, -8.965842425823212e-06, -7.877126336097717e-06, -6.788410246372223e-06, -5.6996941566467285e-06, -4.610978066921234e-06, -3.5222619771957397e-06, -2.4335458874702454e-06, -1.344829797744751e-06, -2.561137080192566e-07, 8.326023817062378e-07, 1.921318471431732e-06, 3.0100345611572266e-06, 4.098750650882721e-06, 5.187466740608215e-06, 6.27618283033371e-06, 7.364898920059204e-06, 8.453615009784698e-06, 9.542331099510193e-06, 1.0631047189235687e-05, 1.1719763278961182e-05, 1.2808479368686676e-05, 1.389719545841217e-05, 1.4985911548137665e-05, 1.607462763786316e-05, 1.7163343727588654e-05, 1.8252059817314148e-05, 1.9340775907039642e-05, 2.0429491996765137e-05, 2.151820808649063e-05, 2.2606924176216125e-05, 2.369564026594162e-05, 2.4784356355667114e-05, 2.587307244539261e-05, 2.6961788535118103e-05, 2.8050504624843597e-05, 2.9139220714569092e-05, 3.0227936804294586e-05, 3.131665289402008e-05, 3.2405368983745575e-05, 3.349408507347107e-05, 3.4582801163196564e-05, 3.567151725292206e-05, 3.676023334264755e-05, 3.784894943237305e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 4.0, 9.0, 6.0, 15.0, 11.0, 18.0, 26.0, 47.0, 78.0, 111.0, 174.0, 294.0, 419.0, 683.0, 1305.0, 2192.0, 4186.0, 8186.0, 16742.0, 36558.0, 86146.0, 213394.0, 347007.0, 189980.0, 76686.0, 32767.0, 15036.0, 7617.0, 3815.0, 2060.0, 1208.0, 675.0, 384.0, 238.0, 177.0, 105.0, 55.0, 51.0, 31.0, 18.0, 16.0, 13.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2099609375, -0.2030620574951172, -0.19616317749023438, -0.18926429748535156, -0.18236541748046875, -0.17546653747558594, -0.16856765747070312, -0.1616687774658203, -0.1547698974609375, -0.1478710174560547, -0.14097213745117188, -0.13407325744628906, -0.12717437744140625, -0.12027549743652344, -0.11337661743164062, -0.10647773742675781, -0.099578857421875, -0.09267997741699219, -0.08578109741210938, -0.07888221740722656, -0.07198333740234375, -0.06508445739746094, -0.058185577392578125, -0.05128669738769531, -0.0443878173828125, -0.03748893737792969, -0.030590057373046875, -0.023691177368164062, -0.01679229736328125, -0.009893417358398438, -0.002994537353515625, 0.0039043426513671875, 0.01080322265625, 0.017702102661132812, 0.024600982666015625, 0.03149986267089844, 0.03839874267578125, 0.04529762268066406, 0.052196502685546875, 0.05909538269042969, 0.0659942626953125, 0.07289314270019531, 0.07979202270507812, 0.08669090270996094, 0.09358978271484375, 0.10048866271972656, 0.10738754272460938, 0.11428642272949219, 0.121185302734375, 0.1280841827392578, 0.13498306274414062, 0.14188194274902344, 0.14878082275390625, 0.15567970275878906, 0.16257858276367188, 0.1694774627685547, 0.1763763427734375, 0.1832752227783203, 0.19017410278320312, 0.19707298278808594, 0.20397186279296875, 0.21087074279785156, 0.21776962280273438, 0.2246685028076172, 0.2315673828125]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 10.0, 10.0, 9.0, 14.0, 11.0, 22.0, 23.0, 36.0, 32.0, 35.0, 61.0, 67.0, 63.0, 84.0, 76.0, 57.0, 60.0, 53.0, 44.0, 45.0, 21.0, 29.0, 24.0, 26.0, 14.0, 9.0, 18.0, 13.0, 4.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03948974609375, -0.03798055648803711, -0.03647136688232422, -0.03496217727661133, -0.03345298767089844, -0.03194379806518555, -0.030434608459472656, -0.028925418853759766, -0.027416229248046875, -0.025907039642333984, -0.024397850036621094, -0.022888660430908203, -0.021379470825195312, -0.019870281219482422, -0.01836109161376953, -0.01685190200805664, -0.01534271240234375, -0.01383352279663086, -0.012324333190917969, -0.010815143585205078, -0.009305953979492188, -0.007796764373779297, -0.006287574768066406, -0.004778385162353516, -0.003269195556640625, -0.0017600059509277344, -0.00025081634521484375, 0.0012583732604980469, 0.0027675628662109375, 0.004276752471923828, 0.005785942077636719, 0.007295131683349609, 0.0088043212890625, 0.01031351089477539, 0.011822700500488281, 0.013331890106201172, 0.014841079711914062, 0.016350269317626953, 0.017859458923339844, 0.019368648529052734, 0.020877838134765625, 0.022387027740478516, 0.023896217346191406, 0.025405406951904297, 0.026914596557617188, 0.028423786163330078, 0.02993297576904297, 0.03144216537475586, 0.03295135498046875, 0.03446054458618164, 0.03596973419189453, 0.03747892379760742, 0.03898811340332031, 0.0404973030090332, 0.042006492614746094, 0.043515682220458984, 0.045024871826171875, 0.046534061431884766, 0.048043251037597656, 0.04955244064331055, 0.05106163024902344, 0.05257081985473633, 0.05408000946044922, 0.05558919906616211, 0.057098388671875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 7.0, 5.0, 10.0, 17.0, 32.0, 25.0, 36.0, 71.0, 87.0, 120.0, 118.0, 113.0, 101.0, 66.0, 57.0, 36.0, 28.0, 15.0, 15.0, 7.0, 8.0, 5.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.036131858825684, -13.51191520690918, -12.987699508666992, -12.463482856750488, -11.9392671585083, -11.415050506591797, -10.89083480834961, -10.366618156433105, -9.842401504516602, -9.318184852600098, -8.79396915435791, -8.269752502441406, -7.745536804199219, -7.221320152282715, -6.697103977203369, -6.172887802124023, -5.648672103881836, -5.12445592880249, -4.6002397537231445, -4.076023101806641, -3.551807165145874, -3.0275909900665283, -2.5033745765686035, -1.9791584014892578, -1.454942226409912, -0.9307259917259216, -0.40650975704193115, 0.1177065372467041, 0.6419227123260498, 1.1661388874053955, 1.6903553009033203, 2.214571475982666, 2.738788604736328, 3.263004779815674, 3.7872209548950195, 4.311437606811523, 4.835653305053711, 5.359869956970215, 5.8840861320495605, 6.408302307128906, 6.932518482208252, 7.456734657287598, 7.980950832366943, 8.505167007446289, 9.029383659362793, 9.55359935760498, 10.077816009521484, 10.602031707763672, 11.126248359680176, 11.65046501159668, 12.174680709838867, 12.698897361755371, 13.223113059997559, 13.747329711914062, 14.27154541015625, 14.795762062072754, 15.319978713989258, 15.844195365905762, 16.368412017822266, 16.892627716064453, 17.41684341430664, 17.941059112548828, 18.46527671813965, 18.989492416381836, 19.513708114624023]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 14.0, 16.0, 22.0, 13.0, 11.0, 21.0, 33.0, 32.0, 28.0, 34.0, 45.0, 30.0, 45.0, 31.0, 49.0, 49.0, 55.0, 38.0, 48.0, 40.0, 38.0, 29.0, 37.0, 26.0, 40.0, 26.0, 25.0, 17.0, 13.0, 15.0, 12.0, 13.0, 10.0, 2.0, 3.0, 5.0, 7.0, 0.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-7.7791266441345215, -7.562592029571533, -7.346057415008545, -7.129523277282715, -6.912988662719727, -6.696454048156738, -6.47991943359375, -6.263384819030762, -6.046850204467773, -5.830315589904785, -5.613780975341797, -5.397246360778809, -5.1807122230529785, -4.96417760848999, -4.747642993927002, -4.531108379364014, -4.314574241638184, -4.098039627075195, -3.881505250930786, -3.664970636367798, -3.4484360218048096, -3.2319016456604004, -3.015367031097412, -2.798832416534424, -2.5822978019714355, -2.3657631874084473, -2.149228811264038, -1.9326941967010498, -1.7161595821380615, -1.4996250867843628, -1.283090591430664, -1.0665559768676758, -0.8500213623046875, -0.633486807346344, -0.4169522821903229, -0.20041775703430176, 0.016116797924041748, 0.23265135288238525, 0.449185848236084, 0.6657204627990723, 0.882254958152771, 1.0987894535064697, 1.315324068069458, 1.5318585634231567, 1.7483930587768555, 1.9649276733398438, 2.181462287902832, 2.3979969024658203, 2.6145312786102295, 2.8310658931732178, 3.047600269317627, 3.2641348838806152, 3.4806694984436035, 3.697204113006592, 3.913738489151001, 4.13027286529541, 4.346807479858398, 4.563342094421387, 4.779876708984375, 4.996411323547363, 5.212945461273193, 5.429480075836182, 5.64601469039917, 5.862549304962158, 6.0790839195251465]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 8.0, 24.0, 14.0, 38.0, 54.0, 102.0, 129.0, 249.0, 359.0, 575.0, 977.0, 1677.0, 2816.0, 4968.0, 8993.0, 17244.0, 34900.0, 74908.0, 164358.0, 275460.0, 234078.0, 118225.0, 53572.0, 25291.0, 13079.0, 7020.0, 3892.0, 2236.0, 1230.0, 788.0, 469.0, 296.0, 200.0, 118.0, 78.0, 43.0, 31.0, 18.0, 9.0, 11.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.7027587890625, -8.428955078125, -8.1551513671875, -7.88134765625, -7.6075439453125, -7.333740234375, -7.0599365234375, -6.7861328125, -6.5123291015625, -6.238525390625, -5.9647216796875, -5.69091796875, -5.4171142578125, -5.143310546875, -4.8695068359375, -4.595703125, -4.3218994140625, -4.048095703125, -3.7742919921875, -3.50048828125, -3.2266845703125, -2.952880859375, -2.6790771484375, -2.4052734375, -2.1314697265625, -1.857666015625, -1.5838623046875, -1.31005859375, -1.0362548828125, -0.762451171875, -0.4886474609375, -0.21484375, 0.0589599609375, 0.332763671875, 0.6065673828125, 0.88037109375, 1.1541748046875, 1.427978515625, 1.7017822265625, 1.9755859375, 2.2493896484375, 2.523193359375, 2.7969970703125, 3.07080078125, 3.3446044921875, 3.618408203125, 3.8922119140625, 4.166015625, 4.4398193359375, 4.713623046875, 4.9874267578125, 5.26123046875, 5.5350341796875, 5.808837890625, 6.0826416015625, 6.3564453125, 6.6302490234375, 6.904052734375, 7.1778564453125, 7.45166015625, 7.7254638671875, 7.999267578125, 8.2730712890625, 8.546875]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 9.0, 11.0, 15.0, 13.0, 15.0, 19.0, 17.0, 33.0, 32.0, 28.0, 26.0, 42.0, 42.0, 46.0, 44.0, 55.0, 44.0, 45.0, 45.0, 50.0, 41.0, 43.0, 35.0, 30.0, 28.0, 32.0, 26.0, 25.0, 14.0, 17.0, 11.0, 15.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 4.0, 1.0], "bins": [-8.7890625, -8.546875, -8.3046875, -8.0625, -7.8203125, -7.578125, -7.3359375, -7.09375, -6.8515625, -6.609375, -6.3671875, -6.125, -5.8828125, -5.640625, -5.3984375, -5.15625, -4.9140625, -4.671875, -4.4296875, -4.1875, -3.9453125, -3.703125, -3.4609375, -3.21875, -2.9765625, -2.734375, -2.4921875, -2.25, -2.0078125, -1.765625, -1.5234375, -1.28125, -1.0390625, -0.796875, -0.5546875, -0.3125, -0.0703125, 0.171875, 0.4140625, 0.65625, 0.8984375, 1.140625, 1.3828125, 1.625, 1.8671875, 2.109375, 2.3515625, 2.59375, 2.8359375, 3.078125, 3.3203125, 3.5625, 3.8046875, 4.046875, 4.2890625, 4.53125, 4.7734375, 5.015625, 5.2578125, 5.5, 5.7421875, 5.984375, 6.2265625, 6.46875, 6.7109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 13.0, 12.0, 26.0, 26.0, 61.0, 70.0, 124.0, 135.0, 218.0, 317.0, 460.0, 710.0, 1032.0, 1716.0, 2682.0, 4497.0, 7609.0, 13156.0, 23771.0, 43526.0, 79899.0, 140307.0, 202126.0, 202378.0, 141484.0, 81061.0, 44002.0, 24204.0, 13124.0, 7623.0, 4510.0, 2762.0, 1621.0, 1083.0, 736.0, 474.0, 324.0, 209.0, 137.0, 109.0, 74.0, 43.0, 33.0, 19.0, 15.0, 13.0, 5.0, 10.0, 3.0, 4.0, 0.0, 3.0, 2.0], "bins": [-6.87890625, -6.6766357421875, -6.474365234375, -6.2720947265625, -6.06982421875, -5.8675537109375, -5.665283203125, -5.4630126953125, -5.2607421875, -5.0584716796875, -4.856201171875, -4.6539306640625, -4.45166015625, -4.2493896484375, -4.047119140625, -3.8448486328125, -3.642578125, -3.4403076171875, -3.238037109375, -3.0357666015625, -2.83349609375, -2.6312255859375, -2.428955078125, -2.2266845703125, -2.0244140625, -1.8221435546875, -1.619873046875, -1.4176025390625, -1.21533203125, -1.0130615234375, -0.810791015625, -0.6085205078125, -0.40625, -0.2039794921875, -0.001708984375, 0.2005615234375, 0.40283203125, 0.6051025390625, 0.807373046875, 1.0096435546875, 1.2119140625, 1.4141845703125, 1.616455078125, 1.8187255859375, 2.02099609375, 2.2232666015625, 2.425537109375, 2.6278076171875, 2.830078125, 3.0323486328125, 3.234619140625, 3.4368896484375, 3.63916015625, 3.8414306640625, 4.043701171875, 4.2459716796875, 4.4482421875, 4.6505126953125, 4.852783203125, 5.0550537109375, 5.25732421875, 5.4595947265625, 5.661865234375, 5.8641357421875, 6.06640625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 10.0, 10.0, 15.0, 9.0, 10.0, 15.0, 15.0, 16.0, 24.0, 38.0, 23.0, 24.0, 32.0, 27.0, 42.0, 39.0, 32.0, 45.0, 41.0, 44.0, 33.0, 43.0, 31.0, 37.0, 37.0, 28.0, 35.0, 26.0, 33.0, 23.0, 22.0, 23.0, 19.0, 20.0, 16.0, 9.0, 7.0, 6.0, 5.0, 7.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.923828125, -3.80865478515625, -3.6934814453125, -3.57830810546875, -3.463134765625, -3.34796142578125, -3.2327880859375, -3.11761474609375, -3.00244140625, -2.88726806640625, -2.7720947265625, -2.65692138671875, -2.541748046875, -2.42657470703125, -2.3114013671875, -2.19622802734375, -2.0810546875, -1.96588134765625, -1.8507080078125, -1.73553466796875, -1.620361328125, -1.50518798828125, -1.3900146484375, -1.27484130859375, -1.15966796875, -1.04449462890625, -0.9293212890625, -0.81414794921875, -0.698974609375, -0.58380126953125, -0.4686279296875, -0.35345458984375, -0.23828125, -0.12310791015625, -0.0079345703125, 0.10723876953125, 0.222412109375, 0.33758544921875, 0.4527587890625, 0.56793212890625, 0.68310546875, 0.79827880859375, 0.9134521484375, 1.02862548828125, 1.143798828125, 1.25897216796875, 1.3741455078125, 1.48931884765625, 1.6044921875, 1.71966552734375, 1.8348388671875, 1.95001220703125, 2.065185546875, 2.18035888671875, 2.2955322265625, 2.41070556640625, 2.52587890625, 2.64105224609375, 2.7562255859375, 2.87139892578125, 2.986572265625, 3.10174560546875, 3.2169189453125, 3.33209228515625, 3.447265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 10.0, 16.0, 30.0, 26.0, 45.0, 64.0, 72.0, 122.0, 191.0, 265.0, 442.0, 683.0, 1100.0, 1835.0, 3108.0, 5347.0, 10266.0, 21167.0, 48617.0, 117628.0, 256137.0, 298145.0, 159284.0, 66017.0, 28442.0, 13425.0, 6617.0, 3709.0, 2124.0, 1250.0, 874.0, 491.0, 315.0, 226.0, 149.0, 93.0, 70.0, 48.0, 30.0, 25.0, 17.0, 12.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.50689697265625, -4.3575439453125, -4.20819091796875, -4.058837890625, -3.90948486328125, -3.7601318359375, -3.61077880859375, -3.46142578125, -3.31207275390625, -3.1627197265625, -3.01336669921875, -2.864013671875, -2.71466064453125, -2.5653076171875, -2.41595458984375, -2.2666015625, -2.11724853515625, -1.9678955078125, -1.81854248046875, -1.669189453125, -1.51983642578125, -1.3704833984375, -1.22113037109375, -1.07177734375, -0.92242431640625, -0.7730712890625, -0.62371826171875, -0.474365234375, -0.32501220703125, -0.1756591796875, -0.02630615234375, 0.123046875, 0.27239990234375, 0.4217529296875, 0.57110595703125, 0.720458984375, 0.86981201171875, 1.0191650390625, 1.16851806640625, 1.31787109375, 1.46722412109375, 1.6165771484375, 1.76593017578125, 1.915283203125, 2.06463623046875, 2.2139892578125, 2.36334228515625, 2.5126953125, 2.66204833984375, 2.8114013671875, 2.96075439453125, 3.110107421875, 3.25946044921875, 3.4088134765625, 3.55816650390625, 3.70751953125, 3.85687255859375, 4.0062255859375, 4.15557861328125, 4.304931640625, 4.45428466796875, 4.6036376953125, 4.75299072265625, 4.90234375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 9.0, 13.0, 18.0, 22.0, 25.0, 28.0, 43.0, 67.0, 88.0, 94.0, 99.0, 88.0, 88.0, 75.0, 69.0, 46.0, 38.0, 16.0, 15.0, 14.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00033664703369140625, -0.00032534822821617126, -0.0003140494227409363, -0.0003027506172657013, -0.0002914518117904663, -0.0002801530063152313, -0.00026885420083999634, -0.00025755539536476135, -0.00024625658988952637, -0.00023495778441429138, -0.0002236589789390564, -0.0002123601734638214, -0.00020106136798858643, -0.00018976256251335144, -0.00017846375703811646, -0.00016716495156288147, -0.00015586614608764648, -0.0001445673406124115, -0.00013326853513717651, -0.00012196972966194153, -0.00011067092418670654, -9.937211871147156e-05, -8.807331323623657e-05, -7.677450776100159e-05, -6.54757022857666e-05, -5.4176896810531616e-05, -4.287809133529663e-05, -3.1579285860061646e-05, -2.028048038482666e-05, -8.981674909591675e-06, 2.3171305656433105e-06, 1.3615936040878296e-05, 2.491474151611328e-05, 3.6213546991348267e-05, 4.751235246658325e-05, 5.881115794181824e-05, 7.010996341705322e-05, 8.140876889228821e-05, 9.27075743675232e-05, 0.00010400637984275818, 0.00011530518531799316, 0.00012660399079322815, 0.00013790279626846313, 0.00014920160174369812, 0.0001605004072189331, 0.0001717992126941681, 0.00018309801816940308, 0.00019439682364463806, 0.00020569562911987305, 0.00021699443459510803, 0.00022829324007034302, 0.000239592045545578, 0.000250890851020813, 0.000262189656496048, 0.00027348846197128296, 0.00028478726744651794, 0.00029608607292175293, 0.0003073848783969879, 0.0003186836838722229, 0.0003299824893474579, 0.00034128129482269287, 0.00035258010029792786, 0.00036387890577316284, 0.00037517771124839783, 0.0003864765167236328]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 7.0, 2.0, 5.0, 7.0, 6.0, 8.0, 14.0, 19.0, 24.0, 26.0, 42.0, 46.0, 73.0, 101.0, 162.0, 214.0, 269.0, 480.0, 683.0, 1084.0, 1864.0, 3663.0, 7763.0, 18543.0, 50485.0, 146764.0, 329736.0, 295418.0, 119958.0, 41154.0, 15459.0, 6594.0, 3053.0, 1769.0, 1036.0, 645.0, 419.0, 276.0, 197.0, 148.0, 96.0, 67.0, 44.0, 24.0, 33.0, 20.0, 13.0, 14.0, 9.0, 9.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.78125, -4.62652587890625, -4.4718017578125, -4.31707763671875, -4.162353515625, -4.00762939453125, -3.8529052734375, -3.69818115234375, -3.54345703125, -3.38873291015625, -3.2340087890625, -3.07928466796875, -2.924560546875, -2.76983642578125, -2.6151123046875, -2.46038818359375, -2.3056640625, -2.15093994140625, -1.9962158203125, -1.84149169921875, -1.686767578125, -1.53204345703125, -1.3773193359375, -1.22259521484375, -1.06787109375, -0.91314697265625, -0.7584228515625, -0.60369873046875, -0.448974609375, -0.29425048828125, -0.1395263671875, 0.01519775390625, 0.169921875, 0.32464599609375, 0.4793701171875, 0.63409423828125, 0.788818359375, 0.94354248046875, 1.0982666015625, 1.25299072265625, 1.40771484375, 1.56243896484375, 1.7171630859375, 1.87188720703125, 2.026611328125, 2.18133544921875, 2.3360595703125, 2.49078369140625, 2.6455078125, 2.80023193359375, 2.9549560546875, 3.10968017578125, 3.264404296875, 3.41912841796875, 3.5738525390625, 3.72857666015625, 3.88330078125, 4.03802490234375, 4.1927490234375, 4.34747314453125, 4.502197265625, 4.65692138671875, 4.8116455078125, 4.96636962890625, 5.12109375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 12.0, 11.0, 18.0, 26.0, 22.0, 36.0, 31.0, 60.0, 60.0, 86.0, 97.0, 77.0, 86.0, 78.0, 80.0, 51.0, 40.0, 25.0, 22.0, 32.0, 13.0, 6.0, 5.0, 7.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.951171875, -0.914886474609375, -0.87860107421875, -0.842315673828125, -0.8060302734375, -0.769744873046875, -0.73345947265625, -0.697174072265625, -0.660888671875, -0.624603271484375, -0.58831787109375, -0.552032470703125, -0.5157470703125, -0.479461669921875, -0.44317626953125, -0.406890869140625, -0.37060546875, -0.334320068359375, -0.29803466796875, -0.261749267578125, -0.2254638671875, -0.189178466796875, -0.15289306640625, -0.116607666015625, -0.080322265625, -0.044036865234375, -0.00775146484375, 0.028533935546875, 0.0648193359375, 0.101104736328125, 0.13739013671875, 0.173675537109375, 0.2099609375, 0.246246337890625, 0.28253173828125, 0.318817138671875, 0.3551025390625, 0.391387939453125, 0.42767333984375, 0.463958740234375, 0.500244140625, 0.536529541015625, 0.57281494140625, 0.609100341796875, 0.6453857421875, 0.681671142578125, 0.71795654296875, 0.754241943359375, 0.79052734375, 0.826812744140625, 0.86309814453125, 0.899383544921875, 0.9356689453125, 0.971954345703125, 1.00823974609375, 1.044525146484375, 1.080810546875, 1.117095947265625, 1.15338134765625, 1.189666748046875, 1.2259521484375, 1.262237548828125, 1.29852294921875, 1.334808349609375, 1.37109375]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 6.0, 9.0, 26.0, 15.0, 26.0, 42.0, 55.0, 67.0, 103.0, 112.0, 113.0, 111.0, 88.0, 61.0, 43.0, 28.0, 22.0, 14.0, 15.0, 10.0, 6.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.388750076293945, -12.879076957702637, -12.369403839111328, -11.859731674194336, -11.350058555603027, -10.840385437011719, -10.33071231842041, -9.821039199829102, -9.31136703491211, -8.8016939163208, -8.292020797729492, -7.782348155975342, -7.272675514221191, -6.763002395629883, -6.253329277038574, -5.743656158447266, -5.233983039855957, -4.724309921264648, -4.214637279510498, -3.7049641609191895, -3.19529128074646, -2.6856184005737305, -2.175945281982422, -1.6662724018096924, -1.156599521636963, -0.6469265818595886, -0.13725364208221436, 0.3724193572998047, 0.8820922374725342, 1.3917651176452637, 1.9014382362365723, 2.4111111164093018, 2.9207839965820312, 3.4304568767547607, 3.9401297569274902, 4.449802875518799, 4.959475517272949, 5.469148635864258, 5.978821754455566, 6.488494873046875, 6.998167514801025, 7.507840633392334, 8.017513275146484, 8.527186393737793, 9.036859512329102, 9.546531677246094, 10.056205749511719, 10.565877914428711, 11.07555103302002, 11.585224151611328, 12.094897270202637, 12.604570388793945, 13.114242553710938, 13.623915672302246, 14.133588790893555, 14.643261909484863, 15.152935028076172, 15.66260814666748, 16.17228126525879, 16.68195343017578, 17.191627502441406, 17.7012996673584, 18.21097183227539, 18.720645904541016, 19.230318069458008]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 11.0, 14.0, 19.0, 19.0, 17.0, 18.0, 29.0, 36.0, 38.0, 33.0, 33.0, 43.0, 45.0, 44.0, 43.0, 46.0, 40.0, 43.0, 46.0, 50.0, 49.0, 32.0, 36.0, 35.0, 27.0, 25.0, 11.0, 19.0, 16.0, 12.0, 10.0, 3.0, 7.0, 10.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.123149871826172, -7.899446964263916, -7.675743579864502, -7.452040672302246, -7.22833776473999, -7.004634857177734, -6.78093147277832, -6.5572285652160645, -6.333525657653809, -6.109822750091553, -5.886119365692139, -5.662416458129883, -5.438713550567627, -5.215010643005371, -4.991307258605957, -4.767604351043701, -4.543900966644287, -4.320198059082031, -4.096494674682617, -3.8727917671203613, -3.6490888595581055, -3.4253857135772705, -3.2016825675964355, -2.9779796600341797, -2.7542765140533447, -2.5305733680725098, -2.306870460510254, -2.083167314529419, -1.8594642877578735, -1.6357612609863281, -1.4120581150054932, -1.1883550882339478, -0.9646525382995605, -0.7409495115280151, -0.517246425151825, -0.29354333877563477, -0.06984031200408936, 0.15386271476745605, 0.377565860748291, 0.6012688875198364, 0.8249719142913818, 1.0486749410629272, 1.2723779678344727, 1.4960811138153076, 1.719784140586853, 1.9434871673583984, 2.1671903133392334, 2.3908934593200684, 2.614596366882324, 2.838299512863159, 3.062002420425415, 3.28570556640625, 3.509408473968506, 3.733111619949341, 3.956814765930176, 4.180517673492432, 4.4042205810546875, 4.627923488616943, 4.851626873016357, 5.075329780578613, 5.299032688140869, 5.522735595703125, 5.746438980102539, 5.970141887664795, 6.193845272064209]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 13.0, 10.0, 9.0, 25.0, 24.0, 33.0, 61.0, 69.0, 111.0, 154.0, 227.0, 323.0, 439.0, 645.0, 997.0, 1617.0, 2471.0, 4359.0, 7779.0, 15518.0, 38643.0, 130626.0, 602032.0, 1957508.0, 1102367.0, 222985.0, 59458.0, 22028.0, 10128.0, 5292.0, 3073.0, 1926.0, 1166.0, 731.0, 482.0, 324.0, 195.0, 131.0, 93.0, 69.0, 43.0, 28.0, 24.0, 12.0, 13.0, 8.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.09375, -16.58642578125, -16.0791015625, -15.57177734375, -15.064453125, -14.55712890625, -14.0498046875, -13.54248046875, -13.03515625, -12.52783203125, -12.0205078125, -11.51318359375, -11.005859375, -10.49853515625, -9.9912109375, -9.48388671875, -8.9765625, -8.46923828125, -7.9619140625, -7.45458984375, -6.947265625, -6.43994140625, -5.9326171875, -5.42529296875, -4.91796875, -4.41064453125, -3.9033203125, -3.39599609375, -2.888671875, -2.38134765625, -1.8740234375, -1.36669921875, -0.859375, -0.35205078125, 0.1552734375, 0.66259765625, 1.169921875, 1.67724609375, 2.1845703125, 2.69189453125, 3.19921875, 3.70654296875, 4.2138671875, 4.72119140625, 5.228515625, 5.73583984375, 6.2431640625, 6.75048828125, 7.2578125, 7.76513671875, 8.2724609375, 8.77978515625, 9.287109375, 9.79443359375, 10.3017578125, 10.80908203125, 11.31640625, 11.82373046875, 12.3310546875, 12.83837890625, 13.345703125, 13.85302734375, 14.3603515625, 14.86767578125, 15.375]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 4.0, 6.0, 17.0, 7.0, 13.0, 12.0, 13.0, 15.0, 22.0, 27.0, 25.0, 25.0, 34.0, 33.0, 40.0, 34.0, 44.0, 49.0, 43.0, 46.0, 45.0, 36.0, 41.0, 38.0, 47.0, 37.0, 32.0, 29.0, 35.0, 21.0, 15.0, 19.0, 19.0, 16.0, 12.0, 11.0, 5.0, 6.0, 7.0, 2.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0], "bins": [-6.80859375, -6.6280517578125, -6.447509765625, -6.2669677734375, -6.08642578125, -5.9058837890625, -5.725341796875, -5.5447998046875, -5.3642578125, -5.1837158203125, -5.003173828125, -4.8226318359375, -4.64208984375, -4.4615478515625, -4.281005859375, -4.1004638671875, -3.919921875, -3.7393798828125, -3.558837890625, -3.3782958984375, -3.19775390625, -3.0172119140625, -2.836669921875, -2.6561279296875, -2.4755859375, -2.2950439453125, -2.114501953125, -1.9339599609375, -1.75341796875, -1.5728759765625, -1.392333984375, -1.2117919921875, -1.03125, -0.8507080078125, -0.670166015625, -0.4896240234375, -0.30908203125, -0.1285400390625, 0.052001953125, 0.2325439453125, 0.4130859375, 0.5936279296875, 0.774169921875, 0.9547119140625, 1.13525390625, 1.3157958984375, 1.496337890625, 1.6768798828125, 1.857421875, 2.0379638671875, 2.218505859375, 2.3990478515625, 2.57958984375, 2.7601318359375, 2.940673828125, 3.1212158203125, 3.3017578125, 3.4822998046875, 3.662841796875, 3.8433837890625, 4.02392578125, 4.2044677734375, 4.385009765625, 4.5655517578125, 4.74609375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 5.0, 5.0, 13.0, 20.0, 34.0, 42.0, 97.0, 145.0, 233.0, 348.0, 552.0, 980.0, 1766.0, 3117.0, 5976.0, 11532.0, 24634.0, 59703.0, 183925.0, 854560.0, 2182491.0, 624132.0, 146570.0, 49937.0, 21304.0, 10316.0, 5199.0, 2850.0, 1525.0, 893.0, 510.0, 329.0, 202.0, 148.0, 65.0, 41.0, 26.0, 19.0, 16.0, 3.0, 8.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.9501953125, -16.353515625, -15.7568359375, -15.16015625, -14.5634765625, -13.966796875, -13.3701171875, -12.7734375, -12.1767578125, -11.580078125, -10.9833984375, -10.38671875, -9.7900390625, -9.193359375, -8.5966796875, -8.0, -7.4033203125, -6.806640625, -6.2099609375, -5.61328125, -5.0166015625, -4.419921875, -3.8232421875, -3.2265625, -2.6298828125, -2.033203125, -1.4365234375, -0.83984375, -0.2431640625, 0.353515625, 0.9501953125, 1.546875, 2.1435546875, 2.740234375, 3.3369140625, 3.93359375, 4.5302734375, 5.126953125, 5.7236328125, 6.3203125, 6.9169921875, 7.513671875, 8.1103515625, 8.70703125, 9.3037109375, 9.900390625, 10.4970703125, 11.09375, 11.6904296875, 12.287109375, 12.8837890625, 13.48046875, 14.0771484375, 14.673828125, 15.2705078125, 15.8671875, 16.4638671875, 17.060546875, 17.6572265625, 18.25390625, 18.8505859375, 19.447265625, 20.0439453125, 20.640625]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 4.0, 12.0, 7.0, 7.0, 17.0, 13.0, 15.0, 24.0, 38.0, 36.0, 46.0, 72.0, 71.0, 114.0, 148.0, 168.0, 267.0, 321.0, 372.0, 382.0, 391.0, 316.0, 288.0, 213.0, 158.0, 124.0, 91.0, 78.0, 49.0, 62.0, 31.0, 32.0, 21.0, 26.0, 11.0, 6.0, 5.0, 11.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.109375, -3.001190185546875, -2.89300537109375, -2.784820556640625, -2.6766357421875, -2.568450927734375, -2.46026611328125, -2.352081298828125, -2.243896484375, -2.135711669921875, -2.02752685546875, -1.919342041015625, -1.8111572265625, -1.702972412109375, -1.59478759765625, -1.486602783203125, -1.37841796875, -1.270233154296875, -1.16204833984375, -1.053863525390625, -0.9456787109375, -0.837493896484375, -0.72930908203125, -0.621124267578125, -0.512939453125, -0.404754638671875, -0.29656982421875, -0.188385009765625, -0.0802001953125, 0.027984619140625, 0.13616943359375, 0.244354248046875, 0.3525390625, 0.460723876953125, 0.56890869140625, 0.677093505859375, 0.7852783203125, 0.893463134765625, 1.00164794921875, 1.109832763671875, 1.218017578125, 1.326202392578125, 1.43438720703125, 1.542572021484375, 1.6507568359375, 1.758941650390625, 1.86712646484375, 1.975311279296875, 2.08349609375, 2.191680908203125, 2.29986572265625, 2.408050537109375, 2.5162353515625, 2.624420166015625, 2.73260498046875, 2.840789794921875, 2.948974609375, 3.057159423828125, 3.16534423828125, 3.273529052734375, 3.3817138671875, 3.489898681640625, 3.59808349609375, 3.706268310546875, 3.814453125]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 9.0, 16.0, 32.0, 29.0, 32.0, 60.0, 86.0, 111.0, 125.0, 130.0, 95.0, 71.0, 53.0, 49.0, 28.0, 20.0, 21.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.301207542419434, -14.709336280822754, -14.11746597290039, -13.525594711303711, -12.933723449707031, -12.341852188110352, -11.749980926513672, -11.158110618591309, -10.566239356994629, -9.97436809539795, -9.382497787475586, -8.790626525878906, -8.198755264282227, -7.606884002685547, -7.015013217926025, -6.423142433166504, -5.831271171569824, -5.2393999099731445, -4.647529125213623, -4.055658340454102, -3.463787078857422, -2.8719160556793213, -2.2800450325012207, -1.6881742477416992, -1.0963029861450195, -0.504431962966919, 0.08743906021118164, 0.6793100833892822, 1.2711811065673828, 1.8630521297454834, 2.454923152923584, 3.0467939376831055, 3.6386642456054688, 4.230535507202148, 4.82240629196167, 5.414277076721191, 6.006148338317871, 6.598019599914551, 7.189890384674072, 7.781761169433594, 8.373632431030273, 8.965503692626953, 9.557374954223633, 10.149245262145996, 10.741116523742676, 11.332987785339355, 11.924858093261719, 12.516729354858398, 13.108600616455078, 13.700471878051758, 14.292343139648438, 14.8842134475708, 15.47608470916748, 16.067955017089844, 16.659826278686523, 17.251697540283203, 17.843568801879883, 18.435440063476562, 19.027311325073242, 19.619182586669922, 20.21105194091797, 20.80292320251465, 21.394794464111328, 21.986665725708008, 22.578536987304688]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 7.0, 15.0, 13.0, 12.0, 22.0, 22.0, 20.0, 28.0, 29.0, 22.0, 40.0, 41.0, 40.0, 47.0, 45.0, 43.0, 53.0, 37.0, 40.0, 44.0, 43.0, 33.0, 51.0, 32.0, 30.0, 25.0, 19.0, 18.0, 16.0, 13.0, 16.0, 13.0, 8.0, 9.0, 6.0, 7.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.755499362945557, -7.531396865844727, -7.307294845581055, -7.083192348480225, -6.8590898513793945, -6.634987831115723, -6.410885334014893, -6.1867828369140625, -5.962680816650391, -5.7385783195495605, -5.514476299285889, -5.290373802185059, -5.066271781921387, -4.842169284820557, -4.618066787719727, -4.393964767456055, -4.169862270355225, -3.9457600116729736, -3.7216577529907227, -3.4975552558898926, -3.2734529972076416, -3.0493507385253906, -2.8252482414245605, -2.6011459827423096, -2.3770437240600586, -2.1529414653778076, -1.928839087486267, -1.7047367095947266, -1.4806344509124756, -1.2565321922302246, -1.032429814338684, -0.8083274364471436, -0.5842256546020508, -0.36012333631515503, -0.13602101802825928, 0.08808130025863647, 0.3121836185455322, 0.5362858772277832, 0.7603882551193237, 0.9844906330108643, 1.2085928916931152, 1.4326951503753662, 1.6567975282669067, 1.8808999061584473, 2.1050021648406982, 2.329104423522949, 2.5532069206237793, 2.7773091793060303, 3.0014114379882812, 3.2255136966705322, 3.449615955352783, 3.6737184524536133, 3.8978207111358643, 4.121922969818115, 4.346025466918945, 4.570127487182617, 4.794229984283447, 5.018332481384277, 5.242434501647949, 5.466536998748779, 5.690639495849609, 5.914741516113281, 6.138844013214111, 6.362946510314941, 6.587048530578613]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 13.0, 9.0, 19.0, 23.0, 35.0, 39.0, 72.0, 79.0, 117.0, 181.0, 218.0, 352.0, 547.0, 902.0, 1487.0, 2603.0, 5133.0, 10977.0, 25284.0, 69286.0, 239545.0, 455077.0, 151770.0, 47893.0, 18707.0, 8427.0, 4036.0, 2250.0, 1207.0, 763.0, 425.0, 287.0, 215.0, 155.0, 104.0, 83.0, 67.0, 44.0, 29.0, 19.0, 15.0, 11.0, 8.0, 4.0, 3.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.763671875, -1.71075439453125, -1.6578369140625, -1.60491943359375, -1.552001953125, -1.49908447265625, -1.4461669921875, -1.39324951171875, -1.34033203125, -1.28741455078125, -1.2344970703125, -1.18157958984375, -1.128662109375, -1.07574462890625, -1.0228271484375, -0.96990966796875, -0.9169921875, -0.86407470703125, -0.8111572265625, -0.75823974609375, -0.705322265625, -0.65240478515625, -0.5994873046875, -0.54656982421875, -0.49365234375, -0.44073486328125, -0.3878173828125, -0.33489990234375, -0.281982421875, -0.22906494140625, -0.1761474609375, -0.12322998046875, -0.0703125, -0.01739501953125, 0.0355224609375, 0.08843994140625, 0.141357421875, 0.19427490234375, 0.2471923828125, 0.30010986328125, 0.35302734375, 0.40594482421875, 0.4588623046875, 0.51177978515625, 0.564697265625, 0.61761474609375, 0.6705322265625, 0.72344970703125, 0.7763671875, 0.82928466796875, 0.8822021484375, 0.93511962890625, 0.988037109375, 1.04095458984375, 1.0938720703125, 1.14678955078125, 1.19970703125, 1.25262451171875, 1.3055419921875, 1.35845947265625, 1.411376953125, 1.46429443359375, 1.5172119140625, 1.57012939453125, 1.623046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 6.0, 8.0, 17.0, 9.0, 21.0, 16.0, 28.0, 31.0, 24.0, 35.0, 34.0, 36.0, 37.0, 48.0, 51.0, 58.0, 40.0, 46.0, 44.0, 47.0, 46.0, 40.0, 32.0, 41.0, 28.0, 17.0, 25.0, 19.0, 16.0, 11.0, 11.0, 16.0, 14.0, 7.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.625, -8.36956787109375, -8.1141357421875, -7.85870361328125, -7.603271484375, -7.34783935546875, -7.0924072265625, -6.83697509765625, -6.58154296875, -6.32611083984375, -6.0706787109375, -5.81524658203125, -5.559814453125, -5.30438232421875, -5.0489501953125, -4.79351806640625, -4.5380859375, -4.28265380859375, -4.0272216796875, -3.77178955078125, -3.516357421875, -3.26092529296875, -3.0054931640625, -2.75006103515625, -2.49462890625, -2.23919677734375, -1.9837646484375, -1.72833251953125, -1.472900390625, -1.21746826171875, -0.9620361328125, -0.70660400390625, -0.451171875, -0.19573974609375, 0.0596923828125, 0.31512451171875, 0.570556640625, 0.82598876953125, 1.0814208984375, 1.33685302734375, 1.59228515625, 1.84771728515625, 2.1031494140625, 2.35858154296875, 2.614013671875, 2.86944580078125, 3.1248779296875, 3.38031005859375, 3.6357421875, 3.89117431640625, 4.1466064453125, 4.40203857421875, 4.657470703125, 4.91290283203125, 5.1683349609375, 5.42376708984375, 5.67919921875, 5.93463134765625, 6.1900634765625, 6.44549560546875, 6.700927734375, 6.95635986328125, 7.2117919921875, 7.46722412109375, 7.72265625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 4.0, 13.0, 8.0, 23.0, 30.0, 45.0, 60.0, 125.0, 237.0, 364.0, 644.0, 1369.0, 3125.0, 9558.0, 44485.0, 934759.0, 39171.0, 8687.0, 3070.0, 1300.0, 652.0, 306.0, 185.0, 114.0, 87.0, 38.0, 25.0, 22.0, 7.0, 9.0, 5.0, 5.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3359375, -5.176513671875, -5.01708984375, -4.857666015625, -4.6982421875, -4.538818359375, -4.37939453125, -4.219970703125, -4.060546875, -3.901123046875, -3.74169921875, -3.582275390625, -3.4228515625, -3.263427734375, -3.10400390625, -2.944580078125, -2.78515625, -2.625732421875, -2.46630859375, -2.306884765625, -2.1474609375, -1.988037109375, -1.82861328125, -1.669189453125, -1.509765625, -1.350341796875, -1.19091796875, -1.031494140625, -0.8720703125, -0.712646484375, -0.55322265625, -0.393798828125, -0.234375, -0.074951171875, 0.08447265625, 0.243896484375, 0.4033203125, 0.562744140625, 0.72216796875, 0.881591796875, 1.041015625, 1.200439453125, 1.35986328125, 1.519287109375, 1.6787109375, 1.838134765625, 1.99755859375, 2.156982421875, 2.31640625, 2.475830078125, 2.63525390625, 2.794677734375, 2.9541015625, 3.113525390625, 3.27294921875, 3.432373046875, 3.591796875, 3.751220703125, 3.91064453125, 4.070068359375, 4.2294921875, 4.388916015625, 4.54833984375, 4.707763671875, 4.8671875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 5.0, 8.0, 11.0, 5.0, 16.0, 18.0, 21.0, 22.0, 24.0, 38.0, 31.0, 27.0, 36.0, 33.0, 40.0, 47.0, 48.0, 38.0, 47.0, 47.0, 48.0, 45.0, 48.0, 28.0, 34.0, 40.0, 25.0, 21.0, 18.0, 21.0, 25.0, 14.0, 11.0, 11.0, 7.0, 7.0, 12.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.375, -5.22418212890625, -5.0733642578125, -4.92254638671875, -4.771728515625, -4.62091064453125, -4.4700927734375, -4.31927490234375, -4.16845703125, -4.01763916015625, -3.8668212890625, -3.71600341796875, -3.565185546875, -3.41436767578125, -3.2635498046875, -3.11273193359375, -2.9619140625, -2.81109619140625, -2.6602783203125, -2.50946044921875, -2.358642578125, -2.20782470703125, -2.0570068359375, -1.90618896484375, -1.75537109375, -1.60455322265625, -1.4537353515625, -1.30291748046875, -1.152099609375, -1.00128173828125, -0.8504638671875, -0.69964599609375, -0.548828125, -0.39801025390625, -0.2471923828125, -0.09637451171875, 0.054443359375, 0.20526123046875, 0.3560791015625, 0.50689697265625, 0.65771484375, 0.80853271484375, 0.9593505859375, 1.11016845703125, 1.260986328125, 1.41180419921875, 1.5626220703125, 1.71343994140625, 1.8642578125, 2.01507568359375, 2.1658935546875, 2.31671142578125, 2.467529296875, 2.61834716796875, 2.7691650390625, 2.91998291015625, 3.07080078125, 3.22161865234375, 3.3724365234375, 3.52325439453125, 3.674072265625, 3.82489013671875, 3.9757080078125, 4.12652587890625, 4.27734375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 9.0, 6.0, 16.0, 6.0, 11.0, 22.0, 29.0, 34.0, 47.0, 61.0, 79.0, 94.0, 128.0, 154.0, 205.0, 276.0, 434.0, 642.0, 1131.0, 2339.0, 6426.0, 28006.0, 955081.0, 39058.0, 7730.0, 2699.0, 1362.0, 750.0, 434.0, 296.0, 278.0, 148.0, 140.0, 88.0, 83.0, 56.0, 32.0, 41.0, 23.0, 31.0, 11.0, 16.0, 15.0, 7.0, 5.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.376953125, -1.3303985595703125, -1.283843994140625, -1.2372894287109375, -1.19073486328125, -1.1441802978515625, -1.097625732421875, -1.0510711669921875, -1.0045166015625, -0.9579620361328125, -0.911407470703125, -0.8648529052734375, -0.81829833984375, -0.7717437744140625, -0.725189208984375, -0.6786346435546875, -0.632080078125, -0.5855255126953125, -0.538970947265625, -0.4924163818359375, -0.44586181640625, -0.3993072509765625, -0.352752685546875, -0.3061981201171875, -0.2596435546875, -0.2130889892578125, -0.166534423828125, -0.1199798583984375, -0.07342529296875, -0.0268707275390625, 0.019683837890625, 0.0662384033203125, 0.11279296875, 0.1593475341796875, 0.205902099609375, 0.2524566650390625, 0.29901123046875, 0.3455657958984375, 0.392120361328125, 0.4386749267578125, 0.4852294921875, 0.5317840576171875, 0.578338623046875, 0.6248931884765625, 0.67144775390625, 0.7180023193359375, 0.764556884765625, 0.8111114501953125, 0.857666015625, 0.9042205810546875, 0.950775146484375, 0.9973297119140625, 1.04388427734375, 1.0904388427734375, 1.136993408203125, 1.1835479736328125, 1.2301025390625, 1.2766571044921875, 1.323211669921875, 1.3697662353515625, 1.41632080078125, 1.4628753662109375, 1.509429931640625, 1.5559844970703125, 1.6025390625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 13.0, 17.0, 12.0, 15.0, 7.0, 22.0, 20.0, 30.0, 31.0, 37.0, 29.0, 35.0, 51.0, 57.0, 52.0, 53.0, 51.0, 46.0, 42.0, 45.0, 36.0, 28.0, 39.0, 25.0, 31.0, 27.0, 24.0, 19.0, 14.0, 12.0, 12.0, 12.0, 7.0, 9.0, 2.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.7147274017333984e-05, -4.5632943511009216e-05, -4.411861300468445e-05, -4.260428249835968e-05, -4.108995199203491e-05, -3.9575621485710144e-05, -3.8061290979385376e-05, -3.654696047306061e-05, -3.503262996673584e-05, -3.351829946041107e-05, -3.2003968954086304e-05, -3.0489638447761536e-05, -2.8975307941436768e-05, -2.7460977435112e-05, -2.594664692878723e-05, -2.4432316422462463e-05, -2.2917985916137695e-05, -2.1403655409812927e-05, -1.988932490348816e-05, -1.837499439716339e-05, -1.6860663890838623e-05, -1.5346333384513855e-05, -1.3832002878189087e-05, -1.2317672371864319e-05, -1.080334186553955e-05, -9.289011359214783e-06, -7.774680852890015e-06, -6.260350346565247e-06, -4.7460198402404785e-06, -3.2316893339157104e-06, -1.7173588275909424e-06, -2.0302832126617432e-07, 1.3113021850585938e-06, 2.825632691383362e-06, 4.33996319770813e-06, 5.854293704032898e-06, 7.368624210357666e-06, 8.882954716682434e-06, 1.0397285223007202e-05, 1.191161572933197e-05, 1.3425946235656738e-05, 1.4940276741981506e-05, 1.6454607248306274e-05, 1.7968937754631042e-05, 1.948326826095581e-05, 2.099759876728058e-05, 2.2511929273605347e-05, 2.4026259779930115e-05, 2.5540590286254883e-05, 2.705492079257965e-05, 2.856925129890442e-05, 3.0083581805229187e-05, 3.1597912311553955e-05, 3.311224281787872e-05, 3.462657332420349e-05, 3.614090383052826e-05, 3.765523433685303e-05, 3.9169564843177795e-05, 4.0683895349502563e-05, 4.219822585582733e-05, 4.37125563621521e-05, 4.522688686847687e-05, 4.6741217374801636e-05, 4.8255547881126404e-05, 4.976987838745117e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 4.0, 7.0, 17.0, 23.0, 42.0, 42.0, 59.0, 85.0, 116.0, 189.0, 318.0, 418.0, 700.0, 1062.0, 1803.0, 3177.0, 6024.0, 12422.0, 28523.0, 77100.0, 244691.0, 418387.0, 158726.0, 53026.0, 20701.0, 9426.0, 4776.0, 2515.0, 1484.0, 899.0, 560.0, 423.0, 266.0, 173.0, 106.0, 73.0, 57.0, 36.0, 24.0, 27.0, 13.0, 4.0, 6.0, 6.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.37939453125, -0.36865234375, -0.35791015625, -0.34716796875, -0.33642578125, -0.32568359375, -0.31494140625, -0.30419921875, -0.29345703125, -0.28271484375, -0.27197265625, -0.26123046875, -0.25048828125, -0.23974609375, -0.22900390625, -0.21826171875, -0.20751953125, -0.19677734375, -0.18603515625, -0.17529296875, -0.16455078125, -0.15380859375, -0.14306640625, -0.13232421875, -0.12158203125, -0.11083984375, -0.10009765625, -0.08935546875, -0.07861328125, -0.06787109375, -0.05712890625, -0.04638671875, -0.03564453125, -0.02490234375, -0.01416015625, -0.00341796875, 0.00732421875, 0.01806640625, 0.02880859375, 0.03955078125, 0.05029296875, 0.06103515625, 0.07177734375, 0.08251953125, 0.09326171875, 0.10400390625, 0.11474609375, 0.12548828125, 0.13623046875, 0.14697265625, 0.15771484375, 0.16845703125, 0.17919921875, 0.18994140625, 0.20068359375, 0.21142578125, 0.22216796875, 0.23291015625, 0.24365234375, 0.25439453125, 0.26513671875, 0.27587890625, 0.28662109375, 0.29736328125, 0.30810546875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 26.0, 23.0, 29.0, 40.0, 49.0, 54.0, 65.0, 72.0, 97.0, 90.0, 75.0, 71.0, 58.0, 48.0, 44.0, 35.0, 20.0, 23.0, 5.0, 6.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.08021306991577148, -0.07796764373779297, -0.07572221755981445, -0.07347679138183594, -0.07123136520385742, -0.0689859390258789, -0.06674051284790039, -0.06449508666992188, -0.06224966049194336, -0.060004234313964844, -0.05775880813598633, -0.05551338195800781, -0.0532679557800293, -0.05102252960205078, -0.048777103424072266, -0.04653167724609375, -0.044286251068115234, -0.04204082489013672, -0.0397953987121582, -0.03754997253417969, -0.03530454635620117, -0.033059120178222656, -0.03081369400024414, -0.028568267822265625, -0.02632284164428711, -0.024077415466308594, -0.021831989288330078, -0.019586563110351562, -0.017341136932373047, -0.015095710754394531, -0.012850284576416016, -0.0106048583984375, -0.008359432220458984, -0.006114006042480469, -0.003868579864501953, -0.0016231536865234375, 0.0006222724914550781, 0.0028676986694335938, 0.005113124847412109, 0.007358551025390625, 0.00960397720336914, 0.011849403381347656, 0.014094829559326172, 0.016340255737304688, 0.018585681915283203, 0.02083110809326172, 0.023076534271240234, 0.02532196044921875, 0.027567386627197266, 0.02981281280517578, 0.0320582389831543, 0.03430366516113281, 0.03654909133911133, 0.038794517517089844, 0.04103994369506836, 0.043285369873046875, 0.04553079605102539, 0.047776222229003906, 0.05002164840698242, 0.05226707458496094, 0.05451250076293945, 0.05675792694091797, 0.059003353118896484, 0.061248779296875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 7.0, 10.0, 17.0, 34.0, 34.0, 36.0, 69.0, 95.0, 110.0, 131.0, 121.0, 88.0, 66.0, 52.0, 37.0, 33.0, 20.0, 16.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.186877250671387, -14.593441009521484, -14.000004768371582, -13.40656852722168, -12.813132286071777, -12.219696044921875, -11.626259803771973, -11.03282356262207, -10.439387321472168, -9.845951080322266, -9.252514839172363, -8.659078598022461, -8.065642356872559, -7.472206115722656, -6.878769874572754, -6.285333633422852, -5.691897392272949, -5.098461151123047, -4.5050249099731445, -3.911588668823242, -3.31815242767334, -2.7247161865234375, -2.131279945373535, -1.5378437042236328, -0.9444074630737305, -0.3509712219238281, 0.24246501922607422, 0.8359012603759766, 1.429337501525879, 2.0227737426757812, 2.6162099838256836, 3.209646224975586, 3.8030834197998047, 4.396519660949707, 4.989955902099609, 5.583392143249512, 6.176828384399414, 6.770264625549316, 7.363700866699219, 7.957137107849121, 8.550573348999023, 9.144009590148926, 9.737445831298828, 10.33088207244873, 10.924318313598633, 11.517754554748535, 12.111190795898438, 12.70462703704834, 13.298063278198242, 13.891499519348145, 14.484935760498047, 15.07837200164795, 15.671808242797852, 16.265243530273438, 16.858680725097656, 17.452117919921875, 18.04555320739746, 18.638988494873047, 19.232425689697266, 19.825862884521484, 20.41929817199707, 21.012733459472656, 21.606170654296875, 22.199607849121094, 22.79304313659668]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 6.0, 9.0, 6.0, 15.0, 12.0, 13.0, 21.0, 22.0, 21.0, 28.0, 28.0, 25.0, 36.0, 43.0, 44.0, 46.0, 44.0, 41.0, 53.0, 41.0, 40.0, 40.0, 43.0, 34.0, 49.0, 37.0, 25.0, 24.0, 21.0, 15.0, 18.0, 13.0, 17.0, 13.0, 9.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-7.695289611816406, -7.47208309173584, -7.248876571655273, -7.025670051574707, -6.802463054656982, -6.579256534576416, -6.35605001449585, -6.132843494415283, -5.909636497497559, -5.686429977416992, -5.463223457336426, -5.240016937255859, -5.016809940338135, -4.793603420257568, -4.570396900177002, -4.3471903800964355, -4.123983860015869, -3.9007773399353027, -3.6775705814361572, -3.454364061355591, -3.2311573028564453, -3.007950782775879, -2.7847442626953125, -2.561537742614746, -2.3383309841156006, -2.115124464035034, -1.8919177055358887, -1.6687111854553223, -1.4455045461654663, -1.2222979068756104, -0.999091386795044, -0.775884747505188, -0.552678108215332, -0.32947149872779846, -0.10626488924026489, 0.11694169044494629, 0.34014832973480225, 0.5633549690246582, 0.7865614891052246, 1.0097681283950806, 1.2329747676849365, 1.4561814069747925, 1.6793880462646484, 1.9025945663452148, 2.1258010864257812, 2.3490078449249268, 2.572214365005493, 2.7954211235046387, 3.018627643585205, 3.2418341636657715, 3.465040922164917, 3.6882474422454834, 3.911454200744629, 4.134660720825195, 4.357867240905762, 4.581073760986328, 4.8042802810668945, 5.027486801147461, 5.250693321228027, 5.473899841308594, 5.697106838226318, 5.920313358306885, 6.143519878387451, 6.366726398468018, 6.589933395385742]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 10.0, 6.0, 7.0, 8.0, 15.0, 24.0, 30.0, 60.0, 76.0, 123.0, 151.0, 202.0, 380.0, 503.0, 722.0, 1093.0, 1794.0, 2574.0, 3975.0, 6662.0, 10802.0, 18394.0, 31904.0, 58570.0, 110696.0, 193133.0, 232529.0, 166895.0, 91296.0, 48347.0, 26731.0, 15521.0, 9234.0, 5645.0, 3599.0, 2315.0, 1449.0, 950.0, 668.0, 479.0, 290.0, 232.0, 150.0, 106.0, 67.0, 41.0, 32.0, 29.0, 9.0, 6.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-7.34765625, -7.10552978515625, -6.8634033203125, -6.62127685546875, -6.379150390625, -6.13702392578125, -5.8948974609375, -5.65277099609375, -5.41064453125, -5.16851806640625, -4.9263916015625, -4.68426513671875, -4.442138671875, -4.20001220703125, -3.9578857421875, -3.71575927734375, -3.4736328125, -3.23150634765625, -2.9893798828125, -2.74725341796875, -2.505126953125, -2.26300048828125, -2.0208740234375, -1.77874755859375, -1.53662109375, -1.29449462890625, -1.0523681640625, -0.81024169921875, -0.568115234375, -0.32598876953125, -0.0838623046875, 0.15826416015625, 0.400390625, 0.64251708984375, 0.8846435546875, 1.12677001953125, 1.368896484375, 1.61102294921875, 1.8531494140625, 2.09527587890625, 2.33740234375, 2.57952880859375, 2.8216552734375, 3.06378173828125, 3.305908203125, 3.54803466796875, 3.7901611328125, 4.03228759765625, 4.2744140625, 4.51654052734375, 4.7586669921875, 5.00079345703125, 5.242919921875, 5.48504638671875, 5.7271728515625, 5.96929931640625, 6.21142578125, 6.45355224609375, 6.6956787109375, 6.93780517578125, 7.179931640625, 7.42205810546875, 7.6641845703125, 7.90631103515625, 8.1484375]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 9.0, 8.0, 9.0, 8.0, 12.0, 11.0, 8.0, 30.0, 18.0, 31.0, 19.0, 40.0, 35.0, 35.0, 46.0, 50.0, 48.0, 49.0, 48.0, 54.0, 44.0, 38.0, 49.0, 32.0, 46.0, 29.0, 30.0, 25.0, 17.0, 21.0, 13.0, 14.0, 17.0, 10.0, 9.0, 9.0, 5.0, 3.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.3125, -8.0587158203125, -7.804931640625, -7.5511474609375, -7.29736328125, -7.0435791015625, -6.789794921875, -6.5360107421875, -6.2822265625, -6.0284423828125, -5.774658203125, -5.5208740234375, -5.26708984375, -5.0133056640625, -4.759521484375, -4.5057373046875, -4.251953125, -3.9981689453125, -3.744384765625, -3.4906005859375, -3.23681640625, -2.9830322265625, -2.729248046875, -2.4754638671875, -2.2216796875, -1.9678955078125, -1.714111328125, -1.4603271484375, -1.20654296875, -0.9527587890625, -0.698974609375, -0.4451904296875, -0.19140625, 0.0623779296875, 0.316162109375, 0.5699462890625, 0.82373046875, 1.0775146484375, 1.331298828125, 1.5850830078125, 1.8388671875, 2.0926513671875, 2.346435546875, 2.6002197265625, 2.85400390625, 3.1077880859375, 3.361572265625, 3.6153564453125, 3.869140625, 4.1229248046875, 4.376708984375, 4.6304931640625, 4.88427734375, 5.1380615234375, 5.391845703125, 5.6456298828125, 5.8994140625, 6.1531982421875, 6.406982421875, 6.6607666015625, 6.91455078125, 7.1683349609375, 7.422119140625, 7.6759033203125, 7.9296875]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 22.0, 26.0, 50.0, 75.0, 120.0, 193.0, 329.0, 604.0, 988.0, 2028.0, 3839.0, 7584.0, 15958.0, 35973.0, 85225.0, 201217.0, 320440.0, 212683.0, 90079.0, 37447.0, 17046.0, 8080.0, 3907.0, 2026.0, 1109.0, 593.0, 356.0, 201.0, 132.0, 64.0, 43.0, 31.0, 20.0, 15.0, 10.0, 5.0, 5.0, 7.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.533935546875, -10.17724609375, -9.820556640625, -9.4638671875, -9.107177734375, -8.75048828125, -8.393798828125, -8.037109375, -7.680419921875, -7.32373046875, -6.967041015625, -6.6103515625, -6.253662109375, -5.89697265625, -5.540283203125, -5.18359375, -4.826904296875, -4.47021484375, -4.113525390625, -3.7568359375, -3.400146484375, -3.04345703125, -2.686767578125, -2.330078125, -1.973388671875, -1.61669921875, -1.260009765625, -0.9033203125, -0.546630859375, -0.18994140625, 0.166748046875, 0.5234375, 0.880126953125, 1.23681640625, 1.593505859375, 1.9501953125, 2.306884765625, 2.66357421875, 3.020263671875, 3.376953125, 3.733642578125, 4.09033203125, 4.447021484375, 4.8037109375, 5.160400390625, 5.51708984375, 5.873779296875, 6.23046875, 6.587158203125, 6.94384765625, 7.300537109375, 7.6572265625, 8.013916015625, 8.37060546875, 8.727294921875, 9.083984375, 9.440673828125, 9.79736328125, 10.154052734375, 10.5107421875, 10.867431640625, 11.22412109375, 11.580810546875, 11.9375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 9.0, 9.0, 8.0, 11.0, 9.0, 16.0, 19.0, 24.0, 25.0, 25.0, 27.0, 34.0, 31.0, 30.0, 26.0, 35.0, 34.0, 39.0, 46.0, 32.0, 39.0, 40.0, 39.0, 44.0, 44.0, 26.0, 32.0, 30.0, 29.0, 17.0, 27.0, 20.0, 17.0, 14.0, 13.0, 13.0, 12.0, 10.0, 4.0, 6.0, 4.0, 4.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-4.3125, -4.184295654296875, -4.05609130859375, -3.927886962890625, -3.7996826171875, -3.671478271484375, -3.54327392578125, -3.415069580078125, -3.286865234375, -3.158660888671875, -3.03045654296875, -2.902252197265625, -2.7740478515625, -2.645843505859375, -2.51763916015625, -2.389434814453125, -2.26123046875, -2.133026123046875, -2.00482177734375, -1.876617431640625, -1.7484130859375, -1.620208740234375, -1.49200439453125, -1.363800048828125, -1.235595703125, -1.107391357421875, -0.97918701171875, -0.850982666015625, -0.7227783203125, -0.594573974609375, -0.46636962890625, -0.338165283203125, -0.2099609375, -0.081756591796875, 0.04644775390625, 0.174652099609375, 0.3028564453125, 0.431060791015625, 0.55926513671875, 0.687469482421875, 0.815673828125, 0.943878173828125, 1.07208251953125, 1.200286865234375, 1.3284912109375, 1.456695556640625, 1.58489990234375, 1.713104248046875, 1.84130859375, 1.969512939453125, 2.09771728515625, 2.225921630859375, 2.3541259765625, 2.482330322265625, 2.61053466796875, 2.738739013671875, 2.866943359375, 2.995147705078125, 3.12335205078125, 3.251556396484375, 3.3797607421875, 3.507965087890625, 3.63616943359375, 3.764373779296875, 3.892578125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 4.0, 5.0, 2.0, 3.0, 5.0, 11.0, 16.0, 17.0, 26.0, 30.0, 51.0, 84.0, 113.0, 165.0, 211.0, 345.0, 474.0, 714.0, 1096.0, 1724.0, 2456.0, 3944.0, 6456.0, 11139.0, 19245.0, 34851.0, 67069.0, 130703.0, 224536.0, 234675.0, 143332.0, 74177.0, 38850.0, 20968.0, 11908.0, 7257.0, 4217.0, 2601.0, 1703.0, 1099.0, 723.0, 478.0, 304.0, 238.0, 160.0, 96.0, 80.0, 56.0, 48.0, 31.0, 22.0, 12.0, 7.0, 11.0, 6.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-4.29296875, -4.15911865234375, -4.0252685546875, -3.89141845703125, -3.757568359375, -3.62371826171875, -3.4898681640625, -3.35601806640625, -3.22216796875, -3.08831787109375, -2.9544677734375, -2.82061767578125, -2.686767578125, -2.55291748046875, -2.4190673828125, -2.28521728515625, -2.1513671875, -2.01751708984375, -1.8836669921875, -1.74981689453125, -1.615966796875, -1.48211669921875, -1.3482666015625, -1.21441650390625, -1.08056640625, -0.94671630859375, -0.8128662109375, -0.67901611328125, -0.545166015625, -0.41131591796875, -0.2774658203125, -0.14361572265625, -0.009765625, 0.12408447265625, 0.2579345703125, 0.39178466796875, 0.525634765625, 0.65948486328125, 0.7933349609375, 0.92718505859375, 1.06103515625, 1.19488525390625, 1.3287353515625, 1.46258544921875, 1.596435546875, 1.73028564453125, 1.8641357421875, 1.99798583984375, 2.1318359375, 2.26568603515625, 2.3995361328125, 2.53338623046875, 2.667236328125, 2.80108642578125, 2.9349365234375, 3.06878662109375, 3.20263671875, 3.33648681640625, 3.4703369140625, 3.60418701171875, 3.738037109375, 3.87188720703125, 4.0057373046875, 4.13958740234375, 4.2734375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 8.0, 11.0, 7.0, 14.0, 15.0, 18.0, 11.0, 34.0, 40.0, 45.0, 75.0, 91.0, 88.0, 93.0, 85.0, 98.0, 66.0, 38.0, 42.0, 29.0, 17.0, 20.0, 12.0, 5.0, 5.0, 3.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003952980041503906, -0.0003823600709438324, -0.00036942213773727417, -0.00035648420453071594, -0.0003435462713241577, -0.0003306083381175995, -0.00031767040491104126, -0.00030473247170448303, -0.0002917945384979248, -0.0002788566052913666, -0.00026591867208480835, -0.0002529807388782501, -0.0002400428056716919, -0.00022710487246513367, -0.00021416693925857544, -0.0002012290060520172, -0.00018829107284545898, -0.00017535313963890076, -0.00016241520643234253, -0.0001494772732257843, -0.00013653934001922607, -0.00012360140681266785, -0.00011066347360610962, -9.772554039955139e-05, -8.478760719299316e-05, -7.184967398643494e-05, -5.891174077987671e-05, -4.597380757331848e-05, -3.3035874366760254e-05, -2.0097941160202026e-05, -7.160007953643799e-06, 5.777925252914429e-06, 1.8715858459472656e-05, 3.1653791666030884e-05, 4.459172487258911e-05, 5.752965807914734e-05, 7.046759128570557e-05, 8.34055244922638e-05, 9.634345769882202e-05, 0.00010928139090538025, 0.00012221932411193848, 0.0001351572573184967, 0.00014809519052505493, 0.00016103312373161316, 0.0001739710569381714, 0.00018690899014472961, 0.00019984692335128784, 0.00021278485655784607, 0.0002257227897644043, 0.00023866072297096252, 0.00025159865617752075, 0.000264536589384079, 0.0002774745225906372, 0.00029041245579719543, 0.00030335038900375366, 0.0003162883222103119, 0.0003292262554168701, 0.00034216418862342834, 0.00035510212182998657, 0.0003680400550365448, 0.00038097798824310303, 0.00039391592144966125, 0.0004068538546562195, 0.0004197917878627777, 0.00043272972106933594]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 5.0, 8.0, 9.0, 17.0, 28.0, 44.0, 71.0, 98.0, 150.0, 223.0, 357.0, 573.0, 906.0, 1552.0, 2530.0, 4752.0, 8468.0, 16540.0, 33628.0, 72863.0, 159625.0, 271150.0, 239826.0, 123562.0, 55799.0, 26386.0, 13190.0, 6911.0, 3799.0, 2128.0, 1270.0, 766.0, 447.0, 335.0, 183.0, 123.0, 82.0, 49.0, 48.0, 20.0, 13.0, 15.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.267822265625, -4.12939453125, -3.990966796875, -3.8525390625, -3.714111328125, -3.57568359375, -3.437255859375, -3.298828125, -3.160400390625, -3.02197265625, -2.883544921875, -2.7451171875, -2.606689453125, -2.46826171875, -2.329833984375, -2.19140625, -2.052978515625, -1.91455078125, -1.776123046875, -1.6376953125, -1.499267578125, -1.36083984375, -1.222412109375, -1.083984375, -0.945556640625, -0.80712890625, -0.668701171875, -0.5302734375, -0.391845703125, -0.25341796875, -0.114990234375, 0.0234375, 0.161865234375, 0.30029296875, 0.438720703125, 0.5771484375, 0.715576171875, 0.85400390625, 0.992431640625, 1.130859375, 1.269287109375, 1.40771484375, 1.546142578125, 1.6845703125, 1.822998046875, 1.96142578125, 2.099853515625, 2.23828125, 2.376708984375, 2.51513671875, 2.653564453125, 2.7919921875, 2.930419921875, 3.06884765625, 3.207275390625, 3.345703125, 3.484130859375, 3.62255859375, 3.760986328125, 3.8994140625, 4.037841796875, 4.17626953125, 4.314697265625, 4.453125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 11.0, 16.0, 16.0, 26.0, 32.0, 34.0, 42.0, 46.0, 43.0, 51.0, 54.0, 62.0, 41.0, 63.0, 60.0, 43.0, 45.0, 42.0, 42.0, 29.0, 34.0, 23.0, 19.0, 17.0, 9.0, 15.0, 12.0, 8.0, 9.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9111328125, -0.8812713623046875, -0.851409912109375, -0.8215484619140625, -0.79168701171875, -0.7618255615234375, -0.731964111328125, -0.7021026611328125, -0.6722412109375, -0.6423797607421875, -0.612518310546875, -0.5826568603515625, -0.55279541015625, -0.5229339599609375, -0.493072509765625, -0.4632110595703125, -0.433349609375, -0.4034881591796875, -0.373626708984375, -0.3437652587890625, -0.31390380859375, -0.2840423583984375, -0.254180908203125, -0.2243194580078125, -0.1944580078125, -0.1645965576171875, -0.134735107421875, -0.1048736572265625, -0.07501220703125, -0.0451507568359375, -0.015289306640625, 0.0145721435546875, 0.04443359375, 0.0742950439453125, 0.104156494140625, 0.1340179443359375, 0.16387939453125, 0.1937408447265625, 0.223602294921875, 0.2534637451171875, 0.2833251953125, 0.3131866455078125, 0.343048095703125, 0.3729095458984375, 0.40277099609375, 0.4326324462890625, 0.462493896484375, 0.4923553466796875, 0.522216796875, 0.5520782470703125, 0.581939697265625, 0.6118011474609375, 0.64166259765625, 0.6715240478515625, 0.701385498046875, 0.7312469482421875, 0.7611083984375, 0.7909698486328125, 0.820831298828125, 0.8506927490234375, 0.88055419921875, 0.9104156494140625, 0.940277099609375, 0.9701385498046875, 1.0]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 16.0, 11.0, 35.0, 30.0, 52.0, 66.0, 92.0, 111.0, 114.0, 107.0, 87.0, 56.0, 54.0, 39.0, 30.0, 30.0, 16.0, 11.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.589505195617676, -13.058735847473145, -12.527966499328613, -11.997196197509766, -11.466426849365234, -10.935657501220703, -10.404888153076172, -9.87411880493164, -9.34334945678711, -8.812580108642578, -8.281810760498047, -7.751040935516357, -7.220271110534668, -6.689501762390137, -6.1587324142456055, -5.627963066101074, -5.097192764282227, -4.566423416137695, -4.035653591156006, -3.5048842430114746, -2.9741146564483643, -2.443345069885254, -1.9125757217407227, -1.3818061351776123, -0.851036548614502, -0.3202670216560364, 0.2105025053024292, 0.74127197265625, 1.2720415592193604, 1.8028111457824707, 2.333580493927002, 2.8643500804901123, 3.395120620727539, 3.9258902072906494, 4.45665979385376, 4.987429141998291, 5.5181989669799805, 6.048968315124512, 6.579737663269043, 7.110507011413574, 7.641276836395264, 8.172046661376953, 8.702816009521484, 9.233585357666016, 9.764354705810547, 10.295124053955078, 10.82589340209961, 11.356663703918457, 11.887433052062988, 12.41820240020752, 12.94897174835205, 13.479742050170898, 14.01051139831543, 14.541280746459961, 15.072050094604492, 15.602819442749023, 16.133588790893555, 16.664358139038086, 17.195127487182617, 17.72589683532715, 18.25666618347168, 18.787437438964844, 19.318206787109375, 19.848976135253906, 20.379745483398438]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 4.0, 5.0, 8.0, 9.0, 14.0, 15.0, 13.0, 12.0, 15.0, 24.0, 22.0, 20.0, 18.0, 36.0, 38.0, 51.0, 37.0, 38.0, 51.0, 42.0, 50.0, 50.0, 39.0, 43.0, 43.0, 48.0, 38.0, 27.0, 36.0, 30.0, 21.0, 19.0, 13.0, 8.0, 11.0, 4.0, 13.0, 11.0, 8.0, 6.0, 3.0, 6.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.085474491119385, -6.859209060668945, -6.632943630218506, -6.406678199768066, -6.180412769317627, -5.9541473388671875, -5.727882385253906, -5.501616477966309, -5.275351524353027, -5.049086093902588, -4.822820663452148, -4.596555233001709, -4.3702898025512695, -4.14402437210083, -3.9177591800689697, -3.6914937496185303, -3.4652280807495117, -3.2389626502990723, -3.012697219848633, -2.7864317893981934, -2.560166358947754, -2.3339009284973145, -2.107635736465454, -1.8813703060150146, -1.6551048755645752, -1.4288394451141357, -1.2025740146636963, -0.9763087034225464, -0.7500432729721069, -0.5237778425216675, -0.2975125312805176, -0.07124710083007812, 0.15501880645751953, 0.3812842071056366, 0.6075496077537537, 0.8338149785995483, 1.0600804090499878, 1.2863458395004272, 1.5126111507415771, 1.7388765811920166, 1.965142011642456, 2.1914074420928955, 2.417672872543335, 2.6439380645751953, 2.8702034950256348, 3.096468925476074, 3.3227343559265137, 3.548999786376953, 3.7752652168273926, 4.001530647277832, 4.2277960777282715, 4.454061508178711, 4.68032693862915, 4.90659236907959, 5.132857322692871, 5.359123229980469, 5.58538818359375, 5.8116536140441895, 6.037919044494629, 6.264184474945068, 6.490449905395508, 6.716715335845947, 6.942980766296387, 7.169245719909668, 7.395511627197266]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 12.0, 15.0, 22.0, 29.0, 52.0, 84.0, 110.0, 173.0, 232.0, 402.0, 600.0, 944.0, 1493.0, 2454.0, 3921.0, 6798.0, 12765.0, 27804.0, 76413.0, 295921.0, 1279726.0, 1804334.0, 496411.0, 111959.0, 35505.0, 15410.0, 7985.0, 4573.0, 2823.0, 1828.0, 1139.0, 749.0, 524.0, 334.0, 258.0, 135.0, 91.0, 60.0, 51.0, 43.0, 32.0, 21.0, 20.0, 4.0, 7.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-15.3125, -14.804931640625, -14.29736328125, -13.789794921875, -13.2822265625, -12.774658203125, -12.26708984375, -11.759521484375, -11.251953125, -10.744384765625, -10.23681640625, -9.729248046875, -9.2216796875, -8.714111328125, -8.20654296875, -7.698974609375, -7.19140625, -6.683837890625, -6.17626953125, -5.668701171875, -5.1611328125, -4.653564453125, -4.14599609375, -3.638427734375, -3.130859375, -2.623291015625, -2.11572265625, -1.608154296875, -1.1005859375, -0.593017578125, -0.08544921875, 0.422119140625, 0.9296875, 1.437255859375, 1.94482421875, 2.452392578125, 2.9599609375, 3.467529296875, 3.97509765625, 4.482666015625, 4.990234375, 5.497802734375, 6.00537109375, 6.512939453125, 7.0205078125, 7.528076171875, 8.03564453125, 8.543212890625, 9.05078125, 9.558349609375, 10.06591796875, 10.573486328125, 11.0810546875, 11.588623046875, 12.09619140625, 12.603759765625, 13.111328125, 13.618896484375, 14.12646484375, 14.634033203125, 15.1416015625, 15.649169921875, 16.15673828125, 16.664306640625, 17.171875]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 3.0, 3.0, 13.0, 10.0, 8.0, 11.0, 18.0, 12.0, 18.0, 21.0, 26.0, 23.0, 35.0, 42.0, 30.0, 46.0, 38.0, 53.0, 37.0, 59.0, 50.0, 45.0, 35.0, 42.0, 46.0, 41.0, 48.0, 38.0, 19.0, 21.0, 28.0, 12.0, 14.0, 8.0, 8.0, 9.0, 13.0, 5.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.6768798828125, -5.474853515625, -5.2728271484375, -5.07080078125, -4.8687744140625, -4.666748046875, -4.4647216796875, -4.2626953125, -4.0606689453125, -3.858642578125, -3.6566162109375, -3.45458984375, -3.2525634765625, -3.050537109375, -2.8485107421875, -2.646484375, -2.4444580078125, -2.242431640625, -2.0404052734375, -1.83837890625, -1.6363525390625, -1.434326171875, -1.2322998046875, -1.0302734375, -0.8282470703125, -0.626220703125, -0.4241943359375, -0.22216796875, -0.0201416015625, 0.181884765625, 0.3839111328125, 0.5859375, 0.7879638671875, 0.989990234375, 1.1920166015625, 1.39404296875, 1.5960693359375, 1.798095703125, 2.0001220703125, 2.2021484375, 2.4041748046875, 2.606201171875, 2.8082275390625, 3.01025390625, 3.2122802734375, 3.414306640625, 3.6163330078125, 3.818359375, 4.0203857421875, 4.222412109375, 4.4244384765625, 4.62646484375, 4.8284912109375, 5.030517578125, 5.2325439453125, 5.4345703125, 5.6365966796875, 5.838623046875, 6.0406494140625, 6.24267578125, 6.4447021484375, 6.646728515625, 6.8487548828125, 7.05078125]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 17.0, 29.0, 31.0, 49.0, 66.0, 110.0, 188.0, 245.0, 367.0, 566.0, 968.0, 1531.0, 2737.0, 4802.0, 8825.0, 16955.0, 36283.0, 89575.0, 298218.0, 1467608.0, 1722603.0, 358849.0, 102247.0, 40648.0, 18806.0, 9459.0, 5146.0, 2916.0, 1678.0, 978.0, 591.0, 397.0, 269.0, 164.0, 114.0, 80.0, 41.0, 37.0, 24.0, 11.0, 9.0, 12.0, 3.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.703125, -19.088623046875, -18.47412109375, -17.859619140625, -17.2451171875, -16.630615234375, -16.01611328125, -15.401611328125, -14.787109375, -14.172607421875, -13.55810546875, -12.943603515625, -12.3291015625, -11.714599609375, -11.10009765625, -10.485595703125, -9.87109375, -9.256591796875, -8.64208984375, -8.027587890625, -7.4130859375, -6.798583984375, -6.18408203125, -5.569580078125, -4.955078125, -4.340576171875, -3.72607421875, -3.111572265625, -2.4970703125, -1.882568359375, -1.26806640625, -0.653564453125, -0.0390625, 0.575439453125, 1.18994140625, 1.804443359375, 2.4189453125, 3.033447265625, 3.64794921875, 4.262451171875, 4.876953125, 5.491455078125, 6.10595703125, 6.720458984375, 7.3349609375, 7.949462890625, 8.56396484375, 9.178466796875, 9.79296875, 10.407470703125, 11.02197265625, 11.636474609375, 12.2509765625, 12.865478515625, 13.47998046875, 14.094482421875, 14.708984375, 15.323486328125, 15.93798828125, 16.552490234375, 17.1669921875, 17.781494140625, 18.39599609375, 19.010498046875, 19.625]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 9.0, 8.0, 8.0, 9.0, 15.0, 7.0, 16.0, 27.0, 40.0, 41.0, 62.0, 69.0, 111.0, 157.0, 211.0, 264.0, 361.0, 418.0, 463.0, 420.0, 324.0, 273.0, 218.0, 137.0, 93.0, 73.0, 57.0, 36.0, 38.0, 24.0, 20.0, 20.0, 12.0, 10.0, 9.0, 2.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.9296875, -4.79815673828125, -4.6666259765625, -4.53509521484375, -4.403564453125, -4.27203369140625, -4.1405029296875, -4.00897216796875, -3.87744140625, -3.74591064453125, -3.6143798828125, -3.48284912109375, -3.351318359375, -3.21978759765625, -3.0882568359375, -2.95672607421875, -2.8251953125, -2.69366455078125, -2.5621337890625, -2.43060302734375, -2.299072265625, -2.16754150390625, -2.0360107421875, -1.90447998046875, -1.77294921875, -1.64141845703125, -1.5098876953125, -1.37835693359375, -1.246826171875, -1.11529541015625, -0.9837646484375, -0.85223388671875, -0.720703125, -0.58917236328125, -0.4576416015625, -0.32611083984375, -0.194580078125, -0.06304931640625, 0.0684814453125, 0.20001220703125, 0.33154296875, 0.46307373046875, 0.5946044921875, 0.72613525390625, 0.857666015625, 0.98919677734375, 1.1207275390625, 1.25225830078125, 1.3837890625, 1.51531982421875, 1.6468505859375, 1.77838134765625, 1.909912109375, 2.04144287109375, 2.1729736328125, 2.30450439453125, 2.43603515625, 2.56756591796875, 2.6990966796875, 2.83062744140625, 2.962158203125, 3.09368896484375, 3.2252197265625, 3.35675048828125, 3.48828125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 7.0, 1.0, 7.0, 6.0, 5.0, 17.0, 18.0, 38.0, 38.0, 78.0, 84.0, 108.0, 133.0, 127.0, 95.0, 93.0, 49.0, 34.0, 19.0, 17.0, 13.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.147273063659668, -14.506760597229004, -13.86624813079834, -13.225735664367676, -12.585222244262695, -11.944709777832031, -11.304197311401367, -10.663684844970703, -10.023172378540039, -9.382659912109375, -8.742147445678711, -8.101634979248047, -7.461122035980225, -6.8206095695495605, -6.180096626281738, -5.539584159851074, -4.89907169342041, -4.258559226989746, -3.618046522140503, -2.9775338172912598, -2.3370213508605957, -1.6965088844299316, -1.0559961795806885, -0.4154834747314453, 0.22502899169921875, 0.8655415773391724, 1.506054162979126, 2.146566867828369, 2.787079334259033, 3.4275918006896973, 4.0681047439575195, 4.708617210388184, 5.349128723144531, 5.989641189575195, 6.630153656005859, 7.270666599273682, 7.911179065704346, 8.551691055297852, 9.192204475402832, 9.832716941833496, 10.47322940826416, 11.113741874694824, 11.754254341125488, 12.394766807556152, 13.035280227661133, 13.675792694091797, 14.316305160522461, 14.956817626953125, 15.597330093383789, 16.237842559814453, 16.878355026245117, 17.51886749267578, 18.159379959106445, 18.79989242553711, 19.440404891967773, 20.080917358398438, 20.721431732177734, 21.3619441986084, 22.002456665039062, 22.642969131469727, 23.28348159790039, 23.923994064331055, 24.56450653076172, 25.205020904541016, 25.845531463623047]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 4.0, 9.0, 10.0, 10.0, 10.0, 14.0, 17.0, 25.0, 24.0, 26.0, 32.0, 23.0, 32.0, 34.0, 35.0, 52.0, 44.0, 55.0, 52.0, 38.0, 43.0, 43.0, 44.0, 45.0, 32.0, 31.0, 26.0, 27.0, 20.0, 20.0, 28.0, 14.0, 19.0, 12.0, 11.0, 7.0, 6.0, 1.0, 3.0, 7.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.655154705047607, -6.415656089782715, -6.176156997680664, -5.9366583824157715, -5.697159767150879, -5.457660675048828, -5.2181620597839355, -4.978663444519043, -4.739164352416992, -4.4996657371521, -4.260166645050049, -4.020668029785156, -3.7811691761016846, -3.541670322418213, -3.3021717071533203, -3.0626728534698486, -2.823173999786377, -2.5836751461029053, -2.3441762924194336, -2.104677677154541, -1.8651788234710693, -1.6256799697875977, -1.3861812353134155, -1.1466825008392334, -0.9071836471557617, -0.6676848530769348, -0.4281860589981079, -0.188687264919281, 0.0508115291595459, 0.2903103828430176, 0.5298091173171997, 0.7693078517913818, 1.0088071823120117, 1.2483060359954834, 1.4878047704696655, 1.7273035049438477, 1.9668023586273193, 2.206301212310791, 2.4457998275756836, 2.6852986812591553, 2.924797534942627, 3.1642963886260986, 3.4037952423095703, 3.643293857574463, 3.8827927112579346, 4.122291564941406, 4.361790180206299, 4.601288795471191, 4.840787887573242, 5.080286502838135, 5.3197855949401855, 5.559284210205078, 5.798783302307129, 6.0382819175720215, 6.277780532836914, 6.517279624938965, 6.756778240203857, 6.99627685546875, 7.235775947570801, 7.475274562835693, 7.714773178100586, 7.954272270202637, 8.193771362304688, 8.433269500732422, 8.672768592834473]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 8.0, 14.0, 18.0, 15.0, 38.0, 50.0, 71.0, 107.0, 178.0, 276.0, 452.0, 660.0, 1188.0, 2036.0, 3606.0, 6637.0, 12279.0, 24365.0, 50243.0, 115224.0, 275033.0, 305359.0, 135156.0, 57700.0, 27067.0, 13886.0, 7289.0, 4082.0, 2178.0, 1255.0, 788.0, 448.0, 300.0, 183.0, 130.0, 78.0, 48.0, 34.0, 29.0, 7.0, 9.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.138671875, -1.0981292724609375, -1.057586669921875, -1.0170440673828125, -0.97650146484375, -0.9359588623046875, -0.895416259765625, -0.8548736572265625, -0.8143310546875, -0.7737884521484375, -0.733245849609375, -0.6927032470703125, -0.65216064453125, -0.6116180419921875, -0.571075439453125, -0.5305328369140625, -0.489990234375, -0.4494476318359375, -0.408905029296875, -0.3683624267578125, -0.32781982421875, -0.2872772216796875, -0.246734619140625, -0.2061920166015625, -0.1656494140625, -0.1251068115234375, -0.084564208984375, -0.0440216064453125, -0.00347900390625, 0.0370635986328125, 0.077606201171875, 0.1181488037109375, 0.15869140625, 0.1992340087890625, 0.239776611328125, 0.2803192138671875, 0.32086181640625, 0.3614044189453125, 0.401947021484375, 0.4424896240234375, 0.4830322265625, 0.5235748291015625, 0.564117431640625, 0.6046600341796875, 0.64520263671875, 0.6857452392578125, 0.726287841796875, 0.7668304443359375, 0.807373046875, 0.8479156494140625, 0.888458251953125, 0.9290008544921875, 0.96954345703125, 1.0100860595703125, 1.050628662109375, 1.0911712646484375, 1.1317138671875, 1.1722564697265625, 1.212799072265625, 1.2533416748046875, 1.29388427734375, 1.3344268798828125, 1.374969482421875, 1.4155120849609375, 1.4560546875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 13.0, 14.0, 8.0, 13.0, 11.0, 21.0, 27.0, 30.0, 31.0, 29.0, 30.0, 33.0, 44.0, 52.0, 56.0, 49.0, 38.0, 54.0, 38.0, 58.0, 43.0, 36.0, 30.0, 31.0, 31.0, 26.0, 21.0, 27.0, 19.0, 20.0, 15.0, 11.0, 5.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.1171875, -7.8360595703125, -7.554931640625, -7.2738037109375, -6.99267578125, -6.7115478515625, -6.430419921875, -6.1492919921875, -5.8681640625, -5.5870361328125, -5.305908203125, -5.0247802734375, -4.74365234375, -4.4625244140625, -4.181396484375, -3.9002685546875, -3.619140625, -3.3380126953125, -3.056884765625, -2.7757568359375, -2.49462890625, -2.2135009765625, -1.932373046875, -1.6512451171875, -1.3701171875, -1.0889892578125, -0.807861328125, -0.5267333984375, -0.24560546875, 0.0355224609375, 0.316650390625, 0.5977783203125, 0.87890625, 1.1600341796875, 1.441162109375, 1.7222900390625, 2.00341796875, 2.2845458984375, 2.565673828125, 2.8468017578125, 3.1279296875, 3.4090576171875, 3.690185546875, 3.9713134765625, 4.25244140625, 4.5335693359375, 4.814697265625, 5.0958251953125, 5.376953125, 5.6580810546875, 5.939208984375, 6.2203369140625, 6.50146484375, 6.7825927734375, 7.063720703125, 7.3448486328125, 7.6259765625, 7.9071044921875, 8.188232421875, 8.4693603515625, 8.75048828125, 9.0316162109375, 9.312744140625, 9.5938720703125, 9.875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 10.0, 6.0, 12.0, 8.0, 18.0, 19.0, 29.0, 31.0, 38.0, 84.0, 85.0, 144.0, 222.0, 276.0, 396.0, 655.0, 982.0, 1679.0, 3083.0, 6009.0, 12757.0, 35007.0, 790684.0, 152523.0, 23178.0, 9758.0, 4556.0, 2397.0, 1333.0, 792.0, 553.0, 351.0, 248.0, 164.0, 122.0, 90.0, 66.0, 54.0, 38.0, 19.0, 15.0, 15.0, 18.0, 7.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-3.11328125, -3.021209716796875, -2.92913818359375, -2.837066650390625, -2.7449951171875, -2.652923583984375, -2.56085205078125, -2.468780517578125, -2.376708984375, -2.284637451171875, -2.19256591796875, -2.100494384765625, -2.0084228515625, -1.916351318359375, -1.82427978515625, -1.732208251953125, -1.64013671875, -1.548065185546875, -1.45599365234375, -1.363922119140625, -1.2718505859375, -1.179779052734375, -1.08770751953125, -0.995635986328125, -0.903564453125, -0.811492919921875, -0.71942138671875, -0.627349853515625, -0.5352783203125, -0.443206787109375, -0.35113525390625, -0.259063720703125, -0.1669921875, -0.074920654296875, 0.01715087890625, 0.109222412109375, 0.2012939453125, 0.293365478515625, 0.38543701171875, 0.477508544921875, 0.569580078125, 0.661651611328125, 0.75372314453125, 0.845794677734375, 0.9378662109375, 1.029937744140625, 1.12200927734375, 1.214080810546875, 1.30615234375, 1.398223876953125, 1.49029541015625, 1.582366943359375, 1.6744384765625, 1.766510009765625, 1.85858154296875, 1.950653076171875, 2.042724609375, 2.134796142578125, 2.22686767578125, 2.318939208984375, 2.4110107421875, 2.503082275390625, 2.59515380859375, 2.687225341796875, 2.779296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 8.0, 12.0, 7.0, 9.0, 14.0, 20.0, 22.0, 25.0, 27.0, 24.0, 22.0, 30.0, 33.0, 33.0, 53.0, 42.0, 43.0, 38.0, 32.0, 46.0, 47.0, 48.0, 43.0, 36.0, 35.0, 40.0, 34.0, 21.0, 19.0, 17.0, 22.0, 14.0, 17.0, 16.0, 10.0, 8.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.15234375, -5.0015869140625, -4.850830078125, -4.7000732421875, -4.54931640625, -4.3985595703125, -4.247802734375, -4.0970458984375, -3.9462890625, -3.7955322265625, -3.644775390625, -3.4940185546875, -3.34326171875, -3.1925048828125, -3.041748046875, -2.8909912109375, -2.740234375, -2.5894775390625, -2.438720703125, -2.2879638671875, -2.13720703125, -1.9864501953125, -1.835693359375, -1.6849365234375, -1.5341796875, -1.3834228515625, -1.232666015625, -1.0819091796875, -0.93115234375, -0.7803955078125, -0.629638671875, -0.4788818359375, -0.328125, -0.1773681640625, -0.026611328125, 0.1241455078125, 0.27490234375, 0.4256591796875, 0.576416015625, 0.7271728515625, 0.8779296875, 1.0286865234375, 1.179443359375, 1.3302001953125, 1.48095703125, 1.6317138671875, 1.782470703125, 1.9332275390625, 2.083984375, 2.2347412109375, 2.385498046875, 2.5362548828125, 2.68701171875, 2.8377685546875, 2.988525390625, 3.1392822265625, 3.2900390625, 3.4407958984375, 3.591552734375, 3.7423095703125, 3.89306640625, 4.0438232421875, 4.194580078125, 4.3453369140625, 4.49609375]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 17.0, 27.0, 37.0, 51.0, 71.0, 116.0, 179.0, 291.0, 556.0, 951.0, 1931.0, 4432.0, 11935.0, 47029.0, 930650.0, 33030.0, 9643.0, 3793.0, 1748.0, 877.0, 432.0, 256.0, 173.0, 90.0, 72.0, 45.0, 27.0, 26.0, 14.0, 12.0, 3.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87353515625, -0.8416519165039062, -0.8097686767578125, -0.7778854370117188, -0.746002197265625, -0.7141189575195312, -0.6822357177734375, -0.6503524780273438, -0.61846923828125, -0.5865859985351562, -0.5547027587890625, -0.5228195190429688, -0.490936279296875, -0.45905303955078125, -0.4271697998046875, -0.39528656005859375, -0.3634033203125, -0.33152008056640625, -0.2996368408203125, -0.26775360107421875, -0.235870361328125, -0.20398712158203125, -0.1721038818359375, -0.14022064208984375, -0.10833740234375, -0.07645416259765625, -0.0445709228515625, -0.01268768310546875, 0.019195556640625, 0.05107879638671875, 0.0829620361328125, 0.11484527587890625, 0.146728515625, 0.17861175537109375, 0.2104949951171875, 0.24237823486328125, 0.274261474609375, 0.30614471435546875, 0.3380279541015625, 0.36991119384765625, 0.40179443359375, 0.43367767333984375, 0.4655609130859375, 0.49744415283203125, 0.529327392578125, 0.5612106323242188, 0.5930938720703125, 0.6249771118164062, 0.6568603515625, 0.6887435913085938, 0.7206268310546875, 0.7525100708007812, 0.784393310546875, 0.8162765502929688, 0.8481597900390625, 0.8800430297851562, 0.91192626953125, 0.9438095092773438, 0.9756927490234375, 1.0075759887695312, 1.039459228515625, 1.0713424682617188, 1.1032257080078125, 1.1351089477539062, 1.1669921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 6.0, 10.0, 9.0, 15.0, 17.0, 15.0, 24.0, 21.0, 30.0, 36.0, 30.0, 36.0, 49.0, 36.0, 61.0, 46.0, 68.0, 62.0, 54.0, 53.0, 29.0, 49.0, 44.0, 30.0, 23.0, 22.0, 20.0, 23.0, 17.0, 14.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.7147274017333984e-05, -4.558078944683075e-05, -4.4014304876327515e-05, -4.244782030582428e-05, -4.0881335735321045e-05, -3.931485116481781e-05, -3.7748366594314575e-05, -3.618188202381134e-05, -3.4615397453308105e-05, -3.304891288280487e-05, -3.1482428312301636e-05, -2.99159437417984e-05, -2.8349459171295166e-05, -2.678297460079193e-05, -2.5216490030288696e-05, -2.365000545978546e-05, -2.2083520889282227e-05, -2.0517036318778992e-05, -1.8950551748275757e-05, -1.7384067177772522e-05, -1.5817582607269287e-05, -1.4251098036766052e-05, -1.2684613466262817e-05, -1.1118128895759583e-05, -9.551644325256348e-06, -7.985159754753113e-06, -6.418675184249878e-06, -4.852190613746643e-06, -3.285706043243408e-06, -1.7192214727401733e-06, -1.5273690223693848e-07, 1.4137476682662964e-06, 2.9802322387695312e-06, 4.546716809272766e-06, 6.113201379776001e-06, 7.679685950279236e-06, 9.24617052078247e-06, 1.0812655091285706e-05, 1.237913966178894e-05, 1.3945624232292175e-05, 1.551210880279541e-05, 1.7078593373298645e-05, 1.864507794380188e-05, 2.0211562514305115e-05, 2.177804708480835e-05, 2.3344531655311584e-05, 2.491101622581482e-05, 2.6477500796318054e-05, 2.804398536682129e-05, 2.9610469937324524e-05, 3.117695450782776e-05, 3.2743439078330994e-05, 3.430992364883423e-05, 3.587640821933746e-05, 3.74428927898407e-05, 3.900937736034393e-05, 4.057586193084717e-05, 4.21423465013504e-05, 4.370883107185364e-05, 4.527531564235687e-05, 4.684180021286011e-05, 4.840828478336334e-05, 4.997476935386658e-05, 5.154125392436981e-05, 5.310773849487305e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 11.0, 13.0, 12.0, 18.0, 31.0, 40.0, 54.0, 71.0, 102.0, 164.0, 257.0, 383.0, 672.0, 1065.0, 1951.0, 3895.0, 8779.0, 22267.0, 65904.0, 230195.0, 456617.0, 172668.0, 50732.0, 17817.0, 7153.0, 3324.0, 1717.0, 937.0, 620.0, 371.0, 235.0, 130.0, 109.0, 70.0, 43.0, 35.0, 25.0, 21.0, 10.0, 9.0, 10.0, 4.0, 5.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.379638671875, -0.3671455383300781, -0.35465240478515625, -0.3421592712402344, -0.3296661376953125, -0.3171730041503906, -0.30467987060546875, -0.2921867370605469, -0.279693603515625, -0.2672004699707031, -0.25470733642578125, -0.24221420288085938, -0.2297210693359375, -0.21722793579101562, -0.20473480224609375, -0.19224166870117188, -0.17974853515625, -0.16725540161132812, -0.15476226806640625, -0.14226913452148438, -0.1297760009765625, -0.11728286743164062, -0.10478973388671875, -0.09229660034179688, -0.079803466796875, -0.06731033325195312, -0.05481719970703125, -0.042324066162109375, -0.0298309326171875, -0.017337799072265625, -0.00484466552734375, 0.007648468017578125, 0.0201416015625, 0.032634735107421875, 0.04512786865234375, 0.057621002197265625, 0.0701141357421875, 0.08260726928710938, 0.09510040283203125, 0.10759353637695312, 0.120086669921875, 0.13257980346679688, 0.14507293701171875, 0.15756607055664062, 0.1700592041015625, 0.18255233764648438, 0.19504547119140625, 0.20753860473632812, 0.22003173828125, 0.23252487182617188, 0.24501800537109375, 0.2575111389160156, 0.2700042724609375, 0.2824974060058594, 0.29499053955078125, 0.3074836730957031, 0.319976806640625, 0.3324699401855469, 0.34496307373046875, 0.3574562072753906, 0.3699493408203125, 0.3824424743652344, 0.39493560791015625, 0.4074287414550781, 0.419921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 13.0, 17.0, 19.0, 31.0, 42.0, 45.0, 60.0, 75.0, 103.0, 108.0, 92.0, 103.0, 72.0, 63.0, 41.0, 31.0, 23.0, 11.0, 10.0, 10.0, 7.0, 5.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09588623046875, -0.0928792953491211, -0.08987236022949219, -0.08686542510986328, -0.08385848999023438, -0.08085155487060547, -0.07784461975097656, -0.07483768463134766, -0.07183074951171875, -0.06882381439208984, -0.06581687927246094, -0.06280994415283203, -0.059803009033203125, -0.05679607391357422, -0.05378913879394531, -0.050782203674316406, -0.0477752685546875, -0.044768333435058594, -0.04176139831542969, -0.03875446319580078, -0.035747528076171875, -0.03274059295654297, -0.029733657836914062, -0.026726722717285156, -0.02371978759765625, -0.020712852478027344, -0.017705917358398438, -0.014698982238769531, -0.011692047119140625, -0.008685111999511719, -0.0056781768798828125, -0.0026712417602539062, 0.000335693359375, 0.0033426284790039062, 0.0063495635986328125, 0.009356498718261719, 0.012363433837890625, 0.015370368957519531, 0.018377304077148438, 0.021384239196777344, 0.02439117431640625, 0.027398109436035156, 0.030405044555664062, 0.03341197967529297, 0.036418914794921875, 0.03942584991455078, 0.04243278503417969, 0.045439720153808594, 0.0484466552734375, 0.051453590393066406, 0.05446052551269531, 0.05746746063232422, 0.060474395751953125, 0.06348133087158203, 0.06648826599121094, 0.06949520111083984, 0.07250213623046875, 0.07550907135009766, 0.07851600646972656, 0.08152294158935547, 0.08452987670898438, 0.08753681182861328, 0.09054374694824219, 0.0935506820678711, 0.0965576171875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 2.0, 9.0, 6.0, 16.0, 16.0, 26.0, 44.0, 60.0, 82.0, 102.0, 114.0, 143.0, 104.0, 94.0, 62.0, 39.0, 26.0, 15.0, 12.0, 13.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.588719367980957, -13.953987121582031, -13.319253921508789, -12.684521675109863, -12.049788475036621, -11.415056228637695, -10.780323028564453, -10.145590782165527, -9.510858535766602, -8.876126289367676, -8.241393089294434, -7.606660842895508, -6.971927642822266, -6.33719539642334, -5.702462673187256, -5.067729949951172, -4.43299674987793, -3.7982640266418457, -3.1635313034057617, -2.528798818588257, -1.8940660953521729, -1.2593333721160889, -0.624600887298584, 0.0101318359375, 0.644864559173584, 1.279597282409668, 1.9143298864364624, 2.549062490463257, 3.183795213699341, 3.818527936935425, 4.45326042175293, 5.087993144989014, 5.722724914550781, 6.357457637786865, 6.992190361022949, 7.626922607421875, 8.261655807495117, 8.896388053894043, 9.531120300292969, 10.165853500366211, 10.800586700439453, 11.435318946838379, 12.070052146911621, 12.704784393310547, 13.339517593383789, 13.974249839782715, 14.60898208618164, 15.243715286254883, 15.878447532653809, 16.513179779052734, 17.147912979125977, 17.78264617919922, 18.417377471923828, 19.05211067199707, 19.686843872070312, 20.321575164794922, 20.956308364868164, 21.591041564941406, 22.225772857666016, 22.860506057739258, 23.4952392578125, 24.129972457885742, 24.76470375061035, 25.399436950683594, 26.034170150756836]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 11.0, 9.0, 10.0, 10.0, 16.0, 16.0, 26.0, 24.0, 24.0, 35.0, 23.0, 31.0, 37.0, 32.0, 53.0, 43.0, 62.0, 47.0, 41.0, 41.0, 46.0, 45.0, 37.0, 34.0, 28.0, 30.0, 27.0, 18.0, 21.0, 26.0, 15.0, 17.0, 14.0, 11.0, 6.0, 5.0, 0.0, 4.0, 6.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.627356052398682, -6.388107776641846, -6.148859977722168, -5.909611701965332, -5.670363426208496, -5.431115627288818, -5.191867351531982, -4.952619552612305, -4.713371276855469, -4.474123001098633, -4.234875202178955, -3.995626926422119, -3.7563788890838623, -3.5171308517456055, -3.2778825759887695, -3.0386345386505127, -2.799386501312256, -2.560138463973999, -2.320890426635742, -2.0816421508789062, -1.8423941135406494, -1.6031460762023926, -1.3638979196548462, -1.1246497631072998, -0.885401725769043, -0.6461536288261414, -0.40690553188323975, -0.16765743494033813, 0.07159066200256348, 0.3108386993408203, 0.5500868558883667, 0.7893350124359131, 1.0285835266113281, 1.267831563949585, 1.5070797204971313, 1.7463278770446777, 1.9855759143829346, 2.2248239517211914, 2.4640722274780273, 2.703320264816284, 2.942568302154541, 3.181816339492798, 3.4210643768310547, 3.6603126525878906, 3.8995606899261475, 4.138808727264404, 4.37805700302124, 4.617304801940918, 4.856553077697754, 5.09580135345459, 5.335049152374268, 5.5742974281311035, 5.813545227050781, 6.052793502807617, 6.292041778564453, 6.531290054321289, 6.770537853240967, 7.009786128997803, 7.2490339279174805, 7.488282203674316, 7.727530479431152, 7.96677827835083, 8.206026077270508, 8.445274353027344, 8.68452262878418]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 4.0, 5.0, 12.0, 13.0, 19.0, 29.0, 46.0, 80.0, 107.0, 163.0, 242.0, 358.0, 672.0, 1049.0, 1715.0, 2896.0, 5204.0, 9498.0, 17750.0, 34878.0, 71154.0, 145050.0, 248303.0, 239778.0, 134232.0, 65391.0, 32074.0, 16744.0, 8894.0, 4968.0, 2841.0, 1582.0, 1056.0, 614.0, 403.0, 241.0, 158.0, 123.0, 71.0, 52.0, 32.0, 19.0, 13.0, 12.0, 4.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.5234375, -9.25091552734375, -8.9783935546875, -8.70587158203125, -8.433349609375, -8.16082763671875, -7.8883056640625, -7.61578369140625, -7.34326171875, -7.07073974609375, -6.7982177734375, -6.52569580078125, -6.253173828125, -5.98065185546875, -5.7081298828125, -5.43560791015625, -5.1630859375, -4.89056396484375, -4.6180419921875, -4.34552001953125, -4.072998046875, -3.80047607421875, -3.5279541015625, -3.25543212890625, -2.98291015625, -2.71038818359375, -2.4378662109375, -2.16534423828125, -1.892822265625, -1.62030029296875, -1.3477783203125, -1.07525634765625, -0.802734375, -0.53021240234375, -0.2576904296875, 0.01483154296875, 0.287353515625, 0.55987548828125, 0.8323974609375, 1.10491943359375, 1.37744140625, 1.64996337890625, 1.9224853515625, 2.19500732421875, 2.467529296875, 2.74005126953125, 3.0125732421875, 3.28509521484375, 3.5576171875, 3.83013916015625, 4.1026611328125, 4.37518310546875, 4.647705078125, 4.92022705078125, 5.1927490234375, 5.46527099609375, 5.73779296875, 6.01031494140625, 6.2828369140625, 6.55535888671875, 6.827880859375, 7.10040283203125, 7.3729248046875, 7.64544677734375, 7.91796875]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 8.0, 8.0, 8.0, 11.0, 19.0, 14.0, 28.0, 26.0, 26.0, 25.0, 29.0, 30.0, 30.0, 53.0, 41.0, 39.0, 55.0, 52.0, 47.0, 56.0, 43.0, 41.0, 35.0, 39.0, 37.0, 30.0, 24.0, 24.0, 15.0, 16.0, 16.0, 11.0, 11.0, 9.0, 5.0, 4.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.30047607421875, -7.0345458984375, -6.76861572265625, -6.502685546875, -6.23675537109375, -5.9708251953125, -5.70489501953125, -5.43896484375, -5.17303466796875, -4.9071044921875, -4.64117431640625, -4.375244140625, -4.10931396484375, -3.8433837890625, -3.57745361328125, -3.3115234375, -3.04559326171875, -2.7796630859375, -2.51373291015625, -2.247802734375, -1.98187255859375, -1.7159423828125, -1.45001220703125, -1.18408203125, -0.91815185546875, -0.6522216796875, -0.38629150390625, -0.120361328125, 0.14556884765625, 0.4114990234375, 0.67742919921875, 0.943359375, 1.20928955078125, 1.4752197265625, 1.74114990234375, 2.007080078125, 2.27301025390625, 2.5389404296875, 2.80487060546875, 3.07080078125, 3.33673095703125, 3.6026611328125, 3.86859130859375, 4.134521484375, 4.40045166015625, 4.6663818359375, 4.93231201171875, 5.1982421875, 5.46417236328125, 5.7301025390625, 5.99603271484375, 6.261962890625, 6.52789306640625, 6.7938232421875, 7.05975341796875, 7.32568359375, 7.59161376953125, 7.8575439453125, 8.12347412109375, 8.389404296875, 8.65533447265625, 8.9212646484375, 9.18719482421875, 9.453125]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 11.0, 15.0, 23.0, 29.0, 48.0, 67.0, 108.0, 156.0, 259.0, 324.0, 518.0, 797.0, 1240.0, 1878.0, 2730.0, 4375.0, 6557.0, 10335.0, 16234.0, 26215.0, 43157.0, 71229.0, 114211.0, 163437.0, 181417.0, 148112.0, 97363.0, 59813.0, 36363.0, 22178.0, 13986.0, 8948.0, 5573.0, 3695.0, 2457.0, 1557.0, 1042.0, 675.0, 470.0, 313.0, 228.0, 149.0, 86.0, 59.0, 36.0, 27.0, 17.0, 16.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.09765625, -5.90301513671875, -5.7083740234375, -5.51373291015625, -5.319091796875, -5.12445068359375, -4.9298095703125, -4.73516845703125, -4.54052734375, -4.34588623046875, -4.1512451171875, -3.95660400390625, -3.761962890625, -3.56732177734375, -3.3726806640625, -3.17803955078125, -2.9833984375, -2.78875732421875, -2.5941162109375, -2.39947509765625, -2.204833984375, -2.01019287109375, -1.8155517578125, -1.62091064453125, -1.42626953125, -1.23162841796875, -1.0369873046875, -0.84234619140625, -0.647705078125, -0.45306396484375, -0.2584228515625, -0.06378173828125, 0.130859375, 0.32550048828125, 0.5201416015625, 0.71478271484375, 0.909423828125, 1.10406494140625, 1.2987060546875, 1.49334716796875, 1.68798828125, 1.88262939453125, 2.0772705078125, 2.27191162109375, 2.466552734375, 2.66119384765625, 2.8558349609375, 3.05047607421875, 3.2451171875, 3.43975830078125, 3.6343994140625, 3.82904052734375, 4.023681640625, 4.21832275390625, 4.4129638671875, 4.60760498046875, 4.80224609375, 4.99688720703125, 5.1915283203125, 5.38616943359375, 5.580810546875, 5.77545166015625, 5.9700927734375, 6.16473388671875, 6.359375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 9.0, 8.0, 11.0, 15.0, 12.0, 10.0, 27.0, 13.0, 19.0, 20.0, 25.0, 23.0, 30.0, 23.0, 36.0, 23.0, 39.0, 47.0, 34.0, 41.0, 47.0, 39.0, 47.0, 28.0, 28.0, 30.0, 35.0, 34.0, 30.0, 28.0, 25.0, 18.0, 18.0, 13.0, 17.0, 11.0, 9.0, 11.0, 11.0, 9.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.96875, -3.847015380859375, -3.72528076171875, -3.603546142578125, -3.4818115234375, -3.360076904296875, -3.23834228515625, -3.116607666015625, -2.994873046875, -2.873138427734375, -2.75140380859375, -2.629669189453125, -2.5079345703125, -2.386199951171875, -2.26446533203125, -2.142730712890625, -2.02099609375, -1.899261474609375, -1.77752685546875, -1.655792236328125, -1.5340576171875, -1.412322998046875, -1.29058837890625, -1.168853759765625, -1.047119140625, -0.925384521484375, -0.80364990234375, -0.681915283203125, -0.5601806640625, -0.438446044921875, -0.31671142578125, -0.194976806640625, -0.0732421875, 0.048492431640625, 0.17022705078125, 0.291961669921875, 0.4136962890625, 0.535430908203125, 0.65716552734375, 0.778900146484375, 0.900634765625, 1.022369384765625, 1.14410400390625, 1.265838623046875, 1.3875732421875, 1.509307861328125, 1.63104248046875, 1.752777099609375, 1.87451171875, 1.996246337890625, 2.11798095703125, 2.239715576171875, 2.3614501953125, 2.483184814453125, 2.60491943359375, 2.726654052734375, 2.848388671875, 2.970123291015625, 3.09185791015625, 3.213592529296875, 3.3353271484375, 3.457061767578125, 3.57879638671875, 3.700531005859375, 3.822265625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 10.0, 12.0, 20.0, 39.0, 53.0, 88.0, 106.0, 172.0, 239.0, 333.0, 574.0, 928.0, 1454.0, 2335.0, 3787.0, 6661.0, 11949.0, 22954.0, 46275.0, 97682.0, 194068.0, 265135.0, 195199.0, 99131.0, 46929.0, 23364.0, 12135.0, 6716.0, 3775.0, 2344.0, 1466.0, 918.0, 556.0, 366.0, 236.0, 169.0, 108.0, 83.0, 58.0, 41.0, 21.0, 16.0, 21.0, 8.0, 6.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-4.59765625, -4.46044921875, -4.3232421875, -4.18603515625, -4.048828125, -3.91162109375, -3.7744140625, -3.63720703125, -3.5, -3.36279296875, -3.2255859375, -3.08837890625, -2.951171875, -2.81396484375, -2.6767578125, -2.53955078125, -2.40234375, -2.26513671875, -2.1279296875, -1.99072265625, -1.853515625, -1.71630859375, -1.5791015625, -1.44189453125, -1.3046875, -1.16748046875, -1.0302734375, -0.89306640625, -0.755859375, -0.61865234375, -0.4814453125, -0.34423828125, -0.20703125, -0.06982421875, 0.0673828125, 0.20458984375, 0.341796875, 0.47900390625, 0.6162109375, 0.75341796875, 0.890625, 1.02783203125, 1.1650390625, 1.30224609375, 1.439453125, 1.57666015625, 1.7138671875, 1.85107421875, 1.98828125, 2.12548828125, 2.2626953125, 2.39990234375, 2.537109375, 2.67431640625, 2.8115234375, 2.94873046875, 3.0859375, 3.22314453125, 3.3603515625, 3.49755859375, 3.634765625, 3.77197265625, 3.9091796875, 4.04638671875, 4.18359375]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 4.0, 10.0, 12.0, 17.0, 23.0, 44.0, 34.0, 48.0, 67.0, 78.0, 85.0, 104.0, 91.0, 92.0, 68.0, 58.0, 32.0, 34.0, 22.0, 18.0, 14.0, 11.0, 12.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041365623474121094, -0.0003996603190898895, -0.0003856644034385681, -0.0003716684877872467, -0.0003576725721359253, -0.0003436766564846039, -0.00032968074083328247, -0.00031568482518196106, -0.00030168890953063965, -0.00028769299387931824, -0.0002736970782279968, -0.0002597011625766754, -0.000245705246925354, -0.0002317093312740326, -0.00021771341562271118, -0.00020371749997138977, -0.00018972158432006836, -0.00017572566866874695, -0.00016172975301742554, -0.00014773383736610413, -0.00013373792171478271, -0.0001197420060634613, -0.00010574609041213989, -9.175017476081848e-05, -7.775425910949707e-05, -6.375834345817566e-05, -4.976242780685425e-05, -3.576651215553284e-05, -2.1770596504211426e-05, -7.774680852890015e-06, 6.2212347984313965e-06, 2.0217150449752808e-05, 3.421306610107422e-05, 4.820898175239563e-05, 6.220489740371704e-05, 7.620081305503845e-05, 9.019672870635986e-05, 0.00010419264435768127, 0.00011818856000900269, 0.0001321844756603241, 0.0001461803913116455, 0.00016017630696296692, 0.00017417222261428833, 0.00018816813826560974, 0.00020216405391693115, 0.00021615996956825256, 0.00023015588521957397, 0.0002441518008708954, 0.0002581477165222168, 0.0002721436321735382, 0.0002861395478248596, 0.00030013546347618103, 0.00031413137912750244, 0.00032812729477882385, 0.00034212321043014526, 0.0003561191260814667, 0.0003701150417327881, 0.0003841109573841095, 0.0003981068730354309, 0.0004121027886867523, 0.00042609870433807373, 0.00044009461998939514, 0.00045409053564071655, 0.00046808645129203796, 0.0004820823669433594]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 12.0, 14.0, 22.0, 29.0, 40.0, 59.0, 83.0, 137.0, 216.0, 314.0, 484.0, 826.0, 1247.0, 2237.0, 3868.0, 7039.0, 13234.0, 26406.0, 55344.0, 115264.0, 207341.0, 250776.0, 179669.0, 93236.0, 44256.0, 21498.0, 10867.0, 5733.0, 3310.0, 1858.0, 1153.0, 701.0, 446.0, 271.0, 201.0, 108.0, 81.0, 44.0, 49.0, 27.0, 17.0, 12.0, 4.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.98046875, -3.864593505859375, -3.74871826171875, -3.632843017578125, -3.5169677734375, -3.401092529296875, -3.28521728515625, -3.169342041015625, -3.053466796875, -2.937591552734375, -2.82171630859375, -2.705841064453125, -2.5899658203125, -2.474090576171875, -2.35821533203125, -2.242340087890625, -2.12646484375, -2.010589599609375, -1.89471435546875, -1.778839111328125, -1.6629638671875, -1.547088623046875, -1.43121337890625, -1.315338134765625, -1.199462890625, -1.083587646484375, -0.96771240234375, -0.851837158203125, -0.7359619140625, -0.620086669921875, -0.50421142578125, -0.388336181640625, -0.2724609375, -0.156585693359375, -0.04071044921875, 0.075164794921875, 0.1910400390625, 0.306915283203125, 0.42279052734375, 0.538665771484375, 0.654541015625, 0.770416259765625, 0.88629150390625, 1.002166748046875, 1.1180419921875, 1.233917236328125, 1.34979248046875, 1.465667724609375, 1.58154296875, 1.697418212890625, 1.81329345703125, 1.929168701171875, 2.0450439453125, 2.160919189453125, 2.27679443359375, 2.392669677734375, 2.508544921875, 2.624420166015625, 2.74029541015625, 2.856170654296875, 2.9720458984375, 3.087921142578125, 3.20379638671875, 3.319671630859375, 3.435546875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 2.0, 7.0, 6.0, 6.0, 14.0, 21.0, 20.0, 22.0, 18.0, 19.0, 42.0, 38.0, 43.0, 47.0, 41.0, 56.0, 47.0, 41.0, 64.0, 49.0, 54.0, 40.0, 46.0, 42.0, 36.0, 19.0, 30.0, 20.0, 18.0, 11.0, 12.0, 10.0, 8.0, 9.0, 8.0, 5.0, 4.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78759765625, -0.763946533203125, -0.74029541015625, -0.716644287109375, -0.6929931640625, -0.669342041015625, -0.64569091796875, -0.622039794921875, -0.598388671875, -0.574737548828125, -0.55108642578125, -0.527435302734375, -0.5037841796875, -0.480133056640625, -0.45648193359375, -0.432830810546875, -0.4091796875, -0.385528564453125, -0.36187744140625, -0.338226318359375, -0.3145751953125, -0.290924072265625, -0.26727294921875, -0.243621826171875, -0.219970703125, -0.196319580078125, -0.17266845703125, -0.149017333984375, -0.1253662109375, -0.101715087890625, -0.07806396484375, -0.054412841796875, -0.03076171875, -0.007110595703125, 0.01654052734375, 0.040191650390625, 0.0638427734375, 0.087493896484375, 0.11114501953125, 0.134796142578125, 0.158447265625, 0.182098388671875, 0.20574951171875, 0.229400634765625, 0.2530517578125, 0.276702880859375, 0.30035400390625, 0.324005126953125, 0.34765625, 0.371307373046875, 0.39495849609375, 0.418609619140625, 0.4422607421875, 0.465911865234375, 0.48956298828125, 0.513214111328125, 0.536865234375, 0.560516357421875, 0.58416748046875, 0.607818603515625, 0.6314697265625, 0.655120849609375, 0.67877197265625, 0.702423095703125, 0.72607421875]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 9.0, 18.0, 15.0, 30.0, 53.0, 66.0, 73.0, 103.0, 124.0, 144.0, 108.0, 86.0, 53.0, 33.0, 21.0, 17.0, 15.0, 7.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.656908988952637, -15.024646759033203, -14.392385482788086, -13.760123252868652, -13.127861022949219, -12.495599746704102, -11.863337516784668, -11.231075286865234, -10.598814010620117, -9.966551780700684, -9.334290504455566, -8.702028274536133, -8.0697660446167, -7.437504291534424, -6.805242538452148, -6.172980308532715, -5.540718078613281, -4.908456325531006, -4.276194095611572, -3.643932342529297, -3.0116703510284424, -2.379408359527588, -1.7471466064453125, -1.114884376525879, -0.4826226234436035, 0.1496393084526062, 0.7819012403488159, 1.4141631126403809, 2.0464251041412354, 2.67868709564209, 3.3109488487243652, 3.943211078643799, 4.575471878051758, 5.207733631134033, 5.839995861053467, 6.472257614135742, 7.104519844055176, 7.736781597137451, 8.369043350219727, 9.00130558013916, 9.633567810058594, 10.265830039978027, 10.898091316223145, 11.530353546142578, 12.162615776062012, 12.794878005981445, 13.427139282226562, 14.059401512145996, 14.691662788391113, 15.323925018310547, 15.956186294555664, 16.58844757080078, 17.22071075439453, 17.85297203063965, 18.485233306884766, 19.117496490478516, 19.749757766723633, 20.38201904296875, 21.0142822265625, 21.646543502807617, 22.278804779052734, 22.911067962646484, 23.5433292388916, 24.17559051513672, 24.80785369873047]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 6.0, 2.0, 5.0, 6.0, 3.0, 5.0, 6.0, 6.0, 13.0, 12.0, 20.0, 16.0, 22.0, 26.0, 22.0, 29.0, 30.0, 33.0, 30.0, 42.0, 25.0, 39.0, 36.0, 40.0, 42.0, 44.0, 53.0, 37.0, 45.0, 41.0, 28.0, 31.0, 21.0, 30.0, 17.0, 22.0, 22.0, 19.0, 12.0, 18.0, 12.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.366284370422363, -6.142533779144287, -5.918783187866211, -5.695032596588135, -5.471282005310059, -5.247531414031982, -5.023780822753906, -4.800029754638672, -4.576279640197754, -4.352529048919678, -4.128778457641602, -3.9050278663635254, -3.681277275085449, -3.457526683807373, -3.2337758541107178, -3.0100252628326416, -2.7862744331359863, -2.56252384185791, -2.338773250579834, -2.115022659301758, -1.891271948814392, -1.667521357536316, -1.4437706470489502, -1.220020055770874, -0.9962694644927979, -0.7725188732147217, -0.5487682223320007, -0.3250175714492798, -0.10126698017120361, 0.12248361110687256, 0.3462343215942383, 0.5699849128723145, 0.7937350273132324, 1.0174856185913086, 1.2412362098693848, 1.4649869203567505, 1.6887375116348267, 1.9124881029129028, 2.1362388134002686, 2.3599894046783447, 2.583739995956421, 2.807490587234497, 3.0312411785125732, 3.2549920082092285, 3.4787425994873047, 3.702493190765381, 3.926243782043457, 4.149994373321533, 4.373744964599609, 4.5974955558776855, 4.821246147155762, 5.044996738433838, 5.268747329711914, 5.49249792098999, 5.716248512268066, 5.939999580383301, 6.163749694824219, 6.387500286102295, 6.611250877380371, 6.835001468658447, 7.058752059936523, 7.2825026512146, 7.506253242492676, 7.73000431060791, 7.953754901885986]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 12.0, 19.0, 18.0, 42.0, 50.0, 101.0, 115.0, 199.0, 270.0, 372.0, 583.0, 933.0, 1434.0, 2381.0, 3874.0, 6789.0, 13418.0, 30001.0, 82840.0, 313856.0, 1295830.0, 1748907.0, 496010.0, 118915.0, 38436.0, 16816.0, 8548.0, 4890.0, 2946.0, 1876.0, 1238.0, 778.0, 570.0, 375.0, 221.0, 177.0, 143.0, 72.0, 46.0, 57.0, 38.0, 22.0, 23.0, 12.0, 8.0, 8.0, 7.0, 3.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.65625, -14.1357421875, -13.615234375, -13.0947265625, -12.57421875, -12.0537109375, -11.533203125, -11.0126953125, -10.4921875, -9.9716796875, -9.451171875, -8.9306640625, -8.41015625, -7.8896484375, -7.369140625, -6.8486328125, -6.328125, -5.8076171875, -5.287109375, -4.7666015625, -4.24609375, -3.7255859375, -3.205078125, -2.6845703125, -2.1640625, -1.6435546875, -1.123046875, -0.6025390625, -0.08203125, 0.4384765625, 0.958984375, 1.4794921875, 2.0, 2.5205078125, 3.041015625, 3.5615234375, 4.08203125, 4.6025390625, 5.123046875, 5.6435546875, 6.1640625, 6.6845703125, 7.205078125, 7.7255859375, 8.24609375, 8.7666015625, 9.287109375, 9.8076171875, 10.328125, 10.8486328125, 11.369140625, 11.8896484375, 12.41015625, 12.9306640625, 13.451171875, 13.9716796875, 14.4921875, 15.0126953125, 15.533203125, 16.0537109375, 16.57421875, 17.0947265625, 17.615234375, 18.1357421875, 18.65625]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 3.0, 4.0, 6.0, 7.0, 10.0, 15.0, 13.0, 12.0, 20.0, 24.0, 27.0, 28.0, 21.0, 28.0, 24.0, 33.0, 27.0, 36.0, 47.0, 37.0, 32.0, 39.0, 44.0, 46.0, 40.0, 40.0, 42.0, 28.0, 31.0, 27.0, 25.0, 19.0, 20.0, 17.0, 22.0, 15.0, 10.0, 13.0, 10.0, 6.0, 7.0, 7.0, 7.0, 4.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5234375, -5.3424072265625, -5.161376953125, -4.9803466796875, -4.79931640625, -4.6182861328125, -4.437255859375, -4.2562255859375, -4.0751953125, -3.8941650390625, -3.713134765625, -3.5321044921875, -3.35107421875, -3.1700439453125, -2.989013671875, -2.8079833984375, -2.626953125, -2.4459228515625, -2.264892578125, -2.0838623046875, -1.90283203125, -1.7218017578125, -1.540771484375, -1.3597412109375, -1.1787109375, -0.9976806640625, -0.816650390625, -0.6356201171875, -0.45458984375, -0.2735595703125, -0.092529296875, 0.0885009765625, 0.26953125, 0.4505615234375, 0.631591796875, 0.8126220703125, 0.99365234375, 1.1746826171875, 1.355712890625, 1.5367431640625, 1.7177734375, 1.8988037109375, 2.079833984375, 2.2608642578125, 2.44189453125, 2.6229248046875, 2.803955078125, 2.9849853515625, 3.166015625, 3.3470458984375, 3.528076171875, 3.7091064453125, 3.89013671875, 4.0711669921875, 4.252197265625, 4.4332275390625, 4.6142578125, 4.7952880859375, 4.976318359375, 5.1573486328125, 5.33837890625, 5.5194091796875, 5.700439453125, 5.8814697265625, 6.0625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 3.0, 2.0, 11.0, 7.0, 16.0, 14.0, 30.0, 47.0, 59.0, 68.0, 101.0, 134.0, 197.0, 283.0, 367.0, 532.0, 805.0, 1185.0, 1698.0, 2613.0, 3829.0, 6059.0, 9797.0, 16906.0, 30493.0, 62119.0, 148453.0, 444945.0, 1461128.0, 1340481.0, 396857.0, 135225.0, 58186.0, 29285.0, 15972.0, 9180.0, 5807.0, 3801.0, 2335.0, 1605.0, 1046.0, 729.0, 513.0, 389.0, 262.0, 174.0, 145.0, 118.0, 80.0, 58.0, 42.0, 27.0, 25.0, 21.0, 10.0, 5.0, 3.0, 4.0, 4.0, 5.0, 1.0], "bins": [-15.8671875, -15.37060546875, -14.8740234375, -14.37744140625, -13.880859375, -13.38427734375, -12.8876953125, -12.39111328125, -11.89453125, -11.39794921875, -10.9013671875, -10.40478515625, -9.908203125, -9.41162109375, -8.9150390625, -8.41845703125, -7.921875, -7.42529296875, -6.9287109375, -6.43212890625, -5.935546875, -5.43896484375, -4.9423828125, -4.44580078125, -3.94921875, -3.45263671875, -2.9560546875, -2.45947265625, -1.962890625, -1.46630859375, -0.9697265625, -0.47314453125, 0.0234375, 0.52001953125, 1.0166015625, 1.51318359375, 2.009765625, 2.50634765625, 3.0029296875, 3.49951171875, 3.99609375, 4.49267578125, 4.9892578125, 5.48583984375, 5.982421875, 6.47900390625, 6.9755859375, 7.47216796875, 7.96875, 8.46533203125, 8.9619140625, 9.45849609375, 9.955078125, 10.45166015625, 10.9482421875, 11.44482421875, 11.94140625, 12.43798828125, 12.9345703125, 13.43115234375, 13.927734375, 14.42431640625, 14.9208984375, 15.41748046875, 15.9140625]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 2.0, 4.0, 10.0, 7.0, 10.0, 9.0, 24.0, 23.0, 24.0, 30.0, 60.0, 61.0, 86.0, 112.0, 162.0, 163.0, 225.0, 325.0, 387.0, 411.0, 405.0, 361.0, 278.0, 223.0, 157.0, 114.0, 94.0, 80.0, 47.0, 43.0, 29.0, 21.0, 15.0, 15.0, 6.0, 14.0, 5.0, 7.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0], "bins": [-4.015625, -3.889404296875, -3.76318359375, -3.636962890625, -3.5107421875, -3.384521484375, -3.25830078125, -3.132080078125, -3.005859375, -2.879638671875, -2.75341796875, -2.627197265625, -2.5009765625, -2.374755859375, -2.24853515625, -2.122314453125, -1.99609375, -1.869873046875, -1.74365234375, -1.617431640625, -1.4912109375, -1.364990234375, -1.23876953125, -1.112548828125, -0.986328125, -0.860107421875, -0.73388671875, -0.607666015625, -0.4814453125, -0.355224609375, -0.22900390625, -0.102783203125, 0.0234375, 0.149658203125, 0.27587890625, 0.402099609375, 0.5283203125, 0.654541015625, 0.78076171875, 0.906982421875, 1.033203125, 1.159423828125, 1.28564453125, 1.411865234375, 1.5380859375, 1.664306640625, 1.79052734375, 1.916748046875, 2.04296875, 2.169189453125, 2.29541015625, 2.421630859375, 2.5478515625, 2.674072265625, 2.80029296875, 2.926513671875, 3.052734375, 3.178955078125, 3.30517578125, 3.431396484375, 3.5576171875, 3.683837890625, 3.81005859375, 3.936279296875, 4.0625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 12.0, 3.0, 15.0, 20.0, 26.0, 22.0, 39.0, 62.0, 58.0, 88.0, 98.0, 110.0, 89.0, 78.0, 66.0, 53.0, 28.0, 27.0, 24.0, 15.0, 9.0, 14.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.730976104736328, -17.2108154296875, -16.690654754638672, -16.170494079589844, -15.6503324508667, -15.130171775817871, -14.610010147094727, -14.089849472045898, -13.56968879699707, -13.049528121948242, -12.529367446899414, -12.00920581817627, -11.489045143127441, -10.968884468078613, -10.448722839355469, -9.92856216430664, -9.408401489257812, -8.888240814208984, -8.368080139160156, -7.847918510437012, -7.327757835388184, -6.8075971603393555, -6.287436008453369, -5.767274856567383, -5.247114181518555, -4.726953506469727, -4.20679235458374, -3.686631441116333, -3.166470527648926, -2.6463096141815186, -2.1261487007141113, -1.605987787246704, -1.0858268737792969, -0.5656659603118896, -0.04550504684448242, 0.4746558666229248, 0.994816780090332, 1.5149776935577393, 2.0351386070251465, 2.5552995204925537, 3.075460433959961, 3.595621347427368, 4.115782260894775, 4.635943412780762, 5.15610408782959, 5.676264762878418, 6.196425914764404, 6.716587066650391, 7.236747741699219, 7.756908416748047, 8.277069091796875, 8.79723072052002, 9.317391395568848, 9.837552070617676, 10.35771369934082, 10.877874374389648, 11.398035049438477, 11.918195724487305, 12.438356399536133, 12.958518028259277, 13.478678703308105, 13.998839378356934, 14.519001007080078, 15.039161682128906, 15.559322357177734]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 2.0, 3.0, 9.0, 12.0, 18.0, 15.0, 22.0, 21.0, 22.0, 26.0, 22.0, 38.0, 27.0, 40.0, 39.0, 41.0, 31.0, 49.0, 42.0, 32.0, 42.0, 36.0, 45.0, 47.0, 33.0, 31.0, 29.0, 35.0, 25.0, 25.0, 25.0, 16.0, 18.0, 11.0, 15.0, 15.0, 8.0, 9.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.691618919372559, -7.438811302185059, -7.186003684997559, -6.9331955909729, -6.6803879737854, -6.4275803565979, -6.174772262573242, -5.921964645385742, -5.669157028198242, -5.416349411010742, -5.163541793823242, -4.910733699798584, -4.657926082611084, -4.405118465423584, -4.152310371398926, -3.899502754211426, -3.646695137023926, -3.393887519836426, -3.1410796642303467, -2.8882718086242676, -2.6354641914367676, -2.3826565742492676, -2.1298487186431885, -1.877040982246399, -1.6242332458496094, -1.3714255094528198, -1.1186177730560303, -0.8658100366592407, -0.6130023002624512, -0.3601945638656616, -0.10738682746887207, 0.14542090892791748, 0.39822864532470703, 0.6510363817214966, 0.9038441181182861, 1.1566518545150757, 1.4094595909118652, 1.6622673273086548, 1.9150750637054443, 2.1678829193115234, 2.4206905364990234, 2.6734981536865234, 2.9263060092926025, 3.1791138648986816, 3.4319214820861816, 3.6847290992736816, 3.9375369548797607, 4.19034481048584, 4.44315242767334, 4.69596004486084, 4.94876766204834, 5.201575756072998, 5.454383373260498, 5.707190990447998, 5.959999084472656, 6.212806701660156, 6.465614318847656, 6.718421936035156, 6.971229553222656, 7.2240376472473145, 7.4768452644348145, 7.7296528816223145, 7.982460975646973, 8.235268592834473, 8.488076210021973]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 12.0, 12.0, 9.0, 35.0, 37.0, 54.0, 87.0, 121.0, 188.0, 275.0, 453.0, 644.0, 1156.0, 1943.0, 3002.0, 5279.0, 9391.0, 16388.0, 30784.0, 59803.0, 126620.0, 267534.0, 267713.0, 127072.0, 59942.0, 31037.0, 16417.0, 9161.0, 5160.0, 3147.0, 1895.0, 1182.0, 658.0, 465.0, 303.0, 190.0, 131.0, 79.0, 55.0, 48.0, 21.0, 16.0, 11.0, 7.0, 8.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.205078125, -1.1685638427734375, -1.132049560546875, -1.0955352783203125, -1.05902099609375, -1.0225067138671875, -0.985992431640625, -0.9494781494140625, -0.9129638671875, -0.8764495849609375, -0.839935302734375, -0.8034210205078125, -0.76690673828125, -0.7303924560546875, -0.693878173828125, -0.6573638916015625, -0.620849609375, -0.5843353271484375, -0.547821044921875, -0.5113067626953125, -0.47479248046875, -0.4382781982421875, -0.401763916015625, -0.3652496337890625, -0.3287353515625, -0.2922210693359375, -0.255706787109375, -0.2191925048828125, -0.18267822265625, -0.1461639404296875, -0.109649658203125, -0.0731353759765625, -0.03662109375, -0.0001068115234375, 0.036407470703125, 0.0729217529296875, 0.10943603515625, 0.1459503173828125, 0.182464599609375, 0.2189788818359375, 0.2554931640625, 0.2920074462890625, 0.328521728515625, 0.3650360107421875, 0.40155029296875, 0.4380645751953125, 0.474578857421875, 0.5110931396484375, 0.547607421875, 0.5841217041015625, 0.620635986328125, 0.6571502685546875, 0.69366455078125, 0.7301788330078125, 0.766693115234375, 0.8032073974609375, 0.8397216796875, 0.8762359619140625, 0.912750244140625, 0.9492645263671875, 0.98577880859375, 1.0222930908203125, 1.058807373046875, 1.0953216552734375, 1.1318359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 7.0, 6.0, 7.0, 8.0, 14.0, 25.0, 17.0, 20.0, 20.0, 26.0, 31.0, 32.0, 28.0, 34.0, 37.0, 38.0, 31.0, 40.0, 49.0, 36.0, 32.0, 36.0, 41.0, 52.0, 35.0, 36.0, 26.0, 35.0, 27.0, 29.0, 14.0, 24.0, 16.0, 14.0, 15.0, 10.0, 9.0, 5.0, 13.0, 9.0, 3.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.4765625, -8.20458984375, -7.9326171875, -7.66064453125, -7.388671875, -7.11669921875, -6.8447265625, -6.57275390625, -6.30078125, -6.02880859375, -5.7568359375, -5.48486328125, -5.212890625, -4.94091796875, -4.6689453125, -4.39697265625, -4.125, -3.85302734375, -3.5810546875, -3.30908203125, -3.037109375, -2.76513671875, -2.4931640625, -2.22119140625, -1.94921875, -1.67724609375, -1.4052734375, -1.13330078125, -0.861328125, -0.58935546875, -0.3173828125, -0.04541015625, 0.2265625, 0.49853515625, 0.7705078125, 1.04248046875, 1.314453125, 1.58642578125, 1.8583984375, 2.13037109375, 2.40234375, 2.67431640625, 2.9462890625, 3.21826171875, 3.490234375, 3.76220703125, 4.0341796875, 4.30615234375, 4.578125, 4.85009765625, 5.1220703125, 5.39404296875, 5.666015625, 5.93798828125, 6.2099609375, 6.48193359375, 6.75390625, 7.02587890625, 7.2978515625, 7.56982421875, 7.841796875, 8.11376953125, 8.3857421875, 8.65771484375, 8.9296875]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 6.0, 5.0, 9.0, 14.0, 20.0, 13.0, 26.0, 45.0, 67.0, 64.0, 83.0, 116.0, 177.0, 243.0, 348.0, 558.0, 776.0, 1236.0, 2053.0, 3426.0, 6235.0, 12705.0, 29797.0, 390431.0, 539497.0, 31813.0, 12850.0, 6423.0, 3489.0, 2044.0, 1189.0, 883.0, 537.0, 376.0, 264.0, 198.0, 147.0, 94.0, 87.0, 47.0, 38.0, 38.0, 29.0, 16.0, 11.0, 5.0, 8.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.560546875, -2.47802734375, -2.3955078125, -2.31298828125, -2.23046875, -2.14794921875, -2.0654296875, -1.98291015625, -1.900390625, -1.81787109375, -1.7353515625, -1.65283203125, -1.5703125, -1.48779296875, -1.4052734375, -1.32275390625, -1.240234375, -1.15771484375, -1.0751953125, -0.99267578125, -0.91015625, -0.82763671875, -0.7451171875, -0.66259765625, -0.580078125, -0.49755859375, -0.4150390625, -0.33251953125, -0.25, -0.16748046875, -0.0849609375, -0.00244140625, 0.080078125, 0.16259765625, 0.2451171875, 0.32763671875, 0.41015625, 0.49267578125, 0.5751953125, 0.65771484375, 0.740234375, 0.82275390625, 0.9052734375, 0.98779296875, 1.0703125, 1.15283203125, 1.2353515625, 1.31787109375, 1.400390625, 1.48291015625, 1.5654296875, 1.64794921875, 1.73046875, 1.81298828125, 1.8955078125, 1.97802734375, 2.060546875, 2.14306640625, 2.2255859375, 2.30810546875, 2.390625, 2.47314453125, 2.5556640625, 2.63818359375, 2.720703125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 4.0, 6.0, 2.0, 11.0, 8.0, 11.0, 19.0, 16.0, 20.0, 29.0, 19.0, 19.0, 34.0, 30.0, 35.0, 23.0, 30.0, 34.0, 39.0, 41.0, 39.0, 42.0, 45.0, 37.0, 29.0, 35.0, 34.0, 39.0, 34.0, 31.0, 32.0, 24.0, 19.0, 20.0, 16.0, 11.0, 11.0, 19.0, 17.0, 9.0, 7.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.40625, -5.24871826171875, -5.0911865234375, -4.93365478515625, -4.776123046875, -4.61859130859375, -4.4610595703125, -4.30352783203125, -4.14599609375, -3.98846435546875, -3.8309326171875, -3.67340087890625, -3.515869140625, -3.35833740234375, -3.2008056640625, -3.04327392578125, -2.8857421875, -2.72821044921875, -2.5706787109375, -2.41314697265625, -2.255615234375, -2.09808349609375, -1.9405517578125, -1.78302001953125, -1.62548828125, -1.46795654296875, -1.3104248046875, -1.15289306640625, -0.995361328125, -0.83782958984375, -0.6802978515625, -0.52276611328125, -0.365234375, -0.20770263671875, -0.0501708984375, 0.10736083984375, 0.264892578125, 0.42242431640625, 0.5799560546875, 0.73748779296875, 0.89501953125, 1.05255126953125, 1.2100830078125, 1.36761474609375, 1.525146484375, 1.68267822265625, 1.8402099609375, 1.99774169921875, 2.1552734375, 2.31280517578125, 2.4703369140625, 2.62786865234375, 2.785400390625, 2.94293212890625, 3.1004638671875, 3.25799560546875, 3.41552734375, 3.57305908203125, 3.7305908203125, 3.88812255859375, 4.045654296875, 4.20318603515625, 4.3607177734375, 4.51824951171875, 4.67578125]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 19.0, 20.0, 33.0, 43.0, 78.0, 107.0, 169.0, 244.0, 421.0, 731.0, 1217.0, 2271.0, 4854.0, 10589.0, 28562.0, 879573.0, 85427.0, 18429.0, 7571.0, 3644.0, 1859.0, 1043.0, 582.0, 396.0, 207.0, 141.0, 105.0, 55.0, 38.0, 35.0, 21.0, 22.0, 7.0, 6.0, 5.0, 3.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.77880859375, -0.7576446533203125, -0.736480712890625, -0.7153167724609375, -0.69415283203125, -0.6729888916015625, -0.651824951171875, -0.6306610107421875, -0.6094970703125, -0.5883331298828125, -0.567169189453125, -0.5460052490234375, -0.52484130859375, -0.5036773681640625, -0.482513427734375, -0.4613494873046875, -0.440185546875, -0.4190216064453125, -0.397857666015625, -0.3766937255859375, -0.35552978515625, -0.3343658447265625, -0.313201904296875, -0.2920379638671875, -0.2708740234375, -0.2497100830078125, -0.228546142578125, -0.2073822021484375, -0.18621826171875, -0.1650543212890625, -0.143890380859375, -0.1227264404296875, -0.1015625, -0.0803985595703125, -0.059234619140625, -0.0380706787109375, -0.01690673828125, 0.0042572021484375, 0.025421142578125, 0.0465850830078125, 0.0677490234375, 0.0889129638671875, 0.110076904296875, 0.1312408447265625, 0.15240478515625, 0.1735687255859375, 0.194732666015625, 0.2158966064453125, 0.237060546875, 0.2582244873046875, 0.279388427734375, 0.3005523681640625, 0.32171630859375, 0.3428802490234375, 0.364044189453125, 0.3852081298828125, 0.4063720703125, 0.4275360107421875, 0.448699951171875, 0.4698638916015625, 0.49102783203125, 0.5121917724609375, 0.533355712890625, 0.5545196533203125, 0.57568359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 7.0, 2.0, 7.0, 5.0, 11.0, 8.0, 11.0, 13.0, 19.0, 14.0, 28.0, 18.0, 24.0, 37.0, 29.0, 26.0, 32.0, 35.0, 33.0, 49.0, 52.0, 53.0, 45.0, 43.0, 48.0, 39.0, 32.0, 37.0, 40.0, 27.0, 26.0, 26.0, 12.0, 15.0, 20.0, 17.0, 14.0, 8.0, 6.0, 5.0, 8.0, 2.0, 6.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.166364669799805e-05, -4.036352038383484e-05, -3.906339406967163e-05, -3.776326775550842e-05, -3.6463141441345215e-05, -3.516301512718201e-05, -3.38628888130188e-05, -3.256276249885559e-05, -3.126263618469238e-05, -2.9962509870529175e-05, -2.8662383556365967e-05, -2.736225724220276e-05, -2.606213092803955e-05, -2.4762004613876343e-05, -2.3461878299713135e-05, -2.2161751985549927e-05, -2.086162567138672e-05, -1.956149935722351e-05, -1.8261373043060303e-05, -1.6961246728897095e-05, -1.5661120414733887e-05, -1.4360994100570679e-05, -1.306086778640747e-05, -1.1760741472244263e-05, -1.0460615158081055e-05, -9.160488843917847e-06, -7.860362529754639e-06, -6.560236215591431e-06, -5.260109901428223e-06, -3.959983587265015e-06, -2.6598572731018066e-06, -1.3597309589385986e-06, -5.960464477539063e-08, 1.2405216693878174e-06, 2.5406479835510254e-06, 3.840774297714233e-06, 5.140900611877441e-06, 6.441026926040649e-06, 7.741153240203857e-06, 9.041279554367065e-06, 1.0341405868530273e-05, 1.1641532182693481e-05, 1.294165849685669e-05, 1.4241784811019897e-05, 1.5541911125183105e-05, 1.6842037439346313e-05, 1.814216375350952e-05, 1.944229006767273e-05, 2.0742416381835938e-05, 2.2042542695999146e-05, 2.3342669010162354e-05, 2.464279532432556e-05, 2.594292163848877e-05, 2.7243047952651978e-05, 2.8543174266815186e-05, 2.9843300580978394e-05, 3.11434268951416e-05, 3.244355320930481e-05, 3.374367952346802e-05, 3.5043805837631226e-05, 3.6343932151794434e-05, 3.764405846595764e-05, 3.894418478012085e-05, 4.024431109428406e-05, 4.1544437408447266e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 14.0, 11.0, 18.0, 24.0, 33.0, 56.0, 59.0, 97.0, 107.0, 199.0, 329.0, 449.0, 643.0, 978.0, 1475.0, 2514.0, 4079.0, 6763.0, 12121.0, 22717.0, 44433.0, 91264.0, 189691.0, 286513.0, 193168.0, 92751.0, 44871.0, 22773.0, 12330.0, 6949.0, 4033.0, 2460.0, 1608.0, 964.0, 662.0, 430.0, 279.0, 214.0, 134.0, 101.0, 70.0, 40.0, 31.0, 29.0, 24.0, 8.0, 6.0, 9.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.2039794921875, -0.19750595092773438, -0.19103240966796875, -0.18455886840820312, -0.1780853271484375, -0.17161178588867188, -0.16513824462890625, -0.15866470336914062, -0.152191162109375, -0.14571762084960938, -0.13924407958984375, -0.13277053833007812, -0.1262969970703125, -0.11982345581054688, -0.11334991455078125, -0.10687637329101562, -0.10040283203125, -0.09392929077148438, -0.08745574951171875, -0.08098220825195312, -0.0745086669921875, -0.06803512573242188, -0.06156158447265625, -0.055088043212890625, -0.048614501953125, -0.042140960693359375, -0.03566741943359375, -0.029193878173828125, -0.0227203369140625, -0.016246795654296875, -0.00977325439453125, -0.003299713134765625, 0.003173828125, 0.009647369384765625, 0.01612091064453125, 0.022594451904296875, 0.0290679931640625, 0.035541534423828125, 0.04201507568359375, 0.048488616943359375, 0.054962158203125, 0.061435699462890625, 0.06790924072265625, 0.07438278198242188, 0.0808563232421875, 0.08732986450195312, 0.09380340576171875, 0.10027694702148438, 0.10675048828125, 0.11322402954101562, 0.11969757080078125, 0.12617111206054688, 0.1326446533203125, 0.13911819458007812, 0.14559173583984375, 0.15206527709960938, 0.158538818359375, 0.16501235961914062, 0.17148590087890625, 0.17795944213867188, 0.1844329833984375, 0.19090652465820312, 0.19738006591796875, 0.20385360717773438, 0.2103271484375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 0.0, 6.0, 5.0, 7.0, 10.0, 13.0, 18.0, 21.0, 22.0, 30.0, 39.0, 57.0, 47.0, 59.0, 72.0, 70.0, 77.0, 60.0, 62.0, 51.0, 56.0, 49.0, 26.0, 22.0, 22.0, 18.0, 15.0, 15.0, 6.0, 10.0, 10.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0582275390625, -0.05665731430053711, -0.05508708953857422, -0.05351686477661133, -0.05194664001464844, -0.05037641525268555, -0.048806190490722656, -0.047235965728759766, -0.045665740966796875, -0.044095516204833984, -0.042525291442871094, -0.0409550666809082, -0.03938484191894531, -0.03781461715698242, -0.03624439239501953, -0.03467416763305664, -0.03310394287109375, -0.03153371810913086, -0.02996349334716797, -0.028393268585205078, -0.026823043823242188, -0.025252819061279297, -0.023682594299316406, -0.022112369537353516, -0.020542144775390625, -0.018971920013427734, -0.017401695251464844, -0.015831470489501953, -0.014261245727539062, -0.012691020965576172, -0.011120796203613281, -0.00955057144165039, -0.0079803466796875, -0.006410121917724609, -0.004839897155761719, -0.003269672393798828, -0.0016994476318359375, -0.00012922286987304688, 0.0014410018920898438, 0.0030112266540527344, 0.004581451416015625, 0.006151676177978516, 0.007721900939941406, 0.009292125701904297, 0.010862350463867188, 0.012432575225830078, 0.014002799987792969, 0.01557302474975586, 0.01714324951171875, 0.01871347427368164, 0.02028369903564453, 0.021853923797607422, 0.023424148559570312, 0.024994373321533203, 0.026564598083496094, 0.028134822845458984, 0.029705047607421875, 0.031275272369384766, 0.032845497131347656, 0.03441572189331055, 0.03598594665527344, 0.03755617141723633, 0.03912639617919922, 0.04069662094116211, 0.042266845703125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 11.0, 3.0, 13.0, 25.0, 23.0, 27.0, 45.0, 58.0, 58.0, 102.0, 100.0, 107.0, 91.0, 78.0, 57.0, 46.0, 29.0, 27.0, 25.0, 11.0, 9.0, 14.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.82588768005371, -17.2995662689209, -16.773244857788086, -16.246923446655273, -15.720602035522461, -15.194280624389648, -14.66795825958252, -14.141636848449707, -13.615315437316895, -13.088994026184082, -12.56267261505127, -12.036351203918457, -11.510028839111328, -10.983707427978516, -10.457386016845703, -9.93106460571289, -9.404743194580078, -8.878421783447266, -8.352100372314453, -7.825778484344482, -7.29945707321167, -6.773135662078857, -6.246813774108887, -5.720492362976074, -5.194170951843262, -4.667849540710449, -4.141528129577637, -3.615206241607666, -3.0888848304748535, -2.562563419342041, -2.0362417697906494, -1.5099201202392578, -0.9835996627807617, -0.45727813243865967, 0.06904339790344238, 0.5953649282455444, 1.1216864585876465, 1.648007869720459, 2.1743295192718506, 2.700651168823242, 3.2269725799560547, 3.753293991088867, 4.27961540222168, 4.80593729019165, 5.332258701324463, 5.858580112457275, 6.384902000427246, 6.911223411560059, 7.437544822692871, 7.963866233825684, 8.490187644958496, 9.016509056091309, 9.542831420898438, 10.06915283203125, 10.595474243164062, 11.121795654296875, 11.648117065429688, 12.1744384765625, 12.700759887695312, 13.227081298828125, 13.753402709960938, 14.27972412109375, 14.806046485900879, 15.332367897033691, 15.858689308166504]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 2.0, 5.0, 8.0, 14.0, 17.0, 15.0, 25.0, 18.0, 24.0, 25.0, 23.0, 36.0, 28.0, 42.0, 39.0, 40.0, 31.0, 50.0, 42.0, 35.0, 38.0, 40.0, 39.0, 45.0, 36.0, 31.0, 30.0, 34.0, 25.0, 26.0, 23.0, 15.0, 18.0, 11.0, 16.0, 13.0, 10.0, 7.0, 9.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.627758026123047, -7.376899719238281, -7.126041412353516, -6.87518310546875, -6.624324798583984, -6.373466491699219, -6.122607707977295, -5.871749401092529, -5.620891094207764, -5.370032787322998, -5.119174480438232, -4.868316173553467, -4.617457389831543, -4.366599082946777, -4.115740776062012, -3.864882469177246, -3.6140241622924805, -3.363165855407715, -3.112307548522949, -2.8614490032196045, -2.610590696334839, -2.3597323894500732, -2.1088738441467285, -1.858015537261963, -1.6071572303771973, -1.3562989234924316, -1.1054404973983765, -0.8545821309089661, -0.6037237644195557, -0.35286545753479004, -0.10200703144073486, 0.1488513946533203, 0.39970874786376953, 0.6505671143531799, 0.9014254808425903, 1.1522839069366455, 1.4031422138214111, 1.6540005207061768, 1.904858946800232, 2.155717372894287, 2.4065756797790527, 2.6574339866638184, 2.908292293548584, 3.1591508388519287, 3.4100091457366943, 3.66086745262146, 3.9117259979248047, 4.16258430480957, 4.413442611694336, 4.664300918579102, 4.915159225463867, 5.166017532348633, 5.416875839233398, 5.667734146118164, 5.918592929840088, 6.1694512367248535, 6.420309543609619, 6.671167850494385, 6.92202615737915, 7.172884464263916, 7.42374324798584, 7.6746015548706055, 7.925459861755371, 8.176318168640137, 8.427176475524902]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 6.0, 10.0, 13.0, 18.0, 23.0, 32.0, 45.0, 61.0, 78.0, 105.0, 166.0, 227.0, 307.0, 431.0, 631.0, 885.0, 1303.0, 1952.0, 2894.0, 4561.0, 7126.0, 11671.0, 20547.0, 37452.0, 74222.0, 154584.0, 261518.0, 224996.0, 114411.0, 55493.0, 29471.0, 16116.0, 9656.0, 5874.0, 3798.0, 2511.0, 1612.0, 1124.0, 819.0, 501.0, 375.0, 261.0, 188.0, 135.0, 96.0, 81.0, 43.0, 43.0, 26.0, 12.0, 15.0, 12.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.09375, -9.7550048828125, -9.416259765625, -9.0775146484375, -8.73876953125, -8.4000244140625, -8.061279296875, -7.7225341796875, -7.3837890625, -7.0450439453125, -6.706298828125, -6.3675537109375, -6.02880859375, -5.6900634765625, -5.351318359375, -5.0125732421875, -4.673828125, -4.3350830078125, -3.996337890625, -3.6575927734375, -3.31884765625, -2.9801025390625, -2.641357421875, -2.3026123046875, -1.9638671875, -1.6251220703125, -1.286376953125, -0.9476318359375, -0.60888671875, -0.2701416015625, 0.068603515625, 0.4073486328125, 0.74609375, 1.0848388671875, 1.423583984375, 1.7623291015625, 2.10107421875, 2.4398193359375, 2.778564453125, 3.1173095703125, 3.4560546875, 3.7947998046875, 4.133544921875, 4.4722900390625, 4.81103515625, 5.1497802734375, 5.488525390625, 5.8272705078125, 6.166015625, 6.5047607421875, 6.843505859375, 7.1822509765625, 7.52099609375, 7.8597412109375, 8.198486328125, 8.5372314453125, 8.8759765625, 9.2147216796875, 9.553466796875, 9.8922119140625, 10.23095703125, 10.5697021484375, 10.908447265625, 11.2471923828125, 11.5859375]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 3.0, 13.0, 19.0, 20.0, 17.0, 25.0, 18.0, 27.0, 36.0, 32.0, 41.0, 42.0, 40.0, 41.0, 46.0, 40.0, 39.0, 44.0, 56.0, 33.0, 51.0, 40.0, 38.0, 25.0, 32.0, 23.0, 29.0, 13.0, 21.0, 19.0, 18.0, 11.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6751708984375, -8.381591796875, -8.0880126953125, -7.79443359375, -7.5008544921875, -7.207275390625, -6.9136962890625, -6.6201171875, -6.3265380859375, -6.032958984375, -5.7393798828125, -5.44580078125, -5.1522216796875, -4.858642578125, -4.5650634765625, -4.271484375, -3.9779052734375, -3.684326171875, -3.3907470703125, -3.09716796875, -2.8035888671875, -2.510009765625, -2.2164306640625, -1.9228515625, -1.6292724609375, -1.335693359375, -1.0421142578125, -0.74853515625, -0.4549560546875, -0.161376953125, 0.1322021484375, 0.42578125, 0.7193603515625, 1.012939453125, 1.3065185546875, 1.60009765625, 1.8936767578125, 2.187255859375, 2.4808349609375, 2.7744140625, 3.0679931640625, 3.361572265625, 3.6551513671875, 3.94873046875, 4.2423095703125, 4.535888671875, 4.8294677734375, 5.123046875, 5.4166259765625, 5.710205078125, 6.0037841796875, 6.29736328125, 6.5909423828125, 6.884521484375, 7.1781005859375, 7.4716796875, 7.7652587890625, 8.058837890625, 8.3524169921875, 8.64599609375, 8.9395751953125, 9.233154296875, 9.5267333984375, 9.8203125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 3.0, 5.0, 5.0, 7.0, 4.0, 17.0, 9.0, 23.0, 28.0, 28.0, 58.0, 73.0, 84.0, 111.0, 204.0, 258.0, 366.0, 526.0, 823.0, 1439.0, 2447.0, 4429.0, 8691.0, 18171.0, 43191.0, 107132.0, 266592.0, 326695.0, 156947.0, 60295.0, 24942.0, 11400.0, 5694.0, 3019.0, 1724.0, 1063.0, 624.0, 458.0, 318.0, 191.0, 130.0, 78.0, 67.0, 49.0, 28.0, 28.0, 24.0, 16.0, 13.0, 9.0, 14.0, 5.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-14.3125, -13.8536376953125, -13.394775390625, -12.9359130859375, -12.47705078125, -12.0181884765625, -11.559326171875, -11.1004638671875, -10.6416015625, -10.1827392578125, -9.723876953125, -9.2650146484375, -8.80615234375, -8.3472900390625, -7.888427734375, -7.4295654296875, -6.970703125, -6.5118408203125, -6.052978515625, -5.5941162109375, -5.13525390625, -4.6763916015625, -4.217529296875, -3.7586669921875, -3.2998046875, -2.8409423828125, -2.382080078125, -1.9232177734375, -1.46435546875, -1.0054931640625, -0.546630859375, -0.0877685546875, 0.37109375, 0.8299560546875, 1.288818359375, 1.7476806640625, 2.20654296875, 2.6654052734375, 3.124267578125, 3.5831298828125, 4.0419921875, 4.5008544921875, 4.959716796875, 5.4185791015625, 5.87744140625, 6.3363037109375, 6.795166015625, 7.2540283203125, 7.712890625, 8.1717529296875, 8.630615234375, 9.0894775390625, 9.54833984375, 10.0072021484375, 10.466064453125, 10.9249267578125, 11.3837890625, 11.8426513671875, 12.301513671875, 12.7603759765625, 13.21923828125, 13.6781005859375, 14.136962890625, 14.5958251953125, 15.0546875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 12.0, 5.0, 6.0, 7.0, 12.0, 9.0, 14.0, 13.0, 25.0, 32.0, 20.0, 25.0, 28.0, 25.0, 39.0, 33.0, 42.0, 41.0, 42.0, 51.0, 50.0, 34.0, 39.0, 37.0, 45.0, 24.0, 38.0, 36.0, 22.0, 26.0, 19.0, 19.0, 19.0, 16.0, 19.0, 20.0, 7.0, 15.0, 7.0, 5.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.3138427734375, -4.166748046875, -4.0196533203125, -3.87255859375, -3.7254638671875, -3.578369140625, -3.4312744140625, -3.2841796875, -3.1370849609375, -2.989990234375, -2.8428955078125, -2.69580078125, -2.5487060546875, -2.401611328125, -2.2545166015625, -2.107421875, -1.9603271484375, -1.813232421875, -1.6661376953125, -1.51904296875, -1.3719482421875, -1.224853515625, -1.0777587890625, -0.9306640625, -0.7835693359375, -0.636474609375, -0.4893798828125, -0.34228515625, -0.1951904296875, -0.048095703125, 0.0989990234375, 0.24609375, 0.3931884765625, 0.540283203125, 0.6873779296875, 0.83447265625, 0.9815673828125, 1.128662109375, 1.2757568359375, 1.4228515625, 1.5699462890625, 1.717041015625, 1.8641357421875, 2.01123046875, 2.1583251953125, 2.305419921875, 2.4525146484375, 2.599609375, 2.7467041015625, 2.893798828125, 3.0408935546875, 3.18798828125, 3.3350830078125, 3.482177734375, 3.6292724609375, 3.7763671875, 3.9234619140625, 4.070556640625, 4.2176513671875, 4.36474609375, 4.5118408203125, 4.658935546875, 4.8060302734375, 4.953125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 1.0, 3.0, 5.0, 14.0, 13.0, 20.0, 22.0, 30.0, 35.0, 64.0, 89.0, 100.0, 125.0, 177.0, 263.0, 397.0, 543.0, 788.0, 1086.0, 1757.0, 2787.0, 4407.0, 7637.0, 14197.0, 27098.0, 55963.0, 120122.0, 227026.0, 263005.0, 162389.0, 77765.0, 36690.0, 18519.0, 9696.0, 5716.0, 3445.0, 2114.0, 1354.0, 924.0, 599.0, 452.0, 316.0, 187.0, 157.0, 135.0, 75.0, 70.0, 47.0, 29.0, 34.0, 19.0, 14.0, 12.0, 9.0, 4.0, 4.0, 5.0, 2.0, 6.0, 2.0], "bins": [-5.31640625, -5.1513671875, -4.986328125, -4.8212890625, -4.65625, -4.4912109375, -4.326171875, -4.1611328125, -3.99609375, -3.8310546875, -3.666015625, -3.5009765625, -3.3359375, -3.1708984375, -3.005859375, -2.8408203125, -2.67578125, -2.5107421875, -2.345703125, -2.1806640625, -2.015625, -1.8505859375, -1.685546875, -1.5205078125, -1.35546875, -1.1904296875, -1.025390625, -0.8603515625, -0.6953125, -0.5302734375, -0.365234375, -0.2001953125, -0.03515625, 0.1298828125, 0.294921875, 0.4599609375, 0.625, 0.7900390625, 0.955078125, 1.1201171875, 1.28515625, 1.4501953125, 1.615234375, 1.7802734375, 1.9453125, 2.1103515625, 2.275390625, 2.4404296875, 2.60546875, 2.7705078125, 2.935546875, 3.1005859375, 3.265625, 3.4306640625, 3.595703125, 3.7607421875, 3.92578125, 4.0908203125, 4.255859375, 4.4208984375, 4.5859375, 4.7509765625, 4.916015625, 5.0810546875, 5.24609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 12.0, 11.0, 24.0, 21.0, 38.0, 57.0, 85.0, 104.0, 142.0, 138.0, 90.0, 76.0, 48.0, 37.0, 23.0, 8.0, 13.0, 10.0, 7.0, 7.0, 6.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007276535034179688, -0.0007023364305496216, -0.0006770193576812744, -0.0006517022848129272, -0.0006263852119445801, -0.0006010681390762329, -0.0005757510662078857, -0.0005504339933395386, -0.0005251169204711914, -0.0004997998476028442, -0.00047448277473449707, -0.0004491657018661499, -0.00042384862899780273, -0.00039853155612945557, -0.0003732144832611084, -0.00034789741039276123, -0.00032258033752441406, -0.0002972632646560669, -0.0002719461917877197, -0.00024662911891937256, -0.0002213120460510254, -0.00019599497318267822, -0.00017067790031433105, -0.0001453608274459839, -0.00012004375457763672, -9.472668170928955e-05, -6.940960884094238e-05, -4.4092535972595215e-05, -1.8775463104248047e-05, 6.541609764099121e-06, 3.185868263244629e-05, 5.717575550079346e-05, 8.249282836914062e-05, 0.00010780990123748779, 0.00013312697410583496, 0.00015844404697418213, 0.0001837611198425293, 0.00020907819271087646, 0.00023439526557922363, 0.0002597123384475708, 0.00028502941131591797, 0.00031034648418426514, 0.0003356635570526123, 0.00036098062992095947, 0.00038629770278930664, 0.0004116147756576538, 0.000436931848526001, 0.00046224892139434814, 0.0004875659942626953, 0.0005128830671310425, 0.0005382001399993896, 0.0005635172128677368, 0.000588834285736084, 0.0006141513586044312, 0.0006394684314727783, 0.0006647855043411255, 0.0006901025772094727, 0.0007154196500778198, 0.000740736722946167, 0.0007660537958145142, 0.0007913708686828613, 0.0008166879415512085, 0.0008420050144195557, 0.0008673220872879028, 0.00089263916015625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 9.0, 9.0, 17.0, 15.0, 23.0, 39.0, 60.0, 80.0, 112.0, 158.0, 226.0, 315.0, 445.0, 670.0, 1099.0, 1568.0, 2485.0, 3854.0, 6568.0, 10989.0, 20051.0, 37162.0, 72053.0, 134115.0, 210083.0, 219837.0, 148986.0, 81232.0, 42325.0, 22320.0, 12494.0, 7044.0, 4380.0, 2679.0, 1664.0, 1047.0, 729.0, 509.0, 363.0, 204.0, 164.0, 107.0, 75.0, 63.0, 41.0, 22.0, 16.0, 23.0, 9.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 3.0], "bins": [-4.140625, -4.0155029296875, -3.890380859375, -3.7652587890625, -3.64013671875, -3.5150146484375, -3.389892578125, -3.2647705078125, -3.1396484375, -3.0145263671875, -2.889404296875, -2.7642822265625, -2.63916015625, -2.5140380859375, -2.388916015625, -2.2637939453125, -2.138671875, -2.0135498046875, -1.888427734375, -1.7633056640625, -1.63818359375, -1.5130615234375, -1.387939453125, -1.2628173828125, -1.1376953125, -1.0125732421875, -0.887451171875, -0.7623291015625, -0.63720703125, -0.5120849609375, -0.386962890625, -0.2618408203125, -0.13671875, -0.0115966796875, 0.113525390625, 0.2386474609375, 0.36376953125, 0.4888916015625, 0.614013671875, 0.7391357421875, 0.8642578125, 0.9893798828125, 1.114501953125, 1.2396240234375, 1.36474609375, 1.4898681640625, 1.614990234375, 1.7401123046875, 1.865234375, 1.9903564453125, 2.115478515625, 2.2406005859375, 2.36572265625, 2.4908447265625, 2.615966796875, 2.7410888671875, 2.8662109375, 2.9913330078125, 3.116455078125, 3.2415771484375, 3.36669921875, 3.4918212890625, 3.616943359375, 3.7420654296875, 3.8671875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 9.0, 1.0, 6.0, 4.0, 9.0, 7.0, 18.0, 12.0, 22.0, 20.0, 33.0, 27.0, 29.0, 34.0, 46.0, 52.0, 53.0, 51.0, 56.0, 57.0, 50.0, 62.0, 46.0, 46.0, 35.0, 37.0, 34.0, 28.0, 19.0, 21.0, 19.0, 14.0, 7.0, 9.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9638671875, -0.9335708618164062, -0.9032745361328125, -0.8729782104492188, -0.842681884765625, -0.8123855590820312, -0.7820892333984375, -0.7517929077148438, -0.72149658203125, -0.6912002563476562, -0.6609039306640625, -0.6306076049804688, -0.600311279296875, -0.5700149536132812, -0.5397186279296875, -0.5094223022460938, -0.4791259765625, -0.44882965087890625, -0.4185333251953125, -0.38823699951171875, -0.357940673828125, -0.32764434814453125, -0.2973480224609375, -0.26705169677734375, -0.23675537109375, -0.20645904541015625, -0.1761627197265625, -0.14586639404296875, -0.115570068359375, -0.08527374267578125, -0.0549774169921875, -0.02468109130859375, 0.005615234375, 0.03591156005859375, 0.0662078857421875, 0.09650421142578125, 0.126800537109375, 0.15709686279296875, 0.1873931884765625, 0.21768951416015625, 0.24798583984375, 0.27828216552734375, 0.3085784912109375, 0.33887481689453125, 0.369171142578125, 0.39946746826171875, 0.4297637939453125, 0.46006011962890625, 0.4903564453125, 0.5206527709960938, 0.5509490966796875, 0.5812454223632812, 0.611541748046875, 0.6418380737304688, 0.6721343994140625, 0.7024307250976562, 0.73272705078125, 0.7630233764648438, 0.7933197021484375, 0.8236160278320312, 0.853912353515625, 0.8842086791992188, 0.9145050048828125, 0.9448013305664062, 0.97509765625]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 9.0, 9.0, 9.0, 16.0, 29.0, 27.0, 39.0, 46.0, 69.0, 72.0, 95.0, 96.0, 96.0, 86.0, 66.0, 56.0, 37.0, 35.0, 22.0, 19.0, 10.0, 9.0, 13.0, 2.0, 3.0, 5.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.54611587524414, -16.035640716552734, -15.525167465209961, -15.014693260192871, -14.504219055175781, -13.993744850158691, -13.483270645141602, -12.972795486450195, -12.462322235107422, -11.951848030090332, -11.441373825073242, -10.930899620056152, -10.420425415039062, -9.909951210021973, -9.399477005004883, -8.889001846313477, -8.378527641296387, -7.868053436279297, -7.357579231262207, -6.847105026245117, -6.336630821228027, -5.8261566162109375, -5.3156819343566895, -4.8052077293396, -4.29473352432251, -3.78425931930542, -3.27378511428833, -2.763310670852661, -2.2528364658355713, -1.7423622608184814, -1.2318878173828125, -0.7214136123657227, -0.2109394073486328, 0.2995348572731018, 0.8100091218948364, 1.3204834461212158, 1.8309576511383057, 2.3414318561553955, 2.8519062995910645, 3.3623805046081543, 3.872854709625244, 4.383328914642334, 4.893803119659424, 5.404277801513672, 5.914752006530762, 6.425226211547852, 6.935700416564941, 7.446174621582031, 7.956648826599121, 8.467123031616211, 8.9775972366333, 9.48807144165039, 9.99854564666748, 10.50901985168457, 11.019495010375977, 11.52996826171875, 12.040443420410156, 12.550917625427246, 13.061391830444336, 13.571866035461426, 14.082340240478516, 14.592814445495605, 15.103288650512695, 15.613763809204102, 16.124237060546875]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 10.0, 8.0, 5.0, 15.0, 23.0, 16.0, 15.0, 29.0, 27.0, 29.0, 30.0, 28.0, 29.0, 39.0, 34.0, 34.0, 33.0, 39.0, 33.0, 34.0, 46.0, 46.0, 36.0, 41.0, 44.0, 28.0, 20.0, 29.0, 30.0, 34.0, 18.0, 15.0, 17.0, 19.0, 11.0, 9.0, 10.0, 8.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.740115642547607, -7.496506690979004, -7.2528977394104, -7.009288787841797, -6.765679836273193, -6.52207088470459, -6.278461456298828, -6.034852981567383, -5.791243553161621, -5.547634601593018, -5.304025650024414, -5.0604166984558105, -4.816807746887207, -4.5731987953186035, -4.32958984375, -4.085980415344238, -3.842371940612793, -3.5987629890441895, -3.355154037475586, -3.1115450859069824, -2.867936134338379, -2.6243271827697754, -2.3807179927825928, -2.1371090412139893, -1.8935000896453857, -1.6498911380767822, -1.4062821865081787, -1.1626731157302856, -0.9190641641616821, -0.6754552125930786, -0.43184614181518555, -0.18823719024658203, 0.055371761322021484, 0.2989807426929474, 0.5425897240638733, 0.7861987352371216, 1.029807686805725, 1.2734166383743286, 1.5170257091522217, 1.7606346607208252, 2.0042436122894287, 2.2478525638580322, 2.4914615154266357, 2.7350707054138184, 2.978679656982422, 3.2222886085510254, 3.465897560119629, 3.7095065116882324, 3.953115463256836, 4.1967244148254395, 4.440333366394043, 4.6839423179626465, 4.92755126953125, 5.1711602210998535, 5.414769172668457, 5.658378601074219, 5.901987075805664, 6.145596027374268, 6.389204978942871, 6.632813930511475, 6.876422882080078, 7.120031833648682, 7.363640785217285, 7.607250213623047, 7.85085916519165]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 14.0, 17.0, 26.0, 25.0, 33.0, 65.0, 95.0, 131.0, 197.0, 319.0, 413.0, 651.0, 977.0, 1581.0, 2575.0, 4425.0, 7744.0, 15102.0, 34919.0, 108108.0, 476173.0, 1744033.0, 1353702.0, 306179.0, 77718.0, 28156.0, 13089.0, 7003.0, 4102.0, 2443.0, 1439.0, 937.0, 602.0, 388.0, 270.0, 205.0, 126.0, 93.0, 52.0, 36.0, 34.0, 19.0, 21.0, 4.0, 11.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.6875, -18.08203125, -17.4765625, -16.87109375, -16.265625, -15.66015625, -15.0546875, -14.44921875, -13.84375, -13.23828125, -12.6328125, -12.02734375, -11.421875, -10.81640625, -10.2109375, -9.60546875, -9.0, -8.39453125, -7.7890625, -7.18359375, -6.578125, -5.97265625, -5.3671875, -4.76171875, -4.15625, -3.55078125, -2.9453125, -2.33984375, -1.734375, -1.12890625, -0.5234375, 0.08203125, 0.6875, 1.29296875, 1.8984375, 2.50390625, 3.109375, 3.71484375, 4.3203125, 4.92578125, 5.53125, 6.13671875, 6.7421875, 7.34765625, 7.953125, 8.55859375, 9.1640625, 9.76953125, 10.375, 10.98046875, 11.5859375, 12.19140625, 12.796875, 13.40234375, 14.0078125, 14.61328125, 15.21875, 15.82421875, 16.4296875, 17.03515625, 17.640625, 18.24609375, 18.8515625, 19.45703125, 20.0625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 7.0, 6.0, 11.0, 14.0, 21.0, 12.0, 15.0, 19.0, 25.0, 26.0, 23.0, 26.0, 35.0, 35.0, 45.0, 52.0, 32.0, 40.0, 42.0, 40.0, 42.0, 41.0, 29.0, 36.0, 44.0, 28.0, 21.0, 32.0, 35.0, 26.0, 20.0, 28.0, 12.0, 18.0, 9.0, 8.0, 11.0, 10.0, 8.0, 2.0, 0.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.0390625, -6.81292724609375, -6.5867919921875, -6.36065673828125, -6.134521484375, -5.90838623046875, -5.6822509765625, -5.45611572265625, -5.22998046875, -5.00384521484375, -4.7777099609375, -4.55157470703125, -4.325439453125, -4.09930419921875, -3.8731689453125, -3.64703369140625, -3.4208984375, -3.19476318359375, -2.9686279296875, -2.74249267578125, -2.516357421875, -2.29022216796875, -2.0640869140625, -1.83795166015625, -1.61181640625, -1.38568115234375, -1.1595458984375, -0.93341064453125, -0.707275390625, -0.48114013671875, -0.2550048828125, -0.02886962890625, 0.197265625, 0.42340087890625, 0.6495361328125, 0.87567138671875, 1.101806640625, 1.32794189453125, 1.5540771484375, 1.78021240234375, 2.00634765625, 2.23248291015625, 2.4586181640625, 2.68475341796875, 2.910888671875, 3.13702392578125, 3.3631591796875, 3.58929443359375, 3.8154296875, 4.04156494140625, 4.2677001953125, 4.49383544921875, 4.719970703125, 4.94610595703125, 5.1722412109375, 5.39837646484375, 5.62451171875, 5.85064697265625, 6.0767822265625, 6.30291748046875, 6.529052734375, 6.75518798828125, 6.9813232421875, 7.20745849609375, 7.43359375]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 9.0, 13.0, 31.0, 37.0, 46.0, 85.0, 110.0, 239.0, 367.0, 589.0, 996.0, 1696.0, 2972.0, 5126.0, 9878.0, 19212.0, 43755.0, 123768.0, 520762.0, 2161183.0, 987201.0, 200071.0, 62775.0, 25648.0, 12452.0, 6636.0, 3563.0, 2075.0, 1224.0, 692.0, 390.0, 272.0, 166.0, 98.0, 44.0, 37.0, 20.0, 15.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.046875, -22.2705078125, -21.494140625, -20.7177734375, -19.94140625, -19.1650390625, -18.388671875, -17.6123046875, -16.8359375, -16.0595703125, -15.283203125, -14.5068359375, -13.73046875, -12.9541015625, -12.177734375, -11.4013671875, -10.625, -9.8486328125, -9.072265625, -8.2958984375, -7.51953125, -6.7431640625, -5.966796875, -5.1904296875, -4.4140625, -3.6376953125, -2.861328125, -2.0849609375, -1.30859375, -0.5322265625, 0.244140625, 1.0205078125, 1.796875, 2.5732421875, 3.349609375, 4.1259765625, 4.90234375, 5.6787109375, 6.455078125, 7.2314453125, 8.0078125, 8.7841796875, 9.560546875, 10.3369140625, 11.11328125, 11.8896484375, 12.666015625, 13.4423828125, 14.21875, 14.9951171875, 15.771484375, 16.5478515625, 17.32421875, 18.1005859375, 18.876953125, 19.6533203125, 20.4296875, 21.2060546875, 21.982421875, 22.7587890625, 23.53515625, 24.3115234375, 25.087890625, 25.8642578125, 26.640625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 7.0, 3.0, 7.0, 9.0, 9.0, 7.0, 22.0, 24.0, 25.0, 27.0, 49.0, 59.0, 85.0, 144.0, 182.0, 237.0, 343.0, 382.0, 482.0, 434.0, 398.0, 305.0, 223.0, 168.0, 118.0, 81.0, 63.0, 40.0, 41.0, 17.0, 17.0, 18.0, 12.0, 8.0, 7.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.42578125, -4.26171875, -4.09765625, -3.93359375, -3.76953125, -3.60546875, -3.44140625, -3.27734375, -3.11328125, -2.94921875, -2.78515625, -2.62109375, -2.45703125, -2.29296875, -2.12890625, -1.96484375, -1.80078125, -1.63671875, -1.47265625, -1.30859375, -1.14453125, -0.98046875, -0.81640625, -0.65234375, -0.48828125, -0.32421875, -0.16015625, 0.00390625, 0.16796875, 0.33203125, 0.49609375, 0.66015625, 0.82421875, 0.98828125, 1.15234375, 1.31640625, 1.48046875, 1.64453125, 1.80859375, 1.97265625, 2.13671875, 2.30078125, 2.46484375, 2.62890625, 2.79296875, 2.95703125, 3.12109375, 3.28515625, 3.44921875, 3.61328125, 3.77734375, 3.94140625, 4.10546875, 4.26953125, 4.43359375, 4.59765625, 4.76171875, 4.92578125, 5.08984375, 5.25390625, 5.41796875, 5.58203125, 5.74609375, 5.91015625, 6.07421875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 7.0, 8.0, 6.0, 7.0, 12.0, 16.0, 19.0, 25.0, 39.0, 48.0, 53.0, 70.0, 78.0, 97.0, 99.0, 90.0, 81.0, 57.0, 33.0, 37.0, 22.0, 23.0, 13.0, 13.0, 10.0, 12.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-18.979957580566406, -18.450641632080078, -17.921327590942383, -17.392011642456055, -16.86269760131836, -16.33338165283203, -15.804067611694336, -15.274751663208008, -14.745437622070312, -14.2161226272583, -13.686807632446289, -13.157492637634277, -12.628177642822266, -12.098862648010254, -11.569547653198242, -11.040231704711914, -10.510916709899902, -9.98160171508789, -9.452286720275879, -8.922971725463867, -8.393656730651855, -7.864341735839844, -7.335026264190674, -6.805711269378662, -6.27639627456665, -5.747081279754639, -5.217766284942627, -4.688450813293457, -4.159135818481445, -3.6298210620880127, -3.100505828857422, -2.57119083404541, -2.041874885559082, -1.5125598907470703, -0.983244776725769, -0.4539296627044678, 0.07538533210754395, 0.6047003269195557, 1.1340155601501465, 1.6633305549621582, 2.19264554977417, 2.7219605445861816, 3.2512755393981934, 3.780590772628784, 4.309906005859375, 4.839221000671387, 5.368535995483398, 5.89785099029541, 6.427165985107422, 6.956480979919434, 7.485795974731445, 8.015110969543457, 8.544425964355469, 9.07374095916748, 9.603055953979492, 10.13237190246582, 10.661685943603516, 11.191000938415527, 11.720315933227539, 12.24963092803955, 12.778945922851562, 13.308260917663574, 13.837575912475586, 14.366891860961914, 14.896206855773926]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 14.0, 12.0, 14.0, 21.0, 17.0, 20.0, 24.0, 27.0, 28.0, 25.0, 42.0, 31.0, 37.0, 40.0, 43.0, 49.0, 39.0, 44.0, 36.0, 38.0, 39.0, 38.0, 43.0, 41.0, 21.0, 35.0, 25.0, 26.0, 24.0, 18.0, 12.0, 15.0, 13.0, 6.0, 10.0, 7.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.096246719360352, -8.802926063537598, -8.509605407714844, -8.21628475189209, -7.922963619232178, -7.629642963409424, -7.336321830749512, -7.043001174926758, -6.749680519104004, -6.45635986328125, -6.163039207458496, -5.869718074798584, -5.57639741897583, -5.283076763153076, -4.989755630493164, -4.69643497467041, -4.403114318847656, -4.109793663024902, -3.8164727687835693, -3.5231518745422363, -3.2298312187194824, -2.9365105628967285, -2.6431896686553955, -2.3498687744140625, -2.0565481185913086, -1.7632273435592651, -1.4699065685272217, -1.1765857934951782, -0.8832650184631348, -0.5899442434310913, -0.29662346839904785, -0.0033025741577148438, 0.29001712799072266, 0.5833379030227661, 0.8766586780548096, 1.169979453086853, 1.4633002281188965, 1.75662100315094, 2.0499417781829834, 2.3432626724243164, 2.6365833282470703, 2.929903984069824, 3.2232248783111572, 3.5165457725524902, 3.809866428375244, 4.103187084197998, 4.39650821685791, 4.689828872680664, 4.983149528503418, 5.276470184326172, 5.569790840148926, 5.863111972808838, 6.156432628631592, 6.449753284454346, 6.743074417114258, 7.036395072937012, 7.329715728759766, 7.6230363845825195, 7.916357040405273, 8.209677696228027, 8.502998352050781, 8.796319961547852, 9.089640617370605, 9.38296127319336, 9.676281929016113]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 2.0, 10.0, 9.0, 17.0, 17.0, 24.0, 53.0, 63.0, 109.0, 164.0, 238.0, 331.0, 487.0, 741.0, 1129.0, 1682.0, 2495.0, 3875.0, 6016.0, 9796.0, 15798.0, 27004.0, 47687.0, 90335.0, 180417.0, 275459.0, 177794.0, 89645.0, 47297.0, 26711.0, 15677.0, 9974.0, 5984.0, 3912.0, 2530.0, 1712.0, 1108.0, 687.0, 526.0, 340.0, 222.0, 129.0, 116.0, 75.0, 53.0, 30.0, 24.0, 24.0, 17.0, 8.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0849609375, -1.04937744140625, -1.0137939453125, -0.97821044921875, -0.942626953125, -0.90704345703125, -0.8714599609375, -0.83587646484375, -0.80029296875, -0.76470947265625, -0.7291259765625, -0.69354248046875, -0.657958984375, -0.62237548828125, -0.5867919921875, -0.55120849609375, -0.515625, -0.48004150390625, -0.4444580078125, -0.40887451171875, -0.373291015625, -0.33770751953125, -0.3021240234375, -0.26654052734375, -0.23095703125, -0.19537353515625, -0.1597900390625, -0.12420654296875, -0.088623046875, -0.05303955078125, -0.0174560546875, 0.01812744140625, 0.0537109375, 0.08929443359375, 0.1248779296875, 0.16046142578125, 0.196044921875, 0.23162841796875, 0.2672119140625, 0.30279541015625, 0.33837890625, 0.37396240234375, 0.4095458984375, 0.44512939453125, 0.480712890625, 0.51629638671875, 0.5518798828125, 0.58746337890625, 0.623046875, 0.65863037109375, 0.6942138671875, 0.72979736328125, 0.765380859375, 0.80096435546875, 0.8365478515625, 0.87213134765625, 0.90771484375, 0.94329833984375, 0.9788818359375, 1.01446533203125, 1.050048828125, 1.08563232421875, 1.1212158203125, 1.15679931640625, 1.1923828125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 8.0, 10.0, 15.0, 9.0, 19.0, 15.0, 19.0, 21.0, 20.0, 28.0, 38.0, 37.0, 32.0, 43.0, 44.0, 48.0, 41.0, 47.0, 50.0, 45.0, 46.0, 47.0, 43.0, 29.0, 36.0, 30.0, 27.0, 21.0, 27.0, 21.0, 24.0, 8.0, 12.0, 6.0, 11.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5390625, -10.1951904296875, -9.851318359375, -9.5074462890625, -9.16357421875, -8.8197021484375, -8.475830078125, -8.1319580078125, -7.7880859375, -7.4442138671875, -7.100341796875, -6.7564697265625, -6.41259765625, -6.0687255859375, -5.724853515625, -5.3809814453125, -5.037109375, -4.6932373046875, -4.349365234375, -4.0054931640625, -3.66162109375, -3.3177490234375, -2.973876953125, -2.6300048828125, -2.2861328125, -1.9422607421875, -1.598388671875, -1.2545166015625, -0.91064453125, -0.5667724609375, -0.222900390625, 0.1209716796875, 0.46484375, 0.8087158203125, 1.152587890625, 1.4964599609375, 1.84033203125, 2.1842041015625, 2.528076171875, 2.8719482421875, 3.2158203125, 3.5596923828125, 3.903564453125, 4.2474365234375, 4.59130859375, 4.9351806640625, 5.279052734375, 5.6229248046875, 5.966796875, 6.3106689453125, 6.654541015625, 6.9984130859375, 7.34228515625, 7.6861572265625, 8.030029296875, 8.3739013671875, 8.7177734375, 9.0616455078125, 9.405517578125, 9.7493896484375, 10.09326171875, 10.4371337890625, 10.781005859375, 11.1248779296875, 11.46875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 14.0, 10.0, 21.0, 33.0, 38.0, 44.0, 79.0, 124.0, 161.0, 260.0, 419.0, 681.0, 1074.0, 1922.0, 3637.0, 7211.0, 17486.0, 74097.0, 869761.0, 43800.0, 14161.0, 6093.0, 3071.0, 1708.0, 974.0, 575.0, 380.0, 223.0, 164.0, 90.0, 73.0, 43.0, 42.0, 21.0, 27.0, 12.0, 12.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.888671875, -3.764739990234375, -3.64080810546875, -3.516876220703125, -3.3929443359375, -3.269012451171875, -3.14508056640625, -3.021148681640625, -2.897216796875, -2.773284912109375, -2.64935302734375, -2.525421142578125, -2.4014892578125, -2.277557373046875, -2.15362548828125, -2.029693603515625, -1.90576171875, -1.781829833984375, -1.65789794921875, -1.533966064453125, -1.4100341796875, -1.286102294921875, -1.16217041015625, -1.038238525390625, -0.914306640625, -0.790374755859375, -0.66644287109375, -0.542510986328125, -0.4185791015625, -0.294647216796875, -0.17071533203125, -0.046783447265625, 0.0771484375, 0.201080322265625, 0.32501220703125, 0.448944091796875, 0.5728759765625, 0.696807861328125, 0.82073974609375, 0.944671630859375, 1.068603515625, 1.192535400390625, 1.31646728515625, 1.440399169921875, 1.5643310546875, 1.688262939453125, 1.81219482421875, 1.936126708984375, 2.06005859375, 2.183990478515625, 2.30792236328125, 2.431854248046875, 2.5557861328125, 2.679718017578125, 2.80364990234375, 2.927581787109375, 3.051513671875, 3.175445556640625, 3.29937744140625, 3.423309326171875, 3.5472412109375, 3.671173095703125, 3.79510498046875, 3.919036865234375, 4.04296875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 4.0, 7.0, 7.0, 17.0, 19.0, 21.0, 18.0, 14.0, 17.0, 28.0, 23.0, 29.0, 41.0, 47.0, 33.0, 40.0, 33.0, 59.0, 37.0, 42.0, 42.0, 43.0, 44.0, 35.0, 45.0, 32.0, 26.0, 30.0, 26.0, 14.0, 18.0, 14.0, 19.0, 15.0, 15.0, 5.0, 6.0, 10.0, 10.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.50177001953125, -5.3160400390625, -5.13031005859375, -4.944580078125, -4.75885009765625, -4.5731201171875, -4.38739013671875, -4.20166015625, -4.01593017578125, -3.8302001953125, -3.64447021484375, -3.458740234375, -3.27301025390625, -3.0872802734375, -2.90155029296875, -2.7158203125, -2.53009033203125, -2.3443603515625, -2.15863037109375, -1.972900390625, -1.78717041015625, -1.6014404296875, -1.41571044921875, -1.22998046875, -1.04425048828125, -0.8585205078125, -0.67279052734375, -0.487060546875, -0.30133056640625, -0.1156005859375, 0.07012939453125, 0.255859375, 0.44158935546875, 0.6273193359375, 0.81304931640625, 0.998779296875, 1.18450927734375, 1.3702392578125, 1.55596923828125, 1.74169921875, 1.92742919921875, 2.1131591796875, 2.29888916015625, 2.484619140625, 2.67034912109375, 2.8560791015625, 3.04180908203125, 3.2275390625, 3.41326904296875, 3.5989990234375, 3.78472900390625, 3.970458984375, 4.15618896484375, 4.3419189453125, 4.52764892578125, 4.71337890625, 4.89910888671875, 5.0848388671875, 5.27056884765625, 5.456298828125, 5.64202880859375, 5.8277587890625, 6.01348876953125, 6.19921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 5.0, 11.0, 18.0, 16.0, 34.0, 46.0, 60.0, 92.0, 127.0, 222.0, 333.0, 572.0, 941.0, 1655.0, 3089.0, 6345.0, 15176.0, 53920.0, 909320.0, 34017.0, 11604.0, 5077.0, 2497.0, 1311.0, 782.0, 436.0, 303.0, 154.0, 114.0, 73.0, 45.0, 39.0, 31.0, 25.0, 9.0, 14.0, 9.0, 3.0, 4.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8203125, -0.7923736572265625, -0.764434814453125, -0.7364959716796875, -0.70855712890625, -0.6806182861328125, -0.652679443359375, -0.6247406005859375, -0.5968017578125, -0.5688629150390625, -0.540924072265625, -0.5129852294921875, -0.48504638671875, -0.4571075439453125, -0.429168701171875, -0.4012298583984375, -0.373291015625, -0.3453521728515625, -0.317413330078125, -0.2894744873046875, -0.26153564453125, -0.2335968017578125, -0.205657958984375, -0.1777191162109375, -0.1497802734375, -0.1218414306640625, -0.093902587890625, -0.0659637451171875, -0.03802490234375, -0.0100860595703125, 0.017852783203125, 0.0457916259765625, 0.07373046875, 0.1016693115234375, 0.129608154296875, 0.1575469970703125, 0.18548583984375, 0.2134246826171875, 0.241363525390625, 0.2693023681640625, 0.2972412109375, 0.3251800537109375, 0.353118896484375, 0.3810577392578125, 0.40899658203125, 0.4369354248046875, 0.464874267578125, 0.4928131103515625, 0.520751953125, 0.5486907958984375, 0.576629638671875, 0.6045684814453125, 0.63250732421875, 0.6604461669921875, 0.688385009765625, 0.7163238525390625, 0.7442626953125, 0.7722015380859375, 0.800140380859375, 0.8280792236328125, 0.85601806640625, 0.8839569091796875, 0.911895751953125, 0.9398345947265625, 0.9677734375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 4.0, 6.0, 12.0, 11.0, 14.0, 12.0, 21.0, 17.0, 25.0, 38.0, 30.0, 45.0, 32.0, 39.0, 40.0, 38.0, 50.0, 38.0, 57.0, 40.0, 48.0, 34.0, 53.0, 37.0, 35.0, 43.0, 28.0, 28.0, 22.0, 13.0, 17.0, 12.0, 10.0, 6.0, 7.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.38690185546875e-05, -4.2584724724292755e-05, -4.130043089389801e-05, -4.0016137063503265e-05, -3.873184323310852e-05, -3.7447549402713776e-05, -3.616325557231903e-05, -3.4878961741924286e-05, -3.359466791152954e-05, -3.2310374081134796e-05, -3.102608025074005e-05, -2.9741786420345306e-05, -2.845749258995056e-05, -2.7173198759555817e-05, -2.5888904929161072e-05, -2.4604611098766327e-05, -2.3320317268371582e-05, -2.2036023437976837e-05, -2.0751729607582092e-05, -1.9467435777187347e-05, -1.8183141946792603e-05, -1.6898848116397858e-05, -1.5614554286003113e-05, -1.4330260455608368e-05, -1.3045966625213623e-05, -1.1761672794818878e-05, -1.0477378964424133e-05, -9.193085134029388e-06, -7.908791303634644e-06, -6.624497473239899e-06, -5.340203642845154e-06, -4.055909812450409e-06, -2.771615982055664e-06, -1.4873221516609192e-06, -2.0302832126617432e-07, 1.0812655091285706e-06, 2.3655593395233154e-06, 3.6498531699180603e-06, 4.934147000312805e-06, 6.21844083070755e-06, 7.502734661102295e-06, 8.78702849149704e-06, 1.0071322321891785e-05, 1.135561615228653e-05, 1.2639909982681274e-05, 1.392420381307602e-05, 1.5208497643470764e-05, 1.649279147386551e-05, 1.7777085304260254e-05, 1.9061379134655e-05, 2.0345672965049744e-05, 2.162996679544449e-05, 2.2914260625839233e-05, 2.4198554456233978e-05, 2.5482848286628723e-05, 2.6767142117023468e-05, 2.8051435947418213e-05, 2.9335729777812958e-05, 3.06200236082077e-05, 3.190431743860245e-05, 3.318861126899719e-05, 3.447290509939194e-05, 3.575719892978668e-05, 3.704149276018143e-05, 3.832578659057617e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 7.0, 14.0, 18.0, 32.0, 32.0, 58.0, 72.0, 112.0, 177.0, 229.0, 350.0, 539.0, 822.0, 1278.0, 1940.0, 3103.0, 5086.0, 8348.0, 14969.0, 27527.0, 54318.0, 115063.0, 233305.0, 275589.0, 152712.0, 71931.0, 35401.0, 18593.0, 10472.0, 6026.0, 3750.0, 2299.0, 1432.0, 926.0, 649.0, 423.0, 304.0, 176.0, 160.0, 92.0, 63.0, 48.0, 40.0, 21.0, 12.0, 11.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0], "bins": [-0.26220703125, -0.25453758239746094, -0.24686813354492188, -0.2391986846923828, -0.23152923583984375, -0.2238597869873047, -0.21619033813476562, -0.20852088928222656, -0.2008514404296875, -0.19318199157714844, -0.18551254272460938, -0.1778430938720703, -0.17017364501953125, -0.1625041961669922, -0.15483474731445312, -0.14716529846191406, -0.139495849609375, -0.13182640075683594, -0.12415695190429688, -0.11648750305175781, -0.10881805419921875, -0.10114860534667969, -0.09347915649414062, -0.08580970764160156, -0.0781402587890625, -0.07047080993652344, -0.06280136108398438, -0.05513191223144531, -0.04746246337890625, -0.03979301452636719, -0.032123565673828125, -0.024454116821289062, -0.01678466796875, -0.009115219116210938, -0.001445770263671875, 0.0062236785888671875, 0.01389312744140625, 0.021562576293945312, 0.029232025146484375, 0.03690147399902344, 0.0445709228515625, 0.05224037170410156, 0.059909820556640625, 0.06757926940917969, 0.07524871826171875, 0.08291816711425781, 0.09058761596679688, 0.09825706481933594, 0.105926513671875, 0.11359596252441406, 0.12126541137695312, 0.1289348602294922, 0.13660430908203125, 0.1442737579345703, 0.15194320678710938, 0.15961265563964844, 0.1672821044921875, 0.17495155334472656, 0.18262100219726562, 0.1902904510498047, 0.19795989990234375, 0.2056293487548828, 0.21329879760742188, 0.22096824645996094, 0.2286376953125]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 6.0, 5.0, 2.0, 8.0, 5.0, 11.0, 15.0, 12.0, 17.0, 28.0, 21.0, 23.0, 49.0, 42.0, 55.0, 53.0, 50.0, 64.0, 61.0, 51.0, 48.0, 64.0, 54.0, 41.0, 44.0, 26.0, 23.0, 18.0, 18.0, 17.0, 14.0, 11.0, 11.0, 8.0, 7.0, 3.0, 7.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05859375, -0.05691099166870117, -0.055228233337402344, -0.053545475006103516, -0.05186271667480469, -0.05017995834350586, -0.04849720001220703, -0.0468144416809082, -0.045131683349609375, -0.04344892501831055, -0.04176616668701172, -0.04008340835571289, -0.03840065002441406, -0.036717891693115234, -0.035035133361816406, -0.03335237503051758, -0.03166961669921875, -0.029986858367919922, -0.028304100036621094, -0.026621341705322266, -0.024938583374023438, -0.02325582504272461, -0.02157306671142578, -0.019890308380126953, -0.018207550048828125, -0.016524791717529297, -0.014842033386230469, -0.01315927505493164, -0.011476516723632812, -0.009793758392333984, -0.008111000061035156, -0.006428241729736328, -0.0047454833984375, -0.003062725067138672, -0.0013799667358398438, 0.0003027915954589844, 0.0019855499267578125, 0.0036683082580566406, 0.005351066589355469, 0.007033824920654297, 0.008716583251953125, 0.010399341583251953, 0.012082099914550781, 0.01376485824584961, 0.015447616577148438, 0.017130374908447266, 0.018813133239746094, 0.020495891571044922, 0.02217864990234375, 0.023861408233642578, 0.025544166564941406, 0.027226924896240234, 0.028909683227539062, 0.03059244155883789, 0.03227519989013672, 0.03395795822143555, 0.035640716552734375, 0.0373234748840332, 0.03900623321533203, 0.04068899154663086, 0.04237174987792969, 0.044054508209228516, 0.045737266540527344, 0.04742002487182617, 0.049102783203125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 7.0, 7.0, 6.0, 14.0, 12.0, 19.0, 24.0, 38.0, 39.0, 59.0, 55.0, 86.0, 88.0, 105.0, 84.0, 88.0, 62.0, 35.0, 32.0, 30.0, 27.0, 14.0, 12.0, 13.0, 10.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-18.870174407958984, -18.34699821472168, -17.823820114135742, -17.300643920898438, -16.777467727661133, -16.254291534423828, -15.73111343383789, -15.207937240600586, -14.684760093688965, -14.161582946777344, -13.638406753540039, -13.115229606628418, -12.592052459716797, -12.068876266479492, -11.545699119567871, -11.02252197265625, -10.499345779418945, -9.976168632507324, -9.45299243927002, -8.929815292358398, -8.406639099121094, -7.883461952209473, -7.360284805297852, -6.837108135223389, -6.313931465148926, -5.790754795074463, -5.267578125, -4.744400978088379, -4.221224308013916, -3.698047637939453, -3.174870729446411, -2.651693820953369, -2.1285152435302734, -1.605338454246521, -1.0821616649627686, -0.5589848756790161, -0.03580808639526367, 0.4873685836791992, 1.0105454921722412, 1.5337224006652832, 2.056899070739746, 2.580075740814209, 3.103252649307251, 3.626429557800293, 4.149606227874756, 4.672782897949219, 5.19596004486084, 5.719136714935303, 6.242313385009766, 6.7654900550842285, 7.288666725158691, 7.8118438720703125, 8.335020065307617, 8.858197212219238, 9.38137435913086, 9.904550552368164, 10.427727699279785, 10.950904846191406, 11.474081039428711, 11.997258186340332, 12.520435333251953, 13.043611526489258, 13.566788673400879, 14.0899658203125, 14.613142013549805]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 15.0, 11.0, 16.0, 19.0, 15.0, 20.0, 25.0, 28.0, 28.0, 26.0, 39.0, 35.0, 32.0, 44.0, 42.0, 50.0, 37.0, 45.0, 35.0, 38.0, 39.0, 38.0, 41.0, 44.0, 23.0, 33.0, 23.0, 29.0, 24.0, 18.0, 10.0, 16.0, 12.0, 7.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.051680564880371, -8.760268211364746, -8.468855857849121, -8.177443504333496, -7.886031150817871, -7.594618797302246, -7.303206443786621, -7.011794090270996, -6.720381736755371, -6.428969383239746, -6.137557029724121, -5.846144676208496, -5.554732322692871, -5.263319969177246, -4.971907615661621, -4.680495262145996, -4.389082908630371, -4.097670555114746, -3.806258201599121, -3.514845848083496, -3.223433494567871, -2.932021141052246, -2.640608787536621, -2.349196434020996, -2.057784080505371, -1.766371726989746, -1.474959373474121, -1.183547019958496, -0.8921346664428711, -0.6007223129272461, -0.3093099594116211, -0.017897605895996094, 0.2735157012939453, 0.5649280548095703, 0.8563404083251953, 1.1477527618408203, 1.4391651153564453, 1.7305774688720703, 2.0219898223876953, 2.3134021759033203, 2.6048145294189453, 2.8962268829345703, 3.1876392364501953, 3.4790515899658203, 3.7704639434814453, 4.06187629699707, 4.353288650512695, 4.64470100402832, 4.936113357543945, 5.22752571105957, 5.518938064575195, 5.81035041809082, 6.101762771606445, 6.39317512512207, 6.684587478637695, 6.97599983215332, 7.267412185668945, 7.55882453918457, 7.850236892700195, 8.14164924621582, 8.433061599731445, 8.72447395324707, 9.015886306762695, 9.30729866027832, 9.598711013793945]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 7.0, 9.0, 14.0, 19.0, 32.0, 60.0, 80.0, 91.0, 167.0, 237.0, 394.0, 559.0, 864.0, 1527.0, 2319.0, 3641.0, 6144.0, 10286.0, 18243.0, 34409.0, 69496.0, 151954.0, 279049.0, 237990.0, 113670.0, 53116.0, 27429.0, 14814.0, 8476.0, 4997.0, 3082.0, 1969.0, 1216.0, 770.0, 470.0, 344.0, 165.0, 147.0, 104.0, 62.0, 50.0, 29.0, 12.0, 16.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.78125, -15.2852783203125, -14.789306640625, -14.2933349609375, -13.79736328125, -13.3013916015625, -12.805419921875, -12.3094482421875, -11.8134765625, -11.3175048828125, -10.821533203125, -10.3255615234375, -9.82958984375, -9.3336181640625, -8.837646484375, -8.3416748046875, -7.845703125, -7.3497314453125, -6.853759765625, -6.3577880859375, -5.86181640625, -5.3658447265625, -4.869873046875, -4.3739013671875, -3.8779296875, -3.3819580078125, -2.885986328125, -2.3900146484375, -1.89404296875, -1.3980712890625, -0.902099609375, -0.4061279296875, 0.08984375, 0.5858154296875, 1.081787109375, 1.5777587890625, 2.07373046875, 2.5697021484375, 3.065673828125, 3.5616455078125, 4.0576171875, 4.5535888671875, 5.049560546875, 5.5455322265625, 6.04150390625, 6.5374755859375, 7.033447265625, 7.5294189453125, 8.025390625, 8.5213623046875, 9.017333984375, 9.5133056640625, 10.00927734375, 10.5052490234375, 11.001220703125, 11.4971923828125, 11.9931640625, 12.4891357421875, 12.985107421875, 13.4810791015625, 13.97705078125, 14.4730224609375, 14.968994140625, 15.4649658203125, 15.9609375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 3.0, 10.0, 12.0, 15.0, 22.0, 16.0, 16.0, 20.0, 28.0, 25.0, 27.0, 32.0, 36.0, 41.0, 38.0, 48.0, 56.0, 41.0, 39.0, 40.0, 49.0, 49.0, 35.0, 39.0, 35.0, 31.0, 31.0, 22.0, 21.0, 20.0, 17.0, 25.0, 9.0, 11.0, 6.0, 5.0, 5.0, 7.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.783447265625, -9.44970703125, -9.115966796875, -8.7822265625, -8.448486328125, -8.11474609375, -7.781005859375, -7.447265625, -7.113525390625, -6.77978515625, -6.446044921875, -6.1123046875, -5.778564453125, -5.44482421875, -5.111083984375, -4.77734375, -4.443603515625, -4.10986328125, -3.776123046875, -3.4423828125, -3.108642578125, -2.77490234375, -2.441162109375, -2.107421875, -1.773681640625, -1.43994140625, -1.106201171875, -0.7724609375, -0.438720703125, -0.10498046875, 0.228759765625, 0.5625, 0.896240234375, 1.22998046875, 1.563720703125, 1.8974609375, 2.231201171875, 2.56494140625, 2.898681640625, 3.232421875, 3.566162109375, 3.89990234375, 4.233642578125, 4.5673828125, 4.901123046875, 5.23486328125, 5.568603515625, 5.90234375, 6.236083984375, 6.56982421875, 6.903564453125, 7.2373046875, 7.571044921875, 7.90478515625, 8.238525390625, 8.572265625, 8.906005859375, 9.23974609375, 9.573486328125, 9.9072265625, 10.240966796875, 10.57470703125, 10.908447265625, 11.2421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 6.0, 12.0, 12.0, 19.0, 28.0, 43.0, 72.0, 100.0, 147.0, 232.0, 339.0, 549.0, 764.0, 1188.0, 1896.0, 3075.0, 5190.0, 8948.0, 15952.0, 29942.0, 59274.0, 120194.0, 222198.0, 254294.0, 157849.0, 78769.0, 39336.0, 20270.0, 11108.0, 6399.0, 3780.0, 2274.0, 1465.0, 953.0, 602.0, 423.0, 274.0, 193.0, 138.0, 78.0, 53.0, 40.0, 26.0, 23.0, 9.0, 10.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.765625, -13.309814453125, -12.85400390625, -12.398193359375, -11.9423828125, -11.486572265625, -11.03076171875, -10.574951171875, -10.119140625, -9.663330078125, -9.20751953125, -8.751708984375, -8.2958984375, -7.840087890625, -7.38427734375, -6.928466796875, -6.47265625, -6.016845703125, -5.56103515625, -5.105224609375, -4.6494140625, -4.193603515625, -3.73779296875, -3.281982421875, -2.826171875, -2.370361328125, -1.91455078125, -1.458740234375, -1.0029296875, -0.547119140625, -0.09130859375, 0.364501953125, 0.8203125, 1.276123046875, 1.73193359375, 2.187744140625, 2.6435546875, 3.099365234375, 3.55517578125, 4.010986328125, 4.466796875, 4.922607421875, 5.37841796875, 5.834228515625, 6.2900390625, 6.745849609375, 7.20166015625, 7.657470703125, 8.11328125, 8.569091796875, 9.02490234375, 9.480712890625, 9.9365234375, 10.392333984375, 10.84814453125, 11.303955078125, 11.759765625, 12.215576171875, 12.67138671875, 13.127197265625, 13.5830078125, 14.038818359375, 14.49462890625, 14.950439453125, 15.40625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 2.0, 7.0, 5.0, 5.0, 4.0, 9.0, 10.0, 13.0, 20.0, 25.0, 24.0, 28.0, 25.0, 28.0, 40.0, 40.0, 41.0, 32.0, 45.0, 43.0, 54.0, 36.0, 45.0, 48.0, 39.0, 38.0, 33.0, 24.0, 30.0, 25.0, 30.0, 20.0, 21.0, 27.0, 10.0, 19.0, 11.0, 8.0, 9.0, 8.0, 3.0, 0.0, 6.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-6.08984375, -5.9114990234375, -5.733154296875, -5.5548095703125, -5.37646484375, -5.1981201171875, -5.019775390625, -4.8414306640625, -4.6630859375, -4.4847412109375, -4.306396484375, -4.1280517578125, -3.94970703125, -3.7713623046875, -3.593017578125, -3.4146728515625, -3.236328125, -3.0579833984375, -2.879638671875, -2.7012939453125, -2.52294921875, -2.3446044921875, -2.166259765625, -1.9879150390625, -1.8095703125, -1.6312255859375, -1.452880859375, -1.2745361328125, -1.09619140625, -0.9178466796875, -0.739501953125, -0.5611572265625, -0.3828125, -0.2044677734375, -0.026123046875, 0.1522216796875, 0.33056640625, 0.5089111328125, 0.687255859375, 0.8656005859375, 1.0439453125, 1.2222900390625, 1.400634765625, 1.5789794921875, 1.75732421875, 1.9356689453125, 2.114013671875, 2.2923583984375, 2.470703125, 2.6490478515625, 2.827392578125, 3.0057373046875, 3.18408203125, 3.3624267578125, 3.540771484375, 3.7191162109375, 3.8974609375, 4.0758056640625, 4.254150390625, 4.4324951171875, 4.61083984375, 4.7891845703125, 4.967529296875, 5.1458740234375, 5.32421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 11.0, 11.0, 17.0, 17.0, 26.0, 38.0, 49.0, 79.0, 93.0, 123.0, 181.0, 220.0, 327.0, 395.0, 545.0, 768.0, 1145.0, 1640.0, 2664.0, 4765.0, 9880.0, 23740.0, 75593.0, 292805.0, 434059.0, 131783.0, 37566.0, 13820.0, 6198.0, 3390.0, 1920.0, 1285.0, 920.0, 695.0, 466.0, 348.0, 254.0, 174.0, 141.0, 131.0, 85.0, 52.0, 35.0, 42.0, 18.0, 13.0, 8.0, 9.0, 8.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.328125, -15.83642578125, -15.3447265625, -14.85302734375, -14.361328125, -13.86962890625, -13.3779296875, -12.88623046875, -12.39453125, -11.90283203125, -11.4111328125, -10.91943359375, -10.427734375, -9.93603515625, -9.4443359375, -8.95263671875, -8.4609375, -7.96923828125, -7.4775390625, -6.98583984375, -6.494140625, -6.00244140625, -5.5107421875, -5.01904296875, -4.52734375, -4.03564453125, -3.5439453125, -3.05224609375, -2.560546875, -2.06884765625, -1.5771484375, -1.08544921875, -0.59375, -0.10205078125, 0.3896484375, 0.88134765625, 1.373046875, 1.86474609375, 2.3564453125, 2.84814453125, 3.33984375, 3.83154296875, 4.3232421875, 4.81494140625, 5.306640625, 5.79833984375, 6.2900390625, 6.78173828125, 7.2734375, 7.76513671875, 8.2568359375, 8.74853515625, 9.240234375, 9.73193359375, 10.2236328125, 10.71533203125, 11.20703125, 11.69873046875, 12.1904296875, 12.68212890625, 13.173828125, 13.66552734375, 14.1572265625, 14.64892578125, 15.140625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 5.0, 4.0, 2.0, 8.0, 10.0, 13.0, 21.0, 22.0, 41.0, 65.0, 96.0, 114.0, 131.0, 138.0, 90.0, 60.0, 46.0, 30.0, 32.0, 23.0, 13.0, 7.0, 9.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00122833251953125, -0.0011882781982421875, -0.001148223876953125, -0.0011081695556640625, -0.001068115234375, -0.0010280609130859375, -0.000988006591796875, -0.0009479522705078125, -0.00090789794921875, -0.0008678436279296875, -0.000827789306640625, -0.0007877349853515625, -0.0007476806640625, -0.0007076263427734375, -0.000667572021484375, -0.0006275177001953125, -0.00058746337890625, -0.0005474090576171875, -0.000507354736328125, -0.0004673004150390625, -0.00042724609375, -0.0003871917724609375, -0.000347137451171875, -0.0003070831298828125, -0.00026702880859375, -0.0002269744873046875, -0.000186920166015625, -0.0001468658447265625, -0.0001068115234375, -6.67572021484375e-05, -2.6702880859375e-05, 1.33514404296875e-05, 5.340576171875e-05, 9.34600830078125e-05, 0.000133514404296875, 0.0001735687255859375, 0.000213623046875, 0.0002536773681640625, 0.000293731689453125, 0.0003337860107421875, 0.00037384033203125, 0.0004138946533203125, 0.000453948974609375, 0.0004940032958984375, 0.0005340576171875, 0.0005741119384765625, 0.000614166259765625, 0.0006542205810546875, 0.00069427490234375, 0.0007343292236328125, 0.000774383544921875, 0.0008144378662109375, 0.0008544921875, 0.0008945465087890625, 0.000934600830078125, 0.0009746551513671875, 0.00101470947265625, 0.0010547637939453125, 0.001094818115234375, 0.0011348724365234375, 0.0011749267578125, 0.0012149810791015625, 0.001255035400390625, 0.0012950897216796875, 0.00133514404296875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 11.0, 24.0, 30.0, 51.0, 69.0, 81.0, 107.0, 154.0, 207.0, 308.0, 415.0, 558.0, 835.0, 1111.0, 1708.0, 2592.0, 4154.0, 8297.0, 22189.0, 88855.0, 422350.0, 378159.0, 76786.0, 19745.0, 7789.0, 4001.0, 2426.0, 1609.0, 1151.0, 820.0, 556.0, 401.0, 275.0, 193.0, 149.0, 97.0, 84.0, 61.0, 53.0, 23.0, 23.0, 16.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-17.765625, -17.271484375, -16.77734375, -16.283203125, -15.7890625, -15.294921875, -14.80078125, -14.306640625, -13.8125, -13.318359375, -12.82421875, -12.330078125, -11.8359375, -11.341796875, -10.84765625, -10.353515625, -9.859375, -9.365234375, -8.87109375, -8.376953125, -7.8828125, -7.388671875, -6.89453125, -6.400390625, -5.90625, -5.412109375, -4.91796875, -4.423828125, -3.9296875, -3.435546875, -2.94140625, -2.447265625, -1.953125, -1.458984375, -0.96484375, -0.470703125, 0.0234375, 0.517578125, 1.01171875, 1.505859375, 2.0, 2.494140625, 2.98828125, 3.482421875, 3.9765625, 4.470703125, 4.96484375, 5.458984375, 5.953125, 6.447265625, 6.94140625, 7.435546875, 7.9296875, 8.423828125, 8.91796875, 9.412109375, 9.90625, 10.400390625, 10.89453125, 11.388671875, 11.8828125, 12.376953125, 12.87109375, 13.365234375, 13.859375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 3.0, 4.0, 6.0, 11.0, 12.0, 23.0, 29.0, 42.0, 68.0, 79.0, 96.0, 100.0, 104.0, 99.0, 84.0, 57.0, 48.0, 39.0, 15.0, 13.0, 9.0, 9.0, 8.0, 6.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.080078125, -2.994964599609375, -2.90985107421875, -2.824737548828125, -2.7396240234375, -2.654510498046875, -2.56939697265625, -2.484283447265625, -2.399169921875, -2.314056396484375, -2.22894287109375, -2.143829345703125, -2.0587158203125, -1.973602294921875, -1.88848876953125, -1.803375244140625, -1.71826171875, -1.633148193359375, -1.54803466796875, -1.462921142578125, -1.3778076171875, -1.292694091796875, -1.20758056640625, -1.122467041015625, -1.037353515625, -0.952239990234375, -0.86712646484375, -0.782012939453125, -0.6968994140625, -0.611785888671875, -0.52667236328125, -0.441558837890625, -0.3564453125, -0.271331787109375, -0.18621826171875, -0.101104736328125, -0.0159912109375, 0.069122314453125, 0.15423583984375, 0.239349365234375, 0.324462890625, 0.409576416015625, 0.49468994140625, 0.579803466796875, 0.6649169921875, 0.750030517578125, 0.83514404296875, 0.920257568359375, 1.00537109375, 1.090484619140625, 1.17559814453125, 1.260711669921875, 1.3458251953125, 1.430938720703125, 1.51605224609375, 1.601165771484375, 1.686279296875, 1.771392822265625, 1.85650634765625, 1.941619873046875, 2.0267333984375, 2.111846923828125, 2.19696044921875, 2.282073974609375, 2.3671875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 4.0, 6.0, 6.0, 10.0, 4.0, 16.0, 22.0, 16.0, 18.0, 24.0, 42.0, 50.0, 67.0, 56.0, 65.0, 67.0, 78.0, 79.0, 55.0, 72.0, 49.0, 37.0, 32.0, 29.0, 21.0, 16.0, 10.0, 7.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.805541038513184, -15.328680038452148, -14.851818084716797, -14.374957084655762, -13.898096084594727, -13.421234130859375, -12.94437313079834, -12.467512130737305, -11.990650177001953, -11.513789176940918, -11.036927223205566, -10.560066223144531, -10.08320426940918, -9.606343269348145, -9.12948226928711, -8.652620315551758, -8.175759315490723, -7.698897838592529, -7.222036361694336, -6.745175361633301, -6.268313884735107, -5.791452407836914, -5.314591407775879, -4.8377299308776855, -4.360868453979492, -3.884006977081299, -3.4071457386016846, -2.9302845001220703, -2.453423023223877, -1.9765615463256836, -1.4997003078460693, -1.022839069366455, -0.5459766387939453, -0.0691152811050415, 0.4077460765838623, 0.8846074342727661, 1.36146879196167, 1.8383302688598633, 2.3151915073394775, 2.792052745819092, 3.268914222717285, 3.7457756996154785, 4.222637176513672, 4.699498176574707, 5.1763596534729, 5.653221130371094, 6.130082130432129, 6.606943607330322, 7.083805084228516, 7.560666561126709, 8.037528038024902, 8.514389038085938, 8.991250991821289, 9.468111991882324, 9.94497299194336, 10.421834945678711, 10.898695945739746, 11.375556945800781, 11.852418899536133, 12.329279899597168, 12.806140899658203, 13.283002853393555, 13.75986385345459, 14.236724853515625, 14.713586807250977]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 7.0, 8.0, 7.0, 13.0, 13.0, 14.0, 13.0, 16.0, 23.0, 25.0, 29.0, 22.0, 36.0, 37.0, 44.0, 46.0, 41.0, 38.0, 39.0, 39.0, 34.0, 41.0, 43.0, 41.0, 39.0, 35.0, 36.0, 23.0, 27.0, 28.0, 26.0, 17.0, 21.0, 17.0, 13.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.661446571350098, -9.361954689025879, -9.062463760375977, -8.762971878051758, -8.463479995727539, -8.16398811340332, -7.86449670791626, -7.565005302429199, -7.2655134201049805, -6.966021537780762, -6.666530132293701, -6.367038726806641, -6.067546844482422, -5.768054962158203, -5.468563556671143, -5.169072151184082, -4.869580268859863, -4.5700883865356445, -4.270596981048584, -3.9711053371429443, -3.6716136932373047, -3.372122049331665, -3.0726304054260254, -2.7731387615203857, -2.473647117614746, -2.1741554737091064, -1.8746638298034668, -1.5751721858978271, -1.2756805419921875, -0.9761888980865479, -0.6766972541809082, -0.37720561027526855, -0.0777130126953125, 0.22177863121032715, 0.5212702751159668, 0.8207619190216064, 1.120253562927246, 1.4197452068328857, 1.7192368507385254, 2.018728494644165, 2.3182201385498047, 2.6177117824554443, 2.917203426361084, 3.2166950702667236, 3.5161867141723633, 3.815678358078003, 4.115170001983643, 4.414661407470703, 4.714153289794922, 5.013645172119141, 5.313136577606201, 5.612627983093262, 5.9121198654174805, 6.211611747741699, 6.51110315322876, 6.81059455871582, 7.110086441040039, 7.409578323364258, 7.709069728851318, 8.008561134338379, 8.308053016662598, 8.607544898986816, 8.907035827636719, 9.206527709960938, 9.506019592285156]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 7.0, 2.0, 3.0, 7.0, 13.0, 11.0, 25.0, 55.0, 63.0, 96.0, 118.0, 172.0, 272.0, 387.0, 553.0, 852.0, 1294.0, 1984.0, 3049.0, 5068.0, 9006.0, 18194.0, 44898.0, 150475.0, 673512.0, 1933525.0, 1014158.0, 224598.0, 60183.0, 22892.0, 11244.0, 6246.0, 3801.0, 2455.0, 1556.0, 1051.0, 732.0, 480.0, 369.0, 278.0, 174.0, 132.0, 65.0, 53.0, 55.0, 42.0, 36.0, 15.0, 11.0, 12.0, 8.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.828125, -18.14697265625, -17.4658203125, -16.78466796875, -16.103515625, -15.42236328125, -14.7412109375, -14.06005859375, -13.37890625, -12.69775390625, -12.0166015625, -11.33544921875, -10.654296875, -9.97314453125, -9.2919921875, -8.61083984375, -7.9296875, -7.24853515625, -6.5673828125, -5.88623046875, -5.205078125, -4.52392578125, -3.8427734375, -3.16162109375, -2.48046875, -1.79931640625, -1.1181640625, -0.43701171875, 0.244140625, 0.92529296875, 1.6064453125, 2.28759765625, 2.96875, 3.64990234375, 4.3310546875, 5.01220703125, 5.693359375, 6.37451171875, 7.0556640625, 7.73681640625, 8.41796875, 9.09912109375, 9.7802734375, 10.46142578125, 11.142578125, 11.82373046875, 12.5048828125, 13.18603515625, 13.8671875, 14.54833984375, 15.2294921875, 15.91064453125, 16.591796875, 17.27294921875, 17.9541015625, 18.63525390625, 19.31640625, 19.99755859375, 20.6787109375, 21.35986328125, 22.041015625, 22.72216796875, 23.4033203125, 24.08447265625, 24.765625]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 1.0, 10.0, 6.0, 6.0, 8.0, 15.0, 12.0, 14.0, 21.0, 29.0, 23.0, 19.0, 31.0, 34.0, 33.0, 48.0, 40.0, 41.0, 47.0, 48.0, 62.0, 44.0, 35.0, 38.0, 42.0, 41.0, 23.0, 39.0, 36.0, 26.0, 24.0, 15.0, 18.0, 17.0, 8.0, 10.0, 9.0, 6.0, 2.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046875, -6.775390625, -6.50390625, -6.232421875, -5.9609375, -5.689453125, -5.41796875, -5.146484375, -4.875, -4.603515625, -4.33203125, -4.060546875, -3.7890625, -3.517578125, -3.24609375, -2.974609375, -2.703125, -2.431640625, -2.16015625, -1.888671875, -1.6171875, -1.345703125, -1.07421875, -0.802734375, -0.53125, -0.259765625, 0.01171875, 0.283203125, 0.5546875, 0.826171875, 1.09765625, 1.369140625, 1.640625, 1.912109375, 2.18359375, 2.455078125, 2.7265625, 2.998046875, 3.26953125, 3.541015625, 3.8125, 4.083984375, 4.35546875, 4.626953125, 4.8984375, 5.169921875, 5.44140625, 5.712890625, 5.984375, 6.255859375, 6.52734375, 6.798828125, 7.0703125, 7.341796875, 7.61328125, 7.884765625, 8.15625, 8.427734375, 8.69921875, 8.970703125, 9.2421875, 9.513671875, 9.78515625, 10.056640625, 10.328125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 4.0, 4.0, 1.0, 6.0, 6.0, 6.0, 12.0, 26.0, 31.0, 61.0, 77.0, 112.0, 170.0, 262.0, 407.0, 682.0, 1139.0, 1840.0, 3151.0, 5452.0, 10019.0, 19483.0, 42338.0, 107970.0, 374573.0, 1624338.0, 1487252.0, 334399.0, 99329.0, 39779.0, 18571.0, 9830.0, 5268.0, 3021.0, 1782.0, 1033.0, 684.0, 410.0, 260.0, 155.0, 119.0, 74.0, 52.0, 40.0, 33.0, 7.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-29.140625, -28.30712890625, -27.4736328125, -26.64013671875, -25.806640625, -24.97314453125, -24.1396484375, -23.30615234375, -22.47265625, -21.63916015625, -20.8056640625, -19.97216796875, -19.138671875, -18.30517578125, -17.4716796875, -16.63818359375, -15.8046875, -14.97119140625, -14.1376953125, -13.30419921875, -12.470703125, -11.63720703125, -10.8037109375, -9.97021484375, -9.13671875, -8.30322265625, -7.4697265625, -6.63623046875, -5.802734375, -4.96923828125, -4.1357421875, -3.30224609375, -2.46875, -1.63525390625, -0.8017578125, 0.03173828125, 0.865234375, 1.69873046875, 2.5322265625, 3.36572265625, 4.19921875, 5.03271484375, 5.8662109375, 6.69970703125, 7.533203125, 8.36669921875, 9.2001953125, 10.03369140625, 10.8671875, 11.70068359375, 12.5341796875, 13.36767578125, 14.201171875, 15.03466796875, 15.8681640625, 16.70166015625, 17.53515625, 18.36865234375, 19.2021484375, 20.03564453125, 20.869140625, 21.70263671875, 22.5361328125, 23.36962890625, 24.203125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 3.0, 19.0, 14.0, 19.0, 33.0, 44.0, 58.0, 60.0, 74.0, 122.0, 188.0, 256.0, 315.0, 362.0, 436.0, 412.0, 373.0, 330.0, 228.0, 167.0, 143.0, 88.0, 69.0, 48.0, 41.0, 29.0, 21.0, 20.0, 12.0, 17.0, 11.0, 13.0, 9.0, 5.0, 1.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.0625, -5.87847900390625, -5.6944580078125, -5.51043701171875, -5.326416015625, -5.14239501953125, -4.9583740234375, -4.77435302734375, -4.59033203125, -4.40631103515625, -4.2222900390625, -4.03826904296875, -3.854248046875, -3.67022705078125, -3.4862060546875, -3.30218505859375, -3.1181640625, -2.93414306640625, -2.7501220703125, -2.56610107421875, -2.382080078125, -2.19805908203125, -2.0140380859375, -1.83001708984375, -1.64599609375, -1.46197509765625, -1.2779541015625, -1.09393310546875, -0.909912109375, -0.72589111328125, -0.5418701171875, -0.35784912109375, -0.173828125, 0.01019287109375, 0.1942138671875, 0.37823486328125, 0.562255859375, 0.74627685546875, 0.9302978515625, 1.11431884765625, 1.29833984375, 1.48236083984375, 1.6663818359375, 1.85040283203125, 2.034423828125, 2.21844482421875, 2.4024658203125, 2.58648681640625, 2.7705078125, 2.95452880859375, 3.1385498046875, 3.32257080078125, 3.506591796875, 3.69061279296875, 3.8746337890625, 4.05865478515625, 4.24267578125, 4.42669677734375, 4.6107177734375, 4.79473876953125, 4.978759765625, 5.16278076171875, 5.3468017578125, 5.53082275390625, 5.71484375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 5.0, 2.0, 4.0, 4.0, 9.0, 10.0, 17.0, 22.0, 26.0, 31.0, 48.0, 55.0, 74.0, 86.0, 97.0, 70.0, 89.0, 69.0, 65.0, 49.0, 32.0, 43.0, 30.0, 14.0, 14.0, 12.0, 3.0, 9.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.391027450561523, -20.763254165649414, -20.135480880737305, -19.507709503173828, -18.87993621826172, -18.25216293334961, -17.6243896484375, -16.99661636352539, -16.368844985961914, -15.741071701049805, -15.113299369812012, -14.485526084899902, -13.85775375366211, -13.22998046875, -12.60220718383789, -11.974434852600098, -11.346661567687988, -10.718888282775879, -10.091115951538086, -9.463342666625977, -8.835570335388184, -8.207797050476074, -7.580024242401123, -6.952251434326172, -6.324478626251221, -5.6967058181762695, -5.068933010101318, -4.441160202026367, -3.813387155532837, -3.1856143474578857, -2.5578413009643555, -1.9300684928894043, -1.3022956848144531, -0.6745228171348572, -0.04674994945526123, 0.5810229778289795, 1.2087957859039307, 1.8365685939788818, 2.464341640472412, 3.0921144485473633, 3.7198872566223145, 4.347660064697266, 4.975432872772217, 5.603205680847168, 6.230978965759277, 6.85875129699707, 7.48652458190918, 8.114297866821289, 8.742070198059082, 9.369843482971191, 9.997615814208984, 10.625389099121094, 11.253161430358887, 11.880934715270996, 12.508707046508789, 13.136480331420898, 13.764253616333008, 14.392026901245117, 15.01979923248291, 15.64757251739502, 16.275344848632812, 16.903118133544922, 17.53089141845703, 18.15866470336914, 18.786436080932617]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 7.0, 10.0, 11.0, 6.0, 12.0, 15.0, 20.0, 18.0, 22.0, 24.0, 33.0, 37.0, 38.0, 40.0, 41.0, 49.0, 35.0, 32.0, 41.0, 41.0, 41.0, 29.0, 47.0, 46.0, 38.0, 35.0, 31.0, 28.0, 29.0, 25.0, 19.0, 20.0, 13.0, 11.0, 14.0, 14.0, 7.0, 9.0, 5.0, 8.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.964448928833008, -10.612944602966309, -10.261439323425293, -9.909934997558594, -9.558429718017578, -9.206925392150879, -8.85542106628418, -8.503915786743164, -8.152411460876465, -7.800906658172607, -7.44940185546875, -7.097897529602051, -6.746392726898193, -6.394887924194336, -6.0433831214904785, -5.691878318786621, -5.340373516082764, -4.988868713378906, -4.637363910675049, -4.285859107971191, -3.934354782104492, -3.5828499794006348, -3.2313451766967773, -2.879840612411499, -2.5283358097076416, -2.176831007003784, -1.8253264427185059, -1.4738216400146484, -1.1223169565200806, -0.7708122730255127, -0.4193074703216553, -0.06780290603637695, 0.28370189666748047, 0.6352065801620483, 0.986711323261261, 1.3382160663604736, 1.6897207498550415, 2.0412254333496094, 2.392730236053467, 2.744234800338745, 3.0957396030426025, 3.44724440574646, 3.7987489700317383, 4.150253772735596, 4.501758575439453, 4.853262901306152, 5.204768180847168, 5.556272506713867, 5.907777309417725, 6.259282112121582, 6.6107869148254395, 6.962291717529297, 7.313796043395996, 7.6653008460998535, 8.016805648803711, 8.36830997467041, 8.719815254211426, 9.071319580078125, 9.42282485961914, 9.77432918548584, 10.125834465026855, 10.477338790893555, 10.82884407043457, 11.18034839630127, 11.531852722167969]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 7.0, 4.0, 12.0, 17.0, 22.0, 30.0, 44.0, 63.0, 101.0, 195.0, 278.0, 434.0, 722.0, 1207.0, 2200.0, 4099.0, 7764.0, 16456.0, 37332.0, 101118.0, 327947.0, 359878.0, 112214.0, 40658.0, 17488.0, 8283.0, 4324.0, 2299.0, 1281.0, 786.0, 470.0, 294.0, 167.0, 129.0, 84.0, 43.0, 37.0, 21.0, 12.0, 14.0, 10.0, 8.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1953125, -3.088958740234375, -2.98260498046875, -2.876251220703125, -2.7698974609375, -2.663543701171875, -2.55718994140625, -2.450836181640625, -2.344482421875, -2.238128662109375, -2.13177490234375, -2.025421142578125, -1.9190673828125, -1.812713623046875, -1.70635986328125, -1.600006103515625, -1.49365234375, -1.387298583984375, -1.28094482421875, -1.174591064453125, -1.0682373046875, -0.961883544921875, -0.85552978515625, -0.749176025390625, -0.642822265625, -0.536468505859375, -0.43011474609375, -0.323760986328125, -0.2174072265625, -0.111053466796875, -0.00469970703125, 0.101654052734375, 0.2080078125, 0.314361572265625, 0.42071533203125, 0.527069091796875, 0.6334228515625, 0.739776611328125, 0.84613037109375, 0.952484130859375, 1.058837890625, 1.165191650390625, 1.27154541015625, 1.377899169921875, 1.4842529296875, 1.590606689453125, 1.69696044921875, 1.803314208984375, 1.90966796875, 2.016021728515625, 2.12237548828125, 2.228729248046875, 2.3350830078125, 2.441436767578125, 2.54779052734375, 2.654144287109375, 2.760498046875, 2.866851806640625, 2.97320556640625, 3.079559326171875, 3.1859130859375, 3.292266845703125, 3.39862060546875, 3.504974365234375, 3.611328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 10.0, 10.0, 14.0, 12.0, 14.0, 15.0, 28.0, 31.0, 35.0, 38.0, 38.0, 43.0, 45.0, 38.0, 43.0, 42.0, 43.0, 37.0, 45.0, 49.0, 44.0, 40.0, 28.0, 37.0, 40.0, 16.0, 26.0, 17.0, 18.0, 16.0, 16.0, 11.0, 13.0, 8.0, 12.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.4453125, -12.0531005859375, -11.660888671875, -11.2686767578125, -10.87646484375, -10.4842529296875, -10.092041015625, -9.6998291015625, -9.3076171875, -8.9154052734375, -8.523193359375, -8.1309814453125, -7.73876953125, -7.3465576171875, -6.954345703125, -6.5621337890625, -6.169921875, -5.7777099609375, -5.385498046875, -4.9932861328125, -4.60107421875, -4.2088623046875, -3.816650390625, -3.4244384765625, -3.0322265625, -2.6400146484375, -2.247802734375, -1.8555908203125, -1.46337890625, -1.0711669921875, -0.678955078125, -0.2867431640625, 0.10546875, 0.4976806640625, 0.889892578125, 1.2821044921875, 1.67431640625, 2.0665283203125, 2.458740234375, 2.8509521484375, 3.2431640625, 3.6353759765625, 4.027587890625, 4.4197998046875, 4.81201171875, 5.2042236328125, 5.596435546875, 5.9886474609375, 6.380859375, 6.7730712890625, 7.165283203125, 7.5574951171875, 7.94970703125, 8.3419189453125, 8.734130859375, 9.1263427734375, 9.5185546875, 9.9107666015625, 10.302978515625, 10.6951904296875, 11.08740234375, 11.4796142578125, 11.871826171875, 12.2640380859375, 12.65625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 9.0, 9.0, 13.0, 21.0, 22.0, 30.0, 58.0, 60.0, 103.0, 136.0, 223.0, 311.0, 470.0, 769.0, 1212.0, 1930.0, 3387.0, 6834.0, 16266.0, 77220.0, 886076.0, 30709.0, 10672.0, 4907.0, 2707.0, 1539.0, 953.0, 605.0, 430.0, 275.0, 165.0, 117.0, 86.0, 51.0, 44.0, 40.0, 23.0, 24.0, 10.0, 11.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.359375, -8.100341796875, -7.84130859375, -7.582275390625, -7.3232421875, -7.064208984375, -6.80517578125, -6.546142578125, -6.287109375, -6.028076171875, -5.76904296875, -5.510009765625, -5.2509765625, -4.991943359375, -4.73291015625, -4.473876953125, -4.21484375, -3.955810546875, -3.69677734375, -3.437744140625, -3.1787109375, -2.919677734375, -2.66064453125, -2.401611328125, -2.142578125, -1.883544921875, -1.62451171875, -1.365478515625, -1.1064453125, -0.847412109375, -0.58837890625, -0.329345703125, -0.0703125, 0.188720703125, 0.44775390625, 0.706787109375, 0.9658203125, 1.224853515625, 1.48388671875, 1.742919921875, 2.001953125, 2.260986328125, 2.52001953125, 2.779052734375, 3.0380859375, 3.297119140625, 3.55615234375, 3.815185546875, 4.07421875, 4.333251953125, 4.59228515625, 4.851318359375, 5.1103515625, 5.369384765625, 5.62841796875, 5.887451171875, 6.146484375, 6.405517578125, 6.66455078125, 6.923583984375, 7.1826171875, 7.441650390625, 7.70068359375, 7.959716796875, 8.21875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 5.0, 4.0, 13.0, 7.0, 8.0, 9.0, 20.0, 30.0, 17.0, 28.0, 29.0, 33.0, 28.0, 33.0, 53.0, 43.0, 28.0, 40.0, 53.0, 35.0, 41.0, 44.0, 37.0, 27.0, 31.0, 38.0, 22.0, 24.0, 28.0, 26.0, 29.0, 17.0, 21.0, 17.0, 10.0, 8.0, 14.0, 3.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.890625, -6.67822265625, -6.4658203125, -6.25341796875, -6.041015625, -5.82861328125, -5.6162109375, -5.40380859375, -5.19140625, -4.97900390625, -4.7666015625, -4.55419921875, -4.341796875, -4.12939453125, -3.9169921875, -3.70458984375, -3.4921875, -3.27978515625, -3.0673828125, -2.85498046875, -2.642578125, -2.43017578125, -2.2177734375, -2.00537109375, -1.79296875, -1.58056640625, -1.3681640625, -1.15576171875, -0.943359375, -0.73095703125, -0.5185546875, -0.30615234375, -0.09375, 0.11865234375, 0.3310546875, 0.54345703125, 0.755859375, 0.96826171875, 1.1806640625, 1.39306640625, 1.60546875, 1.81787109375, 2.0302734375, 2.24267578125, 2.455078125, 2.66748046875, 2.8798828125, 3.09228515625, 3.3046875, 3.51708984375, 3.7294921875, 3.94189453125, 4.154296875, 4.36669921875, 4.5791015625, 4.79150390625, 5.00390625, 5.21630859375, 5.4287109375, 5.64111328125, 5.853515625, 6.06591796875, 6.2783203125, 6.49072265625, 6.703125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 3.0, 11.0, 6.0, 9.0, 11.0, 14.0, 17.0, 33.0, 35.0, 52.0, 53.0, 94.0, 110.0, 187.0, 260.0, 404.0, 605.0, 952.0, 1665.0, 2884.0, 6086.0, 14469.0, 72995.0, 902989.0, 26079.0, 8715.0, 4067.0, 2148.0, 1255.0, 795.0, 542.0, 305.0, 185.0, 123.0, 111.0, 69.0, 55.0, 38.0, 25.0, 24.0, 18.0, 19.0, 11.0, 10.0, 6.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.822265625, -1.7657623291015625, -1.709259033203125, -1.6527557373046875, -1.59625244140625, -1.5397491455078125, -1.483245849609375, -1.4267425537109375, -1.3702392578125, -1.3137359619140625, -1.257232666015625, -1.2007293701171875, -1.14422607421875, -1.0877227783203125, -1.031219482421875, -0.9747161865234375, -0.918212890625, -0.8617095947265625, -0.805206298828125, -0.7487030029296875, -0.69219970703125, -0.6356964111328125, -0.579193115234375, -0.5226898193359375, -0.4661865234375, -0.4096832275390625, -0.353179931640625, -0.2966766357421875, -0.24017333984375, -0.1836700439453125, -0.127166748046875, -0.0706634521484375, -0.01416015625, 0.0423431396484375, 0.098846435546875, 0.1553497314453125, 0.21185302734375, 0.2683563232421875, 0.324859619140625, 0.3813629150390625, 0.4378662109375, 0.4943695068359375, 0.550872802734375, 0.6073760986328125, 0.66387939453125, 0.7203826904296875, 0.776885986328125, 0.8333892822265625, 0.889892578125, 0.9463958740234375, 1.002899169921875, 1.0594024658203125, 1.11590576171875, 1.1724090576171875, 1.228912353515625, 1.2854156494140625, 1.3419189453125, 1.3984222412109375, 1.454925537109375, 1.5114288330078125, 1.56793212890625, 1.6244354248046875, 1.680938720703125, 1.7374420166015625, 1.7939453125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 7.0, 7.0, 9.0, 5.0, 20.0, 21.0, 43.0, 51.0, 65.0, 102.0, 106.0, 112.0, 96.0, 84.0, 71.0, 58.0, 34.0, 29.0, 22.0, 13.0, 11.0, 9.0, 9.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.52346420288086e-05, -8.202530443668365e-05, -7.881596684455872e-05, -7.560662925243378e-05, -7.239729166030884e-05, -6.91879540681839e-05, -6.597861647605896e-05, -6.276927888393402e-05, -5.955994129180908e-05, -5.635060369968414e-05, -5.3141266107559204e-05, -4.9931928515434265e-05, -4.6722590923309326e-05, -4.351325333118439e-05, -4.030391573905945e-05, -3.709457814693451e-05, -3.388524055480957e-05, -3.067590296268463e-05, -2.7466565370559692e-05, -2.4257227778434753e-05, -2.1047890186309814e-05, -1.7838552594184875e-05, -1.4629215002059937e-05, -1.1419877409934998e-05, -8.210539817810059e-06, -5.00120222568512e-06, -1.7918646335601807e-06, 1.4174729585647583e-06, 4.626810550689697e-06, 7.836148142814636e-06, 1.1045485734939575e-05, 1.4254823327064514e-05, 1.7464160919189453e-05, 2.0673498511314392e-05, 2.388283610343933e-05, 2.709217369556427e-05, 3.030151128768921e-05, 3.351084887981415e-05, 3.672018647193909e-05, 3.9929524064064026e-05, 4.3138861656188965e-05, 4.6348199248313904e-05, 4.955753684043884e-05, 5.276687443256378e-05, 5.597621202468872e-05, 5.918554961681366e-05, 6.23948872089386e-05, 6.560422480106354e-05, 6.881356239318848e-05, 7.202289998531342e-05, 7.523223757743835e-05, 7.84415751695633e-05, 8.165091276168823e-05, 8.486025035381317e-05, 8.806958794593811e-05, 9.127892553806305e-05, 9.448826313018799e-05, 9.769760072231293e-05, 0.00010090693831443787, 0.0001041162759065628, 0.00010732561349868774, 0.00011053495109081268, 0.00011374428868293762, 0.00011695362627506256, 0.0001201629638671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 12.0, 5.0, 19.0, 12.0, 23.0, 43.0, 35.0, 54.0, 85.0, 113.0, 179.0, 226.0, 353.0, 538.0, 804.0, 1279.0, 1993.0, 3524.0, 6345.0, 12133.0, 24820.0, 57555.0, 165692.0, 441438.0, 204679.0, 67031.0, 28557.0, 13707.0, 7160.0, 3898.0, 2315.0, 1388.0, 853.0, 539.0, 370.0, 215.0, 160.0, 107.0, 79.0, 65.0, 38.0, 39.0, 19.0, 19.0, 12.0, 5.0, 4.0, 6.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.71728515625, -0.6938323974609375, -0.670379638671875, -0.6469268798828125, -0.62347412109375, -0.6000213623046875, -0.576568603515625, -0.5531158447265625, -0.5296630859375, -0.5062103271484375, -0.482757568359375, -0.4593048095703125, -0.43585205078125, -0.4123992919921875, -0.388946533203125, -0.3654937744140625, -0.342041015625, -0.3185882568359375, -0.295135498046875, -0.2716827392578125, -0.24822998046875, -0.2247772216796875, -0.201324462890625, -0.1778717041015625, -0.1544189453125, -0.1309661865234375, -0.107513427734375, -0.0840606689453125, -0.06060791015625, -0.0371551513671875, -0.013702392578125, 0.0097503662109375, 0.033203125, 0.0566558837890625, 0.080108642578125, 0.1035614013671875, 0.12701416015625, 0.1504669189453125, 0.173919677734375, 0.1973724365234375, 0.2208251953125, 0.2442779541015625, 0.267730712890625, 0.2911834716796875, 0.31463623046875, 0.3380889892578125, 0.361541748046875, 0.3849945068359375, 0.408447265625, 0.4319000244140625, 0.455352783203125, 0.4788055419921875, 0.50225830078125, 0.5257110595703125, 0.549163818359375, 0.5726165771484375, 0.5960693359375, 0.6195220947265625, 0.642974853515625, 0.6664276123046875, 0.68988037109375, 0.7133331298828125, 0.736785888671875, 0.7602386474609375, 0.78369140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 15.0, 15.0, 28.0, 33.0, 39.0, 41.0, 61.0, 94.0, 101.0, 116.0, 96.0, 93.0, 66.0, 45.0, 48.0, 22.0, 19.0, 22.0, 13.0, 7.0, 8.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1453857421875, -0.1401042938232422, -0.13482284545898438, -0.12954139709472656, -0.12425994873046875, -0.11897850036621094, -0.11369705200195312, -0.10841560363769531, -0.1031341552734375, -0.09785270690917969, -0.09257125854492188, -0.08728981018066406, -0.08200836181640625, -0.07672691345214844, -0.07144546508789062, -0.06616401672363281, -0.060882568359375, -0.05560111999511719, -0.050319671630859375, -0.04503822326660156, -0.03975677490234375, -0.03447532653808594, -0.029193878173828125, -0.023912429809570312, -0.0186309814453125, -0.013349533081054688, -0.008068084716796875, -0.0027866363525390625, 0.00249481201171875, 0.0077762603759765625, 0.013057708740234375, 0.018339157104492188, 0.02362060546875, 0.028902053833007812, 0.034183502197265625, 0.03946495056152344, 0.04474639892578125, 0.05002784729003906, 0.055309295654296875, 0.06059074401855469, 0.0658721923828125, 0.07115364074707031, 0.07643508911132812, 0.08171653747558594, 0.08699798583984375, 0.09227943420410156, 0.09756088256835938, 0.10284233093261719, 0.108123779296875, 0.11340522766113281, 0.11868667602539062, 0.12396812438964844, 0.12924957275390625, 0.13453102111816406, 0.13981246948242188, 0.1450939178466797, 0.1503753662109375, 0.1556568145751953, 0.16093826293945312, 0.16621971130371094, 0.17150115966796875, 0.17678260803222656, 0.18206405639648438, 0.1873455047607422, 0.192626953125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 7.0, 9.0, 17.0, 18.0, 23.0, 32.0, 31.0, 55.0, 66.0, 87.0, 90.0, 76.0, 87.0, 79.0, 63.0, 55.0, 46.0, 30.0, 36.0, 26.0, 17.0, 11.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.638803482055664, -21.012712478637695, -20.386619567871094, -19.760528564453125, -19.134437561035156, -18.508346557617188, -17.88225555419922, -17.256162643432617, -16.63007164001465, -16.00398063659668, -15.377888679504395, -14.75179672241211, -14.12570571899414, -13.499614715576172, -12.873522758483887, -12.247430801391602, -11.621339797973633, -10.995248794555664, -10.369156837463379, -9.743064880371094, -9.116973876953125, -8.490882873535156, -7.864790916442871, -7.238699436187744, -6.612607955932617, -5.98651647567749, -5.360424995422363, -4.734333515167236, -4.108242034912109, -3.4821505546569824, -2.8560590744018555, -2.2299675941467285, -1.6038742065429688, -0.9777827262878418, -0.35169124603271484, 0.2744002342224121, 0.9004917144775391, 1.526583194732666, 2.152674674987793, 2.77876615524292, 3.404857635498047, 4.030949115753174, 4.657040596008301, 5.283132076263428, 5.909223556518555, 6.535315036773682, 7.161406517028809, 7.7874979972839355, 8.413589477539062, 9.039680480957031, 9.665772438049316, 10.291864395141602, 10.91795539855957, 11.544046401977539, 12.170138359069824, 12.79623031616211, 13.422321319580078, 14.048412322998047, 14.674504280090332, 15.300596237182617, 15.926687240600586, 16.552778244018555, 17.178871154785156, 17.804962158203125, 18.431053161621094]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 1.0, 7.0, 10.0, 10.0, 5.0, 13.0, 16.0, 19.0, 18.0, 22.0, 25.0, 31.0, 37.0, 37.0, 42.0, 36.0, 49.0, 39.0, 33.0, 40.0, 41.0, 41.0, 31.0, 44.0, 45.0, 42.0, 34.0, 33.0, 28.0, 30.0, 22.0, 20.0, 20.0, 13.0, 11.0, 12.0, 14.0, 9.0, 8.0, 6.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.989212989807129, -10.639248847961426, -10.289283752441406, -9.939319610595703, -9.58935546875, -9.239391326904297, -8.889427185058594, -8.539462089538574, -8.189497947692871, -7.839533805847168, -7.489569187164307, -7.139604568481445, -6.789640426635742, -6.439676284790039, -6.089711666107178, -5.739747047424316, -5.389782905578613, -5.03981876373291, -4.689854145050049, -4.3398895263671875, -3.9899253845214844, -3.639961004257202, -3.28999662399292, -2.9400322437286377, -2.5900678634643555, -2.2401034832000732, -1.890139102935791, -1.5401747226715088, -1.1902103424072266, -0.8402459621429443, -0.4902815818786621, -0.14031720161437988, 0.20964717864990234, 0.5596115589141846, 0.9095759391784668, 1.259540319442749, 1.6095046997070312, 1.9594690799713135, 2.3094334602355957, 2.659397840499878, 3.00936222076416, 3.3593266010284424, 3.7092909812927246, 4.059255599975586, 4.409219741821289, 4.759183883666992, 5.1091485023498535, 5.459113121032715, 5.809077262878418, 6.159041404724121, 6.509006023406982, 6.858970642089844, 7.208934783935547, 7.55889892578125, 7.908863544464111, 8.258828163146973, 8.608792304992676, 8.958756446838379, 9.308721542358398, 9.658685684204102, 10.008649826049805, 10.358613967895508, 10.708578109741211, 11.05854320526123, 11.408507347106934]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 11.0, 16.0, 13.0, 27.0, 54.0, 79.0, 115.0, 150.0, 243.0, 352.0, 546.0, 902.0, 1358.0, 2034.0, 3412.0, 5581.0, 9774.0, 17305.0, 32833.0, 70718.0, 166962.0, 307939.0, 231285.0, 99250.0, 44767.0, 22249.0, 12210.0, 7019.0, 4114.0, 2587.0, 1659.0, 1016.0, 681.0, 397.0, 289.0, 193.0, 138.0, 88.0, 64.0, 40.0, 25.0, 16.0, 13.0, 9.0, 7.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.15625, -19.5205078125, -18.884765625, -18.2490234375, -17.61328125, -16.9775390625, -16.341796875, -15.7060546875, -15.0703125, -14.4345703125, -13.798828125, -13.1630859375, -12.52734375, -11.8916015625, -11.255859375, -10.6201171875, -9.984375, -9.3486328125, -8.712890625, -8.0771484375, -7.44140625, -6.8056640625, -6.169921875, -5.5341796875, -4.8984375, -4.2626953125, -3.626953125, -2.9912109375, -2.35546875, -1.7197265625, -1.083984375, -0.4482421875, 0.1875, 0.8232421875, 1.458984375, 2.0947265625, 2.73046875, 3.3662109375, 4.001953125, 4.6376953125, 5.2734375, 5.9091796875, 6.544921875, 7.1806640625, 7.81640625, 8.4521484375, 9.087890625, 9.7236328125, 10.359375, 10.9951171875, 11.630859375, 12.2666015625, 12.90234375, 13.5380859375, 14.173828125, 14.8095703125, 15.4453125, 16.0810546875, 16.716796875, 17.3525390625, 17.98828125, 18.6240234375, 19.259765625, 19.8955078125, 20.53125]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 3.0, 10.0, 6.0, 4.0, 9.0, 13.0, 21.0, 19.0, 20.0, 25.0, 23.0, 37.0, 32.0, 47.0, 36.0, 47.0, 42.0, 31.0, 44.0, 40.0, 37.0, 42.0, 39.0, 51.0, 40.0, 39.0, 39.0, 27.0, 32.0, 31.0, 21.0, 9.0, 16.0, 14.0, 10.0, 11.0, 12.0, 6.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.156005859375, -10.78076171875, -10.405517578125, -10.0302734375, -9.655029296875, -9.27978515625, -8.904541015625, -8.529296875, -8.154052734375, -7.77880859375, -7.403564453125, -7.0283203125, -6.653076171875, -6.27783203125, -5.902587890625, -5.52734375, -5.152099609375, -4.77685546875, -4.401611328125, -4.0263671875, -3.651123046875, -3.27587890625, -2.900634765625, -2.525390625, -2.150146484375, -1.77490234375, -1.399658203125, -1.0244140625, -0.649169921875, -0.27392578125, 0.101318359375, 0.4765625, 0.851806640625, 1.22705078125, 1.602294921875, 1.9775390625, 2.352783203125, 2.72802734375, 3.103271484375, 3.478515625, 3.853759765625, 4.22900390625, 4.604248046875, 4.9794921875, 5.354736328125, 5.72998046875, 6.105224609375, 6.48046875, 6.855712890625, 7.23095703125, 7.606201171875, 7.9814453125, 8.356689453125, 8.73193359375, 9.107177734375, 9.482421875, 9.857666015625, 10.23291015625, 10.608154296875, 10.9833984375, 11.358642578125, 11.73388671875, 12.109130859375, 12.484375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 10.0, 17.0, 17.0, 45.0, 50.0, 58.0, 101.0, 129.0, 184.0, 236.0, 376.0, 568.0, 873.0, 1311.0, 2049.0, 3169.0, 5287.0, 9233.0, 15911.0, 29088.0, 56978.0, 116787.0, 222139.0, 259801.0, 158534.0, 77409.0, 38598.0, 20386.0, 11418.0, 6538.0, 3869.0, 2500.0, 1639.0, 1020.0, 701.0, 483.0, 327.0, 234.0, 138.0, 96.0, 76.0, 57.0, 37.0, 30.0, 16.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.328125, -17.740966796875, -17.15380859375, -16.566650390625, -15.9794921875, -15.392333984375, -14.80517578125, -14.218017578125, -13.630859375, -13.043701171875, -12.45654296875, -11.869384765625, -11.2822265625, -10.695068359375, -10.10791015625, -9.520751953125, -8.93359375, -8.346435546875, -7.75927734375, -7.172119140625, -6.5849609375, -5.997802734375, -5.41064453125, -4.823486328125, -4.236328125, -3.649169921875, -3.06201171875, -2.474853515625, -1.8876953125, -1.300537109375, -0.71337890625, -0.126220703125, 0.4609375, 1.048095703125, 1.63525390625, 2.222412109375, 2.8095703125, 3.396728515625, 3.98388671875, 4.571044921875, 5.158203125, 5.745361328125, 6.33251953125, 6.919677734375, 7.5068359375, 8.093994140625, 8.68115234375, 9.268310546875, 9.85546875, 10.442626953125, 11.02978515625, 11.616943359375, 12.2041015625, 12.791259765625, 13.37841796875, 13.965576171875, 14.552734375, 15.139892578125, 15.72705078125, 16.314208984375, 16.9013671875, 17.488525390625, 18.07568359375, 18.662841796875, 19.25]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 9.0, 5.0, 7.0, 13.0, 6.0, 4.0, 11.0, 19.0, 21.0, 28.0, 19.0, 31.0, 32.0, 29.0, 38.0, 38.0, 52.0, 42.0, 35.0, 38.0, 41.0, 45.0, 35.0, 45.0, 46.0, 36.0, 54.0, 32.0, 33.0, 33.0, 27.0, 21.0, 18.0, 13.0, 9.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.10870361328125, -6.8775634765625, -6.64642333984375, -6.415283203125, -6.18414306640625, -5.9530029296875, -5.72186279296875, -5.49072265625, -5.25958251953125, -5.0284423828125, -4.79730224609375, -4.566162109375, -4.33502197265625, -4.1038818359375, -3.87274169921875, -3.6416015625, -3.41046142578125, -3.1793212890625, -2.94818115234375, -2.717041015625, -2.48590087890625, -2.2547607421875, -2.02362060546875, -1.79248046875, -1.56134033203125, -1.3302001953125, -1.09906005859375, -0.867919921875, -0.63677978515625, -0.4056396484375, -0.17449951171875, 0.056640625, 0.28778076171875, 0.5189208984375, 0.75006103515625, 0.981201171875, 1.21234130859375, 1.4434814453125, 1.67462158203125, 1.90576171875, 2.13690185546875, 2.3680419921875, 2.59918212890625, 2.830322265625, 3.06146240234375, 3.2926025390625, 3.52374267578125, 3.7548828125, 3.98602294921875, 4.2171630859375, 4.44830322265625, 4.679443359375, 4.91058349609375, 5.1417236328125, 5.37286376953125, 5.60400390625, 5.83514404296875, 6.0662841796875, 6.29742431640625, 6.528564453125, 6.75970458984375, 6.9908447265625, 7.22198486328125, 7.453125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 5.0, 2.0, 3.0, 10.0, 21.0, 27.0, 31.0, 59.0, 84.0, 111.0, 205.0, 296.0, 402.0, 510.0, 775.0, 1075.0, 1604.0, 2426.0, 3898.0, 6582.0, 11863.0, 23247.0, 53327.0, 145915.0, 361184.0, 264978.0, 92024.0, 36595.0, 17299.0, 9186.0, 5159.0, 3119.0, 2106.0, 1329.0, 970.0, 633.0, 459.0, 344.0, 220.0, 162.0, 109.0, 54.0, 52.0, 26.0, 27.0, 17.0, 13.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.125, -13.63427734375, -13.1435546875, -12.65283203125, -12.162109375, -11.67138671875, -11.1806640625, -10.68994140625, -10.19921875, -9.70849609375, -9.2177734375, -8.72705078125, -8.236328125, -7.74560546875, -7.2548828125, -6.76416015625, -6.2734375, -5.78271484375, -5.2919921875, -4.80126953125, -4.310546875, -3.81982421875, -3.3291015625, -2.83837890625, -2.34765625, -1.85693359375, -1.3662109375, -0.87548828125, -0.384765625, 0.10595703125, 0.5966796875, 1.08740234375, 1.578125, 2.06884765625, 2.5595703125, 3.05029296875, 3.541015625, 4.03173828125, 4.5224609375, 5.01318359375, 5.50390625, 5.99462890625, 6.4853515625, 6.97607421875, 7.466796875, 7.95751953125, 8.4482421875, 8.93896484375, 9.4296875, 9.92041015625, 10.4111328125, 10.90185546875, 11.392578125, 11.88330078125, 12.3740234375, 12.86474609375, 13.35546875, 13.84619140625, 14.3369140625, 14.82763671875, 15.318359375, 15.80908203125, 16.2998046875, 16.79052734375, 17.28125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 6.0, 6.0, 13.0, 17.0, 9.0, 34.0, 52.0, 87.0, 151.0, 181.0, 153.0, 116.0, 57.0, 33.0, 21.0, 10.0, 9.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0026874542236328125, -0.002614140510559082, -0.0025408267974853516, -0.002467513084411621, -0.0023941993713378906, -0.00232088565826416, -0.0022475719451904297, -0.0021742582321166992, -0.0021009445190429688, -0.0020276308059692383, -0.001954317092895508, -0.0018810033798217773, -0.0018076896667480469, -0.0017343759536743164, -0.001661062240600586, -0.0015877485275268555, -0.001514434814453125, -0.0014411211013793945, -0.001367807388305664, -0.0012944936752319336, -0.0012211799621582031, -0.0011478662490844727, -0.0010745525360107422, -0.0010012388229370117, -0.0009279251098632812, -0.0008546113967895508, -0.0007812976837158203, -0.0007079839706420898, -0.0006346702575683594, -0.0005613565444946289, -0.00048804283142089844, -0.00041472911834716797, -0.0003414154052734375, -0.00026810169219970703, -0.00019478797912597656, -0.0001214742660522461, -4.8160552978515625e-05, 2.5153160095214844e-05, 9.846687316894531e-05, 0.00017178058624267578, 0.00024509429931640625, 0.0003184080123901367, 0.0003917217254638672, 0.00046503543853759766, 0.0005383491516113281, 0.0006116628646850586, 0.0006849765777587891, 0.0007582902908325195, 0.00083160400390625, 0.0009049177169799805, 0.000978231430053711, 0.0010515451431274414, 0.0011248588562011719, 0.0011981725692749023, 0.0012714862823486328, 0.0013447999954223633, 0.0014181137084960938, 0.0014914274215698242, 0.0015647411346435547, 0.0016380548477172852, 0.0017113685607910156, 0.001784682273864746, 0.0018579959869384766, 0.001931309700012207, 0.0020046234130859375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 7.0, 15.0, 22.0, 37.0, 39.0, 61.0, 79.0, 119.0, 176.0, 225.0, 355.0, 436.0, 648.0, 949.0, 1473.0, 2348.0, 3851.0, 6599.0, 12102.0, 24571.0, 55136.0, 132238.0, 274642.0, 280079.0, 138797.0, 57547.0, 25798.0, 12470.0, 6773.0, 3868.0, 2266.0, 1594.0, 1010.0, 678.0, 426.0, 334.0, 226.0, 154.0, 124.0, 73.0, 57.0, 50.0, 30.0, 32.0, 11.0, 9.0, 9.0, 1.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.5, -9.18359375, -8.8671875, -8.55078125, -8.234375, -7.91796875, -7.6015625, -7.28515625, -6.96875, -6.65234375, -6.3359375, -6.01953125, -5.703125, -5.38671875, -5.0703125, -4.75390625, -4.4375, -4.12109375, -3.8046875, -3.48828125, -3.171875, -2.85546875, -2.5390625, -2.22265625, -1.90625, -1.58984375, -1.2734375, -0.95703125, -0.640625, -0.32421875, -0.0078125, 0.30859375, 0.625, 0.94140625, 1.2578125, 1.57421875, 1.890625, 2.20703125, 2.5234375, 2.83984375, 3.15625, 3.47265625, 3.7890625, 4.10546875, 4.421875, 4.73828125, 5.0546875, 5.37109375, 5.6875, 6.00390625, 6.3203125, 6.63671875, 6.953125, 7.26953125, 7.5859375, 7.90234375, 8.21875, 8.53515625, 8.8515625, 9.16796875, 9.484375, 9.80078125, 10.1171875, 10.43359375, 10.75]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 4.0, 9.0, 7.0, 17.0, 13.0, 18.0, 19.0, 30.0, 37.0, 35.0, 49.0, 49.0, 83.0, 70.0, 75.0, 70.0, 79.0, 59.0, 54.0, 51.0, 32.0, 26.0, 24.0, 26.0, 12.0, 8.0, 10.0, 6.0, 3.0, 6.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.322265625, -2.237945556640625, -2.15362548828125, -2.069305419921875, -1.9849853515625, -1.900665283203125, -1.81634521484375, -1.732025146484375, -1.647705078125, -1.563385009765625, -1.47906494140625, -1.394744873046875, -1.3104248046875, -1.226104736328125, -1.14178466796875, -1.057464599609375, -0.97314453125, -0.888824462890625, -0.80450439453125, -0.720184326171875, -0.6358642578125, -0.551544189453125, -0.46722412109375, -0.382904052734375, -0.298583984375, -0.214263916015625, -0.12994384765625, -0.045623779296875, 0.0386962890625, 0.123016357421875, 0.20733642578125, 0.291656494140625, 0.3759765625, 0.460296630859375, 0.54461669921875, 0.628936767578125, 0.7132568359375, 0.797576904296875, 0.88189697265625, 0.966217041015625, 1.050537109375, 1.134857177734375, 1.21917724609375, 1.303497314453125, 1.3878173828125, 1.472137451171875, 1.55645751953125, 1.640777587890625, 1.72509765625, 1.809417724609375, 1.89373779296875, 1.978057861328125, 2.0623779296875, 2.146697998046875, 2.23101806640625, 2.315338134765625, 2.399658203125, 2.483978271484375, 2.56829833984375, 2.652618408203125, 2.7369384765625, 2.821258544921875, 2.90557861328125, 2.989898681640625, 3.07421875]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 17.0, 10.0, 17.0, 20.0, 22.0, 30.0, 49.0, 52.0, 69.0, 70.0, 79.0, 60.0, 62.0, 68.0, 65.0, 53.0, 63.0, 38.0, 31.0, 27.0, 23.0, 12.0, 7.0, 14.0, 5.0, 3.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.94780921936035, -18.386795043945312, -17.825782775878906, -17.264768600463867, -16.70375633239746, -16.142742156982422, -15.5817289352417, -15.020715713500977, -14.459702491760254, -13.898689270019531, -13.337676048278809, -12.776662826538086, -12.215648651123047, -11.65463638305664, -11.093622207641602, -10.532608985900879, -9.971595764160156, -9.410582542419434, -8.849569320678711, -8.288556098937988, -7.727542400360107, -7.166529178619385, -6.605515480041504, -6.044502258300781, -5.483489036560059, -4.922475814819336, -4.361462593078613, -3.8004488945007324, -3.2394356727600098, -2.678422451019287, -2.1174089908599854, -1.5563955307006836, -0.9953842163085938, -0.43437087535858154, 0.12664246559143066, 0.6876558065414429, 1.248669147491455, 1.8096823692321777, 2.3706958293914795, 2.9317092895507812, 3.492722511291504, 4.053735733032227, 4.614748954772949, 5.17576265335083, 5.736775875091553, 6.297789096832275, 6.858802795410156, 7.419816017150879, 7.980829238891602, 8.541842460632324, 9.102855682373047, 9.66386890411377, 10.224882125854492, 10.785896301269531, 11.346909523010254, 11.907922744750977, 12.4689359664917, 13.029949188232422, 13.590962409973145, 14.151975631713867, 14.712989807128906, 15.274002075195312, 15.835016250610352, 16.39603042602539, 16.957042694091797]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 4.0, 7.0, 10.0, 12.0, 20.0, 17.0, 13.0, 11.0, 19.0, 16.0, 18.0, 26.0, 29.0, 18.0, 29.0, 34.0, 38.0, 37.0, 41.0, 48.0, 44.0, 31.0, 36.0, 36.0, 29.0, 28.0, 37.0, 42.0, 37.0, 26.0, 31.0, 24.0, 21.0, 22.0, 17.0, 15.0, 10.0, 11.0, 9.0, 4.0, 8.0, 6.0, 10.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.496525764465332, -9.181788444519043, -8.867051124572754, -8.552313804626465, -8.237576484680176, -7.922839164733887, -7.608101844787598, -7.293364524841309, -6.9786272048950195, -6.6638898849487305, -6.349152565002441, -6.034415245056152, -5.719677925109863, -5.404940605163574, -5.090203285217285, -4.775465965270996, -4.460728645324707, -4.145991325378418, -3.831254005432129, -3.51651668548584, -3.201779365539551, -2.8870420455932617, -2.5723047256469727, -2.2575674057006836, -1.9428300857543945, -1.6280927658081055, -1.3133554458618164, -0.9986181259155273, -0.6838808059692383, -0.3691434860229492, -0.054406166076660156, 0.2603311538696289, 0.575068473815918, 0.889805793762207, 1.204543113708496, 1.5192804336547852, 1.8340177536010742, 2.1487550735473633, 2.4634923934936523, 2.7782297134399414, 3.0929670333862305, 3.4077043533325195, 3.7224416732788086, 4.037178993225098, 4.351916313171387, 4.666653633117676, 4.981390953063965, 5.296128273010254, 5.610865592956543, 5.925602912902832, 6.240340232849121, 6.55507755279541, 6.869814872741699, 7.184552192687988, 7.499289512634277, 7.814026832580566, 8.128764152526855, 8.443501472473145, 8.758238792419434, 9.072976112365723, 9.387713432312012, 9.7024507522583, 10.01718807220459, 10.331925392150879, 10.646662712097168]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 3.0, 7.0, 11.0, 11.0, 23.0, 23.0, 32.0, 46.0, 54.0, 94.0, 118.0, 189.0, 289.0, 392.0, 552.0, 829.0, 1293.0, 1939.0, 3137.0, 5065.0, 9039.0, 17727.0, 40845.0, 118583.0, 432753.0, 1426083.0, 1464039.0, 465348.0, 122545.0, 41236.0, 17972.0, 9070.0, 5138.0, 3180.0, 2081.0, 1341.0, 949.0, 642.0, 464.0, 319.0, 225.0, 168.0, 114.0, 87.0, 59.0, 58.0, 31.0, 21.0, 16.0, 14.0, 8.0, 10.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-20.015625, -19.325927734375, -18.63623046875, -17.946533203125, -17.2568359375, -16.567138671875, -15.87744140625, -15.187744140625, -14.498046875, -13.808349609375, -13.11865234375, -12.428955078125, -11.7392578125, -11.049560546875, -10.35986328125, -9.670166015625, -8.98046875, -8.290771484375, -7.60107421875, -6.911376953125, -6.2216796875, -5.531982421875, -4.84228515625, -4.152587890625, -3.462890625, -2.773193359375, -2.08349609375, -1.393798828125, -0.7041015625, -0.014404296875, 0.67529296875, 1.364990234375, 2.0546875, 2.744384765625, 3.43408203125, 4.123779296875, 4.8134765625, 5.503173828125, 6.19287109375, 6.882568359375, 7.572265625, 8.261962890625, 8.95166015625, 9.641357421875, 10.3310546875, 11.020751953125, 11.71044921875, 12.400146484375, 13.08984375, 13.779541015625, 14.46923828125, 15.158935546875, 15.8486328125, 16.538330078125, 17.22802734375, 17.917724609375, 18.607421875, 19.297119140625, 19.98681640625, 20.676513671875, 21.3662109375, 22.055908203125, 22.74560546875, 23.435302734375, 24.125]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 11.0, 4.0, 9.0, 12.0, 20.0, 11.0, 14.0, 13.0, 20.0, 23.0, 25.0, 27.0, 39.0, 30.0, 36.0, 35.0, 33.0, 40.0, 48.0, 55.0, 36.0, 46.0, 36.0, 32.0, 37.0, 31.0, 32.0, 39.0, 26.0, 18.0, 28.0, 29.0, 16.0, 16.0, 16.0, 13.0, 5.0, 9.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.46875, -8.1826171875, -7.896484375, -7.6103515625, -7.32421875, -7.0380859375, -6.751953125, -6.4658203125, -6.1796875, -5.8935546875, -5.607421875, -5.3212890625, -5.03515625, -4.7490234375, -4.462890625, -4.1767578125, -3.890625, -3.6044921875, -3.318359375, -3.0322265625, -2.74609375, -2.4599609375, -2.173828125, -1.8876953125, -1.6015625, -1.3154296875, -1.029296875, -0.7431640625, -0.45703125, -0.1708984375, 0.115234375, 0.4013671875, 0.6875, 0.9736328125, 1.259765625, 1.5458984375, 1.83203125, 2.1181640625, 2.404296875, 2.6904296875, 2.9765625, 3.2626953125, 3.548828125, 3.8349609375, 4.12109375, 4.4072265625, 4.693359375, 4.9794921875, 5.265625, 5.5517578125, 5.837890625, 6.1240234375, 6.41015625, 6.6962890625, 6.982421875, 7.2685546875, 7.5546875, 7.8408203125, 8.126953125, 8.4130859375, 8.69921875, 8.9853515625, 9.271484375, 9.5576171875, 9.84375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 1.0, 3.0, 7.0, 7.0, 14.0, 27.0, 27.0, 34.0, 33.0, 70.0, 94.0, 150.0, 202.0, 249.0, 377.0, 574.0, 808.0, 1246.0, 1894.0, 3042.0, 4786.0, 7941.0, 13545.0, 23799.0, 45590.0, 96957.0, 244010.0, 735148.0, 1590932.0, 898852.0, 294284.0, 112620.0, 51694.0, 26790.0, 14883.0, 8765.0, 5332.0, 3275.0, 2084.0, 1316.0, 879.0, 581.0, 447.0, 313.0, 193.0, 104.0, 99.0, 57.0, 55.0, 37.0, 21.0, 12.0, 8.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-22.28125, -21.575927734375, -20.87060546875, -20.165283203125, -19.4599609375, -18.754638671875, -18.04931640625, -17.343994140625, -16.638671875, -15.933349609375, -15.22802734375, -14.522705078125, -13.8173828125, -13.112060546875, -12.40673828125, -11.701416015625, -10.99609375, -10.290771484375, -9.58544921875, -8.880126953125, -8.1748046875, -7.469482421875, -6.76416015625, -6.058837890625, -5.353515625, -4.648193359375, -3.94287109375, -3.237548828125, -2.5322265625, -1.826904296875, -1.12158203125, -0.416259765625, 0.2890625, 0.994384765625, 1.69970703125, 2.405029296875, 3.1103515625, 3.815673828125, 4.52099609375, 5.226318359375, 5.931640625, 6.636962890625, 7.34228515625, 8.047607421875, 8.7529296875, 9.458251953125, 10.16357421875, 10.868896484375, 11.57421875, 12.279541015625, 12.98486328125, 13.690185546875, 14.3955078125, 15.100830078125, 15.80615234375, 16.511474609375, 17.216796875, 17.922119140625, 18.62744140625, 19.332763671875, 20.0380859375, 20.743408203125, 21.44873046875, 22.154052734375, 22.859375]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 9.0, 6.0, 6.0, 9.0, 13.0, 19.0, 23.0, 26.0, 31.0, 32.0, 43.0, 55.0, 84.0, 109.0, 158.0, 202.0, 273.0, 306.0, 387.0, 386.0, 397.0, 326.0, 272.0, 211.0, 174.0, 97.0, 109.0, 68.0, 50.0, 37.0, 29.0, 34.0, 29.0, 12.0, 11.0, 13.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.87890625, -6.68572998046875, -6.4925537109375, -6.29937744140625, -6.106201171875, -5.91302490234375, -5.7198486328125, -5.52667236328125, -5.33349609375, -5.14031982421875, -4.9471435546875, -4.75396728515625, -4.560791015625, -4.36761474609375, -4.1744384765625, -3.98126220703125, -3.7880859375, -3.59490966796875, -3.4017333984375, -3.20855712890625, -3.015380859375, -2.82220458984375, -2.6290283203125, -2.43585205078125, -2.24267578125, -2.04949951171875, -1.8563232421875, -1.66314697265625, -1.469970703125, -1.27679443359375, -1.0836181640625, -0.89044189453125, -0.697265625, -0.50408935546875, -0.3109130859375, -0.11773681640625, 0.075439453125, 0.26861572265625, 0.4617919921875, 0.65496826171875, 0.84814453125, 1.04132080078125, 1.2344970703125, 1.42767333984375, 1.620849609375, 1.81402587890625, 2.0072021484375, 2.20037841796875, 2.3935546875, 2.58673095703125, 2.7799072265625, 2.97308349609375, 3.166259765625, 3.35943603515625, 3.5526123046875, 3.74578857421875, 3.93896484375, 4.13214111328125, 4.3253173828125, 4.51849365234375, 4.711669921875, 4.90484619140625, 5.0980224609375, 5.29119873046875, 5.484375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 8.0, 9.0, 7.0, 17.0, 19.0, 30.0, 25.0, 40.0, 43.0, 73.0, 64.0, 108.0, 74.0, 92.0, 73.0, 77.0, 55.0, 36.0, 37.0, 27.0, 15.0, 14.0, 14.0, 11.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.690162658691406, -21.97059440612793, -21.251026153564453, -20.531457901000977, -19.8118896484375, -19.09231948852539, -18.372751235961914, -17.653182983398438, -16.93361473083496, -16.214046478271484, -15.494478225708008, -14.774909019470215, -14.055340766906738, -13.335772514343262, -12.616203308105469, -11.896635055541992, -11.177066802978516, -10.457498550415039, -9.737930297851562, -9.01836109161377, -8.298792839050293, -7.579224586486816, -6.859655857086182, -6.140087127685547, -5.42051887512207, -4.700950622558594, -3.981381893157959, -3.2618134021759033, -2.5422449111938477, -1.822676420211792, -1.1031079292297363, -0.38353919982910156, 0.3360309600830078, 1.0555994510650635, 1.7751679420471191, 2.494736433029175, 3.2143049240112305, 3.933873414993286, 4.653441905975342, 5.373010635375977, 6.092578887939453, 6.81214714050293, 7.5317158699035645, 8.2512845993042, 8.970852851867676, 9.690421104431152, 10.409990310668945, 11.129558563232422, 11.849126815795898, 12.568695068359375, 13.288263320922852, 14.007832527160645, 14.727400779724121, 15.446969032287598, 16.16653823852539, 16.886106491088867, 17.605674743652344, 18.32524299621582, 19.044811248779297, 19.764379501342773, 20.48394775390625, 21.20351791381836, 21.923086166381836, 22.642654418945312, 23.36222267150879]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 5.0, 2.0, 10.0, 7.0, 10.0, 17.0, 19.0, 15.0, 13.0, 21.0, 19.0, 16.0, 25.0, 28.0, 25.0, 24.0, 28.0, 27.0, 41.0, 31.0, 40.0, 37.0, 33.0, 45.0, 36.0, 39.0, 34.0, 39.0, 36.0, 30.0, 28.0, 20.0, 26.0, 24.0, 25.0, 16.0, 13.0, 13.0, 15.0, 10.0, 13.0, 10.0, 7.0, 4.0, 8.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.780592918395996, -10.445493698120117, -10.110394477844238, -9.77529525756836, -9.44019603729248, -9.105096817016602, -8.769998550415039, -8.434898376464844, -8.099800109863281, -7.764700889587402, -7.429601669311523, -7.0945024490356445, -6.759403228759766, -6.424304008483887, -6.089205265045166, -5.754106044769287, -5.41900634765625, -5.083907127380371, -4.748807907104492, -4.413708686828613, -4.078609466552734, -3.7435104846954346, -3.4084115028381348, -3.073312282562256, -2.738213062286377, -2.403113842010498, -2.068014621734619, -1.7329156398773193, -1.3978164196014404, -1.0627171993255615, -0.7276182174682617, -0.3925189971923828, -0.0574188232421875, 0.27768033742904663, 0.6127794981002808, 0.9478785991668701, 1.282977819442749, 1.618077039718628, 1.9531760215759277, 2.2882752418518066, 2.6233744621276855, 2.9584736824035645, 3.2935729026794434, 3.628671884536743, 3.963771104812622, 4.298870086669922, 4.633969306945801, 4.96906852722168, 5.304167747497559, 5.6392669677734375, 5.974366188049316, 6.309465408325195, 6.644564628601074, 6.979663848876953, 7.314762592315674, 7.649861812591553, 7.984961032867432, 8.320059776306152, 8.655158996582031, 8.99025821685791, 9.325357437133789, 9.660456657409668, 9.995555877685547, 10.330655097961426, 10.665754318237305]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 3.0, 10.0, 6.0, 18.0, 22.0, 41.0, 55.0, 71.0, 112.0, 152.0, 221.0, 322.0, 479.0, 779.0, 1129.0, 1640.0, 2720.0, 4325.0, 7123.0, 12486.0, 23552.0, 51391.0, 128853.0, 364635.0, 270785.0, 93090.0, 38890.0, 19162.0, 10148.0, 6004.0, 3556.0, 2273.0, 1612.0, 900.0, 600.0, 424.0, 306.0, 187.0, 163.0, 82.0, 75.0, 55.0, 26.0, 23.0, 19.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.5, -3.393402099609375, -3.28680419921875, -3.180206298828125, -3.0736083984375, -2.967010498046875, -2.86041259765625, -2.753814697265625, -2.647216796875, -2.540618896484375, -2.43402099609375, -2.327423095703125, -2.2208251953125, -2.114227294921875, -2.00762939453125, -1.901031494140625, -1.79443359375, -1.687835693359375, -1.58123779296875, -1.474639892578125, -1.3680419921875, -1.261444091796875, -1.15484619140625, -1.048248291015625, -0.941650390625, -0.835052490234375, -0.72845458984375, -0.621856689453125, -0.5152587890625, -0.408660888671875, -0.30206298828125, -0.195465087890625, -0.0888671875, 0.017730712890625, 0.12432861328125, 0.230926513671875, 0.3375244140625, 0.444122314453125, 0.55072021484375, 0.657318115234375, 0.763916015625, 0.870513916015625, 0.97711181640625, 1.083709716796875, 1.1903076171875, 1.296905517578125, 1.40350341796875, 1.510101318359375, 1.61669921875, 1.723297119140625, 1.82989501953125, 1.936492919921875, 2.0430908203125, 2.149688720703125, 2.25628662109375, 2.362884521484375, 2.469482421875, 2.576080322265625, 2.68267822265625, 2.789276123046875, 2.8958740234375, 3.002471923828125, 3.10906982421875, 3.215667724609375, 3.322265625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 1.0, 6.0, 6.0, 7.0, 4.0, 6.0, 11.0, 10.0, 12.0, 11.0, 16.0, 13.0, 24.0, 25.0, 24.0, 26.0, 24.0, 31.0, 44.0, 36.0, 41.0, 45.0, 49.0, 38.0, 45.0, 41.0, 48.0, 45.0, 29.0, 34.0, 29.0, 22.0, 29.0, 25.0, 22.0, 14.0, 19.0, 14.0, 16.0, 16.0, 11.0, 11.0, 2.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.9921875, -12.593017578125, -12.19384765625, -11.794677734375, -11.3955078125, -10.996337890625, -10.59716796875, -10.197998046875, -9.798828125, -9.399658203125, -9.00048828125, -8.601318359375, -8.2021484375, -7.802978515625, -7.40380859375, -7.004638671875, -6.60546875, -6.206298828125, -5.80712890625, -5.407958984375, -5.0087890625, -4.609619140625, -4.21044921875, -3.811279296875, -3.412109375, -3.012939453125, -2.61376953125, -2.214599609375, -1.8154296875, -1.416259765625, -1.01708984375, -0.617919921875, -0.21875, 0.180419921875, 0.57958984375, 0.978759765625, 1.3779296875, 1.777099609375, 2.17626953125, 2.575439453125, 2.974609375, 3.373779296875, 3.77294921875, 4.172119140625, 4.5712890625, 4.970458984375, 5.36962890625, 5.768798828125, 6.16796875, 6.567138671875, 6.96630859375, 7.365478515625, 7.7646484375, 8.163818359375, 8.56298828125, 8.962158203125, 9.361328125, 9.760498046875, 10.15966796875, 10.558837890625, 10.9580078125, 11.357177734375, 11.75634765625, 12.155517578125, 12.5546875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 4.0, 6.0, 8.0, 4.0, 9.0, 12.0, 6.0, 22.0, 20.0, 38.0, 54.0, 56.0, 87.0, 109.0, 160.0, 267.0, 469.0, 663.0, 1091.0, 1876.0, 3411.0, 7134.0, 18173.0, 179339.0, 794229.0, 23304.0, 8479.0, 4031.0, 2078.0, 1197.0, 680.0, 504.0, 288.0, 186.0, 162.0, 100.0, 73.0, 53.0, 35.0, 29.0, 29.0, 16.0, 10.0, 14.0, 10.0, 6.0, 9.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.34375, -10.049072265625, -9.75439453125, -9.459716796875, -9.1650390625, -8.870361328125, -8.57568359375, -8.281005859375, -7.986328125, -7.691650390625, -7.39697265625, -7.102294921875, -6.8076171875, -6.512939453125, -6.21826171875, -5.923583984375, -5.62890625, -5.334228515625, -5.03955078125, -4.744873046875, -4.4501953125, -4.155517578125, -3.86083984375, -3.566162109375, -3.271484375, -2.976806640625, -2.68212890625, -2.387451171875, -2.0927734375, -1.798095703125, -1.50341796875, -1.208740234375, -0.9140625, -0.619384765625, -0.32470703125, -0.030029296875, 0.2646484375, 0.559326171875, 0.85400390625, 1.148681640625, 1.443359375, 1.738037109375, 2.03271484375, 2.327392578125, 2.6220703125, 2.916748046875, 3.21142578125, 3.506103515625, 3.80078125, 4.095458984375, 4.39013671875, 4.684814453125, 4.9794921875, 5.274169921875, 5.56884765625, 5.863525390625, 6.158203125, 6.452880859375, 6.74755859375, 7.042236328125, 7.3369140625, 7.631591796875, 7.92626953125, 8.220947265625, 8.515625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 4.0, 9.0, 8.0, 10.0, 6.0, 14.0, 10.0, 12.0, 6.0, 23.0, 12.0, 23.0, 25.0, 27.0, 29.0, 24.0, 37.0, 24.0, 40.0, 41.0, 46.0, 48.0, 40.0, 39.0, 49.0, 49.0, 37.0, 24.0, 20.0, 29.0, 27.0, 36.0, 26.0, 23.0, 21.0, 21.0, 13.0, 19.0, 11.0, 15.0, 10.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.8359375, -7.5924072265625, -7.348876953125, -7.1053466796875, -6.86181640625, -6.6182861328125, -6.374755859375, -6.1312255859375, -5.8876953125, -5.6441650390625, -5.400634765625, -5.1571044921875, -4.91357421875, -4.6700439453125, -4.426513671875, -4.1829833984375, -3.939453125, -3.6959228515625, -3.452392578125, -3.2088623046875, -2.96533203125, -2.7218017578125, -2.478271484375, -2.2347412109375, -1.9912109375, -1.7476806640625, -1.504150390625, -1.2606201171875, -1.01708984375, -0.7735595703125, -0.530029296875, -0.2864990234375, -0.04296875, 0.2005615234375, 0.444091796875, 0.6876220703125, 0.93115234375, 1.1746826171875, 1.418212890625, 1.6617431640625, 1.9052734375, 2.1488037109375, 2.392333984375, 2.6358642578125, 2.87939453125, 3.1229248046875, 3.366455078125, 3.6099853515625, 3.853515625, 4.0970458984375, 4.340576171875, 4.5841064453125, 4.82763671875, 5.0711669921875, 5.314697265625, 5.5582275390625, 5.8017578125, 6.0452880859375, 6.288818359375, 6.5323486328125, 6.77587890625, 7.0194091796875, 7.262939453125, 7.5064697265625, 7.75]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 11.0, 14.0, 11.0, 14.0, 21.0, 33.0, 52.0, 61.0, 130.0, 167.0, 254.0, 444.0, 1056.0, 5908.0, 1023490.0, 14070.0, 1453.0, 532.0, 303.0, 166.0, 112.0, 73.0, 37.0, 35.0, 29.0, 22.0, 10.0, 8.0, 9.0, 14.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -10.1588134765625, -9.856689453125, -9.5545654296875, -9.25244140625, -8.9503173828125, -8.648193359375, -8.3460693359375, -8.0439453125, -7.7418212890625, -7.439697265625, -7.1375732421875, -6.83544921875, -6.5333251953125, -6.231201171875, -5.9290771484375, -5.626953125, -5.3248291015625, -5.022705078125, -4.7205810546875, -4.41845703125, -4.1163330078125, -3.814208984375, -3.5120849609375, -3.2099609375, -2.9078369140625, -2.605712890625, -2.3035888671875, -2.00146484375, -1.6993408203125, -1.397216796875, -1.0950927734375, -0.79296875, -0.4908447265625, -0.188720703125, 0.1134033203125, 0.41552734375, 0.7176513671875, 1.019775390625, 1.3218994140625, 1.6240234375, 1.9261474609375, 2.228271484375, 2.5303955078125, 2.83251953125, 3.1346435546875, 3.436767578125, 3.7388916015625, 4.041015625, 4.3431396484375, 4.645263671875, 4.9473876953125, 5.24951171875, 5.5516357421875, 5.853759765625, 6.1558837890625, 6.4580078125, 6.7601318359375, 7.062255859375, 7.3643798828125, 7.66650390625, 7.9686279296875, 8.270751953125, 8.5728759765625, 8.875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 5.0, 27.0, 114.0, 327.0, 337.0, 127.0, 28.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00033593177795410156, -0.00032475218176841736, -0.00031357258558273315, -0.00030239298939704895, -0.00029121339321136475, -0.00028003379702568054, -0.00026885420083999634, -0.00025767460465431213, -0.00024649500846862793, -0.00023531541228294373, -0.00022413581609725952, -0.00021295621991157532, -0.0002017766237258911, -0.0001905970275402069, -0.0001794174313545227, -0.0001682378351688385, -0.0001570582389831543, -0.0001458786427974701, -0.0001346990466117859, -0.00012351945042610168, -0.00011233985424041748, -0.00010116025805473328, -8.998066186904907e-05, -7.880106568336487e-05, -6.762146949768066e-05, -5.644187331199646e-05, -4.5262277126312256e-05, -3.408268094062805e-05, -2.2903084754943848e-05, -1.1723488569259644e-05, -5.438923835754395e-07, 1.0635703802108765e-05, 2.181529998779297e-05, 3.299489617347717e-05, 4.417449235916138e-05, 5.535408854484558e-05, 6.653368473052979e-05, 7.771328091621399e-05, 8.88928771018982e-05, 0.0001000724732875824, 0.0001112520694732666, 0.0001224316656589508, 0.000133611261844635, 0.00014479085803031921, 0.00015597045421600342, 0.00016715005040168762, 0.00017832964658737183, 0.00018950924277305603, 0.00020068883895874023, 0.00021186843514442444, 0.00022304803133010864, 0.00023422762751579285, 0.00024540722370147705, 0.00025658681988716125, 0.00026776641607284546, 0.00027894601225852966, 0.00029012560844421387, 0.00030130520462989807, 0.0003124848008155823, 0.0003236643970012665, 0.0003348439931869507, 0.0003460235893726349, 0.0003572031855583191, 0.0003683827817440033, 0.0003795623779296875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 8.0, 29.0, 20.0, 37.0, 45.0, 74.0, 113.0, 152.0, 217.0, 304.0, 430.0, 624.0, 923.0, 1374.0, 2019.0, 3137.0, 5607.0, 13655.0, 81552.0, 759016.0, 144343.0, 17979.0, 6555.0, 3582.0, 2124.0, 1396.0, 980.0, 636.0, 472.0, 329.0, 208.0, 163.0, 122.0, 79.0, 74.0, 55.0, 31.0, 31.0, 8.0, 14.0, 3.0, 10.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.75, -1.690887451171875, -1.63177490234375, -1.572662353515625, -1.5135498046875, -1.454437255859375, -1.39532470703125, -1.336212158203125, -1.277099609375, -1.217987060546875, -1.15887451171875, -1.099761962890625, -1.0406494140625, -0.981536865234375, -0.92242431640625, -0.863311767578125, -0.80419921875, -0.745086669921875, -0.68597412109375, -0.626861572265625, -0.5677490234375, -0.508636474609375, -0.44952392578125, -0.390411376953125, -0.331298828125, -0.272186279296875, -0.21307373046875, -0.153961181640625, -0.0948486328125, -0.035736083984375, 0.02337646484375, 0.082489013671875, 0.1416015625, 0.200714111328125, 0.25982666015625, 0.318939208984375, 0.3780517578125, 0.437164306640625, 0.49627685546875, 0.555389404296875, 0.614501953125, 0.673614501953125, 0.73272705078125, 0.791839599609375, 0.8509521484375, 0.910064697265625, 0.96917724609375, 1.028289794921875, 1.08740234375, 1.146514892578125, 1.20562744140625, 1.264739990234375, 1.3238525390625, 1.382965087890625, 1.44207763671875, 1.501190185546875, 1.560302734375, 1.619415283203125, 1.67852783203125, 1.737640380859375, 1.7967529296875, 1.855865478515625, 1.91497802734375, 1.974090576171875, 2.033203125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 7.0, 5.0, 12.0, 14.0, 15.0, 31.0, 59.0, 108.0, 143.0, 159.0, 143.0, 103.0, 78.0, 40.0, 22.0, 19.0, 11.0, 13.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.255859375, -0.2480010986328125, -0.240142822265625, -0.2322845458984375, -0.22442626953125, -0.2165679931640625, -0.208709716796875, -0.2008514404296875, -0.1929931640625, -0.1851348876953125, -0.177276611328125, -0.1694183349609375, -0.16156005859375, -0.1537017822265625, -0.145843505859375, -0.1379852294921875, -0.130126953125, -0.1222686767578125, -0.114410400390625, -0.1065521240234375, -0.09869384765625, -0.0908355712890625, -0.082977294921875, -0.0751190185546875, -0.0672607421875, -0.0594024658203125, -0.051544189453125, -0.0436859130859375, -0.03582763671875, -0.0279693603515625, -0.020111083984375, -0.0122528076171875, -0.00439453125, 0.0034637451171875, 0.011322021484375, 0.0191802978515625, 0.02703857421875, 0.0348968505859375, 0.042755126953125, 0.0506134033203125, 0.0584716796875, 0.0663299560546875, 0.074188232421875, 0.0820465087890625, 0.08990478515625, 0.0977630615234375, 0.105621337890625, 0.1134796142578125, 0.121337890625, 0.1291961669921875, 0.137054443359375, 0.1449127197265625, 0.15277099609375, 0.1606292724609375, 0.168487548828125, 0.1763458251953125, 0.1842041015625, 0.1920623779296875, 0.199920654296875, 0.2077789306640625, 0.21563720703125, 0.2234954833984375, 0.231353759765625, 0.2392120361328125, 0.2470703125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 8.0, 10.0, 10.0, 18.0, 20.0, 30.0, 33.0, 39.0, 56.0, 67.0, 75.0, 101.0, 73.0, 89.0, 75.0, 65.0, 53.0, 39.0, 35.0, 21.0, 12.0, 19.0, 15.0, 6.0, 5.0, 3.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.992338180541992, -22.279550552368164, -21.56676483154297, -20.85397720336914, -20.141189575195312, -19.428401947021484, -18.715614318847656, -18.00282859802246, -17.290040969848633, -16.577253341674805, -15.864466667175293, -15.151679992675781, -14.438892364501953, -13.726104736328125, -13.013318061828613, -12.300531387329102, -11.587743759155273, -10.874956130981445, -10.162169456481934, -9.449382781982422, -8.736595153808594, -8.023807525634766, -7.311020851135254, -6.598233699798584, -5.885446548461914, -5.172659397125244, -4.459872245788574, -3.7470850944519043, -3.0342979431152344, -2.3215107917785645, -1.6087236404418945, -0.8959364891052246, -0.1831512451171875, 0.5296359062194824, 1.2424230575561523, 1.9552102088928223, 2.667997360229492, 3.380784511566162, 4.093571662902832, 4.806358814239502, 5.519145965576172, 6.231933116912842, 6.944720268249512, 7.657507419586182, 8.370294570922852, 9.08308219909668, 9.795868873596191, 10.508655548095703, 11.221443176269531, 11.93423080444336, 12.647017478942871, 13.359804153442383, 14.072591781616211, 14.785379409790039, 15.49816608428955, 16.210952758789062, 16.92374038696289, 17.63652801513672, 18.349315643310547, 19.062101364135742, 19.77488899230957, 20.4876766204834, 21.200462341308594, 21.913249969482422, 22.62603759765625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 4.0, 4.0, 7.0, 7.0, 6.0, 12.0, 16.0, 22.0, 12.0, 13.0, 27.0, 13.0, 18.0, 25.0, 29.0, 25.0, 19.0, 31.0, 29.0, 38.0, 35.0, 38.0, 40.0, 37.0, 40.0, 37.0, 41.0, 34.0, 38.0, 35.0, 29.0, 23.0, 21.0, 26.0, 26.0, 20.0, 19.0, 13.0, 11.0, 18.0, 12.0, 12.0, 8.0, 6.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-10.666050910949707, -10.33454704284668, -10.003042221069336, -9.671538352966309, -9.340033531188965, -9.008529663085938, -8.677024841308594, -8.345520973205566, -8.014016151428223, -7.682511806488037, -7.351007461547852, -7.019503116607666, -6.6879987716674805, -6.356494426727295, -6.024990081787109, -5.693486213684082, -5.3619818687438965, -5.030477523803711, -4.698973178863525, -4.36746883392334, -4.035964488983154, -3.7044601440429688, -3.3729560375213623, -3.0414516925811768, -2.709947347640991, -2.3784430027008057, -2.04693865776062, -1.7154344320297241, -1.3839300870895386, -1.052425742149353, -0.720921516418457, -0.3894171714782715, -0.05791282653808594, 0.2735914885997772, 0.6050958037376404, 0.9366000890731812, 1.2681044340133667, 1.5996087789535522, 1.9311130046844482, 2.262617349624634, 2.5941216945648193, 2.925626039505005, 3.2571303844451904, 3.588634490966797, 3.9201388359069824, 4.251643180847168, 4.5831475257873535, 4.914651870727539, 5.246156215667725, 5.57766056060791, 5.909164905548096, 6.240669250488281, 6.572173595428467, 6.903677940368652, 7.23518180847168, 7.566686630249023, 7.898190498352051, 8.229694366455078, 8.561199188232422, 8.89270305633545, 9.224207878112793, 9.55571174621582, 9.887216567993164, 10.218720436096191, 10.550225257873535]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 7.0, 11.0, 23.0, 26.0, 35.0, 65.0, 79.0, 125.0, 204.0, 275.0, 414.0, 588.0, 937.0, 1365.0, 2029.0, 3001.0, 4609.0, 6860.0, 10811.0, 16665.0, 26949.0, 45907.0, 80410.0, 139603.0, 200666.0, 194490.0, 127771.0, 73196.0, 42013.0, 25237.0, 15286.0, 9756.0, 6456.0, 4183.0, 2769.0, 1864.0, 1188.0, 867.0, 585.0, 406.0, 267.0, 166.0, 131.0, 89.0, 62.0, 31.0, 28.0, 26.0, 10.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.3671875, -11.9671630859375, -11.567138671875, -11.1671142578125, -10.76708984375, -10.3670654296875, -9.967041015625, -9.5670166015625, -9.1669921875, -8.7669677734375, -8.366943359375, -7.9669189453125, -7.56689453125, -7.1668701171875, -6.766845703125, -6.3668212890625, -5.966796875, -5.5667724609375, -5.166748046875, -4.7667236328125, -4.36669921875, -3.9666748046875, -3.566650390625, -3.1666259765625, -2.7666015625, -2.3665771484375, -1.966552734375, -1.5665283203125, -1.16650390625, -0.7664794921875, -0.366455078125, 0.0335693359375, 0.43359375, 0.8336181640625, 1.233642578125, 1.6336669921875, 2.03369140625, 2.4337158203125, 2.833740234375, 3.2337646484375, 3.6337890625, 4.0338134765625, 4.433837890625, 4.8338623046875, 5.23388671875, 5.6339111328125, 6.033935546875, 6.4339599609375, 6.833984375, 7.2340087890625, 7.634033203125, 8.0340576171875, 8.43408203125, 8.8341064453125, 9.234130859375, 9.6341552734375, 10.0341796875, 10.4342041015625, 10.834228515625, 11.2342529296875, 11.63427734375, 12.0343017578125, 12.434326171875, 12.8343505859375, 13.234375]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 9.0, 15.0, 9.0, 24.0, 19.0, 12.0, 25.0, 20.0, 22.0, 18.0, 34.0, 31.0, 22.0, 39.0, 30.0, 38.0, 30.0, 45.0, 40.0, 52.0, 40.0, 35.0, 34.0, 33.0, 36.0, 29.0, 27.0, 21.0, 25.0, 24.0, 18.0, 9.0, 13.0, 21.0, 4.0, 15.0, 10.0, 10.0, 7.0, 5.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0390625, -10.695068359375, -10.35107421875, -10.007080078125, -9.6630859375, -9.319091796875, -8.97509765625, -8.631103515625, -8.287109375, -7.943115234375, -7.59912109375, -7.255126953125, -6.9111328125, -6.567138671875, -6.22314453125, -5.879150390625, -5.53515625, -5.191162109375, -4.84716796875, -4.503173828125, -4.1591796875, -3.815185546875, -3.47119140625, -3.127197265625, -2.783203125, -2.439208984375, -2.09521484375, -1.751220703125, -1.4072265625, -1.063232421875, -0.71923828125, -0.375244140625, -0.03125, 0.312744140625, 0.65673828125, 1.000732421875, 1.3447265625, 1.688720703125, 2.03271484375, 2.376708984375, 2.720703125, 3.064697265625, 3.40869140625, 3.752685546875, 4.0966796875, 4.440673828125, 4.78466796875, 5.128662109375, 5.47265625, 5.816650390625, 6.16064453125, 6.504638671875, 6.8486328125, 7.192626953125, 7.53662109375, 7.880615234375, 8.224609375, 8.568603515625, 8.91259765625, 9.256591796875, 9.6005859375, 9.944580078125, 10.28857421875, 10.632568359375, 10.9765625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 12.0, 6.0, 8.0, 11.0, 28.0, 27.0, 50.0, 92.0, 116.0, 161.0, 252.0, 365.0, 575.0, 810.0, 1169.0, 1706.0, 2521.0, 3623.0, 5522.0, 8188.0, 12617.0, 19937.0, 31509.0, 51146.0, 83261.0, 130364.0, 171845.0, 171071.0, 128930.0, 83088.0, 50851.0, 31472.0, 19774.0, 12517.0, 8101.0, 5498.0, 3608.0, 2395.0, 1742.0, 1120.0, 783.0, 589.0, 356.0, 237.0, 163.0, 103.0, 90.0, 59.0, 32.0, 29.0, 10.0, 13.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.5546875, -10.2027587890625, -9.850830078125, -9.4989013671875, -9.14697265625, -8.7950439453125, -8.443115234375, -8.0911865234375, -7.7392578125, -7.3873291015625, -7.035400390625, -6.6834716796875, -6.33154296875, -5.9796142578125, -5.627685546875, -5.2757568359375, -4.923828125, -4.5718994140625, -4.219970703125, -3.8680419921875, -3.51611328125, -3.1641845703125, -2.812255859375, -2.4603271484375, -2.1083984375, -1.7564697265625, -1.404541015625, -1.0526123046875, -0.70068359375, -0.3487548828125, 0.003173828125, 0.3551025390625, 0.70703125, 1.0589599609375, 1.410888671875, 1.7628173828125, 2.11474609375, 2.4666748046875, 2.818603515625, 3.1705322265625, 3.5224609375, 3.8743896484375, 4.226318359375, 4.5782470703125, 4.93017578125, 5.2821044921875, 5.634033203125, 5.9859619140625, 6.337890625, 6.6898193359375, 7.041748046875, 7.3936767578125, 7.74560546875, 8.0975341796875, 8.449462890625, 8.8013916015625, 9.1533203125, 9.5052490234375, 9.857177734375, 10.2091064453125, 10.56103515625, 10.9129638671875, 11.264892578125, 11.6168212890625, 11.96875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 8.0, 8.0, 17.0, 16.0, 19.0, 13.0, 17.0, 21.0, 21.0, 27.0, 33.0, 34.0, 40.0, 32.0, 41.0, 42.0, 59.0, 40.0, 38.0, 43.0, 48.0, 45.0, 30.0, 35.0, 26.0, 23.0, 28.0, 25.0, 27.0, 19.0, 18.0, 16.0, 16.0, 8.0, 17.0, 10.0, 7.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.10546875, -6.874267578125, -6.64306640625, -6.411865234375, -6.1806640625, -5.949462890625, -5.71826171875, -5.487060546875, -5.255859375, -5.024658203125, -4.79345703125, -4.562255859375, -4.3310546875, -4.099853515625, -3.86865234375, -3.637451171875, -3.40625, -3.175048828125, -2.94384765625, -2.712646484375, -2.4814453125, -2.250244140625, -2.01904296875, -1.787841796875, -1.556640625, -1.325439453125, -1.09423828125, -0.863037109375, -0.6318359375, -0.400634765625, -0.16943359375, 0.061767578125, 0.29296875, 0.524169921875, 0.75537109375, 0.986572265625, 1.2177734375, 1.448974609375, 1.68017578125, 1.911376953125, 2.142578125, 2.373779296875, 2.60498046875, 2.836181640625, 3.0673828125, 3.298583984375, 3.52978515625, 3.760986328125, 3.9921875, 4.223388671875, 4.45458984375, 4.685791015625, 4.9169921875, 5.148193359375, 5.37939453125, 5.610595703125, 5.841796875, 6.072998046875, 6.30419921875, 6.535400390625, 6.7666015625, 6.997802734375, 7.22900390625, 7.460205078125, 7.69140625]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 23.0, 20.0, 30.0, 69.0, 80.0, 101.0, 156.0, 238.0, 339.0, 567.0, 923.0, 1563.0, 2680.0, 4878.0, 9351.0, 19877.0, 45967.0, 115522.0, 262603.0, 309746.0, 158599.0, 62495.0, 26155.0, 12292.0, 6096.0, 3268.0, 1918.0, 1093.0, 711.0, 427.0, 220.0, 204.0, 93.0, 73.0, 46.0, 36.0, 26.0, 17.0, 14.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.953125, -11.61328125, -11.2734375, -10.93359375, -10.59375, -10.25390625, -9.9140625, -9.57421875, -9.234375, -8.89453125, -8.5546875, -8.21484375, -7.875, -7.53515625, -7.1953125, -6.85546875, -6.515625, -6.17578125, -5.8359375, -5.49609375, -5.15625, -4.81640625, -4.4765625, -4.13671875, -3.796875, -3.45703125, -3.1171875, -2.77734375, -2.4375, -2.09765625, -1.7578125, -1.41796875, -1.078125, -0.73828125, -0.3984375, -0.05859375, 0.28125, 0.62109375, 0.9609375, 1.30078125, 1.640625, 1.98046875, 2.3203125, 2.66015625, 3.0, 3.33984375, 3.6796875, 4.01953125, 4.359375, 4.69921875, 5.0390625, 5.37890625, 5.71875, 6.05859375, 6.3984375, 6.73828125, 7.078125, 7.41796875, 7.7578125, 8.09765625, 8.4375, 8.77734375, 9.1171875, 9.45703125, 9.796875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 1.0, 7.0, 6.0, 12.0, 8.0, 11.0, 20.0, 21.0, 34.0, 49.0, 38.0, 75.0, 80.0, 92.0, 114.0, 94.0, 85.0, 61.0, 35.0, 28.0, 27.0, 16.0, 17.0, 13.0, 13.0, 9.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006551742553710938, -0.0006268620491027832, -0.0005985498428344727, -0.0005702376365661621, -0.0005419254302978516, -0.000513613224029541, -0.00048530101776123047, -0.0004569888114929199, -0.0004286766052246094, -0.00040036439895629883, -0.0003720521926879883, -0.00034373998641967773, -0.0003154277801513672, -0.00028711557388305664, -0.0002588033676147461, -0.00023049116134643555, -0.000202178955078125, -0.00017386674880981445, -0.0001455545425415039, -0.00011724233627319336, -8.893013000488281e-05, -6.0617923736572266e-05, -3.230571746826172e-05, -3.993511199951172e-06, 2.4318695068359375e-05, 5.263090133666992e-05, 8.094310760498047e-05, 0.00010925531387329102, 0.00013756752014160156, 0.0001658797264099121, 0.00019419193267822266, 0.0002225041389465332, 0.00025081634521484375, 0.0002791285514831543, 0.00030744075775146484, 0.0003357529640197754, 0.00036406517028808594, 0.0003923773765563965, 0.00042068958282470703, 0.0004490017890930176, 0.0004773139953613281, 0.0005056262016296387, 0.0005339384078979492, 0.0005622506141662598, 0.0005905628204345703, 0.0006188750267028809, 0.0006471872329711914, 0.000675499439239502, 0.0007038116455078125, 0.000732123851776123, 0.0007604360580444336, 0.0007887482643127441, 0.0008170604705810547, 0.0008453726768493652, 0.0008736848831176758, 0.0009019970893859863, 0.0009303092956542969, 0.0009586215019226074, 0.000986933708190918, 0.0010152459144592285, 0.001043558120727539, 0.0010718703269958496, 0.0011001825332641602, 0.0011284947395324707, 0.0011568069458007812]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 8.0, 7.0, 11.0, 18.0, 19.0, 25.0, 19.0, 43.0, 72.0, 98.0, 133.0, 221.0, 330.0, 605.0, 1068.0, 2032.0, 3868.0, 9056.0, 23960.0, 70518.0, 207120.0, 368436.0, 232700.0, 81171.0, 27375.0, 10278.0, 4350.0, 2126.0, 1106.0, 684.0, 377.0, 245.0, 156.0, 97.0, 67.0, 44.0, 31.0, 30.0, 22.0, 8.0, 6.0, 10.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.0625, -12.6845703125, -12.306640625, -11.9287109375, -11.55078125, -11.1728515625, -10.794921875, -10.4169921875, -10.0390625, -9.6611328125, -9.283203125, -8.9052734375, -8.52734375, -8.1494140625, -7.771484375, -7.3935546875, -7.015625, -6.6376953125, -6.259765625, -5.8818359375, -5.50390625, -5.1259765625, -4.748046875, -4.3701171875, -3.9921875, -3.6142578125, -3.236328125, -2.8583984375, -2.48046875, -2.1025390625, -1.724609375, -1.3466796875, -0.96875, -0.5908203125, -0.212890625, 0.1650390625, 0.54296875, 0.9208984375, 1.298828125, 1.6767578125, 2.0546875, 2.4326171875, 2.810546875, 3.1884765625, 3.56640625, 3.9443359375, 4.322265625, 4.7001953125, 5.078125, 5.4560546875, 5.833984375, 6.2119140625, 6.58984375, 6.9677734375, 7.345703125, 7.7236328125, 8.1015625, 8.4794921875, 8.857421875, 9.2353515625, 9.61328125, 9.9912109375, 10.369140625, 10.7470703125, 11.125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 11.0, 9.0, 6.0, 13.0, 21.0, 24.0, 24.0, 32.0, 40.0, 48.0, 68.0, 69.0, 92.0, 79.0, 86.0, 90.0, 64.0, 61.0, 45.0, 34.0, 31.0, 15.0, 11.0, 6.0, 7.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.2421875, -3.167755126953125, -3.09332275390625, -3.018890380859375, -2.9444580078125, -2.870025634765625, -2.79559326171875, -2.721160888671875, -2.646728515625, -2.572296142578125, -2.49786376953125, -2.423431396484375, -2.3489990234375, -2.274566650390625, -2.20013427734375, -2.125701904296875, -2.05126953125, -1.976837158203125, -1.90240478515625, -1.827972412109375, -1.7535400390625, -1.679107666015625, -1.60467529296875, -1.530242919921875, -1.455810546875, -1.381378173828125, -1.30694580078125, -1.232513427734375, -1.1580810546875, -1.083648681640625, -1.00921630859375, -0.934783935546875, -0.8603515625, -0.785919189453125, -0.71148681640625, -0.637054443359375, -0.5626220703125, -0.488189697265625, -0.41375732421875, -0.339324951171875, -0.264892578125, -0.190460205078125, -0.11602783203125, -0.041595458984375, 0.0328369140625, 0.107269287109375, 0.18170166015625, 0.256134033203125, 0.33056640625, 0.404998779296875, 0.47943115234375, 0.553863525390625, 0.6282958984375, 0.702728271484375, 0.77716064453125, 0.851593017578125, 0.926025390625, 1.000457763671875, 1.07489013671875, 1.149322509765625, 1.2237548828125, 1.298187255859375, 1.37261962890625, 1.447052001953125, 1.521484375]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 1.0, 4.0, 7.0, 5.0, 10.0, 15.0, 19.0, 23.0, 24.0, 43.0, 55.0, 65.0, 74.0, 86.0, 93.0, 79.0, 86.0, 50.0, 63.0, 41.0, 34.0, 26.0, 18.0, 24.0, 10.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.651029586791992, -22.96807098388672, -22.285112380981445, -21.602153778076172, -20.91919708251953, -20.236238479614258, -19.553279876708984, -18.87032127380371, -18.187362670898438, -17.504404067993164, -16.82144546508789, -16.138486862182617, -15.45552921295166, -14.772570610046387, -14.08961296081543, -13.406654357910156, -12.723695755004883, -12.04073715209961, -11.357778549194336, -10.674820899963379, -9.991862297058105, -9.308903694152832, -8.625946044921875, -7.942987442016602, -7.260028839111328, -6.577070236206055, -5.8941121101379395, -5.211153984069824, -4.528195381164551, -3.8452370166778564, -3.162278652191162, -2.479320526123047, -1.7963600158691406, -1.1134016513824463, -0.43044328689575195, 0.2525150775909424, 0.9354734420776367, 1.618431806564331, 2.3013901710510254, 2.9843482971191406, 3.667306900024414, 4.3502655029296875, 5.033223628997803, 5.716181755065918, 6.399140357971191, 7.082098960876465, 7.76505708694458, 8.448015213012695, 9.130973815917969, 9.813932418823242, 10.496891021728516, 11.179848670959473, 11.862807273864746, 12.54576587677002, 13.228723526000977, 13.91168212890625, 14.594640731811523, 15.277599334716797, 15.96055793762207, 16.643516540527344, 17.326473236083984, 18.009431838989258, 18.69239044189453, 19.375349044799805, 20.058307647705078]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 9.0, 1.0, 3.0, 9.0, 8.0, 11.0, 14.0, 7.0, 25.0, 12.0, 11.0, 19.0, 21.0, 21.0, 21.0, 33.0, 32.0, 36.0, 31.0, 32.0, 33.0, 45.0, 30.0, 42.0, 52.0, 50.0, 38.0, 40.0, 45.0, 29.0, 38.0, 22.0, 30.0, 21.0, 27.0, 22.0, 13.0, 8.0, 14.0, 10.0, 8.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.097762107849121, -9.739550590515137, -9.381340026855469, -9.023128509521484, -8.6649169921875, -8.306705474853516, -7.948494911193848, -7.590283393859863, -7.232072353363037, -6.873861312866211, -6.515649795532227, -6.1574387550354, -5.799227714538574, -5.44101619720459, -5.082805156707764, -4.7245941162109375, -4.366382598876953, -4.008171558380127, -3.6499600410461426, -3.2917490005493164, -2.933537721633911, -2.575326442718506, -2.2171154022216797, -1.8589041233062744, -1.5006928443908691, -1.1424815654754639, -0.7842704057693481, -0.4260592460632324, -0.06784796714782715, 0.2903633117675781, 0.6485743522644043, 1.0067856311798096, 1.3649959564208984, 1.7232072353363037, 2.081418514251709, 2.439629554748535, 2.7978408336639404, 3.1560521125793457, 3.514263153076172, 3.872474431991577, 4.230685710906982, 4.588896751403809, 4.947108268737793, 5.305319309234619, 5.663530349731445, 6.02174186706543, 6.379952907562256, 6.738163948059082, 7.096375465393066, 7.454586505889893, 7.812798023223877, 8.171009063720703, 8.529220581054688, 8.887432098388672, 9.24564266204834, 9.603854179382324, 9.962064743041992, 10.320276260375977, 10.678486824035645, 11.036698341369629, 11.394909858703613, 11.753120422363281, 12.111331939697266, 12.46954345703125, 12.827754974365234]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 9.0, 14.0, 27.0, 49.0, 43.0, 81.0, 111.0, 190.0, 244.0, 371.0, 490.0, 711.0, 1081.0, 1641.0, 2644.0, 4069.0, 6623.0, 11100.0, 20427.0, 42687.0, 109454.0, 343493.0, 1062037.0, 1514611.0, 711693.0, 220636.0, 72366.0, 29650.0, 14865.0, 8313.0, 5153.0, 3092.0, 2022.0, 1354.0, 905.0, 564.0, 427.0, 305.0, 202.0, 146.0, 129.0, 73.0, 62.0, 35.0, 27.0, 14.0, 14.0, 13.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.890625, -20.201171875, -19.51171875, -18.822265625, -18.1328125, -17.443359375, -16.75390625, -16.064453125, -15.375, -14.685546875, -13.99609375, -13.306640625, -12.6171875, -11.927734375, -11.23828125, -10.548828125, -9.859375, -9.169921875, -8.48046875, -7.791015625, -7.1015625, -6.412109375, -5.72265625, -5.033203125, -4.34375, -3.654296875, -2.96484375, -2.275390625, -1.5859375, -0.896484375, -0.20703125, 0.482421875, 1.171875, 1.861328125, 2.55078125, 3.240234375, 3.9296875, 4.619140625, 5.30859375, 5.998046875, 6.6875, 7.376953125, 8.06640625, 8.755859375, 9.4453125, 10.134765625, 10.82421875, 11.513671875, 12.203125, 12.892578125, 13.58203125, 14.271484375, 14.9609375, 15.650390625, 16.33984375, 17.029296875, 17.71875, 18.408203125, 19.09765625, 19.787109375, 20.4765625, 21.166015625, 21.85546875, 22.544921875, 23.234375]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 11.0, 5.0, 8.0, 12.0, 15.0, 11.0, 14.0, 15.0, 18.0, 22.0, 27.0, 28.0, 38.0, 26.0, 21.0, 35.0, 37.0, 32.0, 39.0, 35.0, 48.0, 51.0, 44.0, 47.0, 45.0, 38.0, 40.0, 26.0, 35.0, 23.0, 22.0, 22.0, 19.0, 18.0, 15.0, 10.0, 11.0, 11.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5335693359375, -9.207763671875, -8.8819580078125, -8.55615234375, -8.2303466796875, -7.904541015625, -7.5787353515625, -7.2529296875, -6.9271240234375, -6.601318359375, -6.2755126953125, -5.94970703125, -5.6239013671875, -5.298095703125, -4.9722900390625, -4.646484375, -4.3206787109375, -3.994873046875, -3.6690673828125, -3.34326171875, -3.0174560546875, -2.691650390625, -2.3658447265625, -2.0400390625, -1.7142333984375, -1.388427734375, -1.0626220703125, -0.73681640625, -0.4110107421875, -0.085205078125, 0.2406005859375, 0.56640625, 0.8922119140625, 1.218017578125, 1.5438232421875, 1.86962890625, 2.1954345703125, 2.521240234375, 2.8470458984375, 3.1728515625, 3.4986572265625, 3.824462890625, 4.1502685546875, 4.47607421875, 4.8018798828125, 5.127685546875, 5.4534912109375, 5.779296875, 6.1051025390625, 6.430908203125, 6.7567138671875, 7.08251953125, 7.4083251953125, 7.734130859375, 8.0599365234375, 8.3857421875, 8.7115478515625, 9.037353515625, 9.3631591796875, 9.68896484375, 10.0147705078125, 10.340576171875, 10.6663818359375, 10.9921875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 8.0, 16.0, 23.0, 20.0, 40.0, 45.0, 94.0, 149.0, 200.0, 387.0, 565.0, 910.0, 1402.0, 2303.0, 3802.0, 6795.0, 12623.0, 24286.0, 51701.0, 126460.0, 377896.0, 1276650.0, 1535595.0, 492353.0, 156982.0, 61855.0, 28149.0, 13988.0, 7730.0, 4437.0, 2643.0, 1572.0, 927.0, 577.0, 343.0, 249.0, 142.0, 108.0, 79.0, 54.0, 31.0, 23.0, 23.0, 10.0, 6.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-27.953125, -27.024658203125, -26.09619140625, -25.167724609375, -24.2392578125, -23.310791015625, -22.38232421875, -21.453857421875, -20.525390625, -19.596923828125, -18.66845703125, -17.739990234375, -16.8115234375, -15.883056640625, -14.95458984375, -14.026123046875, -13.09765625, -12.169189453125, -11.24072265625, -10.312255859375, -9.3837890625, -8.455322265625, -7.52685546875, -6.598388671875, -5.669921875, -4.741455078125, -3.81298828125, -2.884521484375, -1.9560546875, -1.027587890625, -0.09912109375, 0.829345703125, 1.7578125, 2.686279296875, 3.61474609375, 4.543212890625, 5.4716796875, 6.400146484375, 7.32861328125, 8.257080078125, 9.185546875, 10.114013671875, 11.04248046875, 11.970947265625, 12.8994140625, 13.827880859375, 14.75634765625, 15.684814453125, 16.61328125, 17.541748046875, 18.47021484375, 19.398681640625, 20.3271484375, 21.255615234375, 22.18408203125, 23.112548828125, 24.041015625, 24.969482421875, 25.89794921875, 26.826416015625, 27.7548828125, 28.683349609375, 29.61181640625, 30.540283203125, 31.46875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 9.0, 8.0, 14.0, 23.0, 15.0, 27.0, 21.0, 38.0, 59.0, 79.0, 132.0, 144.0, 204.0, 281.0, 348.0, 469.0, 442.0, 428.0, 349.0, 254.0, 190.0, 125.0, 112.0, 70.0, 59.0, 39.0, 27.0, 18.0, 33.0, 15.0, 14.0, 5.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.484375, -6.2271728515625, -5.969970703125, -5.7127685546875, -5.45556640625, -5.1983642578125, -4.941162109375, -4.6839599609375, -4.4267578125, -4.1695556640625, -3.912353515625, -3.6551513671875, -3.39794921875, -3.1407470703125, -2.883544921875, -2.6263427734375, -2.369140625, -2.1119384765625, -1.854736328125, -1.5975341796875, -1.34033203125, -1.0831298828125, -0.825927734375, -0.5687255859375, -0.3115234375, -0.0543212890625, 0.202880859375, 0.4600830078125, 0.71728515625, 0.9744873046875, 1.231689453125, 1.4888916015625, 1.74609375, 2.0032958984375, 2.260498046875, 2.5177001953125, 2.77490234375, 3.0321044921875, 3.289306640625, 3.5465087890625, 3.8037109375, 4.0609130859375, 4.318115234375, 4.5753173828125, 4.83251953125, 5.0897216796875, 5.346923828125, 5.6041259765625, 5.861328125, 6.1185302734375, 6.375732421875, 6.6329345703125, 6.89013671875, 7.1473388671875, 7.404541015625, 7.6617431640625, 7.9189453125, 8.1761474609375, 8.433349609375, 8.6905517578125, 8.94775390625, 9.2049560546875, 9.462158203125, 9.7193603515625, 9.9765625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 6.0, 4.0, 13.0, 13.0, 18.0, 23.0, 27.0, 27.0, 33.0, 34.0, 61.0, 76.0, 67.0, 79.0, 84.0, 86.0, 60.0, 58.0, 49.0, 38.0, 32.0, 25.0, 16.0, 18.0, 13.0, 9.0, 8.0, 4.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-26.38346290588379, -25.65020179748535, -24.91693878173828, -24.183677673339844, -23.450416564941406, -22.71715545654297, -21.9838924407959, -21.25063133239746, -20.51736831665039, -19.784107208251953, -19.050844192504883, -18.317583084106445, -17.584321975708008, -16.851058959960938, -16.1177978515625, -15.384536743164062, -14.651275634765625, -13.918013572692871, -13.184752464294434, -12.45149040222168, -11.718229293823242, -10.984967231750488, -10.251705169677734, -9.518444061279297, -8.785181999206543, -8.051919937133789, -7.318658828735352, -6.585396766662598, -5.852135181427002, -5.118873596191406, -4.385611534118652, -3.6523499488830566, -2.919088363647461, -2.1858267784118652, -1.4525649547576904, -0.7193031311035156, 0.013958454132080078, 0.7472200393676758, 1.4804821014404297, 2.2137436866760254, 2.947005271911621, 3.680266857147217, 4.4135284423828125, 5.146790504455566, 5.880052089691162, 6.613313674926758, 7.346575736999512, 8.079837799072266, 8.813098907470703, 9.546360969543457, 10.279622077941895, 11.012884140014648, 11.746145248413086, 12.47940731048584, 13.212669372558594, 13.945930480957031, 14.679192543029785, 15.412454605102539, 16.145715713500977, 16.878978729248047, 17.612239837646484, 18.345500946044922, 19.07876205444336, 19.81202507019043, 20.545286178588867]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 10.0, 5.0, 14.0, 11.0, 14.0, 13.0, 14.0, 17.0, 19.0, 19.0, 31.0, 30.0, 36.0, 34.0, 37.0, 36.0, 31.0, 39.0, 61.0, 34.0, 37.0, 20.0, 45.0, 30.0, 46.0, 31.0, 46.0, 28.0, 32.0, 24.0, 16.0, 16.0, 29.0, 11.0, 10.0, 11.0, 9.0, 7.0, 5.0, 11.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.10396957397461, -11.706006050109863, -11.3080415725708, -10.910078048706055, -10.512114524841309, -10.114151000976562, -9.7161865234375, -9.318222999572754, -8.920259475708008, -8.522295951843262, -8.1243314743042, -7.726367950439453, -7.328404426574707, -6.930440425872803, -6.532476425170898, -6.134512901306152, -5.73654842376709, -5.3385844230651855, -4.9406208992004395, -4.542656898498535, -4.144693374633789, -3.7467293739318848, -3.3487653732299805, -2.9508016109466553, -2.55283784866333, -2.154874086380005, -1.7569102048873901, -1.3589463233947754, -0.9609825611114502, -0.563018798828125, -0.1650547981262207, 0.2329089641571045, 0.6308727264404297, 1.0288364887237549, 1.4268003702163696, 1.8247642517089844, 2.2227280139923096, 2.6206917762756348, 3.018655776977539, 3.4166195392608643, 3.8145833015441895, 4.212547302246094, 4.61051082611084, 5.008474826812744, 5.406438827514648, 5.8044023513793945, 6.202366352081299, 6.600330352783203, 6.998293876647949, 7.3962578773498535, 7.7942214012146, 8.192185401916504, 8.59014892578125, 8.988113403320312, 9.386076927185059, 9.784040451049805, 10.182004928588867, 10.579968452453613, 10.977932929992676, 11.375896453857422, 11.773859977722168, 12.171823501586914, 12.569787979125977, 12.967751502990723, 13.365715026855469]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 9.0, 6.0, 5.0, 17.0, 26.0, 27.0, 41.0, 64.0, 88.0, 130.0, 184.0, 264.0, 372.0, 568.0, 869.0, 1272.0, 1999.0, 3128.0, 5272.0, 8721.0, 15538.0, 28913.0, 56981.0, 123806.0, 267378.0, 274880.0, 129237.0, 59255.0, 29582.0, 16071.0, 9121.0, 5332.0, 3398.0, 2059.0, 1313.0, 789.0, 564.0, 391.0, 281.0, 183.0, 150.0, 75.0, 50.0, 43.0, 41.0, 26.0, 10.0, 13.0, 7.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.50390625, -2.42572021484375, -2.3475341796875, -2.26934814453125, -2.191162109375, -2.11297607421875, -2.0347900390625, -1.95660400390625, -1.87841796875, -1.80023193359375, -1.7220458984375, -1.64385986328125, -1.565673828125, -1.48748779296875, -1.4093017578125, -1.33111572265625, -1.2529296875, -1.17474365234375, -1.0965576171875, -1.01837158203125, -0.940185546875, -0.86199951171875, -0.7838134765625, -0.70562744140625, -0.62744140625, -0.54925537109375, -0.4710693359375, -0.39288330078125, -0.314697265625, -0.23651123046875, -0.1583251953125, -0.08013916015625, -0.001953125, 0.07623291015625, 0.1544189453125, 0.23260498046875, 0.310791015625, 0.38897705078125, 0.4671630859375, 0.54534912109375, 0.62353515625, 0.70172119140625, 0.7799072265625, 0.85809326171875, 0.936279296875, 1.01446533203125, 1.0926513671875, 1.17083740234375, 1.2490234375, 1.32720947265625, 1.4053955078125, 1.48358154296875, 1.561767578125, 1.63995361328125, 1.7181396484375, 1.79632568359375, 1.87451171875, 1.95269775390625, 2.0308837890625, 2.10906982421875, 2.187255859375, 2.26544189453125, 2.3436279296875, 2.42181396484375, 2.5]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 8.0, 12.0, 7.0, 7.0, 10.0, 19.0, 14.0, 19.0, 30.0, 28.0, 25.0, 34.0, 45.0, 31.0, 35.0, 40.0, 47.0, 53.0, 47.0, 37.0, 33.0, 50.0, 38.0, 33.0, 39.0, 39.0, 29.0, 34.0, 20.0, 28.0, 24.0, 17.0, 13.0, 10.0, 6.0, 11.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8828125, -14.3988037109375, -13.914794921875, -13.4307861328125, -12.94677734375, -12.4627685546875, -11.978759765625, -11.4947509765625, -11.0107421875, -10.5267333984375, -10.042724609375, -9.5587158203125, -9.07470703125, -8.5906982421875, -8.106689453125, -7.6226806640625, -7.138671875, -6.6546630859375, -6.170654296875, -5.6866455078125, -5.20263671875, -4.7186279296875, -4.234619140625, -3.7506103515625, -3.2666015625, -2.7825927734375, -2.298583984375, -1.8145751953125, -1.33056640625, -0.8465576171875, -0.362548828125, 0.1214599609375, 0.60546875, 1.0894775390625, 1.573486328125, 2.0574951171875, 2.54150390625, 3.0255126953125, 3.509521484375, 3.9935302734375, 4.4775390625, 4.9615478515625, 5.445556640625, 5.9295654296875, 6.41357421875, 6.8975830078125, 7.381591796875, 7.8656005859375, 8.349609375, 8.8336181640625, 9.317626953125, 9.8016357421875, 10.28564453125, 10.7696533203125, 11.253662109375, 11.7376708984375, 12.2216796875, 12.7056884765625, 13.189697265625, 13.6737060546875, 14.15771484375, 14.6417236328125, 15.125732421875, 15.6097412109375, 16.09375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 10.0, 20.0, 32.0, 38.0, 40.0, 78.0, 105.0, 152.0, 224.0, 326.0, 547.0, 886.0, 1514.0, 2657.0, 4993.0, 10754.0, 28810.0, 761030.0, 195155.0, 22067.0, 8988.0, 4256.0, 2232.0, 1253.0, 795.0, 539.0, 336.0, 223.0, 147.0, 104.0, 66.0, 50.0, 36.0, 25.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.88671875, -6.67071533203125, -6.4547119140625, -6.23870849609375, -6.022705078125, -5.80670166015625, -5.5906982421875, -5.37469482421875, -5.15869140625, -4.94268798828125, -4.7266845703125, -4.51068115234375, -4.294677734375, -4.07867431640625, -3.8626708984375, -3.64666748046875, -3.4306640625, -3.21466064453125, -2.9986572265625, -2.78265380859375, -2.566650390625, -2.35064697265625, -2.1346435546875, -1.91864013671875, -1.70263671875, -1.48663330078125, -1.2706298828125, -1.05462646484375, -0.838623046875, -0.62261962890625, -0.4066162109375, -0.19061279296875, 0.025390625, 0.24139404296875, 0.4573974609375, 0.67340087890625, 0.889404296875, 1.10540771484375, 1.3214111328125, 1.53741455078125, 1.75341796875, 1.96942138671875, 2.1854248046875, 2.40142822265625, 2.617431640625, 2.83343505859375, 3.0494384765625, 3.26544189453125, 3.4814453125, 3.69744873046875, 3.9134521484375, 4.12945556640625, 4.345458984375, 4.56146240234375, 4.7774658203125, 4.99346923828125, 5.20947265625, 5.42547607421875, 5.6414794921875, 5.85748291015625, 6.073486328125, 6.28948974609375, 6.5054931640625, 6.72149658203125, 6.9375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 7.0, 3.0, 15.0, 9.0, 12.0, 10.0, 18.0, 19.0, 17.0, 24.0, 27.0, 40.0, 42.0, 30.0, 29.0, 32.0, 50.0, 49.0, 45.0, 32.0, 36.0, 43.0, 43.0, 40.0, 38.0, 32.0, 33.0, 24.0, 34.0, 17.0, 16.0, 26.0, 20.0, 17.0, 14.0, 12.0, 12.0, 10.0, 3.0, 3.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.97265625, -7.69573974609375, -7.4188232421875, -7.14190673828125, -6.864990234375, -6.58807373046875, -6.3111572265625, -6.03424072265625, -5.75732421875, -5.48040771484375, -5.2034912109375, -4.92657470703125, -4.649658203125, -4.37274169921875, -4.0958251953125, -3.81890869140625, -3.5419921875, -3.26507568359375, -2.9881591796875, -2.71124267578125, -2.434326171875, -2.15740966796875, -1.8804931640625, -1.60357666015625, -1.32666015625, -1.04974365234375, -0.7728271484375, -0.49591064453125, -0.218994140625, 0.05792236328125, 0.3348388671875, 0.61175537109375, 0.888671875, 1.16558837890625, 1.4425048828125, 1.71942138671875, 1.996337890625, 2.27325439453125, 2.5501708984375, 2.82708740234375, 3.10400390625, 3.38092041015625, 3.6578369140625, 3.93475341796875, 4.211669921875, 4.48858642578125, 4.7655029296875, 5.04241943359375, 5.3193359375, 5.59625244140625, 5.8731689453125, 6.15008544921875, 6.427001953125, 6.70391845703125, 6.9808349609375, 7.25775146484375, 7.53466796875, 7.81158447265625, 8.0885009765625, 8.36541748046875, 8.642333984375, 8.91925048828125, 9.1961669921875, 9.47308349609375, 9.75]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 10.0, 12.0, 22.0, 19.0, 31.0, 40.0, 69.0, 95.0, 97.0, 144.0, 160.0, 286.0, 376.0, 509.0, 787.0, 1237.0, 1930.0, 2937.0, 5059.0, 8906.0, 17155.0, 43168.0, 872530.0, 50801.0, 18520.0, 9356.0, 5244.0, 3075.0, 1972.0, 1286.0, 812.0, 550.0, 374.0, 263.0, 205.0, 120.0, 95.0, 86.0, 60.0, 39.0, 29.0, 21.0, 22.0, 15.0, 9.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.88818359375, -0.8617095947265625, -0.835235595703125, -0.8087615966796875, -0.78228759765625, -0.7558135986328125, -0.729339599609375, -0.7028656005859375, -0.6763916015625, -0.6499176025390625, -0.623443603515625, -0.5969696044921875, -0.57049560546875, -0.5440216064453125, -0.517547607421875, -0.4910736083984375, -0.464599609375, -0.4381256103515625, -0.411651611328125, -0.3851776123046875, -0.35870361328125, -0.3322296142578125, -0.305755615234375, -0.2792816162109375, -0.2528076171875, -0.2263336181640625, -0.199859619140625, -0.1733856201171875, -0.14691162109375, -0.1204376220703125, -0.093963623046875, -0.0674896240234375, -0.041015625, -0.0145416259765625, 0.011932373046875, 0.0384063720703125, 0.06488037109375, 0.0913543701171875, 0.117828369140625, 0.1443023681640625, 0.1707763671875, 0.1972503662109375, 0.223724365234375, 0.2501983642578125, 0.27667236328125, 0.3031463623046875, 0.329620361328125, 0.3560943603515625, 0.382568359375, 0.4090423583984375, 0.435516357421875, 0.4619903564453125, 0.48846435546875, 0.5149383544921875, 0.541412353515625, 0.5678863525390625, 0.5943603515625, 0.6208343505859375, 0.647308349609375, 0.6737823486328125, 0.70025634765625, 0.7267303466796875, 0.753204345703125, 0.7796783447265625, 0.80615234375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 13.0, 18.0, 21.0, 27.0, 43.0, 44.0, 62.0, 62.0, 77.0, 80.0, 80.0, 92.0, 74.0, 73.0, 61.0, 45.0, 32.0, 23.0, 23.0, 21.0, 11.0, 6.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.783008575439453e-05, -6.52708113193512e-05, -6.271153688430786e-05, -6.0152262449264526e-05, -5.759298801422119e-05, -5.5033713579177856e-05, -5.247443914413452e-05, -4.9915164709091187e-05, -4.735589027404785e-05, -4.4796615839004517e-05, -4.223734140396118e-05, -3.967806696891785e-05, -3.711879253387451e-05, -3.455951809883118e-05, -3.200024366378784e-05, -2.9440969228744507e-05, -2.6881694793701172e-05, -2.4322420358657837e-05, -2.1763145923614502e-05, -1.9203871488571167e-05, -1.6644597053527832e-05, -1.4085322618484497e-05, -1.1526048183441162e-05, -8.966773748397827e-06, -6.407499313354492e-06, -3.848224878311157e-06, -1.2889504432678223e-06, 1.2703239917755127e-06, 3.829598426818848e-06, 6.388872861862183e-06, 8.948147296905518e-06, 1.1507421731948853e-05, 1.4066696166992188e-05, 1.6625970602035522e-05, 1.9185245037078857e-05, 2.1744519472122192e-05, 2.4303793907165527e-05, 2.6863068342208862e-05, 2.9422342777252197e-05, 3.198161721229553e-05, 3.454089164733887e-05, 3.71001660823822e-05, 3.965944051742554e-05, 4.221871495246887e-05, 4.477798938751221e-05, 4.733726382255554e-05, 4.989653825759888e-05, 5.245581269264221e-05, 5.501508712768555e-05, 5.757436156272888e-05, 6.013363599777222e-05, 6.269291043281555e-05, 6.525218486785889e-05, 6.781145930290222e-05, 7.037073373794556e-05, 7.293000817298889e-05, 7.548928260803223e-05, 7.804855704307556e-05, 8.06078314781189e-05, 8.316710591316223e-05, 8.572638034820557e-05, 8.82856547832489e-05, 9.084492921829224e-05, 9.340420365333557e-05, 9.59634780883789e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 5.0, 8.0, 14.0, 14.0, 17.0, 46.0, 66.0, 74.0, 123.0, 144.0, 198.0, 286.0, 488.0, 597.0, 911.0, 1394.0, 2073.0, 3228.0, 4733.0, 7529.0, 11673.0, 19495.0, 32424.0, 54806.0, 93664.0, 159445.0, 216677.0, 175894.0, 106137.0, 61443.0, 35989.0, 21707.0, 13203.0, 8218.0, 5336.0, 3410.0, 2245.0, 1541.0, 1043.0, 728.0, 462.0, 323.0, 231.0, 129.0, 96.0, 92.0, 55.0, 46.0, 22.0, 31.0, 18.0, 7.0, 9.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.353271484375, -0.342437744140625, -0.33160400390625, -0.320770263671875, -0.3099365234375, -0.299102783203125, -0.28826904296875, -0.277435302734375, -0.2666015625, -0.255767822265625, -0.24493408203125, -0.234100341796875, -0.2232666015625, -0.212432861328125, -0.20159912109375, -0.190765380859375, -0.179931640625, -0.169097900390625, -0.15826416015625, -0.147430419921875, -0.1365966796875, -0.125762939453125, -0.11492919921875, -0.104095458984375, -0.09326171875, -0.082427978515625, -0.07159423828125, -0.060760498046875, -0.0499267578125, -0.039093017578125, -0.02825927734375, -0.017425537109375, -0.006591796875, 0.004241943359375, 0.01507568359375, 0.025909423828125, 0.0367431640625, 0.047576904296875, 0.05841064453125, 0.069244384765625, 0.080078125, 0.090911865234375, 0.10174560546875, 0.112579345703125, 0.1234130859375, 0.134246826171875, 0.14508056640625, 0.155914306640625, 0.166748046875, 0.177581787109375, 0.18841552734375, 0.199249267578125, 0.2100830078125, 0.220916748046875, 0.23175048828125, 0.242584228515625, 0.25341796875, 0.264251708984375, 0.27508544921875, 0.285919189453125, 0.2967529296875, 0.307586669921875, 0.31842041015625, 0.329254150390625, 0.340087890625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 3.0, 4.0, 14.0, 15.0, 6.0, 13.0, 20.0, 22.0, 29.0, 23.0, 41.0, 43.0, 45.0, 56.0, 65.0, 77.0, 80.0, 68.0, 68.0, 57.0, 42.0, 47.0, 31.0, 28.0, 19.0, 15.0, 13.0, 10.0, 6.0, 9.0, 6.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095947265625, -0.09211540222167969, -0.08828353881835938, -0.08445167541503906, -0.08061981201171875, -0.07678794860839844, -0.07295608520507812, -0.06912422180175781, -0.0652923583984375, -0.06146049499511719, -0.057628631591796875, -0.05379676818847656, -0.04996490478515625, -0.04613304138183594, -0.042301177978515625, -0.03846931457519531, -0.034637451171875, -0.030805587768554688, -0.026973724365234375, -0.023141860961914062, -0.01930999755859375, -0.015478134155273438, -0.011646270751953125, -0.007814407348632812, -0.0039825439453125, -0.0001506805419921875, 0.003681182861328125, 0.0075130462646484375, 0.01134490966796875, 0.015176773071289062, 0.019008636474609375, 0.022840499877929688, 0.02667236328125, 0.030504226684570312, 0.034336090087890625, 0.03816795349121094, 0.04199981689453125, 0.04583168029785156, 0.049663543701171875, 0.05349540710449219, 0.0573272705078125, 0.06115913391113281, 0.06499099731445312, 0.06882286071777344, 0.07265472412109375, 0.07648658752441406, 0.08031845092773438, 0.08415031433105469, 0.087982177734375, 0.09181404113769531, 0.09564590454101562, 0.09947776794433594, 0.10330963134765625, 0.10714149475097656, 0.11097335815429688, 0.11480522155761719, 0.1186370849609375, 0.12246894836425781, 0.12630081176757812, 0.13013267517089844, 0.13396453857421875, 0.13779640197753906, 0.14162826538085938, 0.1454601287841797, 0.1492919921875]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 14.0, 15.0, 31.0, 22.0, 27.0, 33.0, 35.0, 64.0, 71.0, 75.0, 87.0, 77.0, 77.0, 59.0, 60.0, 43.0, 45.0, 25.0, 28.0, 15.0, 23.0, 8.0, 8.0, 7.0, 4.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-25.956026077270508, -25.233850479125977, -24.511676788330078, -23.789501190185547, -23.06732749938965, -22.345151901245117, -21.62297821044922, -20.900802612304688, -20.178627014160156, -19.456451416015625, -18.734277725219727, -18.012102127075195, -17.289928436279297, -16.567752838134766, -15.84557819366455, -15.123403549194336, -14.401229858398438, -13.679055213928223, -12.956880569458008, -12.234704971313477, -11.512531280517578, -10.790355682373047, -10.068181037902832, -9.346006393432617, -8.623831748962402, -7.9016571044921875, -7.179482460021973, -6.4573073387146, -5.735132694244385, -5.01295804977417, -4.290782928466797, -3.568608283996582, -2.846433639526367, -2.1242589950561523, -1.4020841121673584, -0.6799092292785645, 0.04226541519165039, 0.7644400596618652, 1.4866151809692383, 2.208789825439453, 2.930964469909668, 3.653139114379883, 4.375313758850098, 5.097488880157471, 5.8196635246276855, 6.5418381690979, 7.264013290405273, 7.986187934875488, 8.708362579345703, 9.430537223815918, 10.152711868286133, 10.874887466430664, 11.597061157226562, 12.319236755371094, 13.041411399841309, 13.763586044311523, 14.485760688781738, 15.207935333251953, 15.930109977722168, 16.652284622192383, 17.374460220336914, 18.096633911132812, 18.818809509277344, 19.540985107421875, 20.263158798217773]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 7.0, 7.0, 9.0, 9.0, 7.0, 14.0, 11.0, 14.0, 15.0, 13.0, 17.0, 20.0, 20.0, 33.0, 29.0, 37.0, 35.0, 35.0, 36.0, 36.0, 50.0, 52.0, 35.0, 29.0, 27.0, 38.0, 38.0, 42.0, 35.0, 39.0, 30.0, 28.0, 23.0, 17.0, 16.0, 28.0, 10.0, 13.0, 8.0, 10.0, 5.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.024079322814941, -11.625411033630371, -11.226743698120117, -10.828075408935547, -10.429408073425293, -10.030739784240723, -9.632072448730469, -9.233404159545898, -8.834735870361328, -8.436067581176758, -8.037400245666504, -7.638731956481934, -7.24006462097168, -6.841396331787109, -6.442728519439697, -6.044060707092285, -5.645393371582031, -5.246725559234619, -4.848057746887207, -4.449389457702637, -4.050722122192383, -3.6520540714263916, -3.2533860206604004, -2.8547182083129883, -2.456050395965576, -2.057382583618164, -1.6587146520614624, -1.2600467205047607, -0.8613789081573486, -0.4627110958099365, -0.06404304504394531, 0.3346247673034668, 0.7332916259765625, 1.1319594383239746, 1.5306273698806763, 1.929295301437378, 2.32796311378479, 2.726630926132202, 3.1252989768981934, 3.5239667892456055, 3.9226346015930176, 4.32130241394043, 4.719970226287842, 5.118638038635254, 5.517306327819824, 5.915973663330078, 6.314641952514648, 6.7133097648620605, 7.111977577209473, 7.510645389556885, 7.909313201904297, 8.307981491088867, 8.706648826599121, 9.105317115783691, 9.503984451293945, 9.902652740478516, 10.301321029663086, 10.699989318847656, 11.09865665435791, 11.49732494354248, 11.895992279052734, 12.294660568237305, 12.693328857421875, 13.091996192932129, 13.490663528442383]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 14.0, 11.0, 18.0, 26.0, 33.0, 36.0, 59.0, 91.0, 190.0, 262.0, 400.0, 647.0, 1117.0, 1901.0, 3308.0, 5923.0, 10931.0, 19687.0, 38333.0, 75990.0, 150801.0, 239828.0, 226490.0, 132195.0, 66749.0, 33446.0, 17562.0, 9722.0, 5368.0, 3052.0, 1742.0, 987.0, 583.0, 388.0, 230.0, 135.0, 85.0, 74.0, 40.0, 33.0, 19.0, 11.0, 12.0, 6.0, 6.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.15625, -17.587158203125, -17.01806640625, -16.448974609375, -15.8798828125, -15.310791015625, -14.74169921875, -14.172607421875, -13.603515625, -13.034423828125, -12.46533203125, -11.896240234375, -11.3271484375, -10.758056640625, -10.18896484375, -9.619873046875, -9.05078125, -8.481689453125, -7.91259765625, -7.343505859375, -6.7744140625, -6.205322265625, -5.63623046875, -5.067138671875, -4.498046875, -3.928955078125, -3.35986328125, -2.790771484375, -2.2216796875, -1.652587890625, -1.08349609375, -0.514404296875, 0.0546875, 0.623779296875, 1.19287109375, 1.761962890625, 2.3310546875, 2.900146484375, 3.46923828125, 4.038330078125, 4.607421875, 5.176513671875, 5.74560546875, 6.314697265625, 6.8837890625, 7.452880859375, 8.02197265625, 8.591064453125, 9.16015625, 9.729248046875, 10.29833984375, 10.867431640625, 11.4365234375, 12.005615234375, 12.57470703125, 13.143798828125, 13.712890625, 14.281982421875, 14.85107421875, 15.420166015625, 15.9892578125, 16.558349609375, 17.12744140625, 17.696533203125, 18.265625]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 11.0, 6.0, 4.0, 9.0, 7.0, 15.0, 13.0, 12.0, 12.0, 14.0, 17.0, 27.0, 31.0, 26.0, 21.0, 30.0, 30.0, 42.0, 29.0, 37.0, 44.0, 31.0, 40.0, 34.0, 33.0, 36.0, 32.0, 43.0, 36.0, 37.0, 32.0, 24.0, 23.0, 22.0, 17.0, 18.0, 14.0, 11.0, 10.0, 11.0, 10.0, 7.0, 12.0, 6.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.3125, -12.92333984375, -12.5341796875, -12.14501953125, -11.755859375, -11.36669921875, -10.9775390625, -10.58837890625, -10.19921875, -9.81005859375, -9.4208984375, -9.03173828125, -8.642578125, -8.25341796875, -7.8642578125, -7.47509765625, -7.0859375, -6.69677734375, -6.3076171875, -5.91845703125, -5.529296875, -5.14013671875, -4.7509765625, -4.36181640625, -3.97265625, -3.58349609375, -3.1943359375, -2.80517578125, -2.416015625, -2.02685546875, -1.6376953125, -1.24853515625, -0.859375, -0.47021484375, -0.0810546875, 0.30810546875, 0.697265625, 1.08642578125, 1.4755859375, 1.86474609375, 2.25390625, 2.64306640625, 3.0322265625, 3.42138671875, 3.810546875, 4.19970703125, 4.5888671875, 4.97802734375, 5.3671875, 5.75634765625, 6.1455078125, 6.53466796875, 6.923828125, 7.31298828125, 7.7021484375, 8.09130859375, 8.48046875, 8.86962890625, 9.2587890625, 9.64794921875, 10.037109375, 10.42626953125, 10.8154296875, 11.20458984375, 11.59375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 7.0, 9.0, 11.0, 27.0, 31.0, 40.0, 84.0, 110.0, 136.0, 220.0, 344.0, 489.0, 774.0, 1135.0, 1805.0, 2671.0, 4246.0, 6521.0, 10263.0, 16933.0, 28152.0, 47590.0, 81499.0, 133369.0, 185538.0, 186846.0, 134688.0, 82518.0, 47975.0, 28489.0, 16857.0, 10397.0, 6724.0, 4249.0, 2690.0, 1746.0, 1145.0, 760.0, 482.0, 333.0, 224.0, 151.0, 98.0, 58.0, 43.0, 32.0, 16.0, 7.0, 13.0, 7.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8125, -14.3497314453125, -13.886962890625, -13.4241943359375, -12.96142578125, -12.4986572265625, -12.035888671875, -11.5731201171875, -11.1103515625, -10.6475830078125, -10.184814453125, -9.7220458984375, -9.25927734375, -8.7965087890625, -8.333740234375, -7.8709716796875, -7.408203125, -6.9454345703125, -6.482666015625, -6.0198974609375, -5.55712890625, -5.0943603515625, -4.631591796875, -4.1688232421875, -3.7060546875, -3.2432861328125, -2.780517578125, -2.3177490234375, -1.85498046875, -1.3922119140625, -0.929443359375, -0.4666748046875, -0.00390625, 0.4588623046875, 0.921630859375, 1.3843994140625, 1.84716796875, 2.3099365234375, 2.772705078125, 3.2354736328125, 3.6982421875, 4.1610107421875, 4.623779296875, 5.0865478515625, 5.54931640625, 6.0120849609375, 6.474853515625, 6.9376220703125, 7.400390625, 7.8631591796875, 8.325927734375, 8.7886962890625, 9.25146484375, 9.7142333984375, 10.177001953125, 10.6397705078125, 11.1025390625, 11.5653076171875, 12.028076171875, 12.4908447265625, 12.95361328125, 13.4163818359375, 13.879150390625, 14.3419189453125, 14.8046875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 6.0, 6.0, 2.0, 6.0, 3.0, 12.0, 8.0, 16.0, 16.0, 11.0, 21.0, 17.0, 22.0, 22.0, 41.0, 39.0, 33.0, 41.0, 32.0, 47.0, 52.0, 40.0, 35.0, 37.0, 37.0, 36.0, 37.0, 34.0, 32.0, 21.0, 34.0, 23.0, 29.0, 25.0, 23.0, 18.0, 11.0, 18.0, 7.0, 13.0, 6.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0], "bins": [-8.7734375, -8.5079345703125, -8.242431640625, -7.9769287109375, -7.71142578125, -7.4459228515625, -7.180419921875, -6.9149169921875, -6.6494140625, -6.3839111328125, -6.118408203125, -5.8529052734375, -5.58740234375, -5.3218994140625, -5.056396484375, -4.7908935546875, -4.525390625, -4.2598876953125, -3.994384765625, -3.7288818359375, -3.46337890625, -3.1978759765625, -2.932373046875, -2.6668701171875, -2.4013671875, -2.1358642578125, -1.870361328125, -1.6048583984375, -1.33935546875, -1.0738525390625, -0.808349609375, -0.5428466796875, -0.27734375, -0.0118408203125, 0.253662109375, 0.5191650390625, 0.78466796875, 1.0501708984375, 1.315673828125, 1.5811767578125, 1.8466796875, 2.1121826171875, 2.377685546875, 2.6431884765625, 2.90869140625, 3.1741943359375, 3.439697265625, 3.7052001953125, 3.970703125, 4.2362060546875, 4.501708984375, 4.7672119140625, 5.03271484375, 5.2982177734375, 5.563720703125, 5.8292236328125, 6.0947265625, 6.3602294921875, 6.625732421875, 6.8912353515625, 7.15673828125, 7.4222412109375, 7.687744140625, 7.9532470703125, 8.21875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 10.0, 14.0, 22.0, 26.0, 46.0, 72.0, 98.0, 136.0, 192.0, 266.0, 449.0, 639.0, 1013.0, 1610.0, 2603.0, 4580.0, 8487.0, 17178.0, 40013.0, 107261.0, 291275.0, 340000.0, 138239.0, 50188.0, 20851.0, 10021.0, 5303.0, 2881.0, 1785.0, 1132.0, 712.0, 467.0, 309.0, 195.0, 132.0, 97.0, 83.0, 56.0, 35.0, 30.0, 13.0, 12.0, 3.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.796875, -16.27392578125, -15.7509765625, -15.22802734375, -14.705078125, -14.18212890625, -13.6591796875, -13.13623046875, -12.61328125, -12.09033203125, -11.5673828125, -11.04443359375, -10.521484375, -9.99853515625, -9.4755859375, -8.95263671875, -8.4296875, -7.90673828125, -7.3837890625, -6.86083984375, -6.337890625, -5.81494140625, -5.2919921875, -4.76904296875, -4.24609375, -3.72314453125, -3.2001953125, -2.67724609375, -2.154296875, -1.63134765625, -1.1083984375, -0.58544921875, -0.0625, 0.46044921875, 0.9833984375, 1.50634765625, 2.029296875, 2.55224609375, 3.0751953125, 3.59814453125, 4.12109375, 4.64404296875, 5.1669921875, 5.68994140625, 6.212890625, 6.73583984375, 7.2587890625, 7.78173828125, 8.3046875, 8.82763671875, 9.3505859375, 9.87353515625, 10.396484375, 10.91943359375, 11.4423828125, 11.96533203125, 12.48828125, 13.01123046875, 13.5341796875, 14.05712890625, 14.580078125, 15.10302734375, 15.6259765625, 16.14892578125, 16.671875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 4.0, 14.0, 15.0, 18.0, 20.0, 39.0, 61.0, 63.0, 70.0, 110.0, 126.0, 109.0, 94.0, 54.0, 44.0, 26.0, 19.0, 32.0, 22.0, 15.0, 10.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013408660888671875, -0.0012966841459274292, -0.001252502202987671, -0.0012083202600479126, -0.0011641383171081543, -0.001119956374168396, -0.0010757744312286377, -0.0010315924882888794, -0.000987410545349121, -0.0009432286024093628, -0.0008990466594696045, -0.0008548647165298462, -0.0008106827735900879, -0.0007665008306503296, -0.0007223188877105713, -0.000678136944770813, -0.0006339550018310547, -0.0005897730588912964, -0.0005455911159515381, -0.0005014091730117798, -0.0004572272300720215, -0.0004130452871322632, -0.0003688633441925049, -0.0003246814012527466, -0.0002804994583129883, -0.00023631751537322998, -0.00019213557243347168, -0.00014795362949371338, -0.00010377168655395508, -5.958974361419678e-05, -1.5407800674438477e-05, 2.8774142265319824e-05, 7.295608520507812e-05, 0.00011713802814483643, 0.00016131997108459473, 0.00020550191402435303, 0.00024968385696411133, 0.00029386579990386963, 0.00033804774284362793, 0.00038222968578338623, 0.00042641162872314453, 0.00047059357166290283, 0.0005147755146026611, 0.0005589574575424194, 0.0006031394004821777, 0.000647321343421936, 0.0006915032863616943, 0.0007356852293014526, 0.0007798671722412109, 0.0008240491151809692, 0.0008682310581207275, 0.0009124130010604858, 0.0009565949440002441, 0.0010007768869400024, 0.0010449588298797607, 0.001089140772819519, 0.0011333227157592773, 0.0011775046586990356, 0.001221686601638794, 0.0012658685445785522, 0.0013100504875183105, 0.0013542324304580688, 0.0013984143733978271, 0.0014425963163375854, 0.0014867782592773438]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 2.0, 10.0, 9.0, 5.0, 21.0, 27.0, 23.0, 27.0, 57.0, 90.0, 117.0, 226.0, 403.0, 596.0, 1014.0, 1884.0, 3856.0, 8038.0, 19764.0, 59052.0, 212747.0, 447975.0, 201719.0, 55834.0, 19011.0, 7892.0, 3684.0, 1874.0, 1042.0, 567.0, 320.0, 196.0, 144.0, 106.0, 62.0, 43.0, 30.0, 25.0, 13.0, 12.0, 7.0, 3.0, 7.0, 11.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.21875, -20.5849609375, -19.951171875, -19.3173828125, -18.68359375, -18.0498046875, -17.416015625, -16.7822265625, -16.1484375, -15.5146484375, -14.880859375, -14.2470703125, -13.61328125, -12.9794921875, -12.345703125, -11.7119140625, -11.078125, -10.4443359375, -9.810546875, -9.1767578125, -8.54296875, -7.9091796875, -7.275390625, -6.6416015625, -6.0078125, -5.3740234375, -4.740234375, -4.1064453125, -3.47265625, -2.8388671875, -2.205078125, -1.5712890625, -0.9375, -0.3037109375, 0.330078125, 0.9638671875, 1.59765625, 2.2314453125, 2.865234375, 3.4990234375, 4.1328125, 4.7666015625, 5.400390625, 6.0341796875, 6.66796875, 7.3017578125, 7.935546875, 8.5693359375, 9.203125, 9.8369140625, 10.470703125, 11.1044921875, 11.73828125, 12.3720703125, 13.005859375, 13.6396484375, 14.2734375, 14.9072265625, 15.541015625, 16.1748046875, 16.80859375, 17.4423828125, 18.076171875, 18.7099609375, 19.34375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 6.0, 5.0, 10.0, 14.0, 19.0, 26.0, 38.0, 49.0, 57.0, 63.0, 58.0, 93.0, 99.0, 81.0, 59.0, 68.0, 52.0, 30.0, 37.0, 33.0, 17.0, 13.0, 20.0, 10.0, 6.0, 7.0, 7.0, 6.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.5546875, -4.43914794921875, -4.3236083984375, -4.20806884765625, -4.092529296875, -3.97698974609375, -3.8614501953125, -3.74591064453125, -3.63037109375, -3.51483154296875, -3.3992919921875, -3.28375244140625, -3.168212890625, -3.05267333984375, -2.9371337890625, -2.82159423828125, -2.7060546875, -2.59051513671875, -2.4749755859375, -2.35943603515625, -2.243896484375, -2.12835693359375, -2.0128173828125, -1.89727783203125, -1.78173828125, -1.66619873046875, -1.5506591796875, -1.43511962890625, -1.319580078125, -1.20404052734375, -1.0885009765625, -0.97296142578125, -0.857421875, -0.74188232421875, -0.6263427734375, -0.51080322265625, -0.395263671875, -0.27972412109375, -0.1641845703125, -0.04864501953125, 0.06689453125, 0.18243408203125, 0.2979736328125, 0.41351318359375, 0.529052734375, 0.64459228515625, 0.7601318359375, 0.87567138671875, 0.9912109375, 1.10675048828125, 1.2222900390625, 1.33782958984375, 1.453369140625, 1.56890869140625, 1.6844482421875, 1.79998779296875, 1.91552734375, 2.03106689453125, 2.1466064453125, 2.26214599609375, 2.377685546875, 2.49322509765625, 2.6087646484375, 2.72430419921875, 2.83984375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 10.0, 11.0, 15.0, 11.0, 22.0, 21.0, 35.0, 33.0, 61.0, 60.0, 81.0, 81.0, 74.0, 88.0, 75.0, 67.0, 52.0, 45.0, 40.0, 27.0, 28.0, 11.0, 8.0, 3.0, 8.0, 7.0, 2.0, 1.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.318313598632812, -22.552827835083008, -21.787342071533203, -21.02185821533203, -20.256372451782227, -19.490886688232422, -18.725400924682617, -17.959915161132812, -17.19443130493164, -16.428945541381836, -15.663460731506348, -14.897974967956543, -14.132490158081055, -13.36700439453125, -12.601518630981445, -11.836033821105957, -11.070548057556152, -10.305062294006348, -9.53957748413086, -8.774091720581055, -8.008606910705566, -7.243121147155762, -6.477635860443115, -5.712150573730469, -4.946665287017822, -4.181180000305176, -3.4156947135925293, -2.6502091884613037, -1.8847239017486572, -1.1192386150360107, -0.35375308990478516, 0.41173219680786133, 1.1772174835205078, 1.9427027702331543, 2.708188056945801, 3.4736735820770264, 4.239158630371094, 5.004644393920898, 5.770129680633545, 6.535614967346191, 7.301100254058838, 8.066585540771484, 8.832071304321289, 9.597556114196777, 10.363041877746582, 11.12852668762207, 11.894012451171875, 12.65949821472168, 13.424983024597168, 14.190468788146973, 14.955953598022461, 15.721439361572266, 16.48692512512207, 17.252408981323242, 18.017894744873047, 18.78338050842285, 19.548866271972656, 20.31435203552246, 21.079837799072266, 21.845321655273438, 22.610807418823242, 23.376293182373047, 24.14177894592285, 24.907264709472656, 25.672748565673828]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 9.0, 10.0, 17.0, 12.0, 17.0, 17.0, 19.0, 16.0, 22.0, 29.0, 31.0, 22.0, 29.0, 33.0, 31.0, 39.0, 47.0, 43.0, 46.0, 51.0, 47.0, 43.0, 41.0, 38.0, 27.0, 36.0, 25.0, 29.0, 27.0, 21.0, 16.0, 18.0, 12.0, 12.0, 12.0, 12.0, 9.0, 6.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.170042991638184, -12.753195762634277, -12.336348533630371, -11.919501304626465, -11.502654075622559, -11.085806846618652, -10.668959617614746, -10.25211238861084, -9.835265159606934, -9.418417930603027, -9.001570701599121, -8.584723472595215, -8.167876243591309, -7.751029014587402, -7.334181785583496, -6.91733455657959, -6.500486850738525, -6.083639621734619, -5.666792392730713, -5.249945163726807, -4.8330979347229, -4.416250228881836, -3.999403238296509, -3.5825560092926025, -3.1657087802886963, -2.74886155128479, -2.332014322280884, -1.915166974067688, -1.4983197450637817, -1.081472396850586, -0.6646251678466797, -0.24777793884277344, 0.1690692901611328, 0.5859165191650391, 1.0027637481689453, 1.4196110963821411, 1.8364583253860474, 2.253305673599243, 2.6701529026031494, 3.0870001316070557, 3.503847360610962, 3.920694589614868, 4.3375420570373535, 4.75438928604126, 5.171236515045166, 5.588083744049072, 6.0049309730529785, 6.421778202056885, 6.838625431060791, 7.255472660064697, 7.6723198890686035, 8.089167594909668, 8.506014823913574, 8.92286205291748, 9.339709281921387, 9.756556510925293, 10.1734037399292, 10.590250968933105, 11.007098197937012, 11.423945426940918, 11.840792655944824, 12.25763988494873, 12.674487113952637, 13.091334342956543, 13.50818157196045]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 8.0, 13.0, 17.0, 20.0, 38.0, 40.0, 57.0, 97.0, 162.0, 210.0, 327.0, 492.0, 762.0, 1121.0, 1916.0, 3084.0, 5263.0, 9544.0, 18618.0, 39217.0, 100930.0, 320763.0, 1034923.0, 1586853.0, 722828.0, 212947.0, 71373.0, 29495.0, 14121.0, 7646.0, 4236.0, 2652.0, 1591.0, 974.0, 600.0, 445.0, 274.0, 197.0, 117.0, 85.0, 71.0, 48.0, 30.0, 23.0, 13.0, 9.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-25.984375, -25.127685546875, -24.27099609375, -23.414306640625, -22.5576171875, -21.700927734375, -20.84423828125, -19.987548828125, -19.130859375, -18.274169921875, -17.41748046875, -16.560791015625, -15.7041015625, -14.847412109375, -13.99072265625, -13.134033203125, -12.27734375, -11.420654296875, -10.56396484375, -9.707275390625, -8.8505859375, -7.993896484375, -7.13720703125, -6.280517578125, -5.423828125, -4.567138671875, -3.71044921875, -2.853759765625, -1.9970703125, -1.140380859375, -0.28369140625, 0.572998046875, 1.4296875, 2.286376953125, 3.14306640625, 3.999755859375, 4.8564453125, 5.713134765625, 6.56982421875, 7.426513671875, 8.283203125, 9.139892578125, 9.99658203125, 10.853271484375, 11.7099609375, 12.566650390625, 13.42333984375, 14.280029296875, 15.13671875, 15.993408203125, 16.85009765625, 17.706787109375, 18.5634765625, 19.420166015625, 20.27685546875, 21.133544921875, 21.990234375, 22.846923828125, 23.70361328125, 24.560302734375, 25.4169921875, 26.273681640625, 27.13037109375, 27.987060546875, 28.84375]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 14.0, 9.0, 19.0, 10.0, 13.0, 22.0, 19.0, 26.0, 25.0, 26.0, 27.0, 32.0, 32.0, 42.0, 34.0, 42.0, 54.0, 54.0, 49.0, 50.0, 34.0, 43.0, 41.0, 42.0, 37.0, 19.0, 29.0, 25.0, 18.0, 19.0, 12.0, 16.0, 17.0, 6.0, 3.0, 8.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.546875, -11.1680908203125, -10.789306640625, -10.4105224609375, -10.03173828125, -9.6529541015625, -9.274169921875, -8.8953857421875, -8.5166015625, -8.1378173828125, -7.759033203125, -7.3802490234375, -7.00146484375, -6.6226806640625, -6.243896484375, -5.8651123046875, -5.486328125, -5.1075439453125, -4.728759765625, -4.3499755859375, -3.97119140625, -3.5924072265625, -3.213623046875, -2.8348388671875, -2.4560546875, -2.0772705078125, -1.698486328125, -1.3197021484375, -0.94091796875, -0.5621337890625, -0.183349609375, 0.1954345703125, 0.57421875, 0.9530029296875, 1.331787109375, 1.7105712890625, 2.08935546875, 2.4681396484375, 2.846923828125, 3.2257080078125, 3.6044921875, 3.9832763671875, 4.362060546875, 4.7408447265625, 5.11962890625, 5.4984130859375, 5.877197265625, 6.2559814453125, 6.634765625, 7.0135498046875, 7.392333984375, 7.7711181640625, 8.14990234375, 8.5286865234375, 8.907470703125, 9.2862548828125, 9.6650390625, 10.0438232421875, 10.422607421875, 10.8013916015625, 11.18017578125, 11.5589599609375, 11.937744140625, 12.3165283203125, 12.6953125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 5.0, 9.0, 13.0, 11.0, 13.0, 20.0, 60.0, 61.0, 93.0, 102.0, 168.0, 282.0, 407.0, 629.0, 900.0, 1535.0, 2327.0, 3758.0, 5901.0, 10272.0, 18412.0, 34839.0, 71443.0, 165178.0, 441676.0, 1181697.0, 1341344.0, 542624.0, 198524.0, 82849.0, 39687.0, 20242.0, 11299.0, 6658.0, 4142.0, 2519.0, 1551.0, 1069.0, 648.0, 451.0, 276.0, 184.0, 141.0, 86.0, 72.0, 34.0, 30.0, 21.0, 4.0, 7.0, 9.0, 6.0, 2.0, 2.0, 1.0, 2.0], "bins": [-32.78125, -31.81982421875, -30.8583984375, -29.89697265625, -28.935546875, -27.97412109375, -27.0126953125, -26.05126953125, -25.08984375, -24.12841796875, -23.1669921875, -22.20556640625, -21.244140625, -20.28271484375, -19.3212890625, -18.35986328125, -17.3984375, -16.43701171875, -15.4755859375, -14.51416015625, -13.552734375, -12.59130859375, -11.6298828125, -10.66845703125, -9.70703125, -8.74560546875, -7.7841796875, -6.82275390625, -5.861328125, -4.89990234375, -3.9384765625, -2.97705078125, -2.015625, -1.05419921875, -0.0927734375, 0.86865234375, 1.830078125, 2.79150390625, 3.7529296875, 4.71435546875, 5.67578125, 6.63720703125, 7.5986328125, 8.56005859375, 9.521484375, 10.48291015625, 11.4443359375, 12.40576171875, 13.3671875, 14.32861328125, 15.2900390625, 16.25146484375, 17.212890625, 18.17431640625, 19.1357421875, 20.09716796875, 21.05859375, 22.02001953125, 22.9814453125, 23.94287109375, 24.904296875, 25.86572265625, 26.8271484375, 27.78857421875, 28.75]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 7.0, 1.0, 7.0, 10.0, 18.0, 14.0, 28.0, 14.0, 46.0, 32.0, 41.0, 59.0, 102.0, 102.0, 144.0, 192.0, 216.0, 291.0, 342.0, 369.0, 357.0, 344.0, 295.0, 240.0, 177.0, 147.0, 111.0, 97.0, 54.0, 40.0, 36.0, 35.0, 26.0, 18.0, 16.0, 6.0, 10.0, 9.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-8.9453125, -8.687744140625, -8.43017578125, -8.172607421875, -7.9150390625, -7.657470703125, -7.39990234375, -7.142333984375, -6.884765625, -6.627197265625, -6.36962890625, -6.112060546875, -5.8544921875, -5.596923828125, -5.33935546875, -5.081787109375, -4.82421875, -4.566650390625, -4.30908203125, -4.051513671875, -3.7939453125, -3.536376953125, -3.27880859375, -3.021240234375, -2.763671875, -2.506103515625, -2.24853515625, -1.990966796875, -1.7333984375, -1.475830078125, -1.21826171875, -0.960693359375, -0.703125, -0.445556640625, -0.18798828125, 0.069580078125, 0.3271484375, 0.584716796875, 0.84228515625, 1.099853515625, 1.357421875, 1.614990234375, 1.87255859375, 2.130126953125, 2.3876953125, 2.645263671875, 2.90283203125, 3.160400390625, 3.41796875, 3.675537109375, 3.93310546875, 4.190673828125, 4.4482421875, 4.705810546875, 4.96337890625, 5.220947265625, 5.478515625, 5.736083984375, 5.99365234375, 6.251220703125, 6.5087890625, 6.766357421875, 7.02392578125, 7.281494140625, 7.5390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 9.0, 12.0, 12.0, 11.0, 15.0, 17.0, 18.0, 27.0, 35.0, 40.0, 47.0, 68.0, 65.0, 67.0, 79.0, 77.0, 56.0, 60.0, 55.0, 49.0, 28.0, 29.0, 22.0, 18.0, 14.0, 13.0, 7.0, 9.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.455156326293945, -22.683570861816406, -21.9119873046875, -21.14040184020996, -20.368816375732422, -19.597232818603516, -18.825647354125977, -18.054061889648438, -17.28247833251953, -16.510892868041992, -15.739309310913086, -14.967723846435547, -14.196139335632324, -13.424554824829102, -12.652969360351562, -11.88138484954834, -11.109800338745117, -10.338215827941895, -9.566631317138672, -8.795045852661133, -8.02346134185791, -7.2518768310546875, -6.480291843414307, -5.708706855773926, -4.937122344970703, -4.1655378341674805, -3.3939528465270996, -2.622368097305298, -1.850783348083496, -1.0791985988616943, -0.3076138496398926, 0.4639711380004883, 1.2355537414550781, 2.00713849067688, 2.7787232398986816, 3.5503079891204834, 4.321892738342285, 5.093477249145508, 5.865062236785889, 6.6366472244262695, 7.408231735229492, 8.179816246032715, 8.951400756835938, 9.722986221313477, 10.4945707321167, 11.266155242919922, 12.037740707397461, 12.809325218200684, 13.580909729003906, 14.352494239807129, 15.124078750610352, 15.89566421508789, 16.667247772216797, 17.438833236694336, 18.210418701171875, 18.98200225830078, 19.75358772277832, 20.52517318725586, 21.296756744384766, 22.068342208862305, 22.839927673339844, 23.61151123046875, 24.38309669494629, 25.154682159423828, 25.926265716552734]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 5.0, 4.0, 5.0, 9.0, 8.0, 5.0, 15.0, 17.0, 22.0, 26.0, 17.0, 18.0, 25.0, 25.0, 38.0, 29.0, 37.0, 30.0, 29.0, 35.0, 31.0, 40.0, 48.0, 47.0, 41.0, 44.0, 33.0, 45.0, 29.0, 31.0, 21.0, 23.0, 26.0, 27.0, 14.0, 14.0, 19.0, 17.0, 5.0, 11.0, 8.0, 9.0, 3.0, 2.0, 5.0, 4.0, 3.0, 1.0, 1.0, 5.0], "bins": [-16.431198120117188, -15.974394798278809, -15.517590522766113, -15.060787200927734, -14.603982925415039, -14.14717960357666, -13.690376281738281, -13.233572006225586, -12.776768684387207, -12.319965362548828, -11.863161087036133, -11.406357765197754, -10.949554443359375, -10.49275016784668, -10.0359468460083, -9.579143524169922, -9.122339248657227, -8.665535926818848, -8.208731651306152, -7.751928329467773, -7.295124530792236, -6.838320732116699, -6.38151741027832, -5.924713611602783, -5.467909812927246, -5.011106014251709, -4.554302215576172, -4.097498893737793, -3.640695095062256, -3.1838912963867188, -2.7270877361297607, -2.2702841758728027, -1.8134803771972656, -1.356676697731018, -0.8998730182647705, -0.44306933879852295, 0.01373434066772461, 0.4705381393432617, 0.9273416996002197, 1.3841452598571777, 1.8409490585327148, 2.297752857208252, 2.75455641746521, 3.211359977722168, 3.668163776397705, 4.124967575073242, 4.581770896911621, 5.038574695587158, 5.495378494262695, 5.952182292938232, 6.4089860916137695, 6.865789413452148, 7.3225932121276855, 7.779397010803223, 8.236200332641602, 8.693004608154297, 9.149807929992676, 9.606611251831055, 10.06341552734375, 10.520218849182129, 10.977022171020508, 11.433826446533203, 11.890629768371582, 12.347433090209961, 12.804237365722656]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 5.0, 4.0, 10.0, 10.0, 24.0, 26.0, 30.0, 48.0, 72.0, 103.0, 138.0, 215.0, 311.0, 458.0, 627.0, 932.0, 1443.0, 2086.0, 3233.0, 5022.0, 8001.0, 12571.0, 20173.0, 33852.0, 59010.0, 107119.0, 195611.0, 240482.0, 154540.0, 83129.0, 46292.0, 27279.0, 16446.0, 10269.0, 6518.0, 4157.0, 2637.0, 1831.0, 1218.0, 795.0, 610.0, 380.0, 242.0, 216.0, 130.0, 86.0, 59.0, 40.0, 25.0, 15.0, 11.0, 9.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.990234375, -1.924530029296875, -1.85882568359375, -1.793121337890625, -1.7274169921875, -1.661712646484375, -1.59600830078125, -1.530303955078125, -1.464599609375, -1.398895263671875, -1.33319091796875, -1.267486572265625, -1.2017822265625, -1.136077880859375, -1.07037353515625, -1.004669189453125, -0.93896484375, -0.873260498046875, -0.80755615234375, -0.741851806640625, -0.6761474609375, -0.610443115234375, -0.54473876953125, -0.479034423828125, -0.413330078125, -0.347625732421875, -0.28192138671875, -0.216217041015625, -0.1505126953125, -0.084808349609375, -0.01910400390625, 0.046600341796875, 0.1123046875, 0.178009033203125, 0.24371337890625, 0.309417724609375, 0.3751220703125, 0.440826416015625, 0.50653076171875, 0.572235107421875, 0.637939453125, 0.703643798828125, 0.76934814453125, 0.835052490234375, 0.9007568359375, 0.966461181640625, 1.03216552734375, 1.097869873046875, 1.16357421875, 1.229278564453125, 1.29498291015625, 1.360687255859375, 1.4263916015625, 1.492095947265625, 1.55780029296875, 1.623504638671875, 1.689208984375, 1.754913330078125, 1.82061767578125, 1.886322021484375, 1.9520263671875, 2.017730712890625, 2.08343505859375, 2.149139404296875, 2.21484375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 6.0, 7.0, 12.0, 5.0, 11.0, 8.0, 13.0, 23.0, 28.0, 24.0, 33.0, 32.0, 30.0, 43.0, 28.0, 28.0, 32.0, 32.0, 32.0, 40.0, 40.0, 50.0, 47.0, 43.0, 32.0, 37.0, 30.0, 32.0, 21.0, 28.0, 22.0, 21.0, 24.0, 13.0, 13.0, 8.0, 18.0, 7.0, 9.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0], "bins": [-16.9375, -16.4395751953125, -15.941650390625, -15.4437255859375, -14.94580078125, -14.4478759765625, -13.949951171875, -13.4520263671875, -12.9541015625, -12.4561767578125, -11.958251953125, -11.4603271484375, -10.96240234375, -10.4644775390625, -9.966552734375, -9.4686279296875, -8.970703125, -8.4727783203125, -7.974853515625, -7.4769287109375, -6.97900390625, -6.4810791015625, -5.983154296875, -5.4852294921875, -4.9873046875, -4.4893798828125, -3.991455078125, -3.4935302734375, -2.99560546875, -2.4976806640625, -1.999755859375, -1.5018310546875, -1.00390625, -0.5059814453125, -0.008056640625, 0.4898681640625, 0.98779296875, 1.4857177734375, 1.983642578125, 2.4815673828125, 2.9794921875, 3.4774169921875, 3.975341796875, 4.4732666015625, 4.97119140625, 5.4691162109375, 5.967041015625, 6.4649658203125, 6.962890625, 7.4608154296875, 7.958740234375, 8.4566650390625, 8.95458984375, 9.4525146484375, 9.950439453125, 10.4483642578125, 10.9462890625, 11.4442138671875, 11.942138671875, 12.4400634765625, 12.93798828125, 13.4359130859375, 13.933837890625, 14.4317626953125, 14.9296875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 5.0, 9.0, 9.0, 12.0, 19.0, 27.0, 35.0, 71.0, 114.0, 151.0, 238.0, 378.0, 600.0, 1082.0, 1914.0, 3714.0, 8130.0, 22784.0, 368084.0, 599098.0, 24623.0, 8727.0, 3904.0, 2010.0, 1096.0, 619.0, 383.0, 245.0, 152.0, 123.0, 63.0, 53.0, 31.0, 16.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.1015625, -8.8341064453125, -8.566650390625, -8.2991943359375, -8.03173828125, -7.7642822265625, -7.496826171875, -7.2293701171875, -6.9619140625, -6.6944580078125, -6.427001953125, -6.1595458984375, -5.89208984375, -5.6246337890625, -5.357177734375, -5.0897216796875, -4.822265625, -4.5548095703125, -4.287353515625, -4.0198974609375, -3.75244140625, -3.4849853515625, -3.217529296875, -2.9500732421875, -2.6826171875, -2.4151611328125, -2.147705078125, -1.8802490234375, -1.61279296875, -1.3453369140625, -1.077880859375, -0.8104248046875, -0.54296875, -0.2755126953125, -0.008056640625, 0.2593994140625, 0.52685546875, 0.7943115234375, 1.061767578125, 1.3292236328125, 1.5966796875, 1.8641357421875, 2.131591796875, 2.3990478515625, 2.66650390625, 2.9339599609375, 3.201416015625, 3.4688720703125, 3.736328125, 4.0037841796875, 4.271240234375, 4.5386962890625, 4.80615234375, 5.0736083984375, 5.341064453125, 5.6085205078125, 5.8759765625, 6.1434326171875, 6.410888671875, 6.6783447265625, 6.94580078125, 7.2132568359375, 7.480712890625, 7.7481689453125, 8.015625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 7.0, 8.0, 11.0, 13.0, 11.0, 7.0, 23.0, 24.0, 19.0, 31.0, 40.0, 27.0, 44.0, 40.0, 45.0, 44.0, 45.0, 41.0, 51.0, 55.0, 35.0, 36.0, 48.0, 40.0, 36.0, 33.0, 24.0, 26.0, 28.0, 16.0, 25.0, 13.0, 12.0, 6.0, 13.0, 7.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6953125, -10.33935546875, -9.9833984375, -9.62744140625, -9.271484375, -8.91552734375, -8.5595703125, -8.20361328125, -7.84765625, -7.49169921875, -7.1357421875, -6.77978515625, -6.423828125, -6.06787109375, -5.7119140625, -5.35595703125, -5.0, -4.64404296875, -4.2880859375, -3.93212890625, -3.576171875, -3.22021484375, -2.8642578125, -2.50830078125, -2.15234375, -1.79638671875, -1.4404296875, -1.08447265625, -0.728515625, -0.37255859375, -0.0166015625, 0.33935546875, 0.6953125, 1.05126953125, 1.4072265625, 1.76318359375, 2.119140625, 2.47509765625, 2.8310546875, 3.18701171875, 3.54296875, 3.89892578125, 4.2548828125, 4.61083984375, 4.966796875, 5.32275390625, 5.6787109375, 6.03466796875, 6.390625, 6.74658203125, 7.1025390625, 7.45849609375, 7.814453125, 8.17041015625, 8.5263671875, 8.88232421875, 9.23828125, 9.59423828125, 9.9501953125, 10.30615234375, 10.662109375, 11.01806640625, 11.3740234375, 11.72998046875, 12.0859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 7.0, 8.0, 8.0, 19.0, 31.0, 28.0, 52.0, 77.0, 86.0, 165.0, 219.0, 376.0, 557.0, 842.0, 1499.0, 2523.0, 4560.0, 8645.0, 18257.0, 50208.0, 884846.0, 40710.0, 16422.0, 7979.0, 4202.0, 2433.0, 1361.0, 858.0, 526.0, 353.0, 227.0, 135.0, 98.0, 79.0, 48.0, 42.0, 19.0, 19.0, 13.0, 9.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.2470703125, -1.2118682861328125, -1.176666259765625, -1.1414642333984375, -1.10626220703125, -1.0710601806640625, -1.035858154296875, -1.0006561279296875, -0.9654541015625, -0.9302520751953125, -0.895050048828125, -0.8598480224609375, -0.82464599609375, -0.7894439697265625, -0.754241943359375, -0.7190399169921875, -0.683837890625, -0.6486358642578125, -0.613433837890625, -0.5782318115234375, -0.54302978515625, -0.5078277587890625, -0.472625732421875, -0.4374237060546875, -0.4022216796875, -0.3670196533203125, -0.331817626953125, -0.2966156005859375, -0.26141357421875, -0.2262115478515625, -0.191009521484375, -0.1558074951171875, -0.12060546875, -0.0854034423828125, -0.050201416015625, -0.0149993896484375, 0.02020263671875, 0.0554046630859375, 0.090606689453125, 0.1258087158203125, 0.1610107421875, 0.1962127685546875, 0.231414794921875, 0.2666168212890625, 0.30181884765625, 0.3370208740234375, 0.372222900390625, 0.4074249267578125, 0.442626953125, 0.4778289794921875, 0.513031005859375, 0.5482330322265625, 0.58343505859375, 0.6186370849609375, 0.653839111328125, 0.6890411376953125, 0.7242431640625, 0.7594451904296875, 0.794647216796875, 0.8298492431640625, 0.86505126953125, 0.9002532958984375, 0.935455322265625, 0.9706573486328125, 1.005859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 7.0, 5.0, 6.0, 7.0, 8.0, 14.0, 11.0, 14.0, 18.0, 20.0, 25.0, 24.0, 29.0, 29.0, 28.0, 30.0, 43.0, 39.0, 45.0, 52.0, 55.0, 43.0, 34.0, 42.0, 37.0, 28.0, 33.0, 40.0, 20.0, 28.0, 20.0, 25.0, 33.0, 24.0, 11.0, 16.0, 16.0, 9.0, 9.0, 7.0, 7.0, 2.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.319978713989258e-05, -3.212597221136093e-05, -3.1052157282829285e-05, -2.9978342354297638e-05, -2.890452742576599e-05, -2.7830712497234344e-05, -2.6756897568702698e-05, -2.568308264017105e-05, -2.4609267711639404e-05, -2.3535452783107758e-05, -2.246163785457611e-05, -2.1387822926044464e-05, -2.0314007997512817e-05, -1.924019306898117e-05, -1.8166378140449524e-05, -1.7092563211917877e-05, -1.601874828338623e-05, -1.4944933354854584e-05, -1.3871118426322937e-05, -1.279730349779129e-05, -1.1723488569259644e-05, -1.0649673640727997e-05, -9.57585871219635e-06, -8.502043783664703e-06, -7.428228855133057e-06, -6.35441392660141e-06, -5.280598998069763e-06, -4.2067840695381165e-06, -3.1329691410064697e-06, -2.059154212474823e-06, -9.853392839431763e-07, 8.847564458847046e-08, 1.1622905731201172e-06, 2.236105501651764e-06, 3.3099204301834106e-06, 4.383735358715057e-06, 5.457550287246704e-06, 6.531365215778351e-06, 7.6051801443099976e-06, 8.678995072841644e-06, 9.752810001373291e-06, 1.0826624929904938e-05, 1.1900439858436584e-05, 1.2974254786968231e-05, 1.4048069715499878e-05, 1.5121884644031525e-05, 1.619569957256317e-05, 1.7269514501094818e-05, 1.8343329429626465e-05, 1.941714435815811e-05, 2.0490959286689758e-05, 2.1564774215221405e-05, 2.2638589143753052e-05, 2.37124040722847e-05, 2.4786219000816345e-05, 2.5860033929347992e-05, 2.693384885787964e-05, 2.8007663786411285e-05, 2.9081478714942932e-05, 3.015529364347458e-05, 3.1229108572006226e-05, 3.230292350053787e-05, 3.337673842906952e-05, 3.4450553357601166e-05, 3.552436828613281e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 6.0, 10.0, 7.0, 14.0, 36.0, 50.0, 71.0, 116.0, 177.0, 270.0, 451.0, 716.0, 1121.0, 1829.0, 3171.0, 5261.0, 9318.0, 17145.0, 31326.0, 62198.0, 122495.0, 221880.0, 250032.0, 153824.0, 78580.0, 40116.0, 20964.0, 11410.0, 6410.0, 3710.0, 2171.0, 1372.0, 867.0, 551.0, 317.0, 201.0, 129.0, 80.0, 52.0, 32.0, 24.0, 18.0, 12.0, 3.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.57275390625, -0.5554885864257812, -0.5382232666015625, -0.5209579467773438, -0.503692626953125, -0.48642730712890625, -0.4691619873046875, -0.45189666748046875, -0.43463134765625, -0.41736602783203125, -0.4001007080078125, -0.38283538818359375, -0.365570068359375, -0.34830474853515625, -0.3310394287109375, -0.31377410888671875, -0.2965087890625, -0.27924346923828125, -0.2619781494140625, -0.24471282958984375, -0.227447509765625, -0.21018218994140625, -0.1929168701171875, -0.17565155029296875, -0.15838623046875, -0.14112091064453125, -0.1238555908203125, -0.10659027099609375, -0.089324951171875, -0.07205963134765625, -0.0547943115234375, -0.03752899169921875, -0.020263671875, -0.00299835205078125, 0.0142669677734375, 0.03153228759765625, 0.048797607421875, 0.06606292724609375, 0.0833282470703125, 0.10059356689453125, 0.11785888671875, 0.13512420654296875, 0.1523895263671875, 0.16965484619140625, 0.186920166015625, 0.20418548583984375, 0.2214508056640625, 0.23871612548828125, 0.2559814453125, 0.27324676513671875, 0.2905120849609375, 0.30777740478515625, 0.325042724609375, 0.34230804443359375, 0.3595733642578125, 0.37683868408203125, 0.39410400390625, 0.41136932373046875, 0.4286346435546875, 0.44589996337890625, 0.463165283203125, 0.48043060302734375, 0.4976959228515625, 0.5149612426757812, 0.5322265625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 13.0, 8.0, 13.0, 14.0, 19.0, 25.0, 23.0, 37.0, 36.0, 37.0, 37.0, 42.0, 50.0, 50.0, 45.0, 59.0, 74.0, 56.0, 35.0, 64.0, 46.0, 29.0, 31.0, 26.0, 20.0, 17.0, 18.0, 12.0, 9.0, 11.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1551513671875, -0.1507396697998047, -0.14632797241210938, -0.14191627502441406, -0.13750457763671875, -0.13309288024902344, -0.12868118286132812, -0.12426948547363281, -0.1198577880859375, -0.11544609069824219, -0.11103439331054688, -0.10662269592285156, -0.10221099853515625, -0.09779930114746094, -0.09338760375976562, -0.08897590637207031, -0.084564208984375, -0.08015251159667969, -0.07574081420898438, -0.07132911682128906, -0.06691741943359375, -0.06250572204589844, -0.058094024658203125, -0.05368232727050781, -0.0492706298828125, -0.04485893249511719, -0.040447235107421875, -0.03603553771972656, -0.03162384033203125, -0.027212142944335938, -0.022800445556640625, -0.018388748168945312, -0.01397705078125, -0.009565353393554688, -0.005153656005859375, -0.0007419586181640625, 0.00366973876953125, 0.008081436157226562, 0.012493133544921875, 0.016904830932617188, 0.0213165283203125, 0.025728225708007812, 0.030139923095703125, 0.03455162048339844, 0.03896331787109375, 0.04337501525878906, 0.047786712646484375, 0.05219841003417969, 0.056610107421875, 0.06102180480957031, 0.06543350219726562, 0.06984519958496094, 0.07425689697265625, 0.07866859436035156, 0.08308029174804688, 0.08749198913574219, 0.0919036865234375, 0.09631538391113281, 0.10072708129882812, 0.10513877868652344, 0.10955047607421875, 0.11396217346191406, 0.11837387084960938, 0.12278556823730469, 0.127197265625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 7.0, 6.0, 11.0, 12.0, 9.0, 19.0, 15.0, 16.0, 22.0, 32.0, 33.0, 49.0, 61.0, 59.0, 74.0, 71.0, 72.0, 65.0, 52.0, 68.0, 46.0, 40.0, 23.0, 31.0, 18.0, 18.0, 14.0, 9.0, 5.0, 10.0, 4.0, 6.0, 3.0, 3.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.259902954101562, -22.505605697631836, -21.751306533813477, -20.99700927734375, -20.242712020874023, -19.488412857055664, -18.734115600585938, -17.979816436767578, -17.22551918029785, -16.471221923828125, -15.716923713684082, -14.962625503540039, -14.208327293395996, -13.454029083251953, -12.699731826782227, -11.945433616638184, -11.191136360168457, -10.436838150024414, -9.682540893554688, -8.928242683410645, -8.173944473266602, -7.419646739959717, -6.665349006652832, -5.911050796508789, -5.156753063201904, -4.4024553298950195, -3.6481571197509766, -2.893859386444092, -2.139561414718628, -1.385263442993164, -0.6309657096862793, 0.12333250045776367, 0.8776302337646484, 1.6319282054901123, 2.386226177215576, 3.140523910522461, 3.894821882247925, 4.649119853973389, 5.403417587280273, 6.157715797424316, 6.912013530731201, 7.666311264038086, 8.420609474182129, 9.174907684326172, 9.929204940795898, 10.683503150939941, 11.437801361083984, 12.192098617553711, 12.946396827697754, 13.700695037841797, 14.454992294311523, 15.209290504455566, 15.96358871459961, 16.717885971069336, 17.472183227539062, 18.226482391357422, 18.98077964782715, 19.735076904296875, 20.489376068115234, 21.24367332458496, 21.997970581054688, 22.752269744873047, 23.506567001342773, 24.2608642578125, 25.01516342163086]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 1.0, 3.0, 6.0, 4.0, 8.0, 8.0, 8.0, 13.0, 19.0, 19.0, 25.0, 20.0, 17.0, 27.0, 24.0, 30.0, 38.0, 36.0, 27.0, 29.0, 38.0, 29.0, 41.0, 51.0, 47.0, 41.0, 44.0, 34.0, 47.0, 26.0, 28.0, 25.0, 22.0, 29.0, 26.0, 12.0, 16.0, 16.0, 16.0, 7.0, 9.0, 8.0, 9.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0], "bins": [-16.475980758666992, -16.019094467163086, -15.562210083007812, -15.105324745178223, -14.648439407348633, -14.191553115844727, -13.734667778015137, -13.277782440185547, -12.820897102355957, -12.364011764526367, -11.907126426696777, -11.450241088867188, -10.993354797363281, -10.536470413208008, -10.079584121704102, -9.622698783874512, -9.165813446044922, -8.708928108215332, -8.252042770385742, -7.795156955718994, -7.338271617889404, -6.8813862800598145, -6.424500465393066, -5.967615127563477, -5.510729789733887, -5.053844451904297, -4.596959114074707, -4.140073299407959, -3.683187961578369, -3.2263026237487793, -2.7694170475006104, -2.3125314712524414, -1.8556461334228516, -1.3987606763839722, -0.9418752193450928, -0.4849897623062134, -0.028104305267333984, 0.42878103256225586, 0.8856666088104248, 1.3425521850585938, 1.7994375228881836, 2.2563228607177734, 2.7132084369659424, 3.1700940132141113, 3.626979351043701, 4.083864688873291, 4.540750503540039, 4.997635841369629, 5.454521179199219, 5.911406517028809, 6.368291854858398, 6.8251776695251465, 7.282063007354736, 7.738948345184326, 8.195834159851074, 8.652719497680664, 9.109604835510254, 9.566490173339844, 10.023375511169434, 10.480260848999023, 10.93714714050293, 11.394031524658203, 11.85091781616211, 12.3078031539917, 12.764688491821289]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 6.0, 3.0, 1.0, 2.0, 9.0, 14.0, 20.0, 25.0, 37.0, 66.0, 96.0, 110.0, 167.0, 254.0, 358.0, 495.0, 762.0, 1117.0, 1500.0, 2381.0, 3459.0, 5388.0, 8268.0, 12763.0, 19940.0, 31230.0, 49779.0, 75856.0, 110851.0, 142506.0, 155604.0, 134905.0, 100610.0, 67578.0, 43635.0, 27667.0, 17878.0, 11388.0, 7307.0, 4753.0, 3047.0, 2124.0, 1446.0, 956.0, 669.0, 473.0, 313.0, 242.0, 158.0, 122.0, 73.0, 68.0, 35.0, 19.0, 13.0, 10.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.984375, -9.666015625, -9.34765625, -9.029296875, -8.7109375, -8.392578125, -8.07421875, -7.755859375, -7.4375, -7.119140625, -6.80078125, -6.482421875, -6.1640625, -5.845703125, -5.52734375, -5.208984375, -4.890625, -4.572265625, -4.25390625, -3.935546875, -3.6171875, -3.298828125, -2.98046875, -2.662109375, -2.34375, -2.025390625, -1.70703125, -1.388671875, -1.0703125, -0.751953125, -0.43359375, -0.115234375, 0.203125, 0.521484375, 0.83984375, 1.158203125, 1.4765625, 1.794921875, 2.11328125, 2.431640625, 2.75, 3.068359375, 3.38671875, 3.705078125, 4.0234375, 4.341796875, 4.66015625, 4.978515625, 5.296875, 5.615234375, 5.93359375, 6.251953125, 6.5703125, 6.888671875, 7.20703125, 7.525390625, 7.84375, 8.162109375, 8.48046875, 8.798828125, 9.1171875, 9.435546875, 9.75390625, 10.072265625, 10.390625]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 5.0, 7.0, 6.0, 8.0, 14.0, 12.0, 10.0, 21.0, 24.0, 16.0, 22.0, 24.0, 30.0, 31.0, 38.0, 39.0, 37.0, 34.0, 30.0, 35.0, 38.0, 50.0, 38.0, 40.0, 46.0, 24.0, 51.0, 31.0, 29.0, 34.0, 28.0, 25.0, 19.0, 10.0, 18.0, 18.0, 13.0, 9.0, 5.0, 7.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 3.0], "bins": [-17.75, -17.2550048828125, -16.760009765625, -16.2650146484375, -15.77001953125, -15.2750244140625, -14.780029296875, -14.2850341796875, -13.7900390625, -13.2950439453125, -12.800048828125, -12.3050537109375, -11.81005859375, -11.3150634765625, -10.820068359375, -10.3250732421875, -9.830078125, -9.3350830078125, -8.840087890625, -8.3450927734375, -7.85009765625, -7.3551025390625, -6.860107421875, -6.3651123046875, -5.8701171875, -5.3751220703125, -4.880126953125, -4.3851318359375, -3.89013671875, -3.3951416015625, -2.900146484375, -2.4051513671875, -1.91015625, -1.4151611328125, -0.920166015625, -0.4251708984375, 0.06982421875, 0.5648193359375, 1.059814453125, 1.5548095703125, 2.0498046875, 2.5447998046875, 3.039794921875, 3.5347900390625, 4.02978515625, 4.5247802734375, 5.019775390625, 5.5147705078125, 6.009765625, 6.5047607421875, 6.999755859375, 7.4947509765625, 7.98974609375, 8.4847412109375, 8.979736328125, 9.4747314453125, 9.9697265625, 10.4647216796875, 10.959716796875, 11.4547119140625, 11.94970703125, 12.4447021484375, 12.939697265625, 13.4346923828125, 13.9296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 7.0, 10.0, 9.0, 17.0, 25.0, 32.0, 60.0, 79.0, 128.0, 177.0, 288.0, 418.0, 623.0, 961.0, 1463.0, 2162.0, 3371.0, 5229.0, 8107.0, 12687.0, 20421.0, 31771.0, 50904.0, 79081.0, 116657.0, 151173.0, 159561.0, 135078.0, 96306.0, 62787.0, 39622.0, 25039.0, 15817.0, 10045.0, 6371.0, 4186.0, 2692.0, 1715.0, 1165.0, 785.0, 508.0, 348.0, 245.0, 135.0, 96.0, 74.0, 51.0, 27.0, 17.0, 13.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-10.7109375, -10.356689453125, -10.00244140625, -9.648193359375, -9.2939453125, -8.939697265625, -8.58544921875, -8.231201171875, -7.876953125, -7.522705078125, -7.16845703125, -6.814208984375, -6.4599609375, -6.105712890625, -5.75146484375, -5.397216796875, -5.04296875, -4.688720703125, -4.33447265625, -3.980224609375, -3.6259765625, -3.271728515625, -2.91748046875, -2.563232421875, -2.208984375, -1.854736328125, -1.50048828125, -1.146240234375, -0.7919921875, -0.437744140625, -0.08349609375, 0.270751953125, 0.625, 0.979248046875, 1.33349609375, 1.687744140625, 2.0419921875, 2.396240234375, 2.75048828125, 3.104736328125, 3.458984375, 3.813232421875, 4.16748046875, 4.521728515625, 4.8759765625, 5.230224609375, 5.58447265625, 5.938720703125, 6.29296875, 6.647216796875, 7.00146484375, 7.355712890625, 7.7099609375, 8.064208984375, 8.41845703125, 8.772705078125, 9.126953125, 9.481201171875, 9.83544921875, 10.189697265625, 10.5439453125, 10.898193359375, 11.25244140625, 11.606689453125, 11.9609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 9.0, 8.0, 9.0, 11.0, 8.0, 11.0, 15.0, 18.0, 25.0, 13.0, 26.0, 27.0, 27.0, 28.0, 35.0, 29.0, 27.0, 36.0, 37.0, 36.0, 45.0, 36.0, 33.0, 37.0, 40.0, 31.0, 41.0, 30.0, 28.0, 28.0, 25.0, 21.0, 21.0, 18.0, 14.0, 15.0, 11.0, 13.0, 9.0, 13.0, 10.0, 4.0, 10.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.375, -9.092041015625, -8.80908203125, -8.526123046875, -8.2431640625, -7.960205078125, -7.67724609375, -7.394287109375, -7.111328125, -6.828369140625, -6.54541015625, -6.262451171875, -5.9794921875, -5.696533203125, -5.41357421875, -5.130615234375, -4.84765625, -4.564697265625, -4.28173828125, -3.998779296875, -3.7158203125, -3.432861328125, -3.14990234375, -2.866943359375, -2.583984375, -2.301025390625, -2.01806640625, -1.735107421875, -1.4521484375, -1.169189453125, -0.88623046875, -0.603271484375, -0.3203125, -0.037353515625, 0.24560546875, 0.528564453125, 0.8115234375, 1.094482421875, 1.37744140625, 1.660400390625, 1.943359375, 2.226318359375, 2.50927734375, 2.792236328125, 3.0751953125, 3.358154296875, 3.64111328125, 3.924072265625, 4.20703125, 4.489990234375, 4.77294921875, 5.055908203125, 5.3388671875, 5.621826171875, 5.90478515625, 6.187744140625, 6.470703125, 6.753662109375, 7.03662109375, 7.319580078125, 7.6025390625, 7.885498046875, 8.16845703125, 8.451416015625, 8.734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 12.0, 20.0, 24.0, 40.0, 60.0, 78.0, 131.0, 209.0, 323.0, 491.0, 826.0, 1189.0, 2008.0, 3810.0, 7492.0, 16206.0, 39180.0, 98465.0, 221888.0, 308913.0, 199068.0, 84869.0, 33701.0, 14450.0, 6667.0, 3328.0, 1937.0, 1151.0, 744.0, 456.0, 276.0, 184.0, 111.0, 77.0, 58.0, 38.0, 24.0, 20.0, 7.0, 11.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.046875, -11.67529296875, -11.3037109375, -10.93212890625, -10.560546875, -10.18896484375, -9.8173828125, -9.44580078125, -9.07421875, -8.70263671875, -8.3310546875, -7.95947265625, -7.587890625, -7.21630859375, -6.8447265625, -6.47314453125, -6.1015625, -5.72998046875, -5.3583984375, -4.98681640625, -4.615234375, -4.24365234375, -3.8720703125, -3.50048828125, -3.12890625, -2.75732421875, -2.3857421875, -2.01416015625, -1.642578125, -1.27099609375, -0.8994140625, -0.52783203125, -0.15625, 0.21533203125, 0.5869140625, 0.95849609375, 1.330078125, 1.70166015625, 2.0732421875, 2.44482421875, 2.81640625, 3.18798828125, 3.5595703125, 3.93115234375, 4.302734375, 4.67431640625, 5.0458984375, 5.41748046875, 5.7890625, 6.16064453125, 6.5322265625, 6.90380859375, 7.275390625, 7.64697265625, 8.0185546875, 8.39013671875, 8.76171875, 9.13330078125, 9.5048828125, 9.87646484375, 10.248046875, 10.61962890625, 10.9912109375, 11.36279296875, 11.734375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 8.0, 17.0, 22.0, 26.0, 28.0, 34.0, 45.0, 48.0, 64.0, 60.0, 80.0, 78.0, 98.0, 72.0, 63.0, 50.0, 49.0, 31.0, 33.0, 17.0, 18.0, 10.0, 12.0, 8.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006780624389648438, -0.000653386116027832, -0.0006287097930908203, -0.0006040334701538086, -0.0005793571472167969, -0.0005546808242797852, -0.0005300045013427734, -0.0005053281784057617, -0.00048065185546875, -0.0004559755325317383, -0.00043129920959472656, -0.00040662288665771484, -0.0003819465637207031, -0.0003572702407836914, -0.0003325939178466797, -0.00030791759490966797, -0.00028324127197265625, -0.00025856494903564453, -0.0002338886260986328, -0.0002092123031616211, -0.00018453598022460938, -0.00015985965728759766, -0.00013518333435058594, -0.00011050701141357422, -8.58306884765625e-05, -6.115436553955078e-05, -3.647804260253906e-05, -1.1801719665527344e-05, 1.2874603271484375e-05, 3.7550926208496094e-05, 6.222724914550781e-05, 8.690357208251953e-05, 0.00011157989501953125, 0.00013625621795654297, 0.0001609325408935547, 0.0001856088638305664, 0.00021028518676757812, 0.00023496150970458984, 0.00025963783264160156, 0.0002843141555786133, 0.000308990478515625, 0.0003336668014526367, 0.00035834312438964844, 0.00038301944732666016, 0.0004076957702636719, 0.0004323720932006836, 0.0004570484161376953, 0.00048172473907470703, 0.0005064010620117188, 0.0005310773849487305, 0.0005557537078857422, 0.0005804300308227539, 0.0006051063537597656, 0.0006297826766967773, 0.0006544589996337891, 0.0006791353225708008, 0.0007038116455078125, 0.0007284879684448242, 0.0007531642913818359, 0.0007778406143188477, 0.0008025169372558594, 0.0008271932601928711, 0.0008518695831298828, 0.0008765459060668945, 0.0009012222290039062]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 2.0, 10.0, 12.0, 17.0, 19.0, 28.0, 37.0, 52.0, 58.0, 98.0, 145.0, 187.0, 249.0, 340.0, 415.0, 662.0, 974.0, 1515.0, 2458.0, 4506.0, 8957.0, 19472.0, 44838.0, 107849.0, 223235.0, 286839.0, 190078.0, 86130.0, 35965.0, 15866.0, 7431.0, 3656.0, 2055.0, 1381.0, 853.0, 569.0, 410.0, 317.0, 210.0, 174.0, 112.0, 99.0, 59.0, 62.0, 44.0, 34.0, 23.0, 13.0, 7.0, 5.0, 7.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0], "bins": [-11.6953125, -11.333984375, -10.97265625, -10.611328125, -10.25, -9.888671875, -9.52734375, -9.166015625, -8.8046875, -8.443359375, -8.08203125, -7.720703125, -7.359375, -6.998046875, -6.63671875, -6.275390625, -5.9140625, -5.552734375, -5.19140625, -4.830078125, -4.46875, -4.107421875, -3.74609375, -3.384765625, -3.0234375, -2.662109375, -2.30078125, -1.939453125, -1.578125, -1.216796875, -0.85546875, -0.494140625, -0.1328125, 0.228515625, 0.58984375, 0.951171875, 1.3125, 1.673828125, 2.03515625, 2.396484375, 2.7578125, 3.119140625, 3.48046875, 3.841796875, 4.203125, 4.564453125, 4.92578125, 5.287109375, 5.6484375, 6.009765625, 6.37109375, 6.732421875, 7.09375, 7.455078125, 7.81640625, 8.177734375, 8.5390625, 8.900390625, 9.26171875, 9.623046875, 9.984375, 10.345703125, 10.70703125, 11.068359375, 11.4296875]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 14.0, 14.0, 24.0, 33.0, 36.0, 45.0, 33.0, 64.0, 70.0, 77.0, 62.0, 77.0, 73.0, 78.0, 57.0, 50.0, 31.0, 37.0, 30.0, 20.0, 11.0, 13.0, 8.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.576171875, -3.488250732421875, -3.40032958984375, -3.312408447265625, -3.2244873046875, -3.136566162109375, -3.04864501953125, -2.960723876953125, -2.872802734375, -2.784881591796875, -2.69696044921875, -2.609039306640625, -2.5211181640625, -2.433197021484375, -2.34527587890625, -2.257354736328125, -2.16943359375, -2.081512451171875, -1.99359130859375, -1.905670166015625, -1.8177490234375, -1.729827880859375, -1.64190673828125, -1.553985595703125, -1.466064453125, -1.378143310546875, -1.29022216796875, -1.202301025390625, -1.1143798828125, -1.026458740234375, -0.93853759765625, -0.850616455078125, -0.7626953125, -0.674774169921875, -0.58685302734375, -0.498931884765625, -0.4110107421875, -0.323089599609375, -0.23516845703125, -0.147247314453125, -0.059326171875, 0.028594970703125, 0.11651611328125, 0.204437255859375, 0.2923583984375, 0.380279541015625, 0.46820068359375, 0.556121826171875, 0.64404296875, 0.731964111328125, 0.81988525390625, 0.907806396484375, 0.9957275390625, 1.083648681640625, 1.17156982421875, 1.259490966796875, 1.347412109375, 1.435333251953125, 1.52325439453125, 1.611175537109375, 1.6990966796875, 1.787017822265625, 1.87493896484375, 1.962860107421875, 2.05078125]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 4.0, 4.0, 5.0, 6.0, 13.0, 13.0, 15.0, 12.0, 20.0, 20.0, 26.0, 27.0, 46.0, 52.0, 55.0, 51.0, 72.0, 84.0, 81.0, 57.0, 64.0, 42.0, 45.0, 36.0, 29.0, 24.0, 15.0, 16.0, 9.0, 12.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.824419021606445, -22.07671546936035, -21.329011917114258, -20.581308364868164, -19.83360481262207, -19.085901260375977, -18.338197708129883, -17.59049415588379, -16.842790603637695, -16.0950870513916, -15.347383499145508, -14.599679946899414, -13.85197639465332, -13.104272842407227, -12.356569290161133, -11.608865737915039, -10.861163139343262, -10.113459587097168, -9.365756034851074, -8.61805248260498, -7.870348930358887, -7.122645378112793, -6.374942302703857, -5.627238750457764, -4.87953519821167, -4.131831645965576, -3.3841280937194824, -2.6364247798919678, -1.888721227645874, -1.1410176753997803, -0.3933143615722656, 0.3543891906738281, 1.1020927429199219, 1.8497962951660156, 2.5974998474121094, 3.345203161239624, 4.092906951904297, 4.840610504150391, 5.588313579559326, 6.33601713180542, 7.083720684051514, 7.831424236297607, 8.579127311706543, 9.326830863952637, 10.07453441619873, 10.822237968444824, 11.569941520690918, 12.317645072937012, 13.065348625183105, 13.8130521774292, 14.560755729675293, 15.308459281921387, 16.056161880493164, 16.803865432739258, 17.55156898498535, 18.299272537231445, 19.04697608947754, 19.794679641723633, 20.542383193969727, 21.29008674621582, 22.037790298461914, 22.785493850708008, 23.5331974029541, 24.280900955200195, 25.02860450744629]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 13.0, 15.0, 11.0, 14.0, 20.0, 22.0, 17.0, 30.0, 24.0, 28.0, 23.0, 29.0, 33.0, 43.0, 46.0, 34.0, 41.0, 49.0, 35.0, 39.0, 50.0, 42.0, 34.0, 34.0, 36.0, 18.0, 22.0, 21.0, 18.0, 27.0, 19.0, 15.0, 12.0, 6.0, 13.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.306543350219727, -14.836404800415039, -14.366265296936035, -13.896126747131348, -13.425987243652344, -12.955848693847656, -12.485710144042969, -12.015571594238281, -11.545432090759277, -11.07529354095459, -10.605154037475586, -10.135015487670898, -9.664876937866211, -9.194737434387207, -8.72459888458252, -8.254459381103516, -7.784320831298828, -7.314181804656982, -6.844042778015137, -6.373904228210449, -5.9037652015686035, -5.433626174926758, -4.96348762512207, -4.493348598480225, -4.023209571838379, -3.553070545196533, -3.0829317569732666, -2.61279296875, -2.1426539421081543, -1.6725149154663086, -1.202376127243042, -0.7322373390197754, -0.2620973587036133, 0.20804154872894287, 0.678180456161499, 1.1483193635940552, 1.6184582710266113, 2.088597297668457, 2.5587360858917236, 3.0288748741149902, 3.499013900756836, 3.9691529273986816, 4.439291954040527, 4.909430503845215, 5.3795695304870605, 5.849708557128906, 6.319847106933594, 6.7899861335754395, 7.260125160217285, 7.730264186859131, 8.200403213500977, 8.670541763305664, 9.140680313110352, 9.610819816589355, 10.080958366394043, 10.551097869873047, 11.021236419677734, 11.491374969482422, 11.961514472961426, 12.431653022766113, 12.901792526245117, 13.371931076049805, 13.842069625854492, 14.31220817565918, 14.782347679138184]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 12.0, 6.0, 19.0, 18.0, 52.0, 63.0, 90.0, 124.0, 193.0, 272.0, 365.0, 570.0, 763.0, 1081.0, 1692.0, 2424.0, 3622.0, 5703.0, 9381.0, 15621.0, 29835.0, 62590.0, 156653.0, 438123.0, 1087956.0, 1319231.0, 646261.0, 231917.0, 88965.0, 39467.0, 20240.0, 11375.0, 6731.0, 4264.0, 2825.0, 1916.0, 1264.0, 817.0, 557.0, 404.0, 264.0, 191.0, 131.0, 81.0, 58.0, 24.0, 19.0, 25.0, 10.0, 3.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-29.109375, -28.232421875, -27.35546875, -26.478515625, -25.6015625, -24.724609375, -23.84765625, -22.970703125, -22.09375, -21.216796875, -20.33984375, -19.462890625, -18.5859375, -17.708984375, -16.83203125, -15.955078125, -15.078125, -14.201171875, -13.32421875, -12.447265625, -11.5703125, -10.693359375, -9.81640625, -8.939453125, -8.0625, -7.185546875, -6.30859375, -5.431640625, -4.5546875, -3.677734375, -2.80078125, -1.923828125, -1.046875, -0.169921875, 0.70703125, 1.583984375, 2.4609375, 3.337890625, 4.21484375, 5.091796875, 5.96875, 6.845703125, 7.72265625, 8.599609375, 9.4765625, 10.353515625, 11.23046875, 12.107421875, 12.984375, 13.861328125, 14.73828125, 15.615234375, 16.4921875, 17.369140625, 18.24609375, 19.123046875, 20.0, 20.876953125, 21.75390625, 22.630859375, 23.5078125, 24.384765625, 25.26171875, 26.138671875, 27.015625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 12.0, 8.0, 12.0, 12.0, 10.0, 22.0, 8.0, 20.0, 21.0, 26.0, 24.0, 26.0, 33.0, 37.0, 38.0, 39.0, 36.0, 48.0, 39.0, 46.0, 38.0, 63.0, 40.0, 26.0, 50.0, 36.0, 30.0, 29.0, 20.0, 17.0, 17.0, 19.0, 17.0, 21.0, 6.0, 9.0, 2.0, 4.0, 16.0, 5.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.734375, -14.2913818359375, -13.848388671875, -13.4053955078125, -12.96240234375, -12.5194091796875, -12.076416015625, -11.6334228515625, -11.1904296875, -10.7474365234375, -10.304443359375, -9.8614501953125, -9.41845703125, -8.9754638671875, -8.532470703125, -8.0894775390625, -7.646484375, -7.2034912109375, -6.760498046875, -6.3175048828125, -5.87451171875, -5.4315185546875, -4.988525390625, -4.5455322265625, -4.1025390625, -3.6595458984375, -3.216552734375, -2.7735595703125, -2.33056640625, -1.8875732421875, -1.444580078125, -1.0015869140625, -0.55859375, -0.1156005859375, 0.327392578125, 0.7703857421875, 1.21337890625, 1.6563720703125, 2.099365234375, 2.5423583984375, 2.9853515625, 3.4283447265625, 3.871337890625, 4.3143310546875, 4.75732421875, 5.2003173828125, 5.643310546875, 6.0863037109375, 6.529296875, 6.9722900390625, 7.415283203125, 7.8582763671875, 8.30126953125, 8.7442626953125, 9.187255859375, 9.6302490234375, 10.0732421875, 10.5162353515625, 10.959228515625, 11.4022216796875, 11.84521484375, 12.2882080078125, 12.731201171875, 13.1741943359375, 13.6171875]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 14.0, 16.0, 25.0, 24.0, 43.0, 58.0, 89.0, 109.0, 197.0, 261.0, 402.0, 640.0, 1060.0, 1662.0, 2727.0, 4760.0, 8523.0, 16382.0, 33378.0, 75769.0, 201817.0, 640171.0, 1580776.0, 1072896.0, 338727.0, 116024.0, 48307.0, 22393.0, 11555.0, 6221.0, 3549.0, 2129.0, 1263.0, 796.0, 493.0, 326.0, 217.0, 158.0, 89.0, 75.0, 51.0, 31.0, 27.0, 12.0, 9.0, 7.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-42.375, -41.03955078125, -39.7041015625, -38.36865234375, -37.033203125, -35.69775390625, -34.3623046875, -33.02685546875, -31.69140625, -30.35595703125, -29.0205078125, -27.68505859375, -26.349609375, -25.01416015625, -23.6787109375, -22.34326171875, -21.0078125, -19.67236328125, -18.3369140625, -17.00146484375, -15.666015625, -14.33056640625, -12.9951171875, -11.65966796875, -10.32421875, -8.98876953125, -7.6533203125, -6.31787109375, -4.982421875, -3.64697265625, -2.3115234375, -0.97607421875, 0.359375, 1.69482421875, 3.0302734375, 4.36572265625, 5.701171875, 7.03662109375, 8.3720703125, 9.70751953125, 11.04296875, 12.37841796875, 13.7138671875, 15.04931640625, 16.384765625, 17.72021484375, 19.0556640625, 20.39111328125, 21.7265625, 23.06201171875, 24.3974609375, 25.73291015625, 27.068359375, 28.40380859375, 29.7392578125, 31.07470703125, 32.41015625, 33.74560546875, 35.0810546875, 36.41650390625, 37.751953125, 39.08740234375, 40.4228515625, 41.75830078125, 43.09375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 7.0, 6.0, 6.0, 10.0, 21.0, 19.0, 28.0, 41.0, 57.0, 62.0, 98.0, 128.0, 130.0, 238.0, 303.0, 328.0, 383.0, 412.0, 382.0, 323.0, 274.0, 232.0, 155.0, 120.0, 77.0, 73.0, 37.0, 40.0, 15.0, 20.0, 18.0, 7.0, 5.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.4197998046875, -8.058349609375, -7.6968994140625, -7.33544921875, -6.9739990234375, -6.612548828125, -6.2510986328125, -5.8896484375, -5.5281982421875, -5.166748046875, -4.8052978515625, -4.44384765625, -4.0823974609375, -3.720947265625, -3.3594970703125, -2.998046875, -2.6365966796875, -2.275146484375, -1.9136962890625, -1.55224609375, -1.1907958984375, -0.829345703125, -0.4678955078125, -0.1064453125, 0.2550048828125, 0.616455078125, 0.9779052734375, 1.33935546875, 1.7008056640625, 2.062255859375, 2.4237060546875, 2.78515625, 3.1466064453125, 3.508056640625, 3.8695068359375, 4.23095703125, 4.5924072265625, 4.953857421875, 5.3153076171875, 5.6767578125, 6.0382080078125, 6.399658203125, 6.7611083984375, 7.12255859375, 7.4840087890625, 7.845458984375, 8.2069091796875, 8.568359375, 8.9298095703125, 9.291259765625, 9.6527099609375, 10.01416015625, 10.3756103515625, 10.737060546875, 11.0985107421875, 11.4599609375, 11.8214111328125, 12.182861328125, 12.5443115234375, 12.90576171875, 13.2672119140625, 13.628662109375, 13.9901123046875, 14.3515625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 7.0, 10.0, 10.0, 10.0, 15.0, 12.0, 11.0, 22.0, 29.0, 41.0, 37.0, 38.0, 52.0, 64.0, 62.0, 73.0, 67.0, 66.0, 59.0, 59.0, 43.0, 48.0, 40.0, 32.0, 16.0, 20.0, 13.0, 5.0, 8.0, 9.0, 5.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.897720336914062, -21.984949111938477, -21.07217788696289, -20.159404754638672, -19.246633529663086, -18.3338623046875, -17.421091079711914, -16.508319854736328, -15.595547676086426, -14.68277645111084, -13.770004272460938, -12.857233047485352, -11.944461822509766, -11.031689643859863, -10.118918418884277, -9.206146240234375, -8.293375015258789, -7.380603313446045, -6.467831611633301, -5.555060386657715, -4.642288684844971, -3.7295169830322266, -2.8167457580566406, -1.9039740562438965, -0.9912023544311523, -0.07843077182769775, 0.8343408107757568, 1.7471122741699219, 2.659883975982666, 3.57265567779541, 4.485426902770996, 5.39819860458374, 6.310970306396484, 7.2237420082092285, 8.136513710021973, 9.049284934997559, 9.962057113647461, 10.874828338623047, 11.787599563598633, 12.700370788574219, 13.613142967224121, 14.525914192199707, 15.43868637084961, 16.351457595825195, 17.26422882080078, 18.177001953125, 19.089771270751953, 20.002544403076172, 20.915315628051758, 21.828086853027344, 22.74085807800293, 23.653629302978516, 24.566402435302734, 25.47917366027832, 26.391944885253906, 27.304716110229492, 28.217487335205078, 29.130258560180664, 30.04302978515625, 30.95580291748047, 31.868574142456055, 32.78134536743164, 33.694114685058594, 34.60688781738281, 35.51966094970703]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 5.0, 12.0, 6.0, 13.0, 19.0, 21.0, 17.0, 23.0, 28.0, 21.0, 22.0, 34.0, 32.0, 41.0, 35.0, 40.0, 33.0, 57.0, 31.0, 41.0, 60.0, 37.0, 36.0, 46.0, 32.0, 45.0, 35.0, 24.0, 11.0, 22.0, 13.0, 20.0, 17.0, 14.0, 11.0, 9.0, 7.0, 11.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.416501998901367, -19.83499526977539, -19.253488540649414, -18.671979904174805, -18.090473175048828, -17.50896644592285, -16.927459716796875, -16.3459529876709, -15.764445304870605, -15.182938575744629, -14.601430892944336, -14.01992416381836, -13.438417434692383, -12.85690975189209, -12.275403022766113, -11.69389533996582, -11.112388610839844, -10.530881881713867, -9.949374198913574, -9.367867469787598, -8.786359786987305, -8.204853057861328, -7.623346328735352, -7.041839122772217, -6.460331916809082, -5.878824710845947, -5.2973175048828125, -4.715810775756836, -4.134303569793701, -3.5527963638305664, -2.9712893962860107, -2.389782428741455, -1.8082771301269531, -1.226770043373108, -0.6452629566192627, -0.06375586986541748, 0.5177512168884277, 1.0992584228515625, 1.6807653903961182, 2.262272357940674, 2.8437795639038086, 3.4252867698669434, 4.006793975830078, 4.588300704956055, 5.1698079109191895, 5.751315116882324, 6.332821846008301, 6.9143290519714355, 7.49583625793457, 8.077342987060547, 8.65885066986084, 9.240357398986816, 9.82186508178711, 10.403371810913086, 10.984878540039062, 11.566385269165039, 12.147892951965332, 12.729399681091309, 13.310907363891602, 13.892414093017578, 14.473920822143555, 15.055428504943848, 15.636935234069824, 16.218442916870117, 16.799949645996094]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 9.0, 7.0, 24.0, 28.0, 46.0, 47.0, 71.0, 113.0, 164.0, 263.0, 397.0, 586.0, 843.0, 1191.0, 1856.0, 2847.0, 4495.0, 6955.0, 11430.0, 18486.0, 30978.0, 54739.0, 100119.0, 181110.0, 241715.0, 169086.0, 92943.0, 51458.0, 29469.0, 17364.0, 10694.0, 6689.0, 4267.0, 2630.0, 1813.0, 1163.0, 828.0, 587.0, 328.0, 220.0, 141.0, 137.0, 81.0, 37.0, 34.0, 31.0, 8.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.365234375, -2.290008544921875, -2.21478271484375, -2.139556884765625, -2.0643310546875, -1.989105224609375, -1.91387939453125, -1.838653564453125, -1.763427734375, -1.688201904296875, -1.61297607421875, -1.537750244140625, -1.4625244140625, -1.387298583984375, -1.31207275390625, -1.236846923828125, -1.16162109375, -1.086395263671875, -1.01116943359375, -0.935943603515625, -0.8607177734375, -0.785491943359375, -0.71026611328125, -0.635040283203125, -0.559814453125, -0.484588623046875, -0.40936279296875, -0.334136962890625, -0.2589111328125, -0.183685302734375, -0.10845947265625, -0.033233642578125, 0.0419921875, 0.117218017578125, 0.19244384765625, 0.267669677734375, 0.3428955078125, 0.418121337890625, 0.49334716796875, 0.568572998046875, 0.643798828125, 0.719024658203125, 0.79425048828125, 0.869476318359375, 0.9447021484375, 1.019927978515625, 1.09515380859375, 1.170379638671875, 1.24560546875, 1.320831298828125, 1.39605712890625, 1.471282958984375, 1.5465087890625, 1.621734619140625, 1.69696044921875, 1.772186279296875, 1.847412109375, 1.922637939453125, 1.99786376953125, 2.073089599609375, 2.1483154296875, 2.223541259765625, 2.29876708984375, 2.373992919921875, 2.44921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 4.0, 9.0, 9.0, 14.0, 11.0, 23.0, 22.0, 18.0, 24.0, 23.0, 22.0, 28.0, 33.0, 29.0, 40.0, 41.0, 38.0, 42.0, 37.0, 37.0, 40.0, 41.0, 41.0, 40.0, 36.0, 44.0, 35.0, 36.0, 28.0, 16.0, 8.0, 20.0, 17.0, 17.0, 13.0, 11.0, 7.0, 10.0, 7.0, 8.0, 3.0, 6.0, 5.0, 1.0, 3.0, 0.0, 4.0, 1.0], "bins": [-21.5, -20.894775390625, -20.28955078125, -19.684326171875, -19.0791015625, -18.473876953125, -17.86865234375, -17.263427734375, -16.658203125, -16.052978515625, -15.44775390625, -14.842529296875, -14.2373046875, -13.632080078125, -13.02685546875, -12.421630859375, -11.81640625, -11.211181640625, -10.60595703125, -10.000732421875, -9.3955078125, -8.790283203125, -8.18505859375, -7.579833984375, -6.974609375, -6.369384765625, -5.76416015625, -5.158935546875, -4.5537109375, -3.948486328125, -3.34326171875, -2.738037109375, -2.1328125, -1.527587890625, -0.92236328125, -0.317138671875, 0.2880859375, 0.893310546875, 1.49853515625, 2.103759765625, 2.708984375, 3.314208984375, 3.91943359375, 4.524658203125, 5.1298828125, 5.735107421875, 6.34033203125, 6.945556640625, 7.55078125, 8.156005859375, 8.76123046875, 9.366455078125, 9.9716796875, 10.576904296875, 11.18212890625, 11.787353515625, 12.392578125, 12.997802734375, 13.60302734375, 14.208251953125, 14.8134765625, 15.418701171875, 16.02392578125, 16.629150390625, 17.234375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 5.0, 7.0, 12.0, 20.0, 25.0, 25.0, 34.0, 46.0, 79.0, 92.0, 158.0, 187.0, 295.0, 412.0, 639.0, 1003.0, 1705.0, 2872.0, 5514.0, 11708.0, 30379.0, 686455.0, 259598.0, 25389.0, 10088.0, 4848.0, 2644.0, 1502.0, 910.0, 551.0, 388.0, 276.0, 198.0, 136.0, 80.0, 74.0, 60.0, 40.0, 28.0, 12.0, 13.0, 21.0, 12.0, 4.0, 8.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.88671875, -7.6470947265625, -7.407470703125, -7.1678466796875, -6.92822265625, -6.6885986328125, -6.448974609375, -6.2093505859375, -5.9697265625, -5.7301025390625, -5.490478515625, -5.2508544921875, -5.01123046875, -4.7716064453125, -4.531982421875, -4.2923583984375, -4.052734375, -3.8131103515625, -3.573486328125, -3.3338623046875, -3.09423828125, -2.8546142578125, -2.614990234375, -2.3753662109375, -2.1357421875, -1.8961181640625, -1.656494140625, -1.4168701171875, -1.17724609375, -0.9376220703125, -0.697998046875, -0.4583740234375, -0.21875, 0.0208740234375, 0.260498046875, 0.5001220703125, 0.73974609375, 0.9793701171875, 1.218994140625, 1.4586181640625, 1.6982421875, 1.9378662109375, 2.177490234375, 2.4171142578125, 2.65673828125, 2.8963623046875, 3.135986328125, 3.3756103515625, 3.615234375, 3.8548583984375, 4.094482421875, 4.3341064453125, 4.57373046875, 4.8133544921875, 5.052978515625, 5.2926025390625, 5.5322265625, 5.7718505859375, 6.011474609375, 6.2510986328125, 6.49072265625, 6.7303466796875, 6.969970703125, 7.2095947265625, 7.44921875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 8.0, 5.0, 8.0, 10.0, 12.0, 9.0, 9.0, 18.0, 15.0, 23.0, 20.0, 19.0, 26.0, 27.0, 27.0, 31.0, 23.0, 39.0, 26.0, 46.0, 32.0, 37.0, 41.0, 45.0, 52.0, 29.0, 32.0, 42.0, 24.0, 34.0, 27.0, 24.0, 29.0, 29.0, 17.0, 17.0, 17.0, 16.0, 12.0, 4.0, 11.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-13.171875, -12.7969970703125, -12.422119140625, -12.0472412109375, -11.67236328125, -11.2974853515625, -10.922607421875, -10.5477294921875, -10.1728515625, -9.7979736328125, -9.423095703125, -9.0482177734375, -8.67333984375, -8.2984619140625, -7.923583984375, -7.5487060546875, -7.173828125, -6.7989501953125, -6.424072265625, -6.0491943359375, -5.67431640625, -5.2994384765625, -4.924560546875, -4.5496826171875, -4.1748046875, -3.7999267578125, -3.425048828125, -3.0501708984375, -2.67529296875, -2.3004150390625, -1.925537109375, -1.5506591796875, -1.17578125, -0.8009033203125, -0.426025390625, -0.0511474609375, 0.32373046875, 0.6986083984375, 1.073486328125, 1.4483642578125, 1.8232421875, 2.1981201171875, 2.572998046875, 2.9478759765625, 3.32275390625, 3.6976318359375, 4.072509765625, 4.4473876953125, 4.822265625, 5.1971435546875, 5.572021484375, 5.9468994140625, 6.32177734375, 6.6966552734375, 7.071533203125, 7.4464111328125, 7.8212890625, 8.1961669921875, 8.571044921875, 8.9459228515625, 9.32080078125, 9.6956787109375, 10.070556640625, 10.4454345703125, 10.8203125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 4.0, 13.0, 10.0, 11.0, 27.0, 24.0, 29.0, 61.0, 79.0, 111.0, 154.0, 230.0, 345.0, 505.0, 752.0, 1163.0, 1884.0, 3222.0, 5798.0, 10795.0, 21907.0, 93199.0, 843763.0, 32293.0, 14330.0, 7308.0, 4067.0, 2372.0, 1403.0, 861.0, 613.0, 364.0, 287.0, 181.0, 127.0, 80.0, 56.0, 41.0, 27.0, 16.0, 9.0, 11.0, 7.0, 3.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.166015625, -1.1274261474609375, -1.088836669921875, -1.0502471923828125, -1.01165771484375, -0.9730682373046875, -0.934478759765625, -0.8958892822265625, -0.8572998046875, -0.8187103271484375, -0.780120849609375, -0.7415313720703125, -0.70294189453125, -0.6643524169921875, -0.625762939453125, -0.5871734619140625, -0.548583984375, -0.5099945068359375, -0.471405029296875, -0.4328155517578125, -0.39422607421875, -0.3556365966796875, -0.317047119140625, -0.2784576416015625, -0.2398681640625, -0.2012786865234375, -0.162689208984375, -0.1240997314453125, -0.08551025390625, -0.0469207763671875, -0.008331298828125, 0.0302581787109375, 0.06884765625, 0.1074371337890625, 0.146026611328125, 0.1846160888671875, 0.22320556640625, 0.2617950439453125, 0.300384521484375, 0.3389739990234375, 0.3775634765625, 0.4161529541015625, 0.454742431640625, 0.4933319091796875, 0.53192138671875, 0.5705108642578125, 0.609100341796875, 0.6476898193359375, 0.686279296875, 0.7248687744140625, 0.763458251953125, 0.8020477294921875, 0.84063720703125, 0.8792266845703125, 0.917816162109375, 0.9564056396484375, 0.9949951171875, 1.0335845947265625, 1.072174072265625, 1.1107635498046875, 1.14935302734375, 1.1879425048828125, 1.226531982421875, 1.2651214599609375, 1.3037109375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 2.0, 10.0, 11.0, 11.0, 15.0, 10.0, 17.0, 14.0, 11.0, 32.0, 25.0, 31.0, 37.0, 37.0, 32.0, 35.0, 43.0, 32.0, 52.0, 52.0, 36.0, 48.0, 34.0, 36.0, 44.0, 35.0, 30.0, 28.0, 27.0, 26.0, 26.0, 18.0, 17.0, 9.0, 13.0, 10.0, 11.0, 6.0, 7.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-3.647804260253906e-05, -3.542844206094742e-05, -3.4378841519355774e-05, -3.332924097776413e-05, -3.2279640436172485e-05, -3.123003989458084e-05, -3.0180439352989197e-05, -2.9130838811397552e-05, -2.8081238269805908e-05, -2.7031637728214264e-05, -2.598203718662262e-05, -2.4932436645030975e-05, -2.388283610343933e-05, -2.2833235561847687e-05, -2.1783635020256042e-05, -2.0734034478664398e-05, -1.9684433937072754e-05, -1.863483339548111e-05, -1.7585232853889465e-05, -1.653563231229782e-05, -1.5486031770706177e-05, -1.4436431229114532e-05, -1.3386830687522888e-05, -1.2337230145931244e-05, -1.12876296043396e-05, -1.0238029062747955e-05, -9.188428521156311e-06, -8.138827979564667e-06, -7.0892274379730225e-06, -6.039626896381378e-06, -4.990026354789734e-06, -3.94042581319809e-06, -2.8908252716064453e-06, -1.841224730014801e-06, -7.916241884231567e-07, 2.5797635316848755e-07, 1.3075768947601318e-06, 2.357177436351776e-06, 3.4067779779434204e-06, 4.456378519535065e-06, 5.505979061126709e-06, 6.555579602718353e-06, 7.6051801443099976e-06, 8.654780685901642e-06, 9.704381227493286e-06, 1.075398176908493e-05, 1.1803582310676575e-05, 1.2853182852268219e-05, 1.3902783393859863e-05, 1.4952383935451508e-05, 1.6001984477043152e-05, 1.7051585018634796e-05, 1.810118556022644e-05, 1.9150786101818085e-05, 2.020038664340973e-05, 2.1249987185001373e-05, 2.2299587726593018e-05, 2.3349188268184662e-05, 2.4398788809776306e-05, 2.544838935136795e-05, 2.6497989892959595e-05, 2.754759043455124e-05, 2.8597190976142883e-05, 2.9646791517734528e-05, 3.069639205932617e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 5.0, 6.0, 7.0, 2.0, 2.0, 4.0, 7.0, 12.0, 21.0, 22.0, 47.0, 32.0, 63.0, 97.0, 122.0, 188.0, 239.0, 337.0, 593.0, 830.0, 1309.0, 2151.0, 3543.0, 6418.0, 12041.0, 23140.0, 46832.0, 100718.0, 208790.0, 282473.0, 184686.0, 87317.0, 41158.0, 20279.0, 10595.0, 5709.0, 3215.0, 1895.0, 1157.0, 745.0, 526.0, 351.0, 225.0, 170.0, 127.0, 97.0, 63.0, 49.0, 40.0, 38.0, 19.0, 9.0, 12.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.74072265625, -0.717864990234375, -0.69500732421875, -0.672149658203125, -0.6492919921875, -0.626434326171875, -0.60357666015625, -0.580718994140625, -0.557861328125, -0.535003662109375, -0.51214599609375, -0.489288330078125, -0.4664306640625, -0.443572998046875, -0.42071533203125, -0.397857666015625, -0.375, -0.352142333984375, -0.32928466796875, -0.306427001953125, -0.2835693359375, -0.260711669921875, -0.23785400390625, -0.214996337890625, -0.192138671875, -0.169281005859375, -0.14642333984375, -0.123565673828125, -0.1007080078125, -0.077850341796875, -0.05499267578125, -0.032135009765625, -0.00927734375, 0.013580322265625, 0.03643798828125, 0.059295654296875, 0.0821533203125, 0.105010986328125, 0.12786865234375, 0.150726318359375, 0.173583984375, 0.196441650390625, 0.21929931640625, 0.242156982421875, 0.2650146484375, 0.287872314453125, 0.31072998046875, 0.333587646484375, 0.3564453125, 0.379302978515625, 0.40216064453125, 0.425018310546875, 0.4478759765625, 0.470733642578125, 0.49359130859375, 0.516448974609375, 0.539306640625, 0.562164306640625, 0.58502197265625, 0.607879638671875, 0.6307373046875, 0.653594970703125, 0.67645263671875, 0.699310302734375, 0.72216796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 4.0, 5.0, 2.0, 4.0, 9.0, 10.0, 10.0, 30.0, 31.0, 25.0, 33.0, 29.0, 61.0, 54.0, 69.0, 76.0, 76.0, 73.0, 69.0, 67.0, 46.0, 37.0, 31.0, 26.0, 27.0, 24.0, 17.0, 12.0, 8.0, 9.0, 7.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.170166015625, -0.1641693115234375, -0.158172607421875, -0.1521759033203125, -0.14617919921875, -0.1401824951171875, -0.134185791015625, -0.1281890869140625, -0.1221923828125, -0.1161956787109375, -0.110198974609375, -0.1042022705078125, -0.09820556640625, -0.0922088623046875, -0.086212158203125, -0.0802154541015625, -0.07421875, -0.0682220458984375, -0.062225341796875, -0.0562286376953125, -0.05023193359375, -0.0442352294921875, -0.038238525390625, -0.0322418212890625, -0.0262451171875, -0.0202484130859375, -0.014251708984375, -0.0082550048828125, -0.00225830078125, 0.0037384033203125, 0.009735107421875, 0.0157318115234375, 0.021728515625, 0.0277252197265625, 0.033721923828125, 0.0397186279296875, 0.04571533203125, 0.0517120361328125, 0.057708740234375, 0.0637054443359375, 0.0697021484375, 0.0756988525390625, 0.081695556640625, 0.0876922607421875, 0.09368896484375, 0.0996856689453125, 0.105682373046875, 0.1116790771484375, 0.11767578125, 0.1236724853515625, 0.129669189453125, 0.1356658935546875, 0.14166259765625, 0.1476593017578125, 0.153656005859375, 0.1596527099609375, 0.1656494140625, 0.1716461181640625, 0.177642822265625, 0.1836395263671875, 0.18963623046875, 0.1956329345703125, 0.201629638671875, 0.2076263427734375, 0.213623046875]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 12.0, 8.0, 13.0, 10.0, 13.0, 17.0, 26.0, 29.0, 36.0, 40.0, 43.0, 52.0, 59.0, 68.0, 66.0, 74.0, 60.0, 53.0, 62.0, 46.0, 45.0, 36.0, 29.0, 14.0, 20.0, 9.0, 12.0, 4.0, 12.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.123144149780273, -21.229412078857422, -20.33568000793457, -19.44194793701172, -18.548215866088867, -17.654483795166016, -16.76074981689453, -15.867018699645996, -14.973286628723145, -14.079554557800293, -13.185822486877441, -12.292089462280273, -11.398357391357422, -10.50462532043457, -9.610893249511719, -8.717161178588867, -7.823429107666016, -6.929697036743164, -6.0359649658203125, -5.142232418060303, -4.248500347137451, -3.3547682762145996, -2.46103572845459, -1.5673036575317383, -0.6735715866088867, 0.2201606035232544, 1.1138927936553955, 2.007625102996826, 2.9013571739196777, 3.7950892448425293, 4.688821792602539, 5.582553863525391, 6.476284027099609, 7.370016098022461, 8.263748168945312, 9.157480239868164, 10.051212310791016, 10.944944381713867, 11.838677406311035, 12.732409477233887, 13.626141548156738, 14.51987361907959, 15.413605690002441, 16.30733871459961, 17.20107078552246, 18.094802856445312, 18.988534927368164, 19.882266998291016, 20.775999069213867, 21.66973114013672, 22.56346321105957, 23.457195281982422, 24.350927352905273, 25.244659423828125, 26.13839340209961, 27.032123565673828, 27.925857543945312, 28.819589614868164, 29.713321685791016, 30.607053756713867, 31.50078582763672, 32.3945198059082, 33.28824996948242, 34.181983947753906, 35.075714111328125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 6.0, 11.0, 20.0, 22.0, 16.0, 26.0, 28.0, 16.0, 29.0, 30.0, 36.0, 42.0, 33.0, 38.0, 38.0, 51.0, 34.0, 47.0, 57.0, 35.0, 37.0, 44.0, 32.0, 48.0, 31.0, 22.0, 12.0, 21.0, 15.0, 17.0, 20.0, 15.0, 10.0, 7.0, 8.0, 9.0, 7.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.156200408935547, -19.57650375366211, -18.996807098388672, -18.4171085357666, -17.837411880493164, -17.257715225219727, -16.67801856994629, -16.09832000732422, -15.518623352050781, -14.938926696777344, -14.35922908782959, -13.779532432556152, -13.199834823608398, -12.620138168334961, -12.040441513061523, -11.46074390411377, -10.881047248840332, -10.301350593566895, -9.72165298461914, -9.141956329345703, -8.56225872039795, -7.982562065124512, -7.402864933013916, -6.82316780090332, -6.243470668792725, -5.663773536682129, -5.084076404571533, -4.5043792724609375, -3.924682378768921, -3.344985246658325, -2.7652883529663086, -2.185591220855713, -1.6058940887451172, -1.0261969566345215, -0.44649994373321533, 0.13319706916809082, 0.7128942012786865, 1.2925913333892822, 1.8722882270812988, 2.4519853591918945, 3.0316824913024902, 3.611379623413086, 4.191076755523682, 4.770773887634277, 5.350470542907715, 5.930168151855469, 6.509864807128906, 7.089561939239502, 7.669259071350098, 8.248955726623535, 8.828653335571289, 9.408349990844727, 9.98804759979248, 10.567744255065918, 11.147441864013672, 11.72713851928711, 12.306835174560547, 12.886531829833984, 13.466229438781738, 14.045926094055176, 14.62562370300293, 15.205320358276367, 15.785017013549805, 16.364715576171875, 16.944412231445312]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 5.0, 10.0, 15.0, 30.0, 40.0, 49.0, 67.0, 111.0, 197.0, 264.0, 418.0, 590.0, 971.0, 1481.0, 2257.0, 3636.0, 5718.0, 9056.0, 14379.0, 23150.0, 37561.0, 59587.0, 91858.0, 131852.0, 159475.0, 156444.0, 122382.0, 83974.0, 53953.0, 33137.0, 20678.0, 12739.0, 8123.0, 5174.0, 3279.0, 2063.0, 1316.0, 868.0, 571.0, 343.0, 248.0, 156.0, 121.0, 73.0, 47.0, 33.0, 19.0, 15.0, 6.0, 7.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.8203125, -11.4495849609375, -11.078857421875, -10.7081298828125, -10.33740234375, -9.9666748046875, -9.595947265625, -9.2252197265625, -8.8544921875, -8.4837646484375, -8.113037109375, -7.7423095703125, -7.37158203125, -7.0008544921875, -6.630126953125, -6.2593994140625, -5.888671875, -5.5179443359375, -5.147216796875, -4.7764892578125, -4.40576171875, -4.0350341796875, -3.664306640625, -3.2935791015625, -2.9228515625, -2.5521240234375, -2.181396484375, -1.8106689453125, -1.43994140625, -1.0692138671875, -0.698486328125, -0.3277587890625, 0.04296875, 0.4136962890625, 0.784423828125, 1.1551513671875, 1.52587890625, 1.8966064453125, 2.267333984375, 2.6380615234375, 3.0087890625, 3.3795166015625, 3.750244140625, 4.1209716796875, 4.49169921875, 4.8624267578125, 5.233154296875, 5.6038818359375, 5.974609375, 6.3453369140625, 6.716064453125, 7.0867919921875, 7.45751953125, 7.8282470703125, 8.198974609375, 8.5697021484375, 8.9404296875, 9.3111572265625, 9.681884765625, 10.0526123046875, 10.42333984375, 10.7940673828125, 11.164794921875, 11.5355224609375, 11.90625]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 11.0, 12.0, 11.0, 17.0, 27.0, 28.0, 28.0, 32.0, 30.0, 24.0, 32.0, 31.0, 43.0, 35.0, 41.0, 30.0, 44.0, 67.0, 50.0, 39.0, 41.0, 43.0, 37.0, 35.0, 24.0, 20.0, 17.0, 20.0, 20.0, 15.0, 18.0, 17.0, 11.0, 5.0, 10.0, 8.0, 4.0, 0.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.625, -21.000732421875, -20.37646484375, -19.752197265625, -19.1279296875, -18.503662109375, -17.87939453125, -17.255126953125, -16.630859375, -16.006591796875, -15.38232421875, -14.758056640625, -14.1337890625, -13.509521484375, -12.88525390625, -12.260986328125, -11.63671875, -11.012451171875, -10.38818359375, -9.763916015625, -9.1396484375, -8.515380859375, -7.89111328125, -7.266845703125, -6.642578125, -6.018310546875, -5.39404296875, -4.769775390625, -4.1455078125, -3.521240234375, -2.89697265625, -2.272705078125, -1.6484375, -1.024169921875, -0.39990234375, 0.224365234375, 0.8486328125, 1.472900390625, 2.09716796875, 2.721435546875, 3.345703125, 3.969970703125, 4.59423828125, 5.218505859375, 5.8427734375, 6.467041015625, 7.09130859375, 7.715576171875, 8.33984375, 8.964111328125, 9.58837890625, 10.212646484375, 10.8369140625, 11.461181640625, 12.08544921875, 12.709716796875, 13.333984375, 13.958251953125, 14.58251953125, 15.206787109375, 15.8310546875, 16.455322265625, 17.07958984375, 17.703857421875, 18.328125]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 4.0, 17.0, 16.0, 15.0, 13.0, 48.0, 54.0, 67.0, 132.0, 187.0, 268.0, 346.0, 595.0, 884.0, 1314.0, 1980.0, 3005.0, 4623.0, 7186.0, 11171.0, 17405.0, 27846.0, 44273.0, 69004.0, 103461.0, 141765.0, 160524.0, 145168.0, 107552.0, 72483.0, 45931.0, 29535.0, 18285.0, 11586.0, 7617.0, 4816.0, 3133.0, 2098.0, 1425.0, 951.0, 583.0, 372.0, 250.0, 184.0, 122.0, 99.0, 68.0, 34.0, 20.0, 19.0, 8.0, 9.0, 5.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.21875, -11.8052978515625, -11.391845703125, -10.9783935546875, -10.56494140625, -10.1514892578125, -9.738037109375, -9.3245849609375, -8.9111328125, -8.4976806640625, -8.084228515625, -7.6707763671875, -7.25732421875, -6.8438720703125, -6.430419921875, -6.0169677734375, -5.603515625, -5.1900634765625, -4.776611328125, -4.3631591796875, -3.94970703125, -3.5362548828125, -3.122802734375, -2.7093505859375, -2.2958984375, -1.8824462890625, -1.468994140625, -1.0555419921875, -0.64208984375, -0.2286376953125, 0.184814453125, 0.5982666015625, 1.01171875, 1.4251708984375, 1.838623046875, 2.2520751953125, 2.66552734375, 3.0789794921875, 3.492431640625, 3.9058837890625, 4.3193359375, 4.7327880859375, 5.146240234375, 5.5596923828125, 5.97314453125, 6.3865966796875, 6.800048828125, 7.2135009765625, 7.626953125, 8.0404052734375, 8.453857421875, 8.8673095703125, 9.28076171875, 9.6942138671875, 10.107666015625, 10.5211181640625, 10.9345703125, 11.3480224609375, 11.761474609375, 12.1749267578125, 12.58837890625, 13.0018310546875, 13.415283203125, 13.8287353515625, 14.2421875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 10.0, 6.0, 16.0, 17.0, 13.0, 28.0, 23.0, 26.0, 31.0, 23.0, 35.0, 35.0, 39.0, 31.0, 40.0, 53.0, 28.0, 58.0, 45.0, 51.0, 39.0, 34.0, 30.0, 33.0, 19.0, 37.0, 27.0, 26.0, 21.0, 19.0, 21.0, 12.0, 14.0, 9.0, 7.0, 8.0, 7.0, 4.0, 2.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.6689453125, -11.267578125, -10.8662109375, -10.46484375, -10.0634765625, -9.662109375, -9.2607421875, -8.859375, -8.4580078125, -8.056640625, -7.6552734375, -7.25390625, -6.8525390625, -6.451171875, -6.0498046875, -5.6484375, -5.2470703125, -4.845703125, -4.4443359375, -4.04296875, -3.6416015625, -3.240234375, -2.8388671875, -2.4375, -2.0361328125, -1.634765625, -1.2333984375, -0.83203125, -0.4306640625, -0.029296875, 0.3720703125, 0.7734375, 1.1748046875, 1.576171875, 1.9775390625, 2.37890625, 2.7802734375, 3.181640625, 3.5830078125, 3.984375, 4.3857421875, 4.787109375, 5.1884765625, 5.58984375, 5.9912109375, 6.392578125, 6.7939453125, 7.1953125, 7.5966796875, 7.998046875, 8.3994140625, 8.80078125, 9.2021484375, 9.603515625, 10.0048828125, 10.40625, 10.8076171875, 11.208984375, 11.6103515625, 12.01171875, 12.4130859375, 12.814453125, 13.2158203125, 13.6171875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 7.0, 9.0, 19.0, 16.0, 24.0, 23.0, 52.0, 64.0, 86.0, 145.0, 172.0, 276.0, 330.0, 502.0, 733.0, 1016.0, 1479.0, 2305.0, 3334.0, 5370.0, 8255.0, 13550.0, 22976.0, 38494.0, 65528.0, 107077.0, 157508.0, 184762.0, 158252.0, 108773.0, 66312.0, 39277.0, 23511.0, 13762.0, 8489.0, 5369.0, 3467.0, 2268.0, 1512.0, 1008.0, 740.0, 510.0, 358.0, 232.0, 175.0, 125.0, 87.0, 71.0, 47.0, 37.0, 18.0, 12.0, 14.0, 10.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-8.75, -8.4632568359375, -8.176513671875, -7.8897705078125, -7.60302734375, -7.3162841796875, -7.029541015625, -6.7427978515625, -6.4560546875, -6.1693115234375, -5.882568359375, -5.5958251953125, -5.30908203125, -5.0223388671875, -4.735595703125, -4.4488525390625, -4.162109375, -3.8753662109375, -3.588623046875, -3.3018798828125, -3.01513671875, -2.7283935546875, -2.441650390625, -2.1549072265625, -1.8681640625, -1.5814208984375, -1.294677734375, -1.0079345703125, -0.72119140625, -0.4344482421875, -0.147705078125, 0.1390380859375, 0.42578125, 0.7125244140625, 0.999267578125, 1.2860107421875, 1.57275390625, 1.8594970703125, 2.146240234375, 2.4329833984375, 2.7197265625, 3.0064697265625, 3.293212890625, 3.5799560546875, 3.86669921875, 4.1534423828125, 4.440185546875, 4.7269287109375, 5.013671875, 5.3004150390625, 5.587158203125, 5.8739013671875, 6.16064453125, 6.4473876953125, 6.734130859375, 7.0208740234375, 7.3076171875, 7.5943603515625, 7.881103515625, 8.1678466796875, 8.45458984375, 8.7413330078125, 9.028076171875, 9.3148193359375, 9.6015625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 3.0, 7.0, 15.0, 28.0, 41.0, 41.0, 67.0, 89.0, 105.0, 125.0, 128.0, 96.0, 77.0, 58.0, 32.0, 24.0, 17.0, 15.0, 13.0, 3.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012912750244140625, -0.001240953803062439, -0.0011906325817108154, -0.001140311360359192, -0.0010899901390075684, -0.0010396689176559448, -0.0009893476963043213, -0.0009390264749526978, -0.0008887052536010742, -0.0008383840322494507, -0.0007880628108978271, -0.0007377415895462036, -0.0006874203681945801, -0.0006370991468429565, -0.000586777925491333, -0.0005364567041397095, -0.00048613548278808594, -0.0004358142614364624, -0.00038549304008483887, -0.00033517181873321533, -0.0002848505973815918, -0.00023452937602996826, -0.00018420815467834473, -0.0001338869333267212, -8.356571197509766e-05, -3.324449062347412e-05, 1.7076730728149414e-05, 6.739795207977295e-05, 0.00011771917343139648, 0.00016804039478302002, 0.00021836161613464355, 0.0002686828374862671, 0.0003190040588378906, 0.00036932528018951416, 0.0004196465015411377, 0.00046996772289276123, 0.0005202889442443848, 0.0005706101655960083, 0.0006209313869476318, 0.0006712526082992554, 0.0007215738296508789, 0.0007718950510025024, 0.000822216272354126, 0.0008725374937057495, 0.000922858715057373, 0.0009731799364089966, 0.0010235011577606201, 0.0010738223791122437, 0.0011241436004638672, 0.0011744648218154907, 0.0012247860431671143, 0.0012751072645187378, 0.0013254284858703613, 0.0013757497072219849, 0.0014260709285736084, 0.001476392149925232, 0.0015267133712768555, 0.001577034592628479, 0.0016273558139801025, 0.001677677035331726, 0.0017279982566833496, 0.0017783194780349731, 0.0018286406993865967, 0.0018789619207382202, 0.0019292831420898438]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 10.0, 10.0, 11.0, 21.0, 46.0, 32.0, 57.0, 88.0, 135.0, 173.0, 244.0, 367.0, 615.0, 904.0, 1554.0, 2389.0, 4273.0, 7187.0, 13545.0, 25561.0, 50531.0, 100368.0, 179655.0, 237938.0, 192712.0, 110570.0, 56276.0, 28476.0, 14898.0, 8133.0, 4514.0, 2718.0, 1638.0, 984.0, 603.0, 385.0, 271.0, 201.0, 147.0, 97.0, 65.0, 41.0, 28.0, 28.0, 18.0, 13.0, 8.0, 11.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.21875, -12.8250732421875, -12.431396484375, -12.0377197265625, -11.64404296875, -11.2503662109375, -10.856689453125, -10.4630126953125, -10.0693359375, -9.6756591796875, -9.281982421875, -8.8883056640625, -8.49462890625, -8.1009521484375, -7.707275390625, -7.3135986328125, -6.919921875, -6.5262451171875, -6.132568359375, -5.7388916015625, -5.34521484375, -4.9515380859375, -4.557861328125, -4.1641845703125, -3.7705078125, -3.3768310546875, -2.983154296875, -2.5894775390625, -2.19580078125, -1.8021240234375, -1.408447265625, -1.0147705078125, -0.62109375, -0.2274169921875, 0.166259765625, 0.5599365234375, 0.95361328125, 1.3472900390625, 1.740966796875, 2.1346435546875, 2.5283203125, 2.9219970703125, 3.315673828125, 3.7093505859375, 4.10302734375, 4.4967041015625, 4.890380859375, 5.2840576171875, 5.677734375, 6.0714111328125, 6.465087890625, 6.8587646484375, 7.25244140625, 7.6461181640625, 8.039794921875, 8.4334716796875, 8.8271484375, 9.2208251953125, 9.614501953125, 10.0081787109375, 10.40185546875, 10.7955322265625, 11.189208984375, 11.5828857421875, 11.9765625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 7.0, 16.0, 20.0, 30.0, 22.0, 19.0, 27.0, 42.0, 41.0, 46.0, 52.0, 76.0, 54.0, 47.0, 71.0, 55.0, 62.0, 51.0, 46.0, 30.0, 32.0, 38.0, 18.0, 8.0, 14.0, 14.0, 6.0, 10.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0], "bins": [-3.34375, -3.25408935546875, -3.1644287109375, -3.07476806640625, -2.985107421875, -2.89544677734375, -2.8057861328125, -2.71612548828125, -2.62646484375, -2.53680419921875, -2.4471435546875, -2.35748291015625, -2.267822265625, -2.17816162109375, -2.0885009765625, -1.99884033203125, -1.9091796875, -1.81951904296875, -1.7298583984375, -1.64019775390625, -1.550537109375, -1.46087646484375, -1.3712158203125, -1.28155517578125, -1.19189453125, -1.10223388671875, -1.0125732421875, -0.92291259765625, -0.833251953125, -0.74359130859375, -0.6539306640625, -0.56427001953125, -0.474609375, -0.38494873046875, -0.2952880859375, -0.20562744140625, -0.115966796875, -0.02630615234375, 0.0633544921875, 0.15301513671875, 0.24267578125, 0.33233642578125, 0.4219970703125, 0.51165771484375, 0.601318359375, 0.69097900390625, 0.7806396484375, 0.87030029296875, 0.9599609375, 1.04962158203125, 1.1392822265625, 1.22894287109375, 1.318603515625, 1.40826416015625, 1.4979248046875, 1.58758544921875, 1.67724609375, 1.76690673828125, 1.8565673828125, 1.94622802734375, 2.035888671875, 2.12554931640625, 2.2152099609375, 2.30487060546875, 2.39453125]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 9.0, 5.0, 4.0, 11.0, 8.0, 11.0, 17.0, 18.0, 24.0, 25.0, 32.0, 42.0, 43.0, 57.0, 60.0, 55.0, 63.0, 65.0, 52.0, 66.0, 57.0, 60.0, 44.0, 38.0, 23.0, 26.0, 18.0, 12.0, 8.0, 12.0, 6.0, 5.0, 3.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.331640243530273, -21.446327209472656, -20.561012268066406, -19.67569923400879, -18.79038429260254, -17.905071258544922, -17.019756317138672, -16.134443283081055, -15.249129295349121, -14.363815307617188, -13.478501319885254, -12.59318733215332, -11.707874298095703, -10.822559356689453, -9.937246322631836, -9.051932334899902, -8.166618347167969, -7.281304359436035, -6.395990371704102, -5.510676860809326, -4.625362873077393, -3.740048885345459, -2.8547353744506836, -1.96942138671875, -1.0841073989868164, -0.19879353046417236, 0.6865203380584717, 1.5718340873718262, 2.4571480751037598, 3.3424620628356934, 4.227775573730469, 5.113089561462402, 5.998401641845703, 6.883715629577637, 7.76902961730957, 8.654342651367188, 9.539657592773438, 10.424970626831055, 11.310284614562988, 12.195598602294922, 13.080912590026855, 13.966226577758789, 14.851540565490723, 15.736854553222656, 16.622167587280273, 17.507482528686523, 18.39279556274414, 19.27811050415039, 20.163423538208008, 21.048736572265625, 21.934051513671875, 22.819364547729492, 23.704679489135742, 24.58999252319336, 25.47530746459961, 26.360620498657227, 27.245933532714844, 28.13124656677246, 29.01656150817871, 29.901874542236328, 30.787189483642578, 31.672502517700195, 32.55781555175781, 33.44313049316406, 34.32844543457031]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 9.0, 3.0, 4.0, 9.0, 6.0, 6.0, 7.0, 10.0, 17.0, 20.0, 20.0, 22.0, 20.0, 22.0, 20.0, 27.0, 24.0, 39.0, 39.0, 33.0, 33.0, 38.0, 40.0, 48.0, 26.0, 42.0, 28.0, 35.0, 24.0, 28.0, 41.0, 35.0, 22.0, 32.0, 24.0, 16.0, 16.0, 21.0, 15.0, 10.0, 20.0, 15.0, 9.0, 5.0, 5.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-18.31070899963379, -17.771915435791016, -17.233121871948242, -16.69432830810547, -16.155534744262695, -15.616741180419922, -15.077948570251465, -14.539155006408691, -14.000361442565918, -13.461567878723145, -12.922774314880371, -12.383980751037598, -11.84518814086914, -11.306394577026367, -10.767601013183594, -10.22880744934082, -9.690013885498047, -9.151220321655273, -8.6124267578125, -8.073633193969727, -7.534840106964111, -6.996046543121338, -6.457253456115723, -5.918459892272949, -5.379666328430176, -4.840872764587402, -4.302079200744629, -3.7632861137390137, -3.2244925498962402, -2.685698986053467, -2.1469056606292725, -1.6081123352050781, -1.0693168640136719, -0.530523419380188, 0.008270025253295898, 0.5470634698867798, 1.0858569145202637, 1.624650478363037, 2.1634438037872314, 2.702237129211426, 3.241030693054199, 3.7798242568969727, 4.318617820739746, 4.857410907745361, 5.396204471588135, 5.934998035430908, 6.473791122436523, 7.012584686279297, 7.55137825012207, 8.090171813964844, 8.628965377807617, 9.16775894165039, 9.706552505493164, 10.245346069335938, 10.784138679504395, 11.322932243347168, 11.861725807189941, 12.400519371032715, 12.939312934875488, 13.478106498718262, 14.016899108886719, 14.555692672729492, 15.094486236572266, 15.633279800415039, 16.172073364257812]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 8.0, 9.0, 11.0, 25.0, 28.0, 50.0, 80.0, 122.0, 180.0, 269.0, 439.0, 660.0, 1085.0, 1752.0, 2839.0, 4969.0, 8448.0, 15570.0, 32967.0, 82125.0, 251338.0, 837000.0, 1613108.0, 901103.0, 278263.0, 88459.0, 34502.0, 16757.0, 8865.0, 4981.0, 3008.0, 1880.0, 1164.0, 718.0, 500.0, 321.0, 231.0, 141.0, 97.0, 68.0, 47.0, 30.0, 16.0, 20.0, 7.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.4375, -41.091796875, -39.74609375, -38.400390625, -37.0546875, -35.708984375, -34.36328125, -33.017578125, -31.671875, -30.326171875, -28.98046875, -27.634765625, -26.2890625, -24.943359375, -23.59765625, -22.251953125, -20.90625, -19.560546875, -18.21484375, -16.869140625, -15.5234375, -14.177734375, -12.83203125, -11.486328125, -10.140625, -8.794921875, -7.44921875, -6.103515625, -4.7578125, -3.412109375, -2.06640625, -0.720703125, 0.625, 1.970703125, 3.31640625, 4.662109375, 6.0078125, 7.353515625, 8.69921875, 10.044921875, 11.390625, 12.736328125, 14.08203125, 15.427734375, 16.7734375, 18.119140625, 19.46484375, 20.810546875, 22.15625, 23.501953125, 24.84765625, 26.193359375, 27.5390625, 28.884765625, 30.23046875, 31.576171875, 32.921875, 34.267578125, 35.61328125, 36.958984375, 38.3046875, 39.650390625, 40.99609375, 42.341796875, 43.6875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 8.0, 14.0, 10.0, 17.0, 12.0, 18.0, 23.0, 19.0, 23.0, 19.0, 20.0, 30.0, 35.0, 32.0, 36.0, 31.0, 20.0, 51.0, 37.0, 40.0, 51.0, 35.0, 35.0, 30.0, 31.0, 38.0, 30.0, 32.0, 21.0, 26.0, 17.0, 22.0, 16.0, 15.0, 21.0, 14.0, 10.0, 7.0, 8.0, 8.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-17.359375, -16.8397216796875, -16.320068359375, -15.8004150390625, -15.28076171875, -14.7611083984375, -14.241455078125, -13.7218017578125, -13.2021484375, -12.6824951171875, -12.162841796875, -11.6431884765625, -11.12353515625, -10.6038818359375, -10.084228515625, -9.5645751953125, -9.044921875, -8.5252685546875, -8.005615234375, -7.4859619140625, -6.96630859375, -6.4466552734375, -5.927001953125, -5.4073486328125, -4.8876953125, -4.3680419921875, -3.848388671875, -3.3287353515625, -2.80908203125, -2.2894287109375, -1.769775390625, -1.2501220703125, -0.73046875, -0.2108154296875, 0.308837890625, 0.8284912109375, 1.34814453125, 1.8677978515625, 2.387451171875, 2.9071044921875, 3.4267578125, 3.9464111328125, 4.466064453125, 4.9857177734375, 5.50537109375, 6.0250244140625, 6.544677734375, 7.0643310546875, 7.583984375, 8.1036376953125, 8.623291015625, 9.1429443359375, 9.66259765625, 10.1822509765625, 10.701904296875, 11.2215576171875, 11.7412109375, 12.2608642578125, 12.780517578125, 13.3001708984375, 13.81982421875, 14.3394775390625, 14.859130859375, 15.3787841796875, 15.8984375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 2.0, 5.0, 12.0, 20.0, 34.0, 53.0, 54.0, 115.0, 158.0, 271.0, 437.0, 722.0, 1151.0, 1917.0, 2874.0, 4662.0, 7874.0, 13609.0, 23792.0, 46656.0, 100417.0, 254774.0, 736512.0, 1506795.0, 926732.0, 321650.0, 122436.0, 55058.0, 27839.0, 15302.0, 8668.0, 5240.0, 3105.0, 2064.0, 1186.0, 775.0, 473.0, 271.0, 198.0, 137.0, 86.0, 54.0, 34.0, 27.0, 8.0, 9.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.03125, -49.4169921875, -47.802734375, -46.1884765625, -44.57421875, -42.9599609375, -41.345703125, -39.7314453125, -38.1171875, -36.5029296875, -34.888671875, -33.2744140625, -31.66015625, -30.0458984375, -28.431640625, -26.8173828125, -25.203125, -23.5888671875, -21.974609375, -20.3603515625, -18.74609375, -17.1318359375, -15.517578125, -13.9033203125, -12.2890625, -10.6748046875, -9.060546875, -7.4462890625, -5.83203125, -4.2177734375, -2.603515625, -0.9892578125, 0.625, 2.2392578125, 3.853515625, 5.4677734375, 7.08203125, 8.6962890625, 10.310546875, 11.9248046875, 13.5390625, 15.1533203125, 16.767578125, 18.3818359375, 19.99609375, 21.6103515625, 23.224609375, 24.8388671875, 26.453125, 28.0673828125, 29.681640625, 31.2958984375, 32.91015625, 34.5244140625, 36.138671875, 37.7529296875, 39.3671875, 40.9814453125, 42.595703125, 44.2099609375, 45.82421875, 47.4384765625, 49.052734375, 50.6669921875, 52.28125]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 10.0, 3.0, 3.0, 8.0, 13.0, 24.0, 15.0, 25.0, 36.0, 31.0, 40.0, 55.0, 74.0, 89.0, 124.0, 163.0, 215.0, 233.0, 290.0, 325.0, 322.0, 325.0, 323.0, 280.0, 199.0, 183.0, 132.0, 129.0, 89.0, 85.0, 65.0, 38.0, 28.0, 26.0, 16.0, 16.0, 8.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.3203125, -13.908447265625, -13.49658203125, -13.084716796875, -12.6728515625, -12.260986328125, -11.84912109375, -11.437255859375, -11.025390625, -10.613525390625, -10.20166015625, -9.789794921875, -9.3779296875, -8.966064453125, -8.55419921875, -8.142333984375, -7.73046875, -7.318603515625, -6.90673828125, -6.494873046875, -6.0830078125, -5.671142578125, -5.25927734375, -4.847412109375, -4.435546875, -4.023681640625, -3.61181640625, -3.199951171875, -2.7880859375, -2.376220703125, -1.96435546875, -1.552490234375, -1.140625, -0.728759765625, -0.31689453125, 0.094970703125, 0.5068359375, 0.918701171875, 1.33056640625, 1.742431640625, 2.154296875, 2.566162109375, 2.97802734375, 3.389892578125, 3.8017578125, 4.213623046875, 4.62548828125, 5.037353515625, 5.44921875, 5.861083984375, 6.27294921875, 6.684814453125, 7.0966796875, 7.508544921875, 7.92041015625, 8.332275390625, 8.744140625, 9.156005859375, 9.56787109375, 9.979736328125, 10.3916015625, 10.803466796875, 11.21533203125, 11.627197265625, 12.0390625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 4.0, 6.0, 7.0, 7.0, 6.0, 11.0, 9.0, 17.0, 21.0, 23.0, 22.0, 30.0, 35.0, 47.0, 40.0, 60.0, 61.0, 73.0, 72.0, 72.0, 64.0, 65.0, 44.0, 35.0, 45.0, 25.0, 20.0, 22.0, 15.0, 9.0, 2.0, 4.0, 6.0, 0.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-37.76919174194336, -36.545223236083984, -35.32125473022461, -34.09728240966797, -32.873313903808594, -31.64934539794922, -30.425376892089844, -29.20140838623047, -27.97743797302246, -26.753469467163086, -25.529499053955078, -24.305530548095703, -23.081562042236328, -21.85759162902832, -20.633623123168945, -19.409652709960938, -18.185684204101562, -16.961715698242188, -15.73774528503418, -14.513776779174805, -13.289807319641113, -12.065837860107422, -10.841869354248047, -9.617899894714355, -8.393930435180664, -7.169960975646973, -5.9459919929504395, -4.722023010253906, -3.498053550720215, -2.2740840911865234, -1.0501151084899902, 0.17385387420654297, 1.3978271484375, 2.6217963695526123, 3.8457655906677246, 5.069734573364258, 6.293704032897949, 7.517673492431641, 8.741641998291016, 9.965611457824707, 11.189580917358398, 12.41355037689209, 13.637519836425781, 14.861488342285156, 16.08545684814453, 17.30942726135254, 18.533395767211914, 19.757366180419922, 20.981334686279297, 22.205303192138672, 23.42927360534668, 24.653242111206055, 25.877212524414062, 27.101181030273438, 28.325149536132812, 29.549118041992188, 30.773088455200195, 31.99705696105957, 33.22102737426758, 34.44499588012695, 35.66896438598633, 36.89293670654297, 38.116905212402344, 39.34087371826172, 40.564842224121094]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 7.0, 14.0, 13.0, 7.0, 16.0, 22.0, 24.0, 28.0, 28.0, 38.0, 25.0, 46.0, 34.0, 30.0, 34.0, 39.0, 40.0, 32.0, 59.0, 41.0, 46.0, 42.0, 56.0, 28.0, 23.0, 27.0, 28.0, 22.0, 26.0, 23.0, 12.0, 20.0, 11.0, 7.0, 16.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.850019454956055, -23.069915771484375, -22.289812088012695, -21.509708404541016, -20.729604721069336, -19.949501037597656, -19.169397354125977, -18.389293670654297, -17.609189987182617, -16.829086303710938, -16.048982620239258, -15.268878936767578, -14.488775253295898, -13.708671569824219, -12.928567886352539, -12.14846420288086, -11.36836051940918, -10.5882568359375, -9.80815315246582, -9.02804946899414, -8.247945785522461, -7.467842102050781, -6.687738418579102, -5.907634735107422, -5.127531051635742, -4.3474273681640625, -3.567323684692383, -2.787220001220703, -2.0071163177490234, -1.2270126342773438, -0.44690895080566406, 0.3331947326660156, 1.1132984161376953, 1.893402099609375, 2.6735057830810547, 3.4536094665527344, 4.233713150024414, 5.013816833496094, 5.793920516967773, 6.574024200439453, 7.354127883911133, 8.134231567382812, 8.914335250854492, 9.694438934326172, 10.474542617797852, 11.254646301269531, 12.034749984741211, 12.81485366821289, 13.59495735168457, 14.37506103515625, 15.15516471862793, 15.93526840209961, 16.71537208557129, 17.49547576904297, 18.27557945251465, 19.055683135986328, 19.835786819458008, 20.615890502929688, 21.395994186401367, 22.176097869873047, 22.956201553344727, 23.736305236816406, 24.516408920288086, 25.296512603759766, 26.076616287231445]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 5.0, 2.0, 2.0, 5.0, 16.0, 15.0, 18.0, 27.0, 48.0, 71.0, 92.0, 172.0, 187.0, 310.0, 471.0, 730.0, 1042.0, 1688.0, 2527.0, 3962.0, 6238.0, 9936.0, 16631.0, 27063.0, 47987.0, 87681.0, 164092.0, 247967.0, 189523.0, 103380.0, 55551.0, 31150.0, 18748.0, 11391.0, 7047.0, 4487.0, 2822.0, 1822.0, 1221.0, 835.0, 546.0, 305.0, 222.0, 172.0, 114.0, 84.0, 45.0, 35.0, 29.0, 17.0, 9.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.7578125, -2.66473388671875, -2.5716552734375, -2.47857666015625, -2.385498046875, -2.29241943359375, -2.1993408203125, -2.10626220703125, -2.01318359375, -1.92010498046875, -1.8270263671875, -1.73394775390625, -1.640869140625, -1.54779052734375, -1.4547119140625, -1.36163330078125, -1.2685546875, -1.17547607421875, -1.0823974609375, -0.98931884765625, -0.896240234375, -0.80316162109375, -0.7100830078125, -0.61700439453125, -0.52392578125, -0.43084716796875, -0.3377685546875, -0.24468994140625, -0.151611328125, -0.05853271484375, 0.0345458984375, 0.12762451171875, 0.220703125, 0.31378173828125, 0.4068603515625, 0.49993896484375, 0.593017578125, 0.68609619140625, 0.7791748046875, 0.87225341796875, 0.96533203125, 1.05841064453125, 1.1514892578125, 1.24456787109375, 1.337646484375, 1.43072509765625, 1.5238037109375, 1.61688232421875, 1.7099609375, 1.80303955078125, 1.8961181640625, 1.98919677734375, 2.082275390625, 2.17535400390625, 2.2684326171875, 2.36151123046875, 2.45458984375, 2.54766845703125, 2.6407470703125, 2.73382568359375, 2.826904296875, 2.91998291015625, 3.0130615234375, 3.10614013671875, 3.19921875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 3.0, 5.0, 5.0, 3.0, 9.0, 11.0, 13.0, 19.0, 19.0, 26.0, 19.0, 21.0, 38.0, 29.0, 41.0, 37.0, 40.0, 37.0, 37.0, 38.0, 48.0, 39.0, 42.0, 47.0, 45.0, 41.0, 40.0, 38.0, 29.0, 31.0, 20.0, 15.0, 25.0, 27.0, 9.0, 14.0, 16.0, 7.0, 4.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.265625, -26.386962890625, -25.50830078125, -24.629638671875, -23.7509765625, -22.872314453125, -21.99365234375, -21.114990234375, -20.236328125, -19.357666015625, -18.47900390625, -17.600341796875, -16.7216796875, -15.843017578125, -14.96435546875, -14.085693359375, -13.20703125, -12.328369140625, -11.44970703125, -10.571044921875, -9.6923828125, -8.813720703125, -7.93505859375, -7.056396484375, -6.177734375, -5.299072265625, -4.42041015625, -3.541748046875, -2.6630859375, -1.784423828125, -0.90576171875, -0.027099609375, 0.8515625, 1.730224609375, 2.60888671875, 3.487548828125, 4.3662109375, 5.244873046875, 6.12353515625, 7.002197265625, 7.880859375, 8.759521484375, 9.63818359375, 10.516845703125, 11.3955078125, 12.274169921875, 13.15283203125, 14.031494140625, 14.91015625, 15.788818359375, 16.66748046875, 17.546142578125, 18.4248046875, 19.303466796875, 20.18212890625, 21.060791015625, 21.939453125, 22.818115234375, 23.69677734375, 24.575439453125, 25.4541015625, 26.332763671875, 27.21142578125, 28.090087890625, 28.96875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 4.0, 2.0, 13.0, 15.0, 16.0, 27.0, 34.0, 49.0, 69.0, 81.0, 100.0, 166.0, 269.0, 403.0, 623.0, 966.0, 1618.0, 2895.0, 5513.0, 11826.0, 30968.0, 577676.0, 363714.0, 28020.0, 11184.0, 5266.0, 2646.0, 1563.0, 927.0, 608.0, 386.0, 269.0, 193.0, 125.0, 76.0, 65.0, 49.0, 41.0, 27.0, 21.0, 9.0, 6.0, 6.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7183837890625, -8.436767578125, -8.1551513671875, -7.87353515625, -7.5919189453125, -7.310302734375, -7.0286865234375, -6.7470703125, -6.4654541015625, -6.183837890625, -5.9022216796875, -5.62060546875, -5.3389892578125, -5.057373046875, -4.7757568359375, -4.494140625, -4.2125244140625, -3.930908203125, -3.6492919921875, -3.36767578125, -3.0860595703125, -2.804443359375, -2.5228271484375, -2.2412109375, -1.9595947265625, -1.677978515625, -1.3963623046875, -1.11474609375, -0.8331298828125, -0.551513671875, -0.2698974609375, 0.01171875, 0.2933349609375, 0.574951171875, 0.8565673828125, 1.13818359375, 1.4197998046875, 1.701416015625, 1.9830322265625, 2.2646484375, 2.5462646484375, 2.827880859375, 3.1094970703125, 3.39111328125, 3.6727294921875, 3.954345703125, 4.2359619140625, 4.517578125, 4.7991943359375, 5.080810546875, 5.3624267578125, 5.64404296875, 5.9256591796875, 6.207275390625, 6.4888916015625, 6.7705078125, 7.0521240234375, 7.333740234375, 7.6153564453125, 7.89697265625, 8.1785888671875, 8.460205078125, 8.7418212890625, 9.0234375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 4.0, 8.0, 8.0, 12.0, 6.0, 15.0, 17.0, 25.0, 18.0, 16.0, 27.0, 21.0, 26.0, 34.0, 38.0, 28.0, 49.0, 46.0, 34.0, 33.0, 28.0, 30.0, 43.0, 33.0, 48.0, 45.0, 33.0, 28.0, 32.0, 20.0, 28.0, 16.0, 26.0, 16.0, 20.0, 16.0, 14.0, 11.0, 9.0, 6.0, 4.0, 5.0, 6.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0], "bins": [-15.1953125, -14.71826171875, -14.2412109375, -13.76416015625, -13.287109375, -12.81005859375, -12.3330078125, -11.85595703125, -11.37890625, -10.90185546875, -10.4248046875, -9.94775390625, -9.470703125, -8.99365234375, -8.5166015625, -8.03955078125, -7.5625, -7.08544921875, -6.6083984375, -6.13134765625, -5.654296875, -5.17724609375, -4.7001953125, -4.22314453125, -3.74609375, -3.26904296875, -2.7919921875, -2.31494140625, -1.837890625, -1.36083984375, -0.8837890625, -0.40673828125, 0.0703125, 0.54736328125, 1.0244140625, 1.50146484375, 1.978515625, 2.45556640625, 2.9326171875, 3.40966796875, 3.88671875, 4.36376953125, 4.8408203125, 5.31787109375, 5.794921875, 6.27197265625, 6.7490234375, 7.22607421875, 7.703125, 8.18017578125, 8.6572265625, 9.13427734375, 9.611328125, 10.08837890625, 10.5654296875, 11.04248046875, 11.51953125, 11.99658203125, 12.4736328125, 12.95068359375, 13.427734375, 13.90478515625, 14.3818359375, 14.85888671875, 15.3359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 10.0, 9.0, 13.0, 21.0, 19.0, 38.0, 37.0, 66.0, 91.0, 168.0, 257.0, 361.0, 556.0, 970.0, 1657.0, 3031.0, 5968.0, 12536.0, 30074.0, 852424.0, 98003.0, 21674.0, 9544.0, 4679.0, 2549.0, 1393.0, 848.0, 485.0, 305.0, 246.0, 156.0, 105.0, 84.0, 44.0, 30.0, 22.0, 19.0, 12.0, 6.0, 14.0, 9.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.70703125, -1.647796630859375, -1.58856201171875, -1.529327392578125, -1.4700927734375, -1.410858154296875, -1.35162353515625, -1.292388916015625, -1.233154296875, -1.173919677734375, -1.11468505859375, -1.055450439453125, -0.9962158203125, -0.936981201171875, -0.87774658203125, -0.818511962890625, -0.75927734375, -0.700042724609375, -0.64080810546875, -0.581573486328125, -0.5223388671875, -0.463104248046875, -0.40386962890625, -0.344635009765625, -0.285400390625, -0.226165771484375, -0.16693115234375, -0.107696533203125, -0.0484619140625, 0.010772705078125, 0.07000732421875, 0.129241943359375, 0.1884765625, 0.247711181640625, 0.30694580078125, 0.366180419921875, 0.4254150390625, 0.484649658203125, 0.54388427734375, 0.603118896484375, 0.662353515625, 0.721588134765625, 0.78082275390625, 0.840057373046875, 0.8992919921875, 0.958526611328125, 1.01776123046875, 1.076995849609375, 1.13623046875, 1.195465087890625, 1.25469970703125, 1.313934326171875, 1.3731689453125, 1.432403564453125, 1.49163818359375, 1.550872802734375, 1.610107421875, 1.669342041015625, 1.72857666015625, 1.787811279296875, 1.8470458984375, 1.906280517578125, 1.96551513671875, 2.024749755859375, 2.083984375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 9.0, 5.0, 15.0, 7.0, 7.0, 10.0, 13.0, 11.0, 19.0, 21.0, 22.0, 24.0, 24.0, 35.0, 33.0, 51.0, 43.0, 44.0, 33.0, 42.0, 44.0, 37.0, 49.0, 39.0, 47.0, 44.0, 33.0, 29.0, 34.0, 30.0, 23.0, 16.0, 18.0, 17.0, 14.0, 11.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.124641418457031e-05, -3.997236490249634e-05, -3.869831562042236e-05, -3.742426633834839e-05, -3.6150217056274414e-05, -3.487616777420044e-05, -3.3602118492126465e-05, -3.232806921005249e-05, -3.1054019927978516e-05, -2.977997064590454e-05, -2.8505921363830566e-05, -2.7231872081756592e-05, -2.5957822799682617e-05, -2.4683773517608643e-05, -2.3409724235534668e-05, -2.2135674953460693e-05, -2.086162567138672e-05, -1.9587576389312744e-05, -1.831352710723877e-05, -1.7039477825164795e-05, -1.576542854309082e-05, -1.4491379261016846e-05, -1.3217329978942871e-05, -1.1943280696868896e-05, -1.0669231414794922e-05, -9.395182132720947e-06, -8.121132850646973e-06, -6.847083568572998e-06, -5.5730342864990234e-06, -4.298985004425049e-06, -3.0249357223510742e-06, -1.7508864402770996e-06, -4.76837158203125e-07, 7.972121238708496e-07, 2.0712614059448242e-06, 3.345310688018799e-06, 4.6193599700927734e-06, 5.893409252166748e-06, 7.167458534240723e-06, 8.441507816314697e-06, 9.715557098388672e-06, 1.0989606380462646e-05, 1.2263655662536621e-05, 1.3537704944610596e-05, 1.481175422668457e-05, 1.6085803508758545e-05, 1.735985279083252e-05, 1.8633902072906494e-05, 1.990795135498047e-05, 2.1182000637054443e-05, 2.2456049919128418e-05, 2.3730099201202393e-05, 2.5004148483276367e-05, 2.6278197765350342e-05, 2.7552247047424316e-05, 2.882629632949829e-05, 3.0100345611572266e-05, 3.137439489364624e-05, 3.2648444175720215e-05, 3.392249345779419e-05, 3.5196542739868164e-05, 3.647059202194214e-05, 3.774464130401611e-05, 3.901869058609009e-05, 4.029273986816406e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 16.0, 7.0, 23.0, 18.0, 39.0, 33.0, 54.0, 90.0, 118.0, 165.0, 279.0, 480.0, 758.0, 1350.0, 2316.0, 4181.0, 7953.0, 17135.0, 40675.0, 106960.0, 279559.0, 337846.0, 149766.0, 54384.0, 22399.0, 10065.0, 5118.0, 2692.0, 1574.0, 884.0, 565.0, 341.0, 230.0, 170.0, 81.0, 56.0, 50.0, 28.0, 19.0, 12.0, 12.0, 12.0, 7.0, 1.0, 3.0, 7.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1085968017578125, -1.067779541015625, -1.0269622802734375, -0.98614501953125, -0.9453277587890625, -0.904510498046875, -0.8636932373046875, -0.8228759765625, -0.7820587158203125, -0.741241455078125, -0.7004241943359375, -0.65960693359375, -0.6187896728515625, -0.577972412109375, -0.5371551513671875, -0.496337890625, -0.4555206298828125, -0.414703369140625, -0.3738861083984375, -0.33306884765625, -0.2922515869140625, -0.251434326171875, -0.2106170654296875, -0.1697998046875, -0.1289825439453125, -0.088165283203125, -0.0473480224609375, -0.00653076171875, 0.0342864990234375, 0.075103759765625, 0.1159210205078125, 0.15673828125, 0.1975555419921875, 0.238372802734375, 0.2791900634765625, 0.32000732421875, 0.3608245849609375, 0.401641845703125, 0.4424591064453125, 0.4832763671875, 0.5240936279296875, 0.564910888671875, 0.6057281494140625, 0.64654541015625, 0.6873626708984375, 0.728179931640625, 0.7689971923828125, 0.809814453125, 0.8506317138671875, 0.891448974609375, 0.9322662353515625, 0.97308349609375, 1.0139007568359375, 1.054718017578125, 1.0955352783203125, 1.1363525390625, 1.1771697998046875, 1.217987060546875, 1.2588043212890625, 1.29962158203125, 1.3404388427734375, 1.381256103515625, 1.4220733642578125, 1.462890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 18.0, 10.0, 9.0, 18.0, 30.0, 44.0, 41.0, 64.0, 82.0, 81.0, 120.0, 98.0, 93.0, 80.0, 64.0, 40.0, 27.0, 19.0, 16.0, 9.0, 10.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.343994140625, -0.33209991455078125, -0.3202056884765625, -0.30831146240234375, -0.296417236328125, -0.28452301025390625, -0.2726287841796875, -0.26073455810546875, -0.24884033203125, -0.23694610595703125, -0.2250518798828125, -0.21315765380859375, -0.201263427734375, -0.18936920166015625, -0.1774749755859375, -0.16558074951171875, -0.1536865234375, -0.14179229736328125, -0.1298980712890625, -0.11800384521484375, -0.106109619140625, -0.09421539306640625, -0.0823211669921875, -0.07042694091796875, -0.05853271484375, -0.04663848876953125, -0.0347442626953125, -0.02285003662109375, -0.010955810546875, 0.00093841552734375, 0.0128326416015625, 0.02472686767578125, 0.03662109375, 0.04851531982421875, 0.0604095458984375, 0.07230377197265625, 0.084197998046875, 0.09609222412109375, 0.1079864501953125, 0.11988067626953125, 0.13177490234375, 0.14366912841796875, 0.1555633544921875, 0.16745758056640625, 0.179351806640625, 0.19124603271484375, 0.2031402587890625, 0.21503448486328125, 0.2269287109375, 0.23882293701171875, 0.2507171630859375, 0.26261138916015625, 0.274505615234375, 0.28639984130859375, 0.2982940673828125, 0.31018829345703125, 0.32208251953125, 0.33397674560546875, 0.3458709716796875, 0.35776519775390625, 0.369659423828125, 0.38155364990234375, 0.3934478759765625, 0.40534210205078125, 0.417236328125]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 5.0, 5.0, 5.0, 5.0, 4.0, 9.0, 7.0, 10.0, 13.0, 12.0, 23.0, 24.0, 24.0, 30.0, 35.0, 46.0, 45.0, 63.0, 60.0, 74.0, 78.0, 69.0, 71.0, 60.0, 39.0, 36.0, 41.0, 23.0, 18.0, 21.0, 15.0, 7.0, 2.0, 7.0, 3.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.75826644897461, -36.52914047241211, -35.300018310546875, -34.070892333984375, -32.84177017211914, -31.61264419555664, -30.383520126342773, -29.154396057128906, -27.92527198791504, -26.696147918701172, -25.467023849487305, -24.237899780273438, -23.008773803710938, -21.779651641845703, -20.550525665283203, -19.321401596069336, -18.09227752685547, -16.8631534576416, -15.634029388427734, -14.40490436553955, -13.175780296325684, -11.946656227111816, -10.717531204223633, -9.488407135009766, -8.259283065795898, -7.030158996582031, -5.801034450531006, -4.5719099044799805, -3.3427858352661133, -2.113661766052246, -0.8845372200012207, 0.3445873260498047, 1.5737113952636719, 2.802835702896118, 4.0319600105285645, 5.26108455657959, 6.490208625793457, 7.719332695007324, 8.948457717895508, 10.177581787109375, 11.406705856323242, 12.63582992553711, 13.864953994750977, 15.09407901763916, 16.323204040527344, 17.552326202392578, 18.781452178955078, 20.010576248168945, 21.239700317382812, 22.46882438659668, 23.697948455810547, 24.927072525024414, 26.15619659423828, 27.38532257080078, 28.61444664001465, 29.843570709228516, 31.072694778442383, 32.30181884765625, 33.53094482421875, 34.760066986083984, 35.989192962646484, 37.21831512451172, 38.44744110107422, 39.67656707763672, 40.90568923950195]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 7.0, 10.0, 6.0, 14.0, 15.0, 8.0, 13.0, 19.0, 26.0, 29.0, 28.0, 35.0, 27.0, 41.0, 34.0, 33.0, 33.0, 40.0, 40.0, 31.0, 52.0, 48.0, 38.0, 53.0, 54.0, 27.0, 25.0, 30.0, 25.0, 22.0, 28.0, 25.0, 10.0, 19.0, 14.0, 6.0, 18.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.901533126831055, -23.12200164794922, -22.34246826171875, -21.562936782836914, -20.783405303955078, -20.003873825073242, -19.224342346191406, -18.444808959960938, -17.6652774810791, -16.885746002197266, -16.106212615966797, -15.326681137084961, -14.547149658203125, -13.767618179321289, -12.988085746765137, -12.208553314208984, -11.429021835327148, -10.649490356445312, -9.86995792388916, -9.090425491333008, -8.310894012451172, -7.531362056732178, -6.751830101013184, -5.9722981452941895, -5.192766189575195, -4.413234233856201, -3.633702278137207, -2.854170322418213, -2.0746383666992188, -1.2951064109802246, -0.5155744552612305, 0.26395750045776367, 1.0434913635253906, 1.8230233192443848, 2.602555274963379, 3.382087230682373, 4.161619186401367, 4.941151142120361, 5.7206830978393555, 6.50021505355835, 7.279747009277344, 8.05927848815918, 8.838810920715332, 9.618343353271484, 10.39787483215332, 11.177406311035156, 11.956938743591309, 12.736471176147461, 13.516002655029297, 14.295534133911133, 15.075066566467285, 15.854598999023438, 16.634130477905273, 17.41366195678711, 18.193195343017578, 18.972726821899414, 19.75225830078125, 20.531789779663086, 21.311321258544922, 22.09085464477539, 22.870386123657227, 23.649917602539062, 24.42945098876953, 25.208982467651367, 25.988513946533203]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 5.0, 15.0, 15.0, 17.0, 25.0, 48.0, 74.0, 92.0, 150.0, 180.0, 270.0, 427.0, 688.0, 899.0, 1488.0, 2285.0, 3644.0, 6324.0, 11511.0, 21795.0, 46987.0, 106550.0, 226691.0, 288613.0, 176094.0, 78541.0, 35062.0, 17067.0, 8954.0, 5138.0, 3197.0, 1901.0, 1254.0, 811.0, 552.0, 378.0, 242.0, 166.0, 110.0, 91.0, 59.0, 46.0, 25.0, 22.0, 18.0, 17.0, 8.0, 10.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-30.90625, -29.978515625, -29.05078125, -28.123046875, -27.1953125, -26.267578125, -25.33984375, -24.412109375, -23.484375, -22.556640625, -21.62890625, -20.701171875, -19.7734375, -18.845703125, -17.91796875, -16.990234375, -16.0625, -15.134765625, -14.20703125, -13.279296875, -12.3515625, -11.423828125, -10.49609375, -9.568359375, -8.640625, -7.712890625, -6.78515625, -5.857421875, -4.9296875, -4.001953125, -3.07421875, -2.146484375, -1.21875, -0.291015625, 0.63671875, 1.564453125, 2.4921875, 3.419921875, 4.34765625, 5.275390625, 6.203125, 7.130859375, 8.05859375, 8.986328125, 9.9140625, 10.841796875, 11.76953125, 12.697265625, 13.625, 14.552734375, 15.48046875, 16.408203125, 17.3359375, 18.263671875, 19.19140625, 20.119140625, 21.046875, 21.974609375, 22.90234375, 23.830078125, 24.7578125, 25.685546875, 26.61328125, 27.541015625, 28.46875]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 1.0, 9.0, 11.0, 7.0, 15.0, 16.0, 16.0, 20.0, 23.0, 31.0, 31.0, 37.0, 36.0, 36.0, 30.0, 36.0, 38.0, 35.0, 53.0, 38.0, 51.0, 40.0, 44.0, 35.0, 42.0, 44.0, 27.0, 29.0, 30.0, 13.0, 21.0, 25.0, 13.0, 14.0, 12.0, 8.0, 12.0, 8.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.453125, -24.611572265625, -23.77001953125, -22.928466796875, -22.0869140625, -21.245361328125, -20.40380859375, -19.562255859375, -18.720703125, -17.879150390625, -17.03759765625, -16.196044921875, -15.3544921875, -14.512939453125, -13.67138671875, -12.829833984375, -11.98828125, -11.146728515625, -10.30517578125, -9.463623046875, -8.6220703125, -7.780517578125, -6.93896484375, -6.097412109375, -5.255859375, -4.414306640625, -3.57275390625, -2.731201171875, -1.8896484375, -1.048095703125, -0.20654296875, 0.635009765625, 1.4765625, 2.318115234375, 3.15966796875, 4.001220703125, 4.8427734375, 5.684326171875, 6.52587890625, 7.367431640625, 8.208984375, 9.050537109375, 9.89208984375, 10.733642578125, 11.5751953125, 12.416748046875, 13.25830078125, 14.099853515625, 14.94140625, 15.782958984375, 16.62451171875, 17.466064453125, 18.3076171875, 19.149169921875, 19.99072265625, 20.832275390625, 21.673828125, 22.515380859375, 23.35693359375, 24.198486328125, 25.0400390625, 25.881591796875, 26.72314453125, 27.564697265625, 28.40625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 11.0, 18.0, 29.0, 27.0, 76.0, 70.0, 104.0, 143.0, 217.0, 312.0, 461.0, 724.0, 1038.0, 1600.0, 2566.0, 4069.0, 6605.0, 11026.0, 19321.0, 34911.0, 66876.0, 131048.0, 226771.0, 235848.0, 142381.0, 72394.0, 37831.0, 21025.0, 11945.0, 6914.0, 4258.0, 2736.0, 1749.0, 1138.0, 756.0, 473.0, 347.0, 225.0, 168.0, 105.0, 86.0, 47.0, 33.0, 24.0, 13.0, 13.0, 6.0, 5.0, 3.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.583984375, -25.63671875, -24.689453125, -23.7421875, -22.794921875, -21.84765625, -20.900390625, -19.953125, -19.005859375, -18.05859375, -17.111328125, -16.1640625, -15.216796875, -14.26953125, -13.322265625, -12.375, -11.427734375, -10.48046875, -9.533203125, -8.5859375, -7.638671875, -6.69140625, -5.744140625, -4.796875, -3.849609375, -2.90234375, -1.955078125, -1.0078125, -0.060546875, 0.88671875, 1.833984375, 2.78125, 3.728515625, 4.67578125, 5.623046875, 6.5703125, 7.517578125, 8.46484375, 9.412109375, 10.359375, 11.306640625, 12.25390625, 13.201171875, 14.1484375, 15.095703125, 16.04296875, 16.990234375, 17.9375, 18.884765625, 19.83203125, 20.779296875, 21.7265625, 22.673828125, 23.62109375, 24.568359375, 25.515625, 26.462890625, 27.41015625, 28.357421875, 29.3046875, 30.251953125, 31.19921875, 32.146484375, 33.09375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 0.0, 2.0, 4.0, 6.0, 11.0, 11.0, 12.0, 10.0, 12.0, 12.0, 13.0, 19.0, 17.0, 36.0, 21.0, 31.0, 32.0, 25.0, 32.0, 40.0, 57.0, 41.0, 46.0, 46.0, 50.0, 39.0, 42.0, 50.0, 35.0, 31.0, 32.0, 25.0, 32.0, 28.0, 20.0, 16.0, 18.0, 12.0, 6.0, 5.0, 5.0, 3.0, 8.0, 6.0, 0.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.47216796875, -16.8818359375, -16.29150390625, -15.701171875, -15.11083984375, -14.5205078125, -13.93017578125, -13.33984375, -12.74951171875, -12.1591796875, -11.56884765625, -10.978515625, -10.38818359375, -9.7978515625, -9.20751953125, -8.6171875, -8.02685546875, -7.4365234375, -6.84619140625, -6.255859375, -5.66552734375, -5.0751953125, -4.48486328125, -3.89453125, -3.30419921875, -2.7138671875, -2.12353515625, -1.533203125, -0.94287109375, -0.3525390625, 0.23779296875, 0.828125, 1.41845703125, 2.0087890625, 2.59912109375, 3.189453125, 3.77978515625, 4.3701171875, 4.96044921875, 5.55078125, 6.14111328125, 6.7314453125, 7.32177734375, 7.912109375, 8.50244140625, 9.0927734375, 9.68310546875, 10.2734375, 10.86376953125, 11.4541015625, 12.04443359375, 12.634765625, 13.22509765625, 13.8154296875, 14.40576171875, 14.99609375, 15.58642578125, 16.1767578125, 16.76708984375, 17.357421875, 17.94775390625, 18.5380859375, 19.12841796875, 19.71875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 7.0, 19.0, 17.0, 27.0, 19.0, 47.0, 40.0, 70.0, 75.0, 123.0, 144.0, 259.0, 354.0, 554.0, 907.0, 1564.0, 2750.0, 5166.0, 10560.0, 27279.0, 140375.0, 634687.0, 168647.0, 30732.0, 11302.0, 5573.0, 2853.0, 1633.0, 994.0, 563.0, 365.0, 237.0, 142.0, 126.0, 97.0, 64.0, 39.0, 40.0, 23.0, 24.0, 20.0, 10.0, 4.0, 6.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.875, -53.017578125, -51.16015625, -49.302734375, -47.4453125, -45.587890625, -43.73046875, -41.873046875, -40.015625, -38.158203125, -36.30078125, -34.443359375, -32.5859375, -30.728515625, -28.87109375, -27.013671875, -25.15625, -23.298828125, -21.44140625, -19.583984375, -17.7265625, -15.869140625, -14.01171875, -12.154296875, -10.296875, -8.439453125, -6.58203125, -4.724609375, -2.8671875, -1.009765625, 0.84765625, 2.705078125, 4.5625, 6.419921875, 8.27734375, 10.134765625, 11.9921875, 13.849609375, 15.70703125, 17.564453125, 19.421875, 21.279296875, 23.13671875, 24.994140625, 26.8515625, 28.708984375, 30.56640625, 32.423828125, 34.28125, 36.138671875, 37.99609375, 39.853515625, 41.7109375, 43.568359375, 45.42578125, 47.283203125, 49.140625, 50.998046875, 52.85546875, 54.712890625, 56.5703125, 58.427734375, 60.28515625, 62.142578125, 64.0]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 6.0, 27.0, 30.0, 57.0, 75.0, 148.0, 180.0, 137.0, 127.0, 68.0, 36.0, 18.0, 16.0, 9.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003170013427734375, -0.003047049045562744, -0.0029240846633911133, -0.0028011202812194824, -0.0026781558990478516, -0.0025551915168762207, -0.00243222713470459, -0.002309262752532959, -0.002186298370361328, -0.0020633339881896973, -0.0019403696060180664, -0.0018174052238464355, -0.0016944408416748047, -0.0015714764595031738, -0.001448512077331543, -0.0013255476951599121, -0.0012025833129882812, -0.0010796189308166504, -0.0009566545486450195, -0.0008336901664733887, -0.0007107257843017578, -0.000587761402130127, -0.0004647970199584961, -0.00034183263778686523, -0.00021886825561523438, -9.590387344360352e-05, 2.7060508728027344e-05, 0.0001500248908996582, 0.00027298927307128906, 0.0003959536552429199, 0.0005189180374145508, 0.0006418824195861816, 0.0007648468017578125, 0.0008878111839294434, 0.0010107755661010742, 0.001133739948272705, 0.001256704330444336, 0.0013796687126159668, 0.0015026330947875977, 0.0016255974769592285, 0.0017485618591308594, 0.0018715262413024902, 0.001994490623474121, 0.002117455005645752, 0.002240419387817383, 0.0023633837699890137, 0.0024863481521606445, 0.0026093125343322754, 0.0027322769165039062, 0.002855241298675537, 0.002978205680847168, 0.003101170063018799, 0.0032241344451904297, 0.0033470988273620605, 0.0034700632095336914, 0.0035930275917053223, 0.003715991973876953, 0.003838956356048584, 0.003961920738220215, 0.004084885120391846, 0.0042078495025634766, 0.004330813884735107, 0.004453778266906738, 0.004576742649078369, 0.00469970703125]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 11.0, 17.0, 13.0, 29.0, 34.0, 39.0, 58.0, 76.0, 89.0, 116.0, 182.0, 264.0, 428.0, 764.0, 1311.0, 2272.0, 4492.0, 10383.0, 34750.0, 399970.0, 528691.0, 41714.0, 11955.0, 4983.0, 2410.0, 1273.0, 766.0, 458.0, 294.0, 200.0, 119.0, 100.0, 82.0, 63.0, 35.0, 24.0, 27.0, 22.0, 5.0, 15.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-89.4375, -86.5576171875, -83.677734375, -80.7978515625, -77.91796875, -75.0380859375, -72.158203125, -69.2783203125, -66.3984375, -63.5185546875, -60.638671875, -57.7587890625, -54.87890625, -51.9990234375, -49.119140625, -46.2392578125, -43.359375, -40.4794921875, -37.599609375, -34.7197265625, -31.83984375, -28.9599609375, -26.080078125, -23.2001953125, -20.3203125, -17.4404296875, -14.560546875, -11.6806640625, -8.80078125, -5.9208984375, -3.041015625, -0.1611328125, 2.71875, 5.5986328125, 8.478515625, 11.3583984375, 14.23828125, 17.1181640625, 19.998046875, 22.8779296875, 25.7578125, 28.6376953125, 31.517578125, 34.3974609375, 37.27734375, 40.1572265625, 43.037109375, 45.9169921875, 48.796875, 51.6767578125, 54.556640625, 57.4365234375, 60.31640625, 63.1962890625, 66.076171875, 68.9560546875, 71.8359375, 74.7158203125, 77.595703125, 80.4755859375, 83.35546875, 86.2353515625, 89.115234375, 91.9951171875, 94.875]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 6.0, 21.0, 25.0, 56.0, 158.0, 223.0, 208.0, 138.0, 61.0, 26.0, 16.0, 10.0, 7.0, 7.0, 6.0, 6.0, 2.0, 4.0, 1.0, 1.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.921875, -17.361328125, -16.80078125, -16.240234375, -15.6796875, -15.119140625, -14.55859375, -13.998046875, -13.4375, -12.876953125, -12.31640625, -11.755859375, -11.1953125, -10.634765625, -10.07421875, -9.513671875, -8.953125, -8.392578125, -7.83203125, -7.271484375, -6.7109375, -6.150390625, -5.58984375, -5.029296875, -4.46875, -3.908203125, -3.34765625, -2.787109375, -2.2265625, -1.666015625, -1.10546875, -0.544921875, 0.015625, 0.576171875, 1.13671875, 1.697265625, 2.2578125, 2.818359375, 3.37890625, 3.939453125, 4.5, 5.060546875, 5.62109375, 6.181640625, 6.7421875, 7.302734375, 7.86328125, 8.423828125, 8.984375, 9.544921875, 10.10546875, 10.666015625, 11.2265625, 11.787109375, 12.34765625, 12.908203125, 13.46875, 14.029296875, 14.58984375, 15.150390625, 15.7109375, 16.271484375, 16.83203125, 17.392578125, 17.953125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 4.0, 12.0, 6.0, 8.0, 12.0, 7.0, 14.0, 13.0, 27.0, 29.0, 28.0, 38.0, 52.0, 49.0, 46.0, 43.0, 71.0, 68.0, 77.0, 71.0, 49.0, 47.0, 36.0, 40.0, 25.0, 26.0, 21.0, 9.0, 14.0, 7.0, 15.0, 9.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.413875579833984, -37.19951248168945, -35.98514938354492, -34.770782470703125, -33.556419372558594, -32.34205627441406, -31.12769317626953, -29.913328170776367, -28.698963165283203, -27.484600067138672, -26.270235061645508, -25.055871963500977, -23.841506958007812, -22.62714385986328, -21.41278076171875, -20.198415756225586, -18.984052658081055, -17.769689559936523, -16.55532455444336, -15.340961456298828, -14.126596450805664, -12.912233352661133, -11.697869300842285, -10.483505249023438, -9.26914119720459, -8.054777145385742, -6.8404130935668945, -5.626049518585205, -4.411685466766357, -3.1973214149475098, -1.9829578399658203, -0.7685937881469727, 0.445770263671875, 1.660134196281433, 2.874498128890991, 4.08886194229126, 5.303225994110107, 6.517590045928955, 7.7319536209106445, 8.946317672729492, 10.16068172454834, 11.375045776367188, 12.589409828186035, 13.803773880004883, 15.018136978149414, 16.232501983642578, 17.44686508178711, 18.66122817993164, 19.875593185424805, 21.089956283569336, 22.3043212890625, 23.51868438720703, 24.733049392700195, 25.947412490844727, 27.16177749633789, 28.376140594482422, 29.590503692626953, 30.804866790771484, 32.019229888916016, 33.23359680175781, 34.447959899902344, 35.662322998046875, 36.876686096191406, 38.09104919433594, 39.305416107177734]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 3.0, 11.0, 16.0, 11.0, 11.0, 9.0, 22.0, 18.0, 19.0, 22.0, 24.0, 24.0, 27.0, 33.0, 28.0, 36.0, 31.0, 46.0, 32.0, 35.0, 31.0, 34.0, 48.0, 30.0, 29.0, 31.0, 34.0, 46.0, 30.0, 28.0, 27.0, 26.0, 18.0, 25.0, 17.0, 22.0, 21.0, 7.0, 11.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.930965423583984, -25.060312271118164, -24.18965721130371, -23.31900405883789, -22.448348999023438, -21.577695846557617, -20.707042694091797, -19.836387634277344, -18.965734481811523, -18.095081329345703, -17.22442626953125, -16.35377311706543, -15.483119010925293, -14.612464904785156, -13.741811752319336, -12.8711576461792, -12.000503540039062, -11.129849433898926, -10.259195327758789, -9.388542175292969, -8.517888069152832, -7.647233963012695, -6.776580333709717, -5.905926704406738, -5.035272598266602, -4.164618492126465, -3.2939648628234863, -2.4233109951019287, -1.552657127380371, -0.6820030212402344, 0.18865060806274414, 1.0593042373657227, 1.9299564361572266, 2.800610303878784, 3.671264171600342, 4.54191780090332, 5.412571907043457, 6.283226013183594, 7.153879642486572, 8.02453327178955, 8.895187377929688, 9.765841484069824, 10.636495590209961, 11.507148742675781, 12.377802848815918, 13.248456954956055, 14.119110107421875, 14.989764213562012, 15.860418319702148, 16.73107147216797, 17.601726531982422, 18.472379684448242, 19.343032836914062, 20.213687896728516, 21.084341049194336, 21.954994201660156, 22.82564926147461, 23.69630241394043, 24.566957473754883, 25.437610626220703, 26.308265686035156, 27.178918838500977, 28.049571990966797, 28.92022705078125, 29.79088020324707]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 14.0, 8.0, 17.0, 26.0, 39.0, 67.0, 88.0, 119.0, 195.0, 282.0, 395.0, 598.0, 886.0, 1277.0, 1852.0, 2836.0, 4215.0, 6746.0, 11204.0, 20175.0, 41749.0, 105096.0, 325695.0, 999714.0, 1508764.0, 759186.0, 242719.0, 82462.0, 34348.0, 16797.0, 9582.0, 5794.0, 3779.0, 2394.0, 1588.0, 1072.0, 759.0, 489.0, 348.0, 286.0, 190.0, 126.0, 115.0, 60.0, 42.0, 38.0, 15.0, 22.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0], "bins": [-55.0625, -53.361328125, -51.66015625, -49.958984375, -48.2578125, -46.556640625, -44.85546875, -43.154296875, -41.453125, -39.751953125, -38.05078125, -36.349609375, -34.6484375, -32.947265625, -31.24609375, -29.544921875, -27.84375, -26.142578125, -24.44140625, -22.740234375, -21.0390625, -19.337890625, -17.63671875, -15.935546875, -14.234375, -12.533203125, -10.83203125, -9.130859375, -7.4296875, -5.728515625, -4.02734375, -2.326171875, -0.625, 1.076171875, 2.77734375, 4.478515625, 6.1796875, 7.880859375, 9.58203125, 11.283203125, 12.984375, 14.685546875, 16.38671875, 18.087890625, 19.7890625, 21.490234375, 23.19140625, 24.892578125, 26.59375, 28.294921875, 29.99609375, 31.697265625, 33.3984375, 35.099609375, 36.80078125, 38.501953125, 40.203125, 41.904296875, 43.60546875, 45.306640625, 47.0078125, 48.708984375, 50.41015625, 52.111328125, 53.8125]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 11.0, 12.0, 8.0, 7.0, 15.0, 16.0, 22.0, 18.0, 14.0, 30.0, 25.0, 32.0, 33.0, 21.0, 26.0, 35.0, 32.0, 32.0, 40.0, 34.0, 41.0, 41.0, 35.0, 33.0, 34.0, 43.0, 36.0, 33.0, 27.0, 28.0, 27.0, 19.0, 24.0, 11.0, 17.0, 18.0, 20.0, 8.0, 6.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.390625, -25.545654296875, -24.70068359375, -23.855712890625, -23.0107421875, -22.165771484375, -21.32080078125, -20.475830078125, -19.630859375, -18.785888671875, -17.94091796875, -17.095947265625, -16.2509765625, -15.406005859375, -14.56103515625, -13.716064453125, -12.87109375, -12.026123046875, -11.18115234375, -10.336181640625, -9.4912109375, -8.646240234375, -7.80126953125, -6.956298828125, -6.111328125, -5.266357421875, -4.42138671875, -3.576416015625, -2.7314453125, -1.886474609375, -1.04150390625, -0.196533203125, 0.6484375, 1.493408203125, 2.33837890625, 3.183349609375, 4.0283203125, 4.873291015625, 5.71826171875, 6.563232421875, 7.408203125, 8.253173828125, 9.09814453125, 9.943115234375, 10.7880859375, 11.633056640625, 12.47802734375, 13.322998046875, 14.16796875, 15.012939453125, 15.85791015625, 16.702880859375, 17.5478515625, 18.392822265625, 19.23779296875, 20.082763671875, 20.927734375, 21.772705078125, 22.61767578125, 23.462646484375, 24.3076171875, 25.152587890625, 25.99755859375, 26.842529296875, 27.6875]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 9.0, 7.0, 14.0, 22.0, 37.0, 48.0, 67.0, 122.0, 178.0, 256.0, 387.0, 582.0, 838.0, 1350.0, 1991.0, 3263.0, 5150.0, 8298.0, 14347.0, 25645.0, 48914.0, 104271.0, 255997.0, 724918.0, 1496337.0, 923300.0, 322646.0, 126247.0, 57541.0, 29641.0, 16458.0, 9456.0, 5833.0, 3523.0, 2265.0, 1472.0, 968.0, 636.0, 418.0, 255.0, 196.0, 141.0, 78.0, 51.0, 37.0, 24.0, 16.0, 11.0, 6.0, 8.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-69.625, -67.4228515625, -65.220703125, -63.0185546875, -60.81640625, -58.6142578125, -56.412109375, -54.2099609375, -52.0078125, -49.8056640625, -47.603515625, -45.4013671875, -43.19921875, -40.9970703125, -38.794921875, -36.5927734375, -34.390625, -32.1884765625, -29.986328125, -27.7841796875, -25.58203125, -23.3798828125, -21.177734375, -18.9755859375, -16.7734375, -14.5712890625, -12.369140625, -10.1669921875, -7.96484375, -5.7626953125, -3.560546875, -1.3583984375, 0.84375, 3.0458984375, 5.248046875, 7.4501953125, 9.65234375, 11.8544921875, 14.056640625, 16.2587890625, 18.4609375, 20.6630859375, 22.865234375, 25.0673828125, 27.26953125, 29.4716796875, 31.673828125, 33.8759765625, 36.078125, 38.2802734375, 40.482421875, 42.6845703125, 44.88671875, 47.0888671875, 49.291015625, 51.4931640625, 53.6953125, 55.8974609375, 58.099609375, 60.3017578125, 62.50390625, 64.7060546875, 66.908203125, 69.1103515625, 71.3125]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 11.0, 10.0, 17.0, 25.0, 16.0, 33.0, 26.0, 40.0, 44.0, 57.0, 80.0, 81.0, 120.0, 148.0, 182.0, 216.0, 231.0, 290.0, 313.0, 283.0, 306.0, 278.0, 241.0, 214.0, 184.0, 114.0, 109.0, 72.0, 61.0, 55.0, 35.0, 34.0, 32.0, 17.0, 17.0, 12.0, 14.0, 5.0, 9.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0], "bins": [-18.6875, -18.14306640625, -17.5986328125, -17.05419921875, -16.509765625, -15.96533203125, -15.4208984375, -14.87646484375, -14.33203125, -13.78759765625, -13.2431640625, -12.69873046875, -12.154296875, -11.60986328125, -11.0654296875, -10.52099609375, -9.9765625, -9.43212890625, -8.8876953125, -8.34326171875, -7.798828125, -7.25439453125, -6.7099609375, -6.16552734375, -5.62109375, -5.07666015625, -4.5322265625, -3.98779296875, -3.443359375, -2.89892578125, -2.3544921875, -1.81005859375, -1.265625, -0.72119140625, -0.1767578125, 0.36767578125, 0.912109375, 1.45654296875, 2.0009765625, 2.54541015625, 3.08984375, 3.63427734375, 4.1787109375, 4.72314453125, 5.267578125, 5.81201171875, 6.3564453125, 6.90087890625, 7.4453125, 7.98974609375, 8.5341796875, 9.07861328125, 9.623046875, 10.16748046875, 10.7119140625, 11.25634765625, 11.80078125, 12.34521484375, 12.8896484375, 13.43408203125, 13.978515625, 14.52294921875, 15.0673828125, 15.61181640625, 16.15625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 7.0, 9.0, 7.0, 13.0, 12.0, 17.0, 27.0, 23.0, 33.0, 51.0, 51.0, 88.0, 62.0, 88.0, 65.0, 73.0, 49.0, 70.0, 55.0, 32.0, 30.0, 29.0, 14.0, 19.0, 17.0, 13.0, 9.0, 7.0, 4.0, 4.0, 1.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-70.4071273803711, -68.22169494628906, -66.03626251220703, -63.850830078125, -61.66539764404297, -59.47996520996094, -57.29452896118164, -55.10909652709961, -52.92366409301758, -50.73823165893555, -48.552799224853516, -46.367366790771484, -44.18193054199219, -41.996498107910156, -39.811065673828125, -37.625633239746094, -35.44020080566406, -33.25476837158203, -31.0693359375, -28.883901596069336, -26.698469161987305, -24.513036727905273, -22.32760238647461, -20.142169952392578, -17.956737518310547, -15.771305084228516, -13.585871696472168, -11.40043830871582, -9.215005874633789, -7.029573440551758, -4.84414005279541, -2.6587066650390625, -0.47327423095703125, 1.7121586799621582, 3.8975915908813477, 6.083024501800537, 8.268457412719727, 10.453889846801758, 12.639323234558105, 14.824756622314453, 17.010189056396484, 19.195621490478516, 21.381053924560547, 23.56648826599121, 25.751920700073242, 27.937353134155273, 30.122787475585938, 32.30821990966797, 34.49365234375, 36.67908477783203, 38.86451721191406, 41.049949645996094, 43.235382080078125, 45.420814514160156, 47.60625076293945, 49.791683197021484, 51.977115631103516, 54.16254806518555, 56.34798049926758, 58.53341293334961, 60.718849182128906, 62.90428161621094, 65.08971405029297, 67.275146484375, 69.46057891845703]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 1.0, 5.0, 1.0, 7.0, 7.0, 6.0, 6.0, 6.0, 10.0, 10.0, 19.0, 20.0, 14.0, 14.0, 21.0, 21.0, 22.0, 31.0, 40.0, 30.0, 29.0, 27.0, 30.0, 32.0, 29.0, 33.0, 41.0, 32.0, 30.0, 36.0, 36.0, 29.0, 34.0, 30.0, 22.0, 24.0, 27.0, 25.0, 27.0, 16.0, 16.0, 15.0, 14.0, 15.0, 15.0, 6.0, 10.0, 5.0, 8.0, 3.0, 9.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0], "bins": [-34.23876190185547, -33.12650680541992, -32.014251708984375, -30.901994705200195, -29.78973960876465, -28.6774845123291, -27.565227508544922, -26.452972412109375, -25.340717315673828, -24.22846221923828, -23.116207122802734, -22.003950119018555, -20.891695022583008, -19.77943992614746, -18.66718292236328, -17.554927825927734, -16.442672729492188, -15.33041763305664, -14.218161582946777, -13.105905532836914, -11.993650436401367, -10.88139533996582, -9.769139289855957, -8.656883239746094, -7.544628143310547, -6.432372570037842, -5.320116996765137, -4.207861423492432, -3.0956058502197266, -1.9833502769470215, -0.8710947036743164, 0.24116086959838867, 1.3534126281738281, 2.465668201446533, 3.5779237747192383, 4.690179347991943, 5.802434921264648, 6.9146904945373535, 8.026946067810059, 9.139202117919922, 10.251457214355469, 11.363712310791016, 12.475968360900879, 13.588224411010742, 14.700479507446289, 15.812734603881836, 16.924991607666016, 18.037246704101562, 19.14950180053711, 20.261756896972656, 21.374011993408203, 22.486268997192383, 23.59852409362793, 24.710779190063477, 25.823036193847656, 26.935291290283203, 28.04754638671875, 29.159801483154297, 30.272056579589844, 31.384313583374023, 32.49656677246094, 33.60882568359375, 34.7210807800293, 35.833335876464844, 36.94559097290039]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 4.0, 5.0, 12.0, 18.0, 29.0, 49.0, 50.0, 68.0, 85.0, 165.0, 213.0, 263.0, 416.0, 606.0, 898.0, 1282.0, 1891.0, 2828.0, 4480.0, 6561.0, 10452.0, 16826.0, 27668.0, 47031.0, 84126.0, 155159.0, 240962.0, 192721.0, 105787.0, 57811.0, 33897.0, 20185.0, 12705.0, 7843.0, 5105.0, 3357.0, 2244.0, 1430.0, 1013.0, 696.0, 473.0, 331.0, 235.0, 168.0, 117.0, 84.0, 56.0, 45.0, 33.0, 29.0, 18.0, 5.0, 8.0, 5.0, 4.0, 1.0, 4.0, 2.0], "bins": [-5.09765625, -4.94171142578125, -4.7857666015625, -4.62982177734375, -4.473876953125, -4.31793212890625, -4.1619873046875, -4.00604248046875, -3.85009765625, -3.69415283203125, -3.5382080078125, -3.38226318359375, -3.226318359375, -3.07037353515625, -2.9144287109375, -2.75848388671875, -2.6025390625, -2.44659423828125, -2.2906494140625, -2.13470458984375, -1.978759765625, -1.82281494140625, -1.6668701171875, -1.51092529296875, -1.35498046875, -1.19903564453125, -1.0430908203125, -0.88714599609375, -0.731201171875, -0.57525634765625, -0.4193115234375, -0.26336669921875, -0.107421875, 0.04852294921875, 0.2044677734375, 0.36041259765625, 0.516357421875, 0.67230224609375, 0.8282470703125, 0.98419189453125, 1.14013671875, 1.29608154296875, 1.4520263671875, 1.60797119140625, 1.763916015625, 1.91986083984375, 2.0758056640625, 2.23175048828125, 2.3876953125, 2.54364013671875, 2.6995849609375, 2.85552978515625, 3.011474609375, 3.16741943359375, 3.3233642578125, 3.47930908203125, 3.63525390625, 3.79119873046875, 3.9471435546875, 4.10308837890625, 4.259033203125, 4.41497802734375, 4.5709228515625, 4.72686767578125, 4.8828125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 8.0, 4.0, 5.0, 9.0, 15.0, 11.0, 16.0, 17.0, 17.0, 15.0, 22.0, 29.0, 22.0, 26.0, 34.0, 29.0, 24.0, 35.0, 34.0, 43.0, 39.0, 36.0, 35.0, 34.0, 42.0, 32.0, 30.0, 29.0, 33.0, 29.0, 26.0, 27.0, 32.0, 17.0, 29.0, 13.0, 15.0, 11.0, 15.0, 13.0, 10.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-41.15625, -39.87451171875, -38.5927734375, -37.31103515625, -36.029296875, -34.74755859375, -33.4658203125, -32.18408203125, -30.90234375, -29.62060546875, -28.3388671875, -27.05712890625, -25.775390625, -24.49365234375, -23.2119140625, -21.93017578125, -20.6484375, -19.36669921875, -18.0849609375, -16.80322265625, -15.521484375, -14.23974609375, -12.9580078125, -11.67626953125, -10.39453125, -9.11279296875, -7.8310546875, -6.54931640625, -5.267578125, -3.98583984375, -2.7041015625, -1.42236328125, -0.140625, 1.14111328125, 2.4228515625, 3.70458984375, 4.986328125, 6.26806640625, 7.5498046875, 8.83154296875, 10.11328125, 11.39501953125, 12.6767578125, 13.95849609375, 15.240234375, 16.52197265625, 17.8037109375, 19.08544921875, 20.3671875, 21.64892578125, 22.9306640625, 24.21240234375, 25.494140625, 26.77587890625, 28.0576171875, 29.33935546875, 30.62109375, 31.90283203125, 33.1845703125, 34.46630859375, 35.748046875, 37.02978515625, 38.3115234375, 39.59326171875, 40.875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 7.0, 3.0, 5.0, 11.0, 7.0, 9.0, 23.0, 28.0, 30.0, 53.0, 86.0, 92.0, 143.0, 199.0, 317.0, 481.0, 704.0, 1251.0, 2194.0, 4058.0, 8462.0, 20184.0, 93323.0, 841833.0, 46066.0, 14730.0, 6436.0, 3186.0, 1690.0, 1007.0, 643.0, 389.0, 246.0, 180.0, 150.0, 77.0, 64.0, 53.0, 35.0, 23.0, 22.0, 11.0, 8.0, 10.0, 6.0, 7.0, 7.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.48095703125, -15.0166015625, -14.55224609375, -14.087890625, -13.62353515625, -13.1591796875, -12.69482421875, -12.23046875, -11.76611328125, -11.3017578125, -10.83740234375, -10.373046875, -9.90869140625, -9.4443359375, -8.97998046875, -8.515625, -8.05126953125, -7.5869140625, -7.12255859375, -6.658203125, -6.19384765625, -5.7294921875, -5.26513671875, -4.80078125, -4.33642578125, -3.8720703125, -3.40771484375, -2.943359375, -2.47900390625, -2.0146484375, -1.55029296875, -1.0859375, -0.62158203125, -0.1572265625, 0.30712890625, 0.771484375, 1.23583984375, 1.7001953125, 2.16455078125, 2.62890625, 3.09326171875, 3.5576171875, 4.02197265625, 4.486328125, 4.95068359375, 5.4150390625, 5.87939453125, 6.34375, 6.80810546875, 7.2724609375, 7.73681640625, 8.201171875, 8.66552734375, 9.1298828125, 9.59423828125, 10.05859375, 10.52294921875, 10.9873046875, 11.45166015625, 11.916015625, 12.38037109375, 12.8447265625, 13.30908203125, 13.7734375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 5.0, 6.0, 2.0, 0.0, 7.0, 7.0, 15.0, 12.0, 14.0, 20.0, 20.0, 30.0, 19.0, 24.0, 26.0, 32.0, 33.0, 26.0, 38.0, 31.0, 37.0, 48.0, 35.0, 38.0, 41.0, 47.0, 33.0, 38.0, 27.0, 32.0, 23.0, 31.0, 26.0, 25.0, 26.0, 18.0, 23.0, 21.0, 7.0, 6.0, 15.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-26.03125, -25.25732421875, -24.4833984375, -23.70947265625, -22.935546875, -22.16162109375, -21.3876953125, -20.61376953125, -19.83984375, -19.06591796875, -18.2919921875, -17.51806640625, -16.744140625, -15.97021484375, -15.1962890625, -14.42236328125, -13.6484375, -12.87451171875, -12.1005859375, -11.32666015625, -10.552734375, -9.77880859375, -9.0048828125, -8.23095703125, -7.45703125, -6.68310546875, -5.9091796875, -5.13525390625, -4.361328125, -3.58740234375, -2.8134765625, -2.03955078125, -1.265625, -0.49169921875, 0.2822265625, 1.05615234375, 1.830078125, 2.60400390625, 3.3779296875, 4.15185546875, 4.92578125, 5.69970703125, 6.4736328125, 7.24755859375, 8.021484375, 8.79541015625, 9.5693359375, 10.34326171875, 11.1171875, 11.89111328125, 12.6650390625, 13.43896484375, 14.212890625, 14.98681640625, 15.7607421875, 16.53466796875, 17.30859375, 18.08251953125, 18.8564453125, 19.63037109375, 20.404296875, 21.17822265625, 21.9521484375, 22.72607421875, 23.5]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 7.0, 16.0, 16.0, 28.0, 34.0, 48.0, 79.0, 135.0, 196.0, 285.0, 486.0, 793.0, 1427.0, 2420.0, 4416.0, 8637.0, 18683.0, 56875.0, 887374.0, 36410.0, 14382.0, 7079.0, 3679.0, 1970.0, 1150.0, 701.0, 446.0, 264.0, 170.0, 112.0, 76.0, 47.0, 35.0, 22.0, 11.0, 11.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.54296875, -3.4427490234375, -3.342529296875, -3.2423095703125, -3.14208984375, -3.0418701171875, -2.941650390625, -2.8414306640625, -2.7412109375, -2.6409912109375, -2.540771484375, -2.4405517578125, -2.34033203125, -2.2401123046875, -2.139892578125, -2.0396728515625, -1.939453125, -1.8392333984375, -1.739013671875, -1.6387939453125, -1.53857421875, -1.4383544921875, -1.338134765625, -1.2379150390625, -1.1376953125, -1.0374755859375, -0.937255859375, -0.8370361328125, -0.73681640625, -0.6365966796875, -0.536376953125, -0.4361572265625, -0.3359375, -0.2357177734375, -0.135498046875, -0.0352783203125, 0.06494140625, 0.1651611328125, 0.265380859375, 0.3656005859375, 0.4658203125, 0.5660400390625, 0.666259765625, 0.7664794921875, 0.86669921875, 0.9669189453125, 1.067138671875, 1.1673583984375, 1.267578125, 1.3677978515625, 1.468017578125, 1.5682373046875, 1.66845703125, 1.7686767578125, 1.868896484375, 1.9691162109375, 2.0693359375, 2.1695556640625, 2.269775390625, 2.3699951171875, 2.47021484375, 2.5704345703125, 2.670654296875, 2.7708740234375, 2.87109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 4.0, 8.0, 14.0, 9.0, 10.0, 15.0, 20.0, 14.0, 21.0, 32.0, 33.0, 39.0, 54.0, 53.0, 47.0, 66.0, 45.0, 58.0, 57.0, 43.0, 56.0, 49.0, 33.0, 34.0, 16.0, 26.0, 23.0, 19.0, 30.0, 13.0, 15.0, 10.0, 3.0, 6.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.402896881103516e-05, -7.200520485639572e-05, -6.998144090175629e-05, -6.795767694711685e-05, -6.593391299247742e-05, -6.391014903783798e-05, -6.188638508319855e-05, -5.986262112855911e-05, -5.783885717391968e-05, -5.581509321928024e-05, -5.379132926464081e-05, -5.176756531000137e-05, -4.974380135536194e-05, -4.7720037400722504e-05, -4.569627344608307e-05, -4.3672509491443634e-05, -4.16487455368042e-05, -3.9624981582164764e-05, -3.760121762752533e-05, -3.5577453672885895e-05, -3.355368971824646e-05, -3.1529925763607025e-05, -2.950616180896759e-05, -2.7482397854328156e-05, -2.545863389968872e-05, -2.3434869945049286e-05, -2.141110599040985e-05, -1.9387342035770416e-05, -1.736357808113098e-05, -1.5339814126491547e-05, -1.3316050171852112e-05, -1.1292286217212677e-05, -9.268522262573242e-06, -7.244758307933807e-06, -5.2209943532943726e-06, -3.1972303986549377e-06, -1.173466444015503e-06, 8.502975106239319e-07, 2.8740614652633667e-06, 4.8978254199028015e-06, 6.921589374542236e-06, 8.945353329181671e-06, 1.0969117283821106e-05, 1.299288123846054e-05, 1.5016645193099976e-05, 1.704040914773941e-05, 1.9064173102378845e-05, 2.108793705701828e-05, 2.3111701011657715e-05, 2.513546496629715e-05, 2.7159228920936584e-05, 2.918299287557602e-05, 3.1206756830215454e-05, 3.323052078485489e-05, 3.5254284739494324e-05, 3.727804869413376e-05, 3.930181264877319e-05, 4.132557660341263e-05, 4.334934055805206e-05, 4.53731045126915e-05, 4.739686846733093e-05, 4.942063242197037e-05, 5.14443963766098e-05, 5.346816033124924e-05, 5.549192428588867e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 5.0, 12.0, 10.0, 13.0, 20.0, 24.0, 42.0, 55.0, 77.0, 131.0, 187.0, 273.0, 499.0, 957.0, 1660.0, 3252.0, 6556.0, 14167.0, 32235.0, 80992.0, 216781.0, 364448.0, 196803.0, 73689.0, 29706.0, 12999.0, 6142.0, 3057.0, 1512.0, 872.0, 467.0, 297.0, 212.0, 121.0, 71.0, 58.0, 39.0, 26.0, 28.0, 23.0, 9.0, 5.0, 7.0, 8.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.02734375, -1.956085205078125, -1.88482666015625, -1.813568115234375, -1.7423095703125, -1.671051025390625, -1.59979248046875, -1.528533935546875, -1.457275390625, -1.386016845703125, -1.31475830078125, -1.243499755859375, -1.1722412109375, -1.100982666015625, -1.02972412109375, -0.958465576171875, -0.88720703125, -0.815948486328125, -0.74468994140625, -0.673431396484375, -0.6021728515625, -0.530914306640625, -0.45965576171875, -0.388397216796875, -0.317138671875, -0.245880126953125, -0.17462158203125, -0.103363037109375, -0.0321044921875, 0.039154052734375, 0.11041259765625, 0.181671142578125, 0.2529296875, 0.324188232421875, 0.39544677734375, 0.466705322265625, 0.5379638671875, 0.609222412109375, 0.68048095703125, 0.751739501953125, 0.822998046875, 0.894256591796875, 0.96551513671875, 1.036773681640625, 1.1080322265625, 1.179290771484375, 1.25054931640625, 1.321807861328125, 1.39306640625, 1.464324951171875, 1.53558349609375, 1.606842041015625, 1.6781005859375, 1.749359130859375, 1.82061767578125, 1.891876220703125, 1.963134765625, 2.034393310546875, 2.10565185546875, 2.176910400390625, 2.2481689453125, 2.319427490234375, 2.39068603515625, 2.461944580078125, 2.533203125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 9.0, 13.0, 13.0, 13.0, 21.0, 19.0, 39.0, 56.0, 53.0, 53.0, 55.0, 65.0, 75.0, 75.0, 72.0, 65.0, 49.0, 56.0, 35.0, 26.0, 20.0, 20.0, 14.0, 9.0, 14.0, 9.0, 6.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42578125, -0.41241455078125, -0.3990478515625, -0.38568115234375, -0.372314453125, -0.35894775390625, -0.3455810546875, -0.33221435546875, -0.31884765625, -0.30548095703125, -0.2921142578125, -0.27874755859375, -0.265380859375, -0.25201416015625, -0.2386474609375, -0.22528076171875, -0.2119140625, -0.19854736328125, -0.1851806640625, -0.17181396484375, -0.158447265625, -0.14508056640625, -0.1317138671875, -0.11834716796875, -0.10498046875, -0.09161376953125, -0.0782470703125, -0.06488037109375, -0.051513671875, -0.03814697265625, -0.0247802734375, -0.01141357421875, 0.001953125, 0.01531982421875, 0.0286865234375, 0.04205322265625, 0.055419921875, 0.06878662109375, 0.0821533203125, 0.09552001953125, 0.10888671875, 0.12225341796875, 0.1356201171875, 0.14898681640625, 0.162353515625, 0.17572021484375, 0.1890869140625, 0.20245361328125, 0.2158203125, 0.22918701171875, 0.2425537109375, 0.25592041015625, 0.269287109375, 0.28265380859375, 0.2960205078125, 0.30938720703125, 0.32275390625, 0.33612060546875, 0.3494873046875, 0.36285400390625, 0.376220703125, 0.38958740234375, 0.4029541015625, 0.41632080078125, 0.4296875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 15.0, 14.0, 25.0, 21.0, 30.0, 39.0, 50.0, 51.0, 88.0, 75.0, 77.0, 69.0, 59.0, 54.0, 63.0, 50.0, 32.0, 30.0, 27.0, 12.0, 17.0, 17.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-70.87083435058594, -68.71742248535156, -66.56400299072266, -64.41059112548828, -62.257171630859375, -60.103759765625, -57.95034408569336, -55.79692840576172, -53.64351272583008, -51.49009704589844, -49.3366813659668, -47.183265686035156, -45.02985382080078, -42.876434326171875, -40.7230224609375, -38.56960678100586, -36.41619110107422, -34.26277542114258, -32.10935974121094, -29.95594596862793, -27.80253028869629, -25.64911460876465, -23.49570083618164, -21.34228515625, -19.18886947631836, -17.03545379638672, -14.882039070129395, -12.72862434387207, -10.57520866394043, -8.421792984008789, -6.268378257751465, -4.114963531494141, -1.9615478515625, 0.19186735153198242, 2.345282554626465, 4.498697757720947, 6.65211296081543, 8.80552864074707, 10.958943367004395, 13.112358093261719, 15.26577377319336, 17.419189453125, 19.57260513305664, 21.72601890563965, 23.87943458557129, 26.03285026550293, 28.186264038085938, 30.339679718017578, 32.49309539794922, 34.64651107788086, 36.7999267578125, 38.95334243774414, 41.10675811767578, 43.260169982910156, 45.4135856628418, 47.56700134277344, 49.72041702270508, 51.87383270263672, 54.02724838256836, 56.1806640625, 58.334075927734375, 60.48749542236328, 62.640907287597656, 64.79432678222656, 66.94773864746094]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 6.0, 8.0, 7.0, 4.0, 6.0, 9.0, 10.0, 20.0, 18.0, 18.0, 13.0, 19.0, 21.0, 28.0, 27.0, 39.0, 27.0, 33.0, 24.0, 31.0, 31.0, 30.0, 35.0, 40.0, 33.0, 29.0, 33.0, 37.0, 32.0, 30.0, 29.0, 23.0, 26.0, 22.0, 28.0, 26.0, 17.0, 16.0, 17.0, 16.0, 14.0, 13.0, 9.0, 8.0, 6.0, 6.0, 6.0, 5.0, 9.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0], "bins": [-34.51490020751953, -33.399234771728516, -32.283573150634766, -31.167909622192383, -30.05224609375, -28.936582565307617, -27.820919036865234, -26.70525360107422, -25.58959197998047, -24.473928451538086, -23.358264923095703, -22.24260139465332, -21.126937866210938, -20.011274337768555, -18.895610809326172, -17.779945373535156, -16.664281845092773, -15.54861831665039, -14.432954788208008, -13.317291259765625, -12.201627731323242, -11.08596420288086, -9.97029972076416, -8.854636192321777, -7.7389726638793945, -6.623309135437012, -5.507645606994629, -4.391981601715088, -3.276318073272705, -2.1606545448303223, -1.0449905395507812, 0.07067298889160156, 1.1863365173339844, 2.302000045776367, 3.417663812637329, 4.533327579498291, 5.648991107940674, 6.764654636383057, 7.880318641662598, 8.99598217010498, 10.111645698547363, 11.227309226989746, 12.342972755432129, 13.458637237548828, 14.574300765991211, 15.689964294433594, 16.805627822875977, 17.92129135131836, 19.036954879760742, 20.152618408203125, 21.268281936645508, 22.38394546508789, 23.499608993530273, 24.615272521972656, 25.730937957763672, 26.846599578857422, 27.962265014648438, 29.07792854309082, 30.193592071533203, 31.309255599975586, 32.42491912841797, 33.540584564208984, 34.656246185302734, 35.77191162109375, 36.8875732421875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 19.0, 23.0, 35.0, 40.0, 65.0, 103.0, 178.0, 246.0, 331.0, 523.0, 705.0, 1118.0, 1544.0, 2344.0, 3437.0, 5042.0, 7219.0, 10720.0, 16189.0, 24038.0, 35149.0, 52827.0, 75827.0, 104697.0, 130984.0, 139377.0, 124804.0, 96653.0, 69314.0, 47108.0, 31912.0, 21256.0, 14152.0, 9925.0, 6499.0, 4417.0, 3199.0, 2061.0, 1426.0, 1020.0, 632.0, 466.0, 339.0, 199.0, 122.0, 106.0, 60.0, 35.0, 18.0, 20.0, 12.0, 12.0, 5.0, 4.0, 3.0, 0.0, 1.0], "bins": [-18.84375, -18.261474609375, -17.67919921875, -17.096923828125, -16.5146484375, -15.932373046875, -15.35009765625, -14.767822265625, -14.185546875, -13.603271484375, -13.02099609375, -12.438720703125, -11.8564453125, -11.274169921875, -10.69189453125, -10.109619140625, -9.52734375, -8.945068359375, -8.36279296875, -7.780517578125, -7.1982421875, -6.615966796875, -6.03369140625, -5.451416015625, -4.869140625, -4.286865234375, -3.70458984375, -3.122314453125, -2.5400390625, -1.957763671875, -1.37548828125, -0.793212890625, -0.2109375, 0.371337890625, 0.95361328125, 1.535888671875, 2.1181640625, 2.700439453125, 3.28271484375, 3.864990234375, 4.447265625, 5.029541015625, 5.61181640625, 6.194091796875, 6.7763671875, 7.358642578125, 7.94091796875, 8.523193359375, 9.10546875, 9.687744140625, 10.27001953125, 10.852294921875, 11.4345703125, 12.016845703125, 12.59912109375, 13.181396484375, 13.763671875, 14.345947265625, 14.92822265625, 15.510498046875, 16.0927734375, 16.675048828125, 17.25732421875, 17.839599609375, 18.421875]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 13.0, 16.0, 13.0, 18.0, 14.0, 19.0, 24.0, 21.0, 34.0, 36.0, 27.0, 28.0, 35.0, 43.0, 34.0, 44.0, 28.0, 43.0, 32.0, 38.0, 30.0, 32.0, 31.0, 31.0, 32.0, 31.0, 30.0, 17.0, 25.0, 28.0, 23.0, 12.0, 11.0, 16.0, 10.0, 11.0, 14.0, 1.0, 5.0, 6.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-40.90625, -39.64453125, -38.3828125, -37.12109375, -35.859375, -34.59765625, -33.3359375, -32.07421875, -30.8125, -29.55078125, -28.2890625, -27.02734375, -25.765625, -24.50390625, -23.2421875, -21.98046875, -20.71875, -19.45703125, -18.1953125, -16.93359375, -15.671875, -14.41015625, -13.1484375, -11.88671875, -10.625, -9.36328125, -8.1015625, -6.83984375, -5.578125, -4.31640625, -3.0546875, -1.79296875, -0.53125, 0.73046875, 1.9921875, 3.25390625, 4.515625, 5.77734375, 7.0390625, 8.30078125, 9.5625, 10.82421875, 12.0859375, 13.34765625, 14.609375, 15.87109375, 17.1328125, 18.39453125, 19.65625, 20.91796875, 22.1796875, 23.44140625, 24.703125, 25.96484375, 27.2265625, 28.48828125, 29.75, 31.01171875, 32.2734375, 33.53515625, 34.796875, 36.05859375, 37.3203125, 38.58203125, 39.84375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 12.0, 28.0, 38.0, 56.0, 73.0, 117.0, 170.0, 234.0, 400.0, 578.0, 905.0, 1344.0, 2154.0, 3348.0, 5228.0, 8525.0, 14022.0, 23929.0, 42335.0, 77557.0, 145391.0, 231862.0, 212088.0, 122684.0, 65908.0, 36234.0, 20519.0, 12178.0, 7522.0, 4662.0, 3015.0, 1892.0, 1253.0, 747.0, 510.0, 355.0, 245.0, 161.0, 77.0, 68.0, 34.0, 33.0, 22.0, 13.0, 5.0, 4.0, 5.0, 7.0, 1.0, 2.0], "bins": [-57.71875, -56.109375, -54.5, -52.890625, -51.28125, -49.671875, -48.0625, -46.453125, -44.84375, -43.234375, -41.625, -40.015625, -38.40625, -36.796875, -35.1875, -33.578125, -31.96875, -30.359375, -28.75, -27.140625, -25.53125, -23.921875, -22.3125, -20.703125, -19.09375, -17.484375, -15.875, -14.265625, -12.65625, -11.046875, -9.4375, -7.828125, -6.21875, -4.609375, -3.0, -1.390625, 0.21875, 1.828125, 3.4375, 5.046875, 6.65625, 8.265625, 9.875, 11.484375, 13.09375, 14.703125, 16.3125, 17.921875, 19.53125, 21.140625, 22.75, 24.359375, 25.96875, 27.578125, 29.1875, 30.796875, 32.40625, 34.015625, 35.625, 37.234375, 38.84375, 40.453125, 42.0625, 43.671875, 45.28125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 10.0, 11.0, 8.0, 7.0, 17.0, 15.0, 27.0, 20.0, 26.0, 28.0, 24.0, 34.0, 32.0, 32.0, 47.0, 47.0, 29.0, 34.0, 51.0, 42.0, 25.0, 41.0, 37.0, 42.0, 36.0, 32.0, 41.0, 31.0, 23.0, 22.0, 17.0, 11.0, 15.0, 14.0, 12.0, 10.0, 12.0, 4.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.703125, -27.80517578125, -26.9072265625, -26.00927734375, -25.111328125, -24.21337890625, -23.3154296875, -22.41748046875, -21.51953125, -20.62158203125, -19.7236328125, -18.82568359375, -17.927734375, -17.02978515625, -16.1318359375, -15.23388671875, -14.3359375, -13.43798828125, -12.5400390625, -11.64208984375, -10.744140625, -9.84619140625, -8.9482421875, -8.05029296875, -7.15234375, -6.25439453125, -5.3564453125, -4.45849609375, -3.560546875, -2.66259765625, -1.7646484375, -0.86669921875, 0.03125, 0.92919921875, 1.8271484375, 2.72509765625, 3.623046875, 4.52099609375, 5.4189453125, 6.31689453125, 7.21484375, 8.11279296875, 9.0107421875, 9.90869140625, 10.806640625, 11.70458984375, 12.6025390625, 13.50048828125, 14.3984375, 15.29638671875, 16.1943359375, 17.09228515625, 17.990234375, 18.88818359375, 19.7861328125, 20.68408203125, 21.58203125, 22.47998046875, 23.3779296875, 24.27587890625, 25.173828125, 26.07177734375, 26.9697265625, 27.86767578125, 28.765625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 8.0, 10.0, 16.0, 25.0, 38.0, 58.0, 81.0, 118.0, 149.0, 217.0, 314.0, 454.0, 615.0, 912.0, 1497.0, 2132.0, 3314.0, 5172.0, 8122.0, 12812.0, 20939.0, 35127.0, 59065.0, 98164.0, 152106.0, 188613.0, 166850.0, 114380.0, 69938.0, 41025.0, 24702.0, 14811.0, 9493.0, 5886.0, 3810.0, 2457.0, 1594.0, 1090.0, 777.0, 493.0, 347.0, 261.0, 195.0, 105.0, 86.0, 69.0, 35.0, 22.0, 14.0, 20.0, 10.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-17.25, -16.705078125, -16.16015625, -15.615234375, -15.0703125, -14.525390625, -13.98046875, -13.435546875, -12.890625, -12.345703125, -11.80078125, -11.255859375, -10.7109375, -10.166015625, -9.62109375, -9.076171875, -8.53125, -7.986328125, -7.44140625, -6.896484375, -6.3515625, -5.806640625, -5.26171875, -4.716796875, -4.171875, -3.626953125, -3.08203125, -2.537109375, -1.9921875, -1.447265625, -0.90234375, -0.357421875, 0.1875, 0.732421875, 1.27734375, 1.822265625, 2.3671875, 2.912109375, 3.45703125, 4.001953125, 4.546875, 5.091796875, 5.63671875, 6.181640625, 6.7265625, 7.271484375, 7.81640625, 8.361328125, 8.90625, 9.451171875, 9.99609375, 10.541015625, 11.0859375, 11.630859375, 12.17578125, 12.720703125, 13.265625, 13.810546875, 14.35546875, 14.900390625, 15.4453125, 15.990234375, 16.53515625, 17.080078125, 17.625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 6.0, 20.0, 20.0, 28.0, 37.0, 56.0, 81.0, 92.0, 98.0, 113.0, 103.0, 85.0, 70.0, 47.0, 36.0, 14.0, 25.0, 16.0, 12.0, 8.0, 4.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029048919677734375, -0.002795189619064331, -0.0026854872703552246, -0.002575784921646118, -0.0024660825729370117, -0.0023563802242279053, -0.002246677875518799, -0.0021369755268096924, -0.002027273178100586, -0.0019175708293914795, -0.001807868480682373, -0.0016981661319732666, -0.0015884637832641602, -0.0014787614345550537, -0.0013690590858459473, -0.0012593567371368408, -0.0011496543884277344, -0.001039952039718628, -0.0009302496910095215, -0.000820547342300415, -0.0007108449935913086, -0.0006011426448822021, -0.0004914402961730957, -0.00038173794746398926, -0.0002720355987548828, -0.00016233325004577637, -5.263090133666992e-05, 5.7071447372436523e-05, 0.00016677379608154297, 0.0002764761447906494, 0.00038617849349975586, 0.0004958808422088623, 0.0006055831909179688, 0.0007152855396270752, 0.0008249878883361816, 0.0009346902370452881, 0.0010443925857543945, 0.001154094934463501, 0.0012637972831726074, 0.0013734996318817139, 0.0014832019805908203, 0.0015929043292999268, 0.0017026066780090332, 0.0018123090267181396, 0.001922011375427246, 0.0020317137241363525, 0.002141416072845459, 0.0022511184215545654, 0.002360820770263672, 0.0024705231189727783, 0.0025802254676818848, 0.002689927816390991, 0.0027996301651000977, 0.002909332513809204, 0.0030190348625183105, 0.003128737211227417, 0.0032384395599365234, 0.00334814190864563, 0.0034578442573547363, 0.0035675466060638428, 0.0036772489547729492, 0.0037869513034820557, 0.003896653652191162, 0.0040063560009002686, 0.004116058349609375]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 11.0, 15.0, 21.0, 36.0, 41.0, 79.0, 129.0, 207.0, 395.0, 645.0, 1170.0, 2262.0, 4306.0, 8952.0, 19996.0, 47486.0, 114719.0, 243569.0, 298366.0, 174295.0, 74422.0, 30946.0, 13356.0, 6305.0, 3087.0, 1673.0, 890.0, 439.0, 281.0, 166.0, 105.0, 54.0, 43.0, 26.0, 14.0, 12.0, 9.0, 4.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.3125, -28.456787109375, -27.60107421875, -26.745361328125, -25.8896484375, -25.033935546875, -24.17822265625, -23.322509765625, -22.466796875, -21.611083984375, -20.75537109375, -19.899658203125, -19.0439453125, -18.188232421875, -17.33251953125, -16.476806640625, -15.62109375, -14.765380859375, -13.90966796875, -13.053955078125, -12.1982421875, -11.342529296875, -10.48681640625, -9.631103515625, -8.775390625, -7.919677734375, -7.06396484375, -6.208251953125, -5.3525390625, -4.496826171875, -3.64111328125, -2.785400390625, -1.9296875, -1.073974609375, -0.21826171875, 0.637451171875, 1.4931640625, 2.348876953125, 3.20458984375, 4.060302734375, 4.916015625, 5.771728515625, 6.62744140625, 7.483154296875, 8.3388671875, 9.194580078125, 10.05029296875, 10.906005859375, 11.76171875, 12.617431640625, 13.47314453125, 14.328857421875, 15.1845703125, 16.040283203125, 16.89599609375, 17.751708984375, 18.607421875, 19.463134765625, 20.31884765625, 21.174560546875, 22.0302734375, 22.885986328125, 23.74169921875, 24.597412109375, 25.453125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 7.0, 10.0, 20.0, 19.0, 22.0, 43.0, 40.0, 41.0, 50.0, 69.0, 65.0, 74.0, 54.0, 61.0, 52.0, 67.0, 48.0, 52.0, 52.0, 34.0, 27.0, 15.0, 17.0, 15.0, 14.0, 8.0, 2.0, 3.0, 5.0, 0.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.9066162109375, -4.723388671875, -4.5401611328125, -4.35693359375, -4.1737060546875, -3.990478515625, -3.8072509765625, -3.6240234375, -3.4407958984375, -3.257568359375, -3.0743408203125, -2.89111328125, -2.7078857421875, -2.524658203125, -2.3414306640625, -2.158203125, -1.9749755859375, -1.791748046875, -1.6085205078125, -1.42529296875, -1.2420654296875, -1.058837890625, -0.8756103515625, -0.6923828125, -0.5091552734375, -0.325927734375, -0.1427001953125, 0.04052734375, 0.2237548828125, 0.406982421875, 0.5902099609375, 0.7734375, 0.9566650390625, 1.139892578125, 1.3231201171875, 1.50634765625, 1.6895751953125, 1.872802734375, 2.0560302734375, 2.2392578125, 2.4224853515625, 2.605712890625, 2.7889404296875, 2.97216796875, 3.1553955078125, 3.338623046875, 3.5218505859375, 3.705078125, 3.8883056640625, 4.071533203125, 4.2547607421875, 4.43798828125, 4.6212158203125, 4.804443359375, 4.9876708984375, 5.1708984375, 5.3541259765625, 5.537353515625, 5.7205810546875, 5.90380859375, 6.0870361328125, 6.270263671875, 6.4534912109375, 6.63671875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 8.0, 6.0, 4.0, 6.0, 8.0, 10.0, 18.0, 29.0, 23.0, 27.0, 45.0, 56.0, 56.0, 61.0, 70.0, 60.0, 66.0, 59.0, 71.0, 54.0, 53.0, 34.0, 39.0, 29.0, 15.0, 20.0, 11.0, 15.0, 12.0, 8.0, 6.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-74.32234954833984, -72.0781478881836, -69.83393859863281, -67.58973693847656, -65.34552764892578, -63.10132598876953, -60.857120513916016, -58.6129150390625, -56.368709564208984, -54.12450408935547, -51.88029861450195, -49.63609313964844, -47.39189147949219, -45.147682189941406, -42.903480529785156, -40.65927505493164, -38.415069580078125, -36.17086410522461, -33.926658630371094, -31.68245506286621, -29.438249588012695, -27.19404411315918, -24.949840545654297, -22.70563507080078, -20.461429595947266, -18.21722412109375, -15.97301959991455, -13.728815078735352, -11.484609603881836, -9.24040412902832, -6.996199607849121, -4.751995086669922, -2.5077896118164062, -0.26358461380004883, 1.9806203842163086, 4.224825382232666, 6.469030380249023, 8.713235855102539, 10.957440376281738, 13.201644897460938, 15.445850372314453, 17.69005584716797, 19.934261322021484, 22.178464889526367, 24.422670364379883, 26.6668758392334, 28.91107940673828, 31.155284881591797, 33.39949035644531, 35.64369583129883, 37.887901306152344, 40.13210678100586, 42.376312255859375, 44.620513916015625, 46.86471939086914, 49.108924865722656, 51.35313034057617, 53.59733581542969, 55.8415412902832, 58.08574676513672, 60.32994842529297, 62.57415771484375, 64.818359375, 67.06256103515625, 69.30677032470703]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 10.0, 11.0, 13.0, 6.0, 16.0, 13.0, 13.0, 20.0, 20.0, 28.0, 27.0, 25.0, 40.0, 28.0, 29.0, 36.0, 37.0, 38.0, 41.0, 45.0, 31.0, 44.0, 32.0, 36.0, 35.0, 31.0, 25.0, 36.0, 22.0, 27.0, 23.0, 27.0, 21.0, 16.0, 17.0, 11.0, 11.0, 13.0, 4.0, 10.0, 2.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-54.58190155029297, -52.91526412963867, -51.248626708984375, -49.58198928833008, -47.91535186767578, -46.248714447021484, -44.58207702636719, -42.915443420410156, -41.248802185058594, -39.5821647644043, -37.91552734375, -36.2488899230957, -34.582252502441406, -32.91561508178711, -31.248979568481445, -29.58234214782715, -27.915706634521484, -26.249069213867188, -24.58243179321289, -22.915794372558594, -21.249156951904297, -19.58251953125, -17.915884017944336, -16.24924659729004, -14.582609176635742, -12.915971755981445, -11.249334335327148, -9.582697868347168, -7.916060447692871, -6.249423027038574, -4.582786560058594, -2.916149139404297, -1.2495155334472656, 0.41712164878845215, 2.08375883102417, 3.7503957748413086, 5.4170331954956055, 7.083670616149902, 8.750307083129883, 10.41694450378418, 12.083581924438477, 13.750219345092773, 15.41685676574707, 17.083492279052734, 18.75012969970703, 20.416767120361328, 22.083404541015625, 23.750041961669922, 25.41667938232422, 27.083316802978516, 28.749954223632812, 30.41659164428711, 32.083229064941406, 33.7498664855957, 35.41650390625, 37.08313751220703, 38.749778747558594, 40.41641616821289, 42.08305358886719, 43.749691009521484, 45.41632843017578, 47.08296585083008, 48.749603271484375, 50.416236877441406, 52.0828742980957]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 6.0, 7.0, 15.0, 7.0, 10.0, 13.0, 15.0, 19.0, 16.0, 26.0, 27.0, 35.0, 57.0, 69.0, 114.0, 145.0, 238.0, 462.0, 1241.0, 8440.0, 507017.0, 4212.0, 914.0, 376.0, 228.0, 139.0, 79.0, 69.0, 60.0, 25.0, 22.0, 21.0, 18.0, 21.0, 20.0, 16.0, 6.0, 10.0, 6.0, 6.0, 8.0, 7.0, 6.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1316.349609375, -1274.3819580078125, -1232.4141845703125, -1190.446533203125, -1148.4788818359375, -1106.51123046875, -1064.54345703125, -1022.5758056640625, -980.6080932617188, -938.640380859375, -896.6727294921875, -854.7050170898438, -812.7373046875, -770.7696533203125, -728.8019409179688, -686.834228515625, -644.8665771484375, -602.8988647460938, -560.9312133789062, -518.9635009765625, -476.9958190917969, -435.02813720703125, -393.0604248046875, -351.0927429199219, -309.12506103515625, -267.1573791503906, -225.18968200683594, -183.22198486328125, -141.25430297851562, -99.28662109375, -57.31892395019531, -15.351226806640625, 26.6163330078125, 68.58402252197266, 110.55171203613281, 152.5194091796875, 194.48709106445312, 236.45477294921875, 278.4224853515625, 320.3901672363281, 362.35784912109375, 404.3255310058594, 446.293212890625, 488.26092529296875, 530.2286376953125, 572.1962890625, 614.1640014648438, 656.1317138671875, 698.099365234375, 740.0670776367188, 782.0347290039062, 824.00244140625, 865.9700927734375, 907.9378051757812, 949.905517578125, 991.8731689453125, 1033.8408203125, 1075.8084716796875, 1117.7762451171875, 1159.743896484375, 1201.7115478515625, 1243.67919921875, 1285.64697265625, 1327.6146240234375, 1369.5823974609375]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 11.0, 9.0, 14.0, 8.0, 13.0, 14.0, 14.0, 20.0, 20.0, 25.0, 29.0, 23.0, 36.0, 25.0, 37.0, 33.0, 36.0, 40.0, 38.0, 44.0, 1064.0, 37.0, 33.0, 37.0, 36.0, 28.0, 30.0, 27.0, 27.0, 27.0, 23.0, 23.0, 21.0, 19.0, 17.0, 11.0, 12.0, 15.0, 6.0, 8.0, 4.0, 6.0, 8.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1710.0235595703125, -1658.3663330078125, -1606.709228515625, -1555.052001953125, -1503.3948974609375, -1451.7376708984375, -1400.08056640625, -1348.42333984375, -1296.7662353515625, -1245.1090087890625, -1193.451904296875, -1141.794677734375, -1090.1375732421875, -1038.4803466796875, -986.8232421875, -935.166015625, -883.5088500976562, -831.8516845703125, -780.1945190429688, -728.537353515625, -676.8801879882812, -625.2230224609375, -573.5657958984375, -521.90869140625, -470.2514953613281, -418.5943298339844, -366.9371643066406, -315.27996826171875, -263.622802734375, -211.96563720703125, -160.3084716796875, -108.65130615234375, -56.994140625, -5.336971282958984, 46.32019805908203, 97.97737121582031, 149.63453674316406, 201.29171752929688, 252.94888305664062, 304.6060485839844, 356.2632141113281, 407.9203796386719, 459.5775451660156, 511.2347412109375, 562.8919067382812, 614.549072265625, 666.2062377929688, 717.8634033203125, 769.5205688476562, 821.177734375, 872.8348999023438, 924.4920654296875, 976.1492309570312, 1027.806396484375, 1079.463623046875, 1131.1207275390625, 1182.7779541015625, 1234.4351806640625, 1286.09228515625, 1337.74951171875, 1389.4066162109375, 1441.0638427734375, 1492.720947265625, 1544.378173828125, 1596.0352783203125]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 3.0, 3.0, 8.0, 8.0, 9.0, 13.0, 15.0, 16.0, 21.0, 26.0, 40.0, 55.0, 67.0, 105.0, 156.0, 229.0, 386.0, 586.0, 908.0, 1159.0, 1701.0, 2873.0, 6642.0, 31185760.0, 38321.0, 7400.0, 5903.0, 763.0, 455.0, 241.0, 188.0, 98.0, 91.0, 60.0, 37.0, 31.0, 20.0, 19.0, 16.0, 11.0, 11.0, 4.0, 15.0, 5.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1258.243408203125, -1216.0384521484375, -1173.83349609375, -1131.62841796875, -1089.4234619140625, -1047.218505859375, -1005.0134887695312, -962.8084716796875, -920.603515625, -878.3985595703125, -836.1935424804688, -793.988525390625, -751.7835693359375, -709.57861328125, -667.3735961914062, -625.1685791015625, -582.963623046875, -540.7586669921875, -498.55364990234375, -456.3486633300781, -414.1436767578125, -371.9386901855469, -329.73370361328125, -287.5287170410156, -245.32373046875, -203.11874389648438, -160.91375732421875, -118.70877075195312, -76.5037841796875, -34.298797607421875, 7.90618896484375, 50.111175537109375, 92.3160400390625, 134.52102661132812, 176.72601318359375, 218.93099975585938, 261.135986328125, 303.3409729003906, 345.54595947265625, 387.7509460449219, 429.9559326171875, 472.1609191894531, 514.3659057617188, 556.5709228515625, 598.77587890625, 640.9808349609375, 683.1858520507812, 725.390869140625, 767.5958251953125, 809.80078125, 852.0057983398438, 894.2108154296875, 936.415771484375, 978.6207275390625, 1020.8257446289062, 1063.03076171875, 1105.2357177734375, 1147.440673828125, 1189.645751953125, 1231.8507080078125, 1274.0556640625, 1316.2606201171875, 1358.465576171875, 1400.670654296875, 1442.8756103515625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 12.0, 12.0, 16.0, 22.0, 28.0, 49.0, 56.0, 57.0, 83.0, 123.0, 95.0, 105.0, 78.0, 64.0, 52.0, 38.0, 21.0, 28.0, 17.0, 18.0, 4.0, 3.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1172.977783203125, -1138.875244140625, -1104.7725830078125, -1070.6700439453125, -1036.5673828125, -1002.46484375, -968.3623046875, -934.2597045898438, -900.1571044921875, -866.0545043945312, -831.951904296875, -797.849365234375, -763.7467651367188, -729.6441650390625, -695.5416259765625, -661.4390258789062, -627.33642578125, -593.2338256835938, -559.1312255859375, -525.0286865234375, -490.92608642578125, -456.823486328125, -422.7209167480469, -388.61834716796875, -354.5157470703125, -320.41314697265625, -286.3105773925781, -252.20799255371094, -218.10540771484375, -184.00282287597656, -149.90023803710938, -115.79765319824219, -81.6949462890625, -47.59236145019531, -13.489776611328125, 20.612808227539062, 54.71539306640625, 88.81797790527344, 122.92056274414062, 157.0231475830078, 191.125732421875, 225.2283172607422, 259.3309020996094, 293.4334716796875, 327.53607177734375, 361.638671875, 395.7412414550781, 429.84381103515625, 463.9464111328125, 498.04901123046875, 532.151611328125, 566.254150390625, 600.3567504882812, 634.4593505859375, 668.5618896484375, 702.6644897460938, 736.76708984375, 770.8696899414062, 804.9722900390625, 839.0748291015625, 873.1774291992188, 907.280029296875, 941.382568359375, 975.4851684570312, 1009.5877685546875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 12.0, 8.0, 14.0, 15.0, 20.0, 18.0, 15.0, 20.0, 36.0, 32.0, 39.0, 45.0, 51.0, 67.0, 81.0, 77.0, 58.0, 61.0, 45.0, 49.0, 38.0, 23.0, 22.0, 35.0, 23.0, 23.0, 9.0, 11.0, 8.0, 12.0, 3.0, 5.0, 5.0, 3.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-867.371826171875, -841.8292846679688, -816.2867431640625, -790.7442626953125, -765.2017211914062, -739.6591796875, -714.1166381835938, -688.5740966796875, -663.0316162109375, -637.4890747070312, -611.946533203125, -586.404052734375, -560.8615112304688, -535.3189697265625, -509.77642822265625, -484.23388671875, -458.69134521484375, -433.1488037109375, -407.6062927246094, -382.0637512207031, -356.521240234375, -330.97869873046875, -305.4361572265625, -279.89361572265625, -254.35110473632812, -228.80857849121094, -203.26605224609375, -177.7235107421875, -152.1809844970703, -126.63845825195312, -101.09591674804688, -75.55339050292969, -50.01092529296875, -24.468395233154297, 1.0741348266601562, 26.616668701171875, 52.15919494628906, 77.70172119140625, 103.2442626953125, 128.7867889404297, 154.32931518554688, 179.87184143066406, 205.41436767578125, 230.9569091796875, 256.49945068359375, 282.0419616699219, 307.5845031738281, 333.12701416015625, 358.6695556640625, 384.21209716796875, 409.7546081542969, 435.2971496582031, 460.83966064453125, 486.3822021484375, 511.92474365234375, 537.46728515625, 563.009765625, 588.5523071289062, 614.0948486328125, 639.6373291015625, 665.1798706054688, 690.722412109375, 716.2649536132812, 741.8074951171875, 767.3500366210938]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 5.0, 9.0, 10.0, 20.0, 36.0, 60.0, 89.0, 116.0, 173.0, 324.0, 515.0, 960.0, 1676.0, 2979.0, 5460.0, 10053.0, 19106.0, 37253.0, 74229.0, 153144.0, 328141.0, 729805.0, 1548753.0, 681803.0, 304070.0, 146010.0, 71621.0, 36034.0, 18652.0, 9895.0, 5348.0, 3039.0, 1897.0, 1109.0, 674.0, 425.0, 257.0, 172.0, 130.0, 88.0, 47.0, 41.0, 19.0, 11.0, 9.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.90625, -13.434326171875, -12.96240234375, -12.490478515625, -12.0185546875, -11.546630859375, -11.07470703125, -10.602783203125, -10.130859375, -9.658935546875, -9.18701171875, -8.715087890625, -8.2431640625, -7.771240234375, -7.29931640625, -6.827392578125, -6.35546875, -5.883544921875, -5.41162109375, -4.939697265625, -4.4677734375, -3.995849609375, -3.52392578125, -3.052001953125, -2.580078125, -2.108154296875, -1.63623046875, -1.164306640625, -0.6923828125, -0.220458984375, 0.25146484375, 0.723388671875, 1.1953125, 1.667236328125, 2.13916015625, 2.611083984375, 3.0830078125, 3.554931640625, 4.02685546875, 4.498779296875, 4.970703125, 5.442626953125, 5.91455078125, 6.386474609375, 6.8583984375, 7.330322265625, 7.80224609375, 8.274169921875, 8.74609375, 9.218017578125, 9.68994140625, 10.161865234375, 10.6337890625, 11.105712890625, 11.57763671875, 12.049560546875, 12.521484375, 12.993408203125, 13.46533203125, 13.937255859375, 14.4091796875, 14.881103515625, 15.35302734375, 15.824951171875, 16.296875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 9.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 12.0, 17.0, 22.0, 26.0, 35.0, 42.0, 27.0, 44.0, 49.0, 52.0, 62.0, 55.0, 51.0, 61.0, 46.0, 53.0, 38.0, 41.0, 33.0, 37.0, 30.0, 22.0, 24.0, 19.0, 21.0, 14.0, 9.0, 11.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94873046875, -0.9117202758789062, -0.8747100830078125, -0.8376998901367188, -0.800689697265625, -0.7636795043945312, -0.7266693115234375, -0.6896591186523438, -0.65264892578125, -0.6156387329101562, -0.5786285400390625, -0.5416183471679688, -0.504608154296875, -0.46759796142578125, -0.4305877685546875, -0.39357757568359375, -0.3565673828125, -0.31955718994140625, -0.2825469970703125, -0.24553680419921875, -0.208526611328125, -0.17151641845703125, -0.1345062255859375, -0.09749603271484375, -0.06048583984375, -0.02347564697265625, 0.0135345458984375, 0.05054473876953125, 0.087554931640625, 0.12456512451171875, 0.1615753173828125, 0.19858551025390625, 0.235595703125, 0.27260589599609375, 0.3096160888671875, 0.34662628173828125, 0.383636474609375, 0.42064666748046875, 0.4576568603515625, 0.49466705322265625, 0.53167724609375, 0.5686874389648438, 0.6056976318359375, 0.6427078247070312, 0.679718017578125, 0.7167282104492188, 0.7537384033203125, 0.7907485961914062, 0.8277587890625, 0.8647689819335938, 0.9017791748046875, 0.9387893676757812, 0.975799560546875, 1.0128097534179688, 1.0498199462890625, 1.0868301391601562, 1.12384033203125, 1.1608505249023438, 1.1978607177734375, 1.2348709106445312, 1.271881103515625, 1.3088912963867188, 1.3459014892578125, 1.3829116821289062, 1.419921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 12.0, 10.0, 20.0, 33.0, 58.0, 72.0, 129.0, 224.0, 399.0, 764.0, 1557.0, 3416.0, 8156.0, 21616.0, 62998.0, 209395.0, 736860.0, 1911919.0, 874176.0, 248262.0, 73324.0, 24396.0, 9117.0, 3685.0, 1742.0, 836.0, 454.0, 240.0, 132.0, 95.0, 56.0, 24.0, 23.0, 23.0, 14.0, 8.0, 6.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.1328125, -14.6031494140625, -14.073486328125, -13.5438232421875, -13.01416015625, -12.4844970703125, -11.954833984375, -11.4251708984375, -10.8955078125, -10.3658447265625, -9.836181640625, -9.3065185546875, -8.77685546875, -8.2471923828125, -7.717529296875, -7.1878662109375, -6.658203125, -6.1285400390625, -5.598876953125, -5.0692138671875, -4.53955078125, -4.0098876953125, -3.480224609375, -2.9505615234375, -2.4208984375, -1.8912353515625, -1.361572265625, -0.8319091796875, -0.30224609375, 0.2274169921875, 0.757080078125, 1.2867431640625, 1.81640625, 2.3460693359375, 2.875732421875, 3.4053955078125, 3.93505859375, 4.4647216796875, 4.994384765625, 5.5240478515625, 6.0537109375, 6.5833740234375, 7.113037109375, 7.6427001953125, 8.17236328125, 8.7020263671875, 9.231689453125, 9.7613525390625, 10.291015625, 10.8206787109375, 11.350341796875, 11.8800048828125, 12.40966796875, 12.9393310546875, 13.468994140625, 13.9986572265625, 14.5283203125, 15.0579833984375, 15.587646484375, 16.1173095703125, 16.64697265625, 17.1766357421875, 17.706298828125, 18.2359619140625, 18.765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 6.0, 7.0, 12.0, 16.0, 16.0, 35.0, 32.0, 40.0, 51.0, 51.0, 61.0, 71.0, 95.0, 133.0, 130.0, 174.0, 186.0, 189.0, 219.0, 239.0, 297.0, 287.0, 248.0, 218.0, 175.0, 179.0, 156.0, 132.0, 130.0, 106.0, 77.0, 66.0, 54.0, 39.0, 26.0, 23.0, 21.0, 12.0, 11.0, 10.0, 9.0, 7.0, 4.0, 4.0, 5.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.20703125, -3.106719970703125, -3.00640869140625, -2.906097412109375, -2.8057861328125, -2.705474853515625, -2.60516357421875, -2.504852294921875, -2.404541015625, -2.304229736328125, -2.20391845703125, -2.103607177734375, -2.0032958984375, -1.902984619140625, -1.80267333984375, -1.702362060546875, -1.60205078125, -1.501739501953125, -1.40142822265625, -1.301116943359375, -1.2008056640625, -1.100494384765625, -1.00018310546875, -0.899871826171875, -0.799560546875, -0.699249267578125, -0.59893798828125, -0.498626708984375, -0.3983154296875, -0.298004150390625, -0.19769287109375, -0.097381591796875, 0.0029296875, 0.103240966796875, 0.20355224609375, 0.303863525390625, 0.4041748046875, 0.504486083984375, 0.60479736328125, 0.705108642578125, 0.805419921875, 0.905731201171875, 1.00604248046875, 1.106353759765625, 1.2066650390625, 1.306976318359375, 1.40728759765625, 1.507598876953125, 1.60791015625, 1.708221435546875, 1.80853271484375, 1.908843994140625, 2.0091552734375, 2.109466552734375, 2.20977783203125, 2.310089111328125, 2.410400390625, 2.510711669921875, 2.61102294921875, 2.711334228515625, 2.8116455078125, 2.911956787109375, 3.01226806640625, 3.112579345703125, 3.212890625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 7.0, 11.0, 24.0, 23.0, 35.0, 30.0, 43.0, 68.0, 83.0, 79.0, 68.0, 93.0, 62.0, 69.0, 76.0, 41.0, 37.0, 38.0, 26.0, 18.0, 16.0, 4.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.671653747558594, -42.30682373046875, -40.94199752807617, -39.57716751098633, -38.21234130859375, -36.847511291503906, -35.48268508911133, -34.117855072021484, -32.753028869628906, -31.388200759887695, -30.023372650146484, -28.658544540405273, -27.293716430664062, -25.92888832092285, -24.56406021118164, -23.199230194091797, -21.834402084350586, -20.469573974609375, -19.104745864868164, -17.739917755126953, -16.375089645385742, -15.010261535644531, -13.645432472229004, -12.280604362487793, -10.915776252746582, -9.550948143005371, -8.18612003326416, -6.821291446685791, -5.45646333694458, -4.091635227203369, -2.726806640625, -1.361978530883789, 0.002849578857421875, 1.3676778078079224, 2.732506036758423, 4.097334384918213, 5.462162494659424, 6.826990604400635, 8.191819190979004, 9.556647300720215, 10.921475410461426, 12.286303520202637, 13.651131629943848, 15.015960693359375, 16.380788803100586, 17.745616912841797, 19.110445022583008, 20.47527313232422, 21.84010124206543, 23.20492935180664, 24.56975746154785, 25.934585571289062, 27.299413681030273, 28.664241790771484, 30.029071807861328, 31.393898010253906, 32.75872802734375, 34.123558044433594, 35.48838424682617, 36.853214263916016, 38.218040466308594, 39.58287048339844, 40.947696685791016, 42.31252670288086, 43.67735290527344]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 8.0, 9.0, 18.0, 13.0, 19.0, 13.0, 26.0, 31.0, 23.0, 28.0, 24.0, 46.0, 53.0, 41.0, 57.0, 58.0, 55.0, 52.0, 45.0, 46.0, 51.0, 44.0, 43.0, 34.0, 29.0, 23.0, 33.0, 15.0, 14.0, 9.0, 9.0, 8.0, 3.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.58348846435547, -27.757017135620117, -26.930545806884766, -26.104074478149414, -25.277603149414062, -24.451133728027344, -23.62466049194336, -22.79819107055664, -21.97171974182129, -21.145248413085938, -20.318777084350586, -19.492305755615234, -18.665834426879883, -17.83936309814453, -17.012893676757812, -16.18642234802246, -15.359950065612793, -14.533478736877441, -13.70700740814209, -12.880537033081055, -12.054065704345703, -11.227594375610352, -10.401123046875, -9.574651718139648, -8.748180389404297, -7.921709060668945, -7.095238208770752, -6.2687668800354, -5.442296028137207, -4.6158246994018555, -3.789353370666504, -2.9628825187683105, -2.136411666870117, -1.3099405765533447, -0.4834693670272827, 0.3430018424987793, 1.1694729328155518, 1.9959440231323242, 2.822415351867676, 3.648886203765869, 4.475357532501221, 5.301828861236572, 6.128299713134766, 6.954771041870117, 7.781242370605469, 8.60771369934082, 9.434185028076172, 10.260655403137207, 11.087126731872559, 11.91359806060791, 12.740069389343262, 13.566539764404297, 14.393011093139648, 15.219482421875, 16.04595375061035, 16.872425079345703, 17.698896408081055, 18.525367736816406, 19.351839065551758, 20.17831039428711, 21.00478172302246, 21.831253051757812, 22.65772247314453, 23.484193801879883, 24.310665130615234]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 8.0, 9.0, 9.0, 13.0, 26.0, 43.0, 70.0, 80.0, 123.0, 197.0, 337.0, 548.0, 878.0, 1579.0, 2674.0, 4755.0, 8568.0, 15444.0, 29273.0, 59094.0, 124417.0, 253679.0, 271902.0, 138659.0, 65132.0, 32592.0, 17018.0, 9063.0, 5112.0, 2959.0, 1705.0, 958.0, 582.0, 372.0, 229.0, 154.0, 96.0, 54.0, 42.0, 28.0, 28.0, 15.0, 12.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.40625, -9.121826171875, -8.83740234375, -8.552978515625, -8.2685546875, -7.984130859375, -7.69970703125, -7.415283203125, -7.130859375, -6.846435546875, -6.56201171875, -6.277587890625, -5.9931640625, -5.708740234375, -5.42431640625, -5.139892578125, -4.85546875, -4.571044921875, -4.28662109375, -4.002197265625, -3.7177734375, -3.433349609375, -3.14892578125, -2.864501953125, -2.580078125, -2.295654296875, -2.01123046875, -1.726806640625, -1.4423828125, -1.157958984375, -0.87353515625, -0.589111328125, -0.3046875, -0.020263671875, 0.26416015625, 0.548583984375, 0.8330078125, 1.117431640625, 1.40185546875, 1.686279296875, 1.970703125, 2.255126953125, 2.53955078125, 2.823974609375, 3.1083984375, 3.392822265625, 3.67724609375, 3.961669921875, 4.24609375, 4.530517578125, 4.81494140625, 5.099365234375, 5.3837890625, 5.668212890625, 5.95263671875, 6.237060546875, 6.521484375, 6.805908203125, 7.09033203125, 7.374755859375, 7.6591796875, 7.943603515625, 8.22802734375, 8.512451171875, 8.796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 3.0, 18.0, 14.0, 9.0, 22.0, 25.0, 27.0, 36.0, 16.0, 57.0, 42.0, 38.0, 49.0, 51.0, 42.0, 39.0, 55.0, 56.0, 41.0, 40.0, 39.0, 43.0, 25.0, 32.0, 28.0, 26.0, 24.0, 21.0, 16.0, 12.0, 15.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.029296875, -0.9892578125, -0.94921875, -0.9091796875, -0.869140625, -0.8291015625, -0.7890625, -0.7490234375, -0.708984375, -0.6689453125, -0.62890625, -0.5888671875, -0.548828125, -0.5087890625, -0.46875, -0.4287109375, -0.388671875, -0.3486328125, -0.30859375, -0.2685546875, -0.228515625, -0.1884765625, -0.1484375, -0.1083984375, -0.068359375, -0.0283203125, 0.01171875, 0.0517578125, 0.091796875, 0.1318359375, 0.171875, 0.2119140625, 0.251953125, 0.2919921875, 0.33203125, 0.3720703125, 0.412109375, 0.4521484375, 0.4921875, 0.5322265625, 0.572265625, 0.6123046875, 0.65234375, 0.6923828125, 0.732421875, 0.7724609375, 0.8125, 0.8525390625, 0.892578125, 0.9326171875, 0.97265625, 1.0126953125, 1.052734375, 1.0927734375, 1.1328125, 1.1728515625, 1.212890625, 1.2529296875, 1.29296875, 1.3330078125, 1.373046875, 1.4130859375, 1.453125, 1.4931640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 7.0, 5.0, 14.0, 9.0, 23.0, 28.0, 58.0, 104.0, 203.0, 426.0, 1176.0, 3421.0, 14486.0, 125327.0, 798334.0, 88196.0, 11737.0, 3123.0, 1012.0, 421.0, 189.0, 93.0, 50.0, 37.0, 25.0, 11.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.7431640625, -19.048828125, -18.3544921875, -17.66015625, -16.9658203125, -16.271484375, -15.5771484375, -14.8828125, -14.1884765625, -13.494140625, -12.7998046875, -12.10546875, -11.4111328125, -10.716796875, -10.0224609375, -9.328125, -8.6337890625, -7.939453125, -7.2451171875, -6.55078125, -5.8564453125, -5.162109375, -4.4677734375, -3.7734375, -3.0791015625, -2.384765625, -1.6904296875, -0.99609375, -0.3017578125, 0.392578125, 1.0869140625, 1.78125, 2.4755859375, 3.169921875, 3.8642578125, 4.55859375, 5.2529296875, 5.947265625, 6.6416015625, 7.3359375, 8.0302734375, 8.724609375, 9.4189453125, 10.11328125, 10.8076171875, 11.501953125, 12.1962890625, 12.890625, 13.5849609375, 14.279296875, 14.9736328125, 15.66796875, 16.3623046875, 17.056640625, 17.7509765625, 18.4453125, 19.1396484375, 19.833984375, 20.5283203125, 21.22265625, 21.9169921875, 22.611328125, 23.3056640625, 24.0]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 5.0, 17.0, 17.0, 11.0, 9.0, 10.0, 22.0, 24.0, 23.0, 28.0, 29.0, 31.0, 32.0, 44.0, 31.0, 56.0, 46.0, 41.0, 42.0, 34.0, 52.0, 42.0, 47.0, 39.0, 26.0, 42.0, 30.0, 26.0, 23.0, 18.0, 15.0, 16.0, 16.0, 12.0, 11.0, 5.0, 3.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.90234375, -7.69012451171875, -7.4779052734375, -7.26568603515625, -7.053466796875, -6.84124755859375, -6.6290283203125, -6.41680908203125, -6.20458984375, -5.99237060546875, -5.7801513671875, -5.56793212890625, -5.355712890625, -5.14349365234375, -4.9312744140625, -4.71905517578125, -4.5068359375, -4.29461669921875, -4.0823974609375, -3.87017822265625, -3.657958984375, -3.44573974609375, -3.2335205078125, -3.02130126953125, -2.80908203125, -2.59686279296875, -2.3846435546875, -2.17242431640625, -1.960205078125, -1.74798583984375, -1.5357666015625, -1.32354736328125, -1.111328125, -0.89910888671875, -0.6868896484375, -0.47467041015625, -0.262451171875, -0.05023193359375, 0.1619873046875, 0.37420654296875, 0.58642578125, 0.79864501953125, 1.0108642578125, 1.22308349609375, 1.435302734375, 1.64752197265625, 1.8597412109375, 2.07196044921875, 2.2841796875, 2.49639892578125, 2.7086181640625, 2.92083740234375, 3.133056640625, 3.34527587890625, 3.5574951171875, 3.76971435546875, 3.98193359375, 4.19415283203125, 4.4063720703125, 4.61859130859375, 4.830810546875, 5.04302978515625, 5.2552490234375, 5.46746826171875, 5.6796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 9.0, 8.0, 12.0, 20.0, 23.0, 37.0, 54.0, 100.0, 135.0, 255.0, 472.0, 871.0, 1887.0, 4158.0, 13197.0, 81822.0, 832189.0, 90905.0, 14046.0, 4444.0, 1832.0, 879.0, 475.0, 270.0, 158.0, 97.0, 54.0, 51.0, 30.0, 17.0, 14.0, 5.0, 9.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-32.875, -31.949462890625, -31.02392578125, -30.098388671875, -29.1728515625, -28.247314453125, -27.32177734375, -26.396240234375, -25.470703125, -24.545166015625, -23.61962890625, -22.694091796875, -21.7685546875, -20.843017578125, -19.91748046875, -18.991943359375, -18.06640625, -17.140869140625, -16.21533203125, -15.289794921875, -14.3642578125, -13.438720703125, -12.51318359375, -11.587646484375, -10.662109375, -9.736572265625, -8.81103515625, -7.885498046875, -6.9599609375, -6.034423828125, -5.10888671875, -4.183349609375, -3.2578125, -2.332275390625, -1.40673828125, -0.481201171875, 0.4443359375, 1.369873046875, 2.29541015625, 3.220947265625, 4.146484375, 5.072021484375, 5.99755859375, 6.923095703125, 7.8486328125, 8.774169921875, 9.69970703125, 10.625244140625, 11.55078125, 12.476318359375, 13.40185546875, 14.327392578125, 15.2529296875, 16.178466796875, 17.10400390625, 18.029541015625, 18.955078125, 19.880615234375, 20.80615234375, 21.731689453125, 22.6572265625, 23.582763671875, 24.50830078125, 25.433837890625, 26.359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 14.0, 16.0, 32.0, 50.0, 92.0, 144.0, 185.0, 174.0, 111.0, 72.0, 29.0, 30.0, 18.0, 10.0, 5.0, 3.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00171661376953125, -0.0016687065362930298, -0.0016207993030548096, -0.0015728920698165894, -0.0015249848365783691, -0.001477077603340149, -0.0014291703701019287, -0.0013812631368637085, -0.0013333559036254883, -0.001285448670387268, -0.0012375414371490479, -0.0011896342039108276, -0.0011417269706726074, -0.0010938197374343872, -0.001045912504196167, -0.0009980052709579468, -0.0009500980377197266, -0.0009021908044815063, -0.0008542835712432861, -0.0008063763380050659, -0.0007584691047668457, -0.0007105618715286255, -0.0006626546382904053, -0.0006147474050521851, -0.0005668401718139648, -0.0005189329385757446, -0.0004710257053375244, -0.0004231184720993042, -0.000375211238861084, -0.00032730400562286377, -0.00027939677238464355, -0.00023148953914642334, -0.00018358230590820312, -0.0001356750726699829, -8.77678394317627e-05, -3.986060619354248e-05, 8.046627044677734e-06, 5.595386028289795e-05, 0.00010386109352111816, 0.00015176832675933838, 0.0001996755599975586, 0.0002475827932357788, 0.000295490026473999, 0.00034339725971221924, 0.00039130449295043945, 0.00043921172618865967, 0.0004871189594268799, 0.0005350261926651001, 0.0005829334259033203, 0.0006308406591415405, 0.0006787478923797607, 0.000726655125617981, 0.0007745623588562012, 0.0008224695920944214, 0.0008703768253326416, 0.0009182840585708618, 0.000966191291809082, 0.0010140985250473022, 0.0010620057582855225, 0.0011099129915237427, 0.0011578202247619629, 0.001205727458000183, 0.0012536346912384033, 0.0013015419244766235, 0.0013494491577148438]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 6.0, 6.0, 12.0, 13.0, 16.0, 25.0, 37.0, 53.0, 68.0, 101.0, 142.0, 224.0, 382.0, 670.0, 1079.0, 1974.0, 3863.0, 9334.0, 26877.0, 128329.0, 638010.0, 182225.0, 34135.0, 10863.0, 4525.0, 2347.0, 1230.0, 744.0, 444.0, 264.0, 175.0, 100.0, 82.0, 58.0, 45.0, 31.0, 12.0, 13.0, 10.0, 8.0, 5.0, 3.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.609375, -17.03369140625, -16.4580078125, -15.88232421875, -15.306640625, -14.73095703125, -14.1552734375, -13.57958984375, -13.00390625, -12.42822265625, -11.8525390625, -11.27685546875, -10.701171875, -10.12548828125, -9.5498046875, -8.97412109375, -8.3984375, -7.82275390625, -7.2470703125, -6.67138671875, -6.095703125, -5.52001953125, -4.9443359375, -4.36865234375, -3.79296875, -3.21728515625, -2.6416015625, -2.06591796875, -1.490234375, -0.91455078125, -0.3388671875, 0.23681640625, 0.8125, 1.38818359375, 1.9638671875, 2.53955078125, 3.115234375, 3.69091796875, 4.2666015625, 4.84228515625, 5.41796875, 5.99365234375, 6.5693359375, 7.14501953125, 7.720703125, 8.29638671875, 8.8720703125, 9.44775390625, 10.0234375, 10.59912109375, 11.1748046875, 11.75048828125, 12.326171875, 12.90185546875, 13.4775390625, 14.05322265625, 14.62890625, 15.20458984375, 15.7802734375, 16.35595703125, 16.931640625, 17.50732421875, 18.0830078125, 18.65869140625, 19.234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 5.0, 7.0, 12.0, 12.0, 12.0, 11.0, 17.0, 10.0, 33.0, 21.0, 34.0, 40.0, 48.0, 50.0, 40.0, 63.0, 81.0, 75.0, 64.0, 55.0, 41.0, 43.0, 33.0, 32.0, 23.0, 25.0, 24.0, 16.0, 9.0, 8.0, 14.0, 5.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.90234375, -6.69805908203125, -6.4937744140625, -6.28948974609375, -6.085205078125, -5.88092041015625, -5.6766357421875, -5.47235107421875, -5.26806640625, -5.06378173828125, -4.8594970703125, -4.65521240234375, -4.450927734375, -4.24664306640625, -4.0423583984375, -3.83807373046875, -3.6337890625, -3.42950439453125, -3.2252197265625, -3.02093505859375, -2.816650390625, -2.61236572265625, -2.4080810546875, -2.20379638671875, -1.99951171875, -1.79522705078125, -1.5909423828125, -1.38665771484375, -1.182373046875, -0.97808837890625, -0.7738037109375, -0.56951904296875, -0.365234375, -0.16094970703125, 0.0433349609375, 0.24761962890625, 0.451904296875, 0.65618896484375, 0.8604736328125, 1.06475830078125, 1.26904296875, 1.47332763671875, 1.6776123046875, 1.88189697265625, 2.086181640625, 2.29046630859375, 2.4947509765625, 2.69903564453125, 2.9033203125, 3.10760498046875, 3.3118896484375, 3.51617431640625, 3.720458984375, 3.92474365234375, 4.1290283203125, 4.33331298828125, 4.53759765625, 4.74188232421875, 4.9461669921875, 5.15045166015625, 5.354736328125, 5.55902099609375, 5.7633056640625, 5.96759033203125, 6.171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 9.0, 22.0, 39.0, 59.0, 170.0, 279.0, 202.0, 97.0, 63.0, 19.0, 14.0, 7.0, 8.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.50115966796875, -127.12567901611328, -121.75019836425781, -116.37471771240234, -110.99923706054688, -105.6237564086914, -100.24827575683594, -94.87279510498047, -89.497314453125, -84.12183380126953, -78.74635314941406, -73.3708724975586, -67.99539184570312, -62.619911193847656, -57.24443054199219, -51.86894989013672, -46.49346923828125, -41.11798858642578, -35.74250793457031, -30.367027282714844, -24.991546630859375, -19.616065979003906, -14.240585327148438, -8.865104675292969, -3.4896240234375, 1.8858566284179688, 7.2613372802734375, 12.636817932128906, 18.012298583984375, 23.387779235839844, 28.763259887695312, 34.13874053955078, 39.51420593261719, 44.889686584472656, 50.265167236328125, 55.640647888183594, 61.01612854003906, 66.39160919189453, 71.76708984375, 77.14257049560547, 82.51805114746094, 87.8935317993164, 93.26901245117188, 98.64449310302734, 104.01997375488281, 109.39545440673828, 114.77093505859375, 120.14641571044922, 125.52189636230469, 130.89736938476562, 136.27285766601562, 141.64834594726562, 147.02381896972656, 152.3992919921875, 157.7747802734375, 163.1502685546875, 168.52574157714844, 173.90121459960938, 179.27670288085938, 184.65219116210938, 190.0276641845703, 195.40313720703125, 200.77862548828125, 206.15411376953125, 211.5295867919922]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 5.0, 0.0, 1.0, 6.0, 5.0, 8.0, 5.0, 13.0, 14.0, 35.0, 22.0, 56.0, 75.0, 84.0, 113.0, 106.0, 113.0, 105.0, 69.0, 46.0, 23.0, 18.0, 18.0, 11.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.6932373046875, -106.21023559570312, -102.72723388671875, -99.24423217773438, -95.76123046875, -92.27822875976562, -88.79522705078125, -85.31222534179688, -81.8292236328125, -78.34622192382812, -74.86322021484375, -71.38021850585938, -67.897216796875, -64.41421508789062, -60.93121337890625, -57.448211669921875, -53.965213775634766, -50.48221206665039, -46.999210357666016, -43.51620864868164, -40.033206939697266, -36.550209045410156, -33.06720733642578, -29.584203720092773, -26.1012020111084, -22.618200302124023, -19.13519859313965, -15.65219783782959, -12.169196128845215, -8.686195373535156, -5.203193664550781, -1.7201919555664062, 1.7628097534179688, 5.245811462402344, 8.728813171386719, 12.211813926696777, 15.694815635681152, 19.17781639099121, 22.660818099975586, 26.14381980895996, 29.626821517944336, 33.10982131958008, 36.59282302856445, 40.07582473754883, 43.5588264465332, 47.04182815551758, 50.52482986450195, 54.00783157348633, 57.4908332824707, 60.97383499145508, 64.45683288574219, 67.93983459472656, 71.42283630371094, 74.90583801269531, 78.38883972167969, 81.87184143066406, 85.35484313964844, 88.83784484863281, 92.32084655761719, 95.80384826660156, 99.28684997558594, 102.76985168457031, 106.25285339355469, 109.73585510253906, 113.21885681152344]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 5.0, 1.0, 1.0, 2.0, 9.0, 5.0, 7.0, 7.0, 12.0, 26.0, 36.0, 54.0, 77.0, 103.0, 171.0, 225.0, 388.0, 621.0, 1100.0, 1871.0, 3333.0, 6032.0, 11274.0, 22223.0, 45411.0, 98439.0, 251389.0, 2897844.0, 557003.0, 160107.0, 68347.0, 32295.0, 16365.0, 8605.0, 4607.0, 2563.0, 1481.0, 861.0, 535.0, 315.0, 183.0, 131.0, 68.0, 43.0, 43.0, 22.0, 14.0, 9.0, 12.0, 5.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.4375, -25.60546875, -24.7734375, -23.94140625, -23.109375, -22.27734375, -21.4453125, -20.61328125, -19.78125, -18.94921875, -18.1171875, -17.28515625, -16.453125, -15.62109375, -14.7890625, -13.95703125, -13.125, -12.29296875, -11.4609375, -10.62890625, -9.796875, -8.96484375, -8.1328125, -7.30078125, -6.46875, -5.63671875, -4.8046875, -3.97265625, -3.140625, -2.30859375, -1.4765625, -0.64453125, 0.1875, 1.01953125, 1.8515625, 2.68359375, 3.515625, 4.34765625, 5.1796875, 6.01171875, 6.84375, 7.67578125, 8.5078125, 9.33984375, 10.171875, 11.00390625, 11.8359375, 12.66796875, 13.5, 14.33203125, 15.1640625, 15.99609375, 16.828125, 17.66015625, 18.4921875, 19.32421875, 20.15625, 20.98828125, 21.8203125, 22.65234375, 23.484375, 24.31640625, 25.1484375, 25.98046875, 26.8125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 5.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 3.0, 8.0, 12.0, 13.0, 21.0, 18.0, 23.0, 31.0, 28.0, 49.0, 37.0, 40.0, 40.0, 45.0, 40.0, 45.0, 49.0, 39.0, 52.0, 43.0, 40.0, 42.0, 37.0, 32.0, 26.0, 34.0, 24.0, 18.0, 24.0, 18.0, 11.0, 10.0, 9.0, 3.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.0431060791015625, -1.002227783203125, -0.9613494873046875, -0.92047119140625, -0.8795928955078125, -0.838714599609375, -0.7978363037109375, -0.7569580078125, -0.7160797119140625, -0.675201416015625, -0.6343231201171875, -0.59344482421875, -0.5525665283203125, -0.511688232421875, -0.4708099365234375, -0.429931640625, -0.3890533447265625, -0.348175048828125, -0.3072967529296875, -0.26641845703125, -0.2255401611328125, -0.184661865234375, -0.1437835693359375, -0.1029052734375, -0.0620269775390625, -0.021148681640625, 0.0197296142578125, 0.06060791015625, 0.1014862060546875, 0.142364501953125, 0.1832427978515625, 0.22412109375, 0.2649993896484375, 0.305877685546875, 0.3467559814453125, 0.38763427734375, 0.4285125732421875, 0.469390869140625, 0.5102691650390625, 0.5511474609375, 0.5920257568359375, 0.632904052734375, 0.6737823486328125, 0.71466064453125, 0.7555389404296875, 0.796417236328125, 0.8372955322265625, 0.878173828125, 0.9190521240234375, 0.959930419921875, 1.0008087158203125, 1.04168701171875, 1.0825653076171875, 1.123443603515625, 1.1643218994140625, 1.2052001953125, 1.2460784912109375, 1.286956787109375, 1.3278350830078125, 1.36871337890625, 1.4095916748046875, 1.450469970703125, 1.4913482666015625, 1.5322265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 14.0, 32.0, 37.0, 78.0, 116.0, 159.0, 325.0, 554.0, 937.0, 1692.0, 3193.0, 6070.0, 11932.0, 24366.0, 51920.0, 117248.0, 305546.0, 2567640.0, 729879.0, 211002.0, 85382.0, 38308.0, 18374.0, 9099.0, 4680.0, 2504.0, 1346.0, 717.0, 414.0, 264.0, 159.0, 89.0, 69.0, 44.0, 37.0, 12.0, 8.0, 9.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-30.109375, -29.268798828125, -28.42822265625, -27.587646484375, -26.7470703125, -25.906494140625, -25.06591796875, -24.225341796875, -23.384765625, -22.544189453125, -21.70361328125, -20.863037109375, -20.0224609375, -19.181884765625, -18.34130859375, -17.500732421875, -16.66015625, -15.819580078125, -14.97900390625, -14.138427734375, -13.2978515625, -12.457275390625, -11.61669921875, -10.776123046875, -9.935546875, -9.094970703125, -8.25439453125, -7.413818359375, -6.5732421875, -5.732666015625, -4.89208984375, -4.051513671875, -3.2109375, -2.370361328125, -1.52978515625, -0.689208984375, 0.1513671875, 0.991943359375, 1.83251953125, 2.673095703125, 3.513671875, 4.354248046875, 5.19482421875, 6.035400390625, 6.8759765625, 7.716552734375, 8.55712890625, 9.397705078125, 10.23828125, 11.078857421875, 11.91943359375, 12.760009765625, 13.6005859375, 14.441162109375, 15.28173828125, 16.122314453125, 16.962890625, 17.803466796875, 18.64404296875, 19.484619140625, 20.3251953125, 21.165771484375, 22.00634765625, 22.846923828125, 23.6875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 2.0, 8.0, 4.0, 12.0, 7.0, 18.0, 21.0, 23.0, 28.0, 24.0, 39.0, 36.0, 53.0, 66.0, 69.0, 103.0, 94.0, 127.0, 183.0, 251.0, 1179.0, 669.0, 227.0, 179.0, 124.0, 97.0, 101.0, 53.0, 61.0, 47.0, 31.0, 25.0, 21.0, 20.0, 14.0, 10.0, 9.0, 10.0, 6.0, 7.0, 6.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.900390625, -3.778350830078125, -3.65631103515625, -3.534271240234375, -3.4122314453125, -3.290191650390625, -3.16815185546875, -3.046112060546875, -2.924072265625, -2.802032470703125, -2.67999267578125, -2.557952880859375, -2.4359130859375, -2.313873291015625, -2.19183349609375, -2.069793701171875, -1.94775390625, -1.825714111328125, -1.70367431640625, -1.581634521484375, -1.4595947265625, -1.337554931640625, -1.21551513671875, -1.093475341796875, -0.971435546875, -0.849395751953125, -0.72735595703125, -0.605316162109375, -0.4832763671875, -0.361236572265625, -0.23919677734375, -0.117156982421875, 0.0048828125, 0.126922607421875, 0.24896240234375, 0.371002197265625, 0.4930419921875, 0.615081787109375, 0.73712158203125, 0.859161376953125, 0.981201171875, 1.103240966796875, 1.22528076171875, 1.347320556640625, 1.4693603515625, 1.591400146484375, 1.71343994140625, 1.835479736328125, 1.95751953125, 2.079559326171875, 2.20159912109375, 2.323638916015625, 2.4456787109375, 2.567718505859375, 2.68975830078125, 2.811798095703125, 2.933837890625, 3.055877685546875, 3.17791748046875, 3.299957275390625, 3.4219970703125, 3.544036865234375, 3.66607666015625, 3.788116455078125, 3.91015625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 15.0, 16.0, 49.0, 103.0, 233.0, 308.0, 164.0, 57.0, 33.0, 17.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.35238647460938, -143.69107055664062, -140.0297393798828, -136.36842346191406, -132.7071075439453, -129.0457763671875, -125.38446044921875, -121.72314453125, -118.06182098388672, -114.40049743652344, -110.73918151855469, -107.0778579711914, -103.41653442382812, -99.75521850585938, -96.0938949584961, -92.43257141113281, -88.77125549316406, -85.10993194580078, -81.44861602783203, -77.78729248046875, -74.1259765625, -70.46465301513672, -66.80332946777344, -63.14200973510742, -59.480690002441406, -55.81937026977539, -52.158050537109375, -48.496726989746094, -44.83540725708008, -41.17408752441406, -37.51276397705078, -33.851444244384766, -30.19012451171875, -26.528804779052734, -22.867483139038086, -19.206161499023438, -15.544841766357422, -11.883522033691406, -8.222200393676758, -4.560878753662109, -0.8995590209960938, 2.7617616653442383, 6.42308235168457, 10.084403038024902, 13.745723724365234, 17.40704345703125, 21.0683650970459, 24.729686737060547, 28.391006469726562, 32.05232620239258, 35.713645935058594, 39.374969482421875, 43.03628921508789, 46.697608947753906, 50.35893249511719, 54.0202522277832, 57.68157196044922, 61.342891693115234, 65.00421142578125, 68.66553497314453, 72.32685852050781, 75.98817443847656, 79.64949798583984, 83.31082153320312, 86.97213745117188]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 9.0, 14.0, 9.0, 11.0, 17.0, 26.0, 23.0, 21.0, 31.0, 29.0, 31.0, 35.0, 26.0, 33.0, 38.0, 42.0, 53.0, 50.0, 48.0, 39.0, 41.0, 41.0, 39.0, 34.0, 25.0, 39.0, 23.0, 32.0, 19.0, 19.0, 19.0, 14.0, 16.0, 10.0, 5.0, 11.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.749717712402344, -20.097631454467773, -19.445545196533203, -18.793460845947266, -18.141374588012695, -17.489288330078125, -16.837202072143555, -16.185115814208984, -15.53303050994873, -14.88094425201416, -14.228858947753906, -13.576772689819336, -12.924686431884766, -12.272601127624512, -11.620514869689941, -10.968429565429688, -10.316343307495117, -9.664257049560547, -9.012171745300293, -8.360085487365723, -7.7079997062683105, -7.055913925170898, -6.403827667236328, -5.751741886138916, -5.099656105041504, -4.447570323944092, -3.7954843044281006, -3.1433982849121094, -2.4913125038146973, -1.8392267227172852, -1.187140703201294, -0.5350546836853027, 0.11703109741210938, 0.769116997718811, 1.4212028980255127, 2.073288917541504, 2.725374698638916, 3.377460479736328, 4.029546737670898, 4.6816325187683105, 5.333718299865723, 5.985804080963135, 6.637889862060547, 7.289976119995117, 7.942061901092529, 8.594147682189941, 9.246233940124512, 9.898319244384766, 10.550405502319336, 11.202491760253906, 11.85457706451416, 12.50666332244873, 13.158748626708984, 13.810834884643555, 14.462921142578125, 15.115007400512695, 15.76709270477295, 16.419178009033203, 17.071264266967773, 17.723350524902344, 18.375436782836914, 19.027523040771484, 19.679607391357422, 20.331693649291992, 20.983779907226562]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 3.0, 7.0, 17.0, 26.0, 48.0, 97.0, 116.0, 221.0, 356.0, 659.0, 1310.0, 2679.0, 5832.0, 13206.0, 37836.0, 156792.0, 598796.0, 165816.0, 39557.0, 13580.0, 5921.0, 2751.0, 1322.0, 688.0, 384.0, 197.0, 112.0, 84.0, 37.0, 27.0, 14.0, 13.0, 10.0, 7.0, 5.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.57763671875, -28.6083984375, -27.63916015625, -26.669921875, -25.70068359375, -24.7314453125, -23.76220703125, -22.79296875, -21.82373046875, -20.8544921875, -19.88525390625, -18.916015625, -17.94677734375, -16.9775390625, -16.00830078125, -15.0390625, -14.06982421875, -13.1005859375, -12.13134765625, -11.162109375, -10.19287109375, -9.2236328125, -8.25439453125, -7.28515625, -6.31591796875, -5.3466796875, -4.37744140625, -3.408203125, -2.43896484375, -1.4697265625, -0.50048828125, 0.46875, 1.43798828125, 2.4072265625, 3.37646484375, 4.345703125, 5.31494140625, 6.2841796875, 7.25341796875, 8.22265625, 9.19189453125, 10.1611328125, 11.13037109375, 12.099609375, 13.06884765625, 14.0380859375, 15.00732421875, 15.9765625, 16.94580078125, 17.9150390625, 18.88427734375, 19.853515625, 20.82275390625, 21.7919921875, 22.76123046875, 23.73046875, 24.69970703125, 25.6689453125, 26.63818359375, 27.607421875, 28.57666015625, 29.5458984375, 30.51513671875, 31.484375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 7.0, 13.0, 14.0, 16.0, 22.0, 21.0, 25.0, 33.0, 35.0, 39.0, 38.0, 50.0, 60.0, 41.0, 57.0, 52.0, 51.0, 45.0, 50.0, 39.0, 37.0, 28.0, 37.0, 23.0, 27.0, 24.0, 22.0, 12.0, 16.0, 9.0, 9.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4560546875, -1.4074554443359375, -1.358856201171875, -1.3102569580078125, -1.26165771484375, -1.2130584716796875, -1.164459228515625, -1.1158599853515625, -1.0672607421875, -1.0186614990234375, -0.970062255859375, -0.9214630126953125, -0.87286376953125, -0.8242645263671875, -0.775665283203125, -0.7270660400390625, -0.678466796875, -0.6298675537109375, -0.581268310546875, -0.5326690673828125, -0.48406982421875, -0.4354705810546875, -0.386871337890625, -0.3382720947265625, -0.2896728515625, -0.2410736083984375, -0.192474365234375, -0.1438751220703125, -0.09527587890625, -0.0466766357421875, 0.001922607421875, 0.0505218505859375, 0.09912109375, 0.1477203369140625, 0.196319580078125, 0.2449188232421875, 0.29351806640625, 0.3421173095703125, 0.390716552734375, 0.4393157958984375, 0.4879150390625, 0.5365142822265625, 0.585113525390625, 0.6337127685546875, 0.68231201171875, 0.7309112548828125, 0.779510498046875, 0.8281097412109375, 0.876708984375, 0.9253082275390625, 0.973907470703125, 1.0225067138671875, 1.07110595703125, 1.1197052001953125, 1.168304443359375, 1.2169036865234375, 1.2655029296875, 1.3141021728515625, 1.362701416015625, 1.4113006591796875, 1.45989990234375, 1.5084991455078125, 1.557098388671875, 1.6056976318359375, 1.654296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 1.0, 6.0, 10.0, 8.0, 7.0, 4.0, 5.0, 16.0, 18.0, 25.0, 85.0, 518.0, 6175.0, 504592.0, 530167.0, 6124.0, 571.0, 94.0, 24.0, 12.0, 8.0, 7.0, 5.0, 10.0, 5.0, 2.0, 5.0, 1.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-88.875, -86.3359375, -83.796875, -81.2578125, -78.71875, -76.1796875, -73.640625, -71.1015625, -68.5625, -66.0234375, -63.484375, -60.9453125, -58.40625, -55.8671875, -53.328125, -50.7890625, -48.25, -45.7109375, -43.171875, -40.6328125, -38.09375, -35.5546875, -33.015625, -30.4765625, -27.9375, -25.3984375, -22.859375, -20.3203125, -17.78125, -15.2421875, -12.703125, -10.1640625, -7.625, -5.0859375, -2.546875, -0.0078125, 2.53125, 5.0703125, 7.609375, 10.1484375, 12.6875, 15.2265625, 17.765625, 20.3046875, 22.84375, 25.3828125, 27.921875, 30.4609375, 33.0, 35.5390625, 38.078125, 40.6171875, 43.15625, 45.6953125, 48.234375, 50.7734375, 53.3125, 55.8515625, 58.390625, 60.9296875, 63.46875, 66.0078125, 68.546875, 71.0859375, 73.625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 5.0, 7.0, 7.0, 6.0, 13.0, 15.0, 15.0, 28.0, 22.0, 34.0, 36.0, 35.0, 45.0, 36.0, 51.0, 43.0, 53.0, 46.0, 64.0, 41.0, 45.0, 41.0, 38.0, 43.0, 31.0, 24.0, 30.0, 32.0, 19.0, 30.0, 8.0, 9.0, 2.0, 15.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.0859375, -7.85125732421875, -7.6165771484375, -7.38189697265625, -7.147216796875, -6.91253662109375, -6.6778564453125, -6.44317626953125, -6.20849609375, -5.97381591796875, -5.7391357421875, -5.50445556640625, -5.269775390625, -5.03509521484375, -4.8004150390625, -4.56573486328125, -4.3310546875, -4.09637451171875, -3.8616943359375, -3.62701416015625, -3.392333984375, -3.15765380859375, -2.9229736328125, -2.68829345703125, -2.45361328125, -2.21893310546875, -1.9842529296875, -1.74957275390625, -1.514892578125, -1.28021240234375, -1.0455322265625, -0.81085205078125, -0.576171875, -0.34149169921875, -0.1068115234375, 0.12786865234375, 0.362548828125, 0.59722900390625, 0.8319091796875, 1.06658935546875, 1.30126953125, 1.53594970703125, 1.7706298828125, 2.00531005859375, 2.239990234375, 2.47467041015625, 2.7093505859375, 2.94403076171875, 3.1787109375, 3.41339111328125, 3.6480712890625, 3.88275146484375, 4.117431640625, 4.35211181640625, 4.5867919921875, 4.82147216796875, 5.05615234375, 5.29083251953125, 5.5255126953125, 5.76019287109375, 5.994873046875, 6.22955322265625, 6.4642333984375, 6.69891357421875, 6.93359375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 23.0, 38.0, 97.0, 411.0, 8557.0, 1036484.0, 2566.0, 214.0, 47.0, 18.0, 13.0, 6.0, 14.0, 4.0, 3.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.5, -253.50390625, -243.5078125, -233.51171875, -223.515625, -213.51953125, -203.5234375, -193.52734375, -183.53125, -173.53515625, -163.5390625, -153.54296875, -143.546875, -133.55078125, -123.5546875, -113.55859375, -103.5625, -93.56640625, -83.5703125, -73.57421875, -63.578125, -53.58203125, -43.5859375, -33.58984375, -23.59375, -13.59765625, -3.6015625, 6.39453125, 16.390625, 26.38671875, 36.3828125, 46.37890625, 56.375, 66.37109375, 76.3671875, 86.36328125, 96.359375, 106.35546875, 116.3515625, 126.34765625, 136.34375, 146.33984375, 156.3359375, 166.33203125, 176.328125, 186.32421875, 196.3203125, 206.31640625, 216.3125, 226.30859375, 236.3046875, 246.30078125, 256.296875, 266.29296875, 276.2890625, 286.28515625, 296.28125, 306.27734375, 316.2734375, 326.26953125, 336.265625, 346.26171875, 356.2578125, 366.25390625, 376.25]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 12.0, 23.0, 37.0, 85.0, 228.0, 307.0, 177.0, 51.0, 23.0, 22.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0027446746826171875, -0.0026622116565704346, -0.0025797486305236816, -0.0024972856044769287, -0.0024148225784301758, -0.002332359552383423, -0.00224989652633667, -0.002167433500289917, -0.002084970474243164, -0.002002507448196411, -0.0019200444221496582, -0.0018375813961029053, -0.0017551183700561523, -0.0016726553440093994, -0.0015901923179626465, -0.0015077292919158936, -0.0014252662658691406, -0.0013428032398223877, -0.0012603402137756348, -0.0011778771877288818, -0.001095414161682129, -0.001012951135635376, -0.000930488109588623, -0.0008480250835418701, -0.0007655620574951172, -0.0006830990314483643, -0.0006006360054016113, -0.0005181729793548584, -0.00043570995330810547, -0.00035324692726135254, -0.0002707839012145996, -0.00018832087516784668, -0.00010585784912109375, -2.339482307434082e-05, 5.906820297241211e-05, 0.00014153122901916504, 0.00022399425506591797, 0.0003064572811126709, 0.00038892030715942383, 0.00047138333320617676, 0.0005538463592529297, 0.0006363093852996826, 0.0007187724113464355, 0.0008012354373931885, 0.0008836984634399414, 0.0009661614894866943, 0.0010486245155334473, 0.0011310875415802002, 0.0012135505676269531, 0.001296013593673706, 0.001378476619720459, 0.001460939645767212, 0.0015434026718139648, 0.0016258656978607178, 0.0017083287239074707, 0.0017907917499542236, 0.0018732547760009766, 0.0019557178020477295, 0.0020381808280944824, 0.0021206438541412354, 0.0022031068801879883, 0.002285569906234741, 0.002368032932281494, 0.002450495958328247, 0.002532958984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 6.0, 10.0, 13.0, 21.0, 36.0, 30.0, 45.0, 73.0, 102.0, 121.0, 187.0, 299.0, 422.0, 715.0, 1145.0, 2038.0, 3965.0, 8651.0, 26799.0, 350725.0, 600414.0, 32561.0, 9792.0, 4355.0, 2355.0, 1277.0, 795.0, 499.0, 344.0, 226.0, 148.0, 99.0, 76.0, 52.0, 38.0, 34.0, 21.0, 15.0, 12.0, 6.0, 4.0, 2.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-72.625, -70.359375, -68.09375, -65.828125, -63.5625, -61.296875, -59.03125, -56.765625, -54.5, -52.234375, -49.96875, -47.703125, -45.4375, -43.171875, -40.90625, -38.640625, -36.375, -34.109375, -31.84375, -29.578125, -27.3125, -25.046875, -22.78125, -20.515625, -18.25, -15.984375, -13.71875, -11.453125, -9.1875, -6.921875, -4.65625, -2.390625, -0.125, 2.140625, 4.40625, 6.671875, 8.9375, 11.203125, 13.46875, 15.734375, 18.0, 20.265625, 22.53125, 24.796875, 27.0625, 29.328125, 31.59375, 33.859375, 36.125, 38.390625, 40.65625, 42.921875, 45.1875, 47.453125, 49.71875, 51.984375, 54.25, 56.515625, 58.78125, 61.046875, 63.3125, 65.578125, 67.84375, 70.109375, 72.375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 5.0, 7.0, 3.0, 6.0, 14.0, 20.0, 30.0, 85.0, 334.0, 285.0, 86.0, 44.0, 22.0, 16.0, 6.0, 11.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.46875, -53.787109375, -52.10546875, -50.423828125, -48.7421875, -47.060546875, -45.37890625, -43.697265625, -42.015625, -40.333984375, -38.65234375, -36.970703125, -35.2890625, -33.607421875, -31.92578125, -30.244140625, -28.5625, -26.880859375, -25.19921875, -23.517578125, -21.8359375, -20.154296875, -18.47265625, -16.791015625, -15.109375, -13.427734375, -11.74609375, -10.064453125, -8.3828125, -6.701171875, -5.01953125, -3.337890625, -1.65625, 0.025390625, 1.70703125, 3.388671875, 5.0703125, 6.751953125, 8.43359375, 10.115234375, 11.796875, 13.478515625, 15.16015625, 16.841796875, 18.5234375, 20.205078125, 21.88671875, 23.568359375, 25.25, 26.931640625, 28.61328125, 30.294921875, 31.9765625, 33.658203125, 35.33984375, 37.021484375, 38.703125, 40.384765625, 42.06640625, 43.748046875, 45.4296875, 47.111328125, 48.79296875, 50.474609375, 52.15625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 6.0, 6.0, 11.0, 15.0, 39.0, 60.0, 129.0, 192.0, 223.0, 165.0, 78.0, 34.0, 19.0, 9.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.8294219970703, -245.4001007080078, -238.9707794189453, -232.54147338867188, -226.11215209960938, -219.68283081054688, -213.25350952148438, -206.82418823242188, -200.39488220214844, -193.96556091308594, -187.53623962402344, -181.10693359375, -174.6776123046875, -168.248291015625, -161.8189697265625, -155.3896484375, -148.9603271484375, -142.531005859375, -136.1016845703125, -129.67237854003906, -123.24305725097656, -116.81373596191406, -110.38441467285156, -103.9551010131836, -97.52578735351562, -91.09646606445312, -84.66715240478516, -78.23783111572266, -71.80851745605469, -65.37919616699219, -58.94987869262695, -52.52056121826172, -46.09124755859375, -39.661930084228516, -33.23261260986328, -26.803293228149414, -20.37397575378418, -13.944656372070312, -7.515338897705078, -1.0860214233398438, 5.343296051025391, 11.772613525390625, 18.20193099975586, 24.631250381469727, 31.06056785583496, 37.48988723754883, 43.91920471191406, 50.3485221862793, 56.77783966064453, 63.207157135009766, 69.636474609375, 76.0657958984375, 82.49510955810547, 88.92443084716797, 95.35374450683594, 101.78306579589844, 108.21238708496094, 114.64170837402344, 121.0710220336914, 127.5003433227539, 133.92965698242188, 140.35897827148438, 146.78829956054688, 153.21762084960938, 159.6469268798828]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 2.0, 6.0, 3.0, 14.0, 14.0, 23.0, 25.0, 39.0, 29.0, 45.0, 68.0, 63.0, 78.0, 79.0, 82.0, 64.0, 64.0, 50.0, 58.0, 40.0, 35.0, 26.0, 27.0, 16.0, 18.0, 10.0, 8.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.31697082519531, -88.5999526977539, -85.8829345703125, -83.16592407226562, -80.44890594482422, -77.73188781738281, -75.0148696899414, -72.2978515625, -69.58084106445312, -66.86382293701172, -64.14680480957031, -61.42979049682617, -58.71277618408203, -55.995758056640625, -53.27873992919922, -50.56172180175781, -47.844703674316406, -45.127685546875, -42.41067123413086, -39.69365310668945, -36.97663879394531, -34.259620666503906, -31.5426025390625, -28.825586318969727, -26.108570098876953, -23.39155387878418, -20.674537658691406, -17.95751953125, -15.240503311157227, -12.523487091064453, -9.806468963623047, -7.089452743530273, -4.372444152832031, -1.6554274559020996, 1.061589241027832, 3.778606414794922, 6.495622634887695, 9.212638854980469, 11.929656982421875, 14.646673202514648, 17.363689422607422, 20.080705642700195, 22.79772186279297, 25.514739990234375, 28.23175621032715, 30.948772430419922, 33.66579055786133, 36.38280487060547, 39.099822998046875, 41.81684112548828, 44.53385543823242, 47.25087356567383, 49.96788787841797, 52.684906005859375, 55.40192413330078, 58.11894226074219, 60.83595657348633, 63.552974700927734, 66.26998901367188, 68.98700714111328, 71.70402526855469, 74.42103576660156, 77.1380615234375, 79.85507202148438, 82.57209014892578]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 9.0, 9.0, 9.0, 17.0, 17.0, 20.0, 23.0, 19.0, 46.0, 75.0, 104.0, 233.0, 467.0, 1098.0, 2985.0, 10091.0, 43231.0, 366132.0, 3662927.0, 81666.0, 17531.0, 4920.0, 1559.0, 571.0, 253.0, 102.0, 61.0, 23.0, 20.0, 7.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-91.125, -88.53515625, -85.9453125, -83.35546875, -80.765625, -78.17578125, -75.5859375, -72.99609375, -70.40625, -67.81640625, -65.2265625, -62.63671875, -60.046875, -57.45703125, -54.8671875, -52.27734375, -49.6875, -47.09765625, -44.5078125, -41.91796875, -39.328125, -36.73828125, -34.1484375, -31.55859375, -28.96875, -26.37890625, -23.7890625, -21.19921875, -18.609375, -16.01953125, -13.4296875, -10.83984375, -8.25, -5.66015625, -3.0703125, -0.48046875, 2.109375, 4.69921875, 7.2890625, 9.87890625, 12.46875, 15.05859375, 17.6484375, 20.23828125, 22.828125, 25.41796875, 28.0078125, 30.59765625, 33.1875, 35.77734375, 38.3671875, 40.95703125, 43.546875, 46.13671875, 48.7265625, 51.31640625, 53.90625, 56.49609375, 59.0859375, 61.67578125, 64.265625, 66.85546875, 69.4453125, 72.03515625, 74.625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 2.0, 5.0, 8.0, 9.0, 10.0, 12.0, 13.0, 19.0, 13.0, 18.0, 31.0, 29.0, 25.0, 32.0, 36.0, 43.0, 43.0, 49.0, 53.0, 65.0, 37.0, 48.0, 40.0, 39.0, 43.0, 49.0, 32.0, 22.0, 24.0, 21.0, 28.0, 16.0, 18.0, 14.0, 12.0, 10.0, 8.0, 2.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5107421875, -1.4616851806640625, -1.412628173828125, -1.3635711669921875, -1.31451416015625, -1.2654571533203125, -1.216400146484375, -1.1673431396484375, -1.1182861328125, -1.0692291259765625, -1.020172119140625, -0.9711151123046875, -0.92205810546875, -0.8730010986328125, -0.823944091796875, -0.7748870849609375, -0.725830078125, -0.6767730712890625, -0.627716064453125, -0.5786590576171875, -0.52960205078125, -0.4805450439453125, -0.431488037109375, -0.3824310302734375, -0.3333740234375, -0.2843170166015625, -0.235260009765625, -0.1862030029296875, -0.13714599609375, -0.0880889892578125, -0.039031982421875, 0.0100250244140625, 0.05908203125, 0.1081390380859375, 0.157196044921875, 0.2062530517578125, 0.25531005859375, 0.3043670654296875, 0.353424072265625, 0.4024810791015625, 0.4515380859375, 0.5005950927734375, 0.549652099609375, 0.5987091064453125, 0.64776611328125, 0.6968231201171875, 0.745880126953125, 0.7949371337890625, 0.843994140625, 0.8930511474609375, 0.942108154296875, 0.9911651611328125, 1.04022216796875, 1.0892791748046875, 1.138336181640625, 1.1873931884765625, 1.2364501953125, 1.2855072021484375, 1.334564208984375, 1.3836212158203125, 1.43267822265625, 1.4817352294921875, 1.530792236328125, 1.5798492431640625, 1.62890625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 12.0, 13.0, 5.0, 9.0, 18.0, 16.0, 29.0, 31.0, 52.0, 57.0, 70.0, 98.0, 189.0, 464.0, 1390.0, 6299.0, 34380.0, 293247.0, 3686047.0, 144937.0, 20668.0, 4131.0, 1101.0, 370.0, 177.0, 113.0, 80.0, 72.0, 46.0, 26.0, 30.0, 25.0, 15.0, 8.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-111.5625, -108.576171875, -105.58984375, -102.603515625, -99.6171875, -96.630859375, -93.64453125, -90.658203125, -87.671875, -84.685546875, -81.69921875, -78.712890625, -75.7265625, -72.740234375, -69.75390625, -66.767578125, -63.78125, -60.794921875, -57.80859375, -54.822265625, -51.8359375, -48.849609375, -45.86328125, -42.876953125, -39.890625, -36.904296875, -33.91796875, -30.931640625, -27.9453125, -24.958984375, -21.97265625, -18.986328125, -16.0, -13.013671875, -10.02734375, -7.041015625, -4.0546875, -1.068359375, 1.91796875, 4.904296875, 7.890625, 10.876953125, 13.86328125, 16.849609375, 19.8359375, 22.822265625, 25.80859375, 28.794921875, 31.78125, 34.767578125, 37.75390625, 40.740234375, 43.7265625, 46.712890625, 49.69921875, 52.685546875, 55.671875, 58.658203125, 61.64453125, 64.630859375, 67.6171875, 70.603515625, 73.58984375, 76.576171875, 79.5625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 15.0, 18.0, 23.0, 20.0, 16.0, 33.0, 55.0, 62.0, 85.0, 123.0, 174.0, 291.0, 1979.0, 458.0, 197.0, 129.0, 81.0, 83.0, 48.0, 42.0, 33.0, 22.0, 26.0, 15.0, 3.0, 9.0, 6.0, 6.0, 5.0, 1.0, 4.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.81561279296875, -4.6038818359375, -4.39215087890625, -4.180419921875, -3.96868896484375, -3.7569580078125, -3.54522705078125, -3.33349609375, -3.12176513671875, -2.9100341796875, -2.69830322265625, -2.486572265625, -2.27484130859375, -2.0631103515625, -1.85137939453125, -1.6396484375, -1.42791748046875, -1.2161865234375, -1.00445556640625, -0.792724609375, -0.58099365234375, -0.3692626953125, -0.15753173828125, 0.05419921875, 0.26593017578125, 0.4776611328125, 0.68939208984375, 0.901123046875, 1.11285400390625, 1.3245849609375, 1.53631591796875, 1.748046875, 1.95977783203125, 2.1715087890625, 2.38323974609375, 2.594970703125, 2.80670166015625, 3.0184326171875, 3.23016357421875, 3.44189453125, 3.65362548828125, 3.8653564453125, 4.07708740234375, 4.288818359375, 4.50054931640625, 4.7122802734375, 4.92401123046875, 5.1357421875, 5.34747314453125, 5.5592041015625, 5.77093505859375, 5.982666015625, 6.19439697265625, 6.4061279296875, 6.61785888671875, 6.82958984375, 7.04132080078125, 7.2530517578125, 7.46478271484375, 7.676513671875, 7.88824462890625, 8.0999755859375, 8.31170654296875, 8.5234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 4.0, 3.0, 5.0, 10.0, 11.0, 13.0, 19.0, 39.0, 41.0, 43.0, 53.0, 49.0, 76.0, 72.0, 93.0, 87.0, 57.0, 66.0, 50.0, 28.0, 44.0, 33.0, 17.0, 11.0, 13.0, 12.0, 11.0, 10.0, 5.0, 2.0, 7.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.3068962097168, -37.19454574584961, -36.08219528198242, -34.96984100341797, -33.85749053955078, -32.745140075683594, -31.632789611816406, -30.52043914794922, -29.40808868408203, -28.295738220214844, -27.183385848999023, -26.071035385131836, -24.95868492126465, -23.846332550048828, -22.73398208618164, -21.621631622314453, -20.509279251098633, -19.396928787231445, -18.284576416015625, -17.172225952148438, -16.05987548828125, -14.947524070739746, -13.835172653198242, -12.722822189331055, -11.61047077178955, -10.498119354248047, -9.38576889038086, -8.273417472839355, -7.16106653213501, -6.048715591430664, -4.93636417388916, -3.8240132331848145, -2.7116622924804688, -1.5993112325668335, -0.48696017265319824, 0.6253910064697266, 1.7377419471740723, 2.850092887878418, 3.962444305419922, 5.074795246124268, 6.187146186828613, 7.299497127532959, 8.411848068237305, 9.524199485778809, 10.636550903320312, 11.7489013671875, 12.861252784729004, 13.973604202270508, 15.085954666137695, 16.198305130004883, 17.310657501220703, 18.42300796508789, 19.535358428955078, 20.647708892822266, 21.760061264038086, 22.872411727905273, 23.984764099121094, 25.09711456298828, 26.2094669342041, 27.32181739807129, 28.434167861938477, 29.546520233154297, 30.658870697021484, 31.771221160888672, 32.88357162475586]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 7.0, 5.0, 13.0, 16.0, 11.0, 15.0, 20.0, 25.0, 16.0, 33.0, 31.0, 35.0, 36.0, 39.0, 55.0, 51.0, 52.0, 44.0, 46.0, 44.0, 43.0, 36.0, 40.0, 36.0, 39.0, 34.0, 22.0, 23.0, 23.0, 15.0, 14.0, 13.0, 15.0, 7.0, 6.0, 4.0, 9.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-23.09457778930664, -22.35789680480957, -21.6212158203125, -20.88453483581543, -20.14785385131836, -19.41117286682129, -18.67449188232422, -17.93781089782715, -17.201129913330078, -16.464448928833008, -15.727767944335938, -14.991086959838867, -14.254405975341797, -13.517724990844727, -12.781044006347656, -12.044363021850586, -11.307682991027832, -10.571002006530762, -9.834321022033691, -9.097640037536621, -8.36095905303955, -7.6242780685424805, -6.887597560882568, -6.150916576385498, -5.414235591888428, -4.677554607391357, -3.940873622894287, -3.204192876815796, -2.4675118923187256, -1.7308309078216553, -0.9941501617431641, -0.25746917724609375, 0.47921180725097656, 1.2158927917480469, 1.9525736570358276, 2.6892545223236084, 3.4259355068206787, 4.162616729736328, 4.89929723739624, 5.6359782218933105, 6.372659206390381, 7.109340190887451, 7.8460211753845215, 8.582701683044434, 9.319382667541504, 10.056063652038574, 10.792744636535645, 11.529425621032715, 12.266106605529785, 13.002787590026855, 13.739468574523926, 14.476149559020996, 15.212830543518066, 15.949511528015137, 16.68619155883789, 17.42287254333496, 18.15955352783203, 18.8962345123291, 19.632915496826172, 20.369596481323242, 21.106277465820312, 21.842958450317383, 22.579639434814453, 23.316320419311523, 24.053001403808594]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 11.0, 13.0, 27.0, 27.0, 26.0, 57.0, 88.0, 104.0, 183.0, 275.0, 386.0, 605.0, 851.0, 1407.0, 2148.0, 3147.0, 5010.0, 7632.0, 12007.0, 18424.0, 29073.0, 45012.0, 68944.0, 101980.0, 140043.0, 162709.0, 141744.0, 105102.0, 71208.0, 46465.0, 29636.0, 19213.0, 12401.0, 7819.0, 5131.0, 3392.0, 2132.0, 1420.0, 887.0, 630.0, 412.0, 275.0, 162.0, 117.0, 83.0, 61.0, 26.0, 24.0, 13.0, 7.0, 4.0, 2.0, 5.0, 0.0, 3.0, 2.0, 2.0], "bins": [-11.6484375, -11.2904052734375, -10.932373046875, -10.5743408203125, -10.21630859375, -9.8582763671875, -9.500244140625, -9.1422119140625, -8.7841796875, -8.4261474609375, -8.068115234375, -7.7100830078125, -7.35205078125, -6.9940185546875, -6.635986328125, -6.2779541015625, -5.919921875, -5.5618896484375, -5.203857421875, -4.8458251953125, -4.48779296875, -4.1297607421875, -3.771728515625, -3.4136962890625, -3.0556640625, -2.6976318359375, -2.339599609375, -1.9815673828125, -1.62353515625, -1.2655029296875, -0.907470703125, -0.5494384765625, -0.19140625, 0.1666259765625, 0.524658203125, 0.8826904296875, 1.24072265625, 1.5987548828125, 1.956787109375, 2.3148193359375, 2.6728515625, 3.0308837890625, 3.388916015625, 3.7469482421875, 4.10498046875, 4.4630126953125, 4.821044921875, 5.1790771484375, 5.537109375, 5.8951416015625, 6.253173828125, 6.6112060546875, 6.96923828125, 7.3272705078125, 7.685302734375, 8.0433349609375, 8.4013671875, 8.7593994140625, 9.117431640625, 9.4754638671875, 9.83349609375, 10.1915283203125, 10.549560546875, 10.9075927734375, 11.265625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 6.0, 9.0, 9.0, 10.0, 10.0, 16.0, 25.0, 28.0, 22.0, 27.0, 33.0, 34.0, 31.0, 35.0, 40.0, 32.0, 42.0, 47.0, 39.0, 44.0, 46.0, 43.0, 40.0, 40.0, 36.0, 26.0, 33.0, 19.0, 22.0, 20.0, 17.0, 16.0, 27.0, 13.0, 16.0, 6.0, 4.0, 5.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4189453125, -1.372589111328125, -1.32623291015625, -1.279876708984375, -1.2335205078125, -1.187164306640625, -1.14080810546875, -1.094451904296875, -1.048095703125, -1.001739501953125, -0.95538330078125, -0.909027099609375, -0.8626708984375, -0.816314697265625, -0.76995849609375, -0.723602294921875, -0.67724609375, -0.630889892578125, -0.58453369140625, -0.538177490234375, -0.4918212890625, -0.445465087890625, -0.39910888671875, -0.352752685546875, -0.306396484375, -0.260040283203125, -0.21368408203125, -0.167327880859375, -0.1209716796875, -0.074615478515625, -0.02825927734375, 0.018096923828125, 0.064453125, 0.110809326171875, 0.15716552734375, 0.203521728515625, 0.2498779296875, 0.296234130859375, 0.34259033203125, 0.388946533203125, 0.435302734375, 0.481658935546875, 0.52801513671875, 0.574371337890625, 0.6207275390625, 0.667083740234375, 0.71343994140625, 0.759796142578125, 0.80615234375, 0.852508544921875, 0.89886474609375, 0.945220947265625, 0.9915771484375, 1.037933349609375, 1.08428955078125, 1.130645751953125, 1.177001953125, 1.223358154296875, 1.26971435546875, 1.316070556640625, 1.3624267578125, 1.408782958984375, 1.45513916015625, 1.501495361328125, 1.5478515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 2.0, 8.0, 11.0, 20.0, 36.0, 48.0, 69.0, 125.0, 138.0, 203.0, 332.0, 503.0, 825.0, 1425.0, 2582.0, 4872.0, 9856.0, 20941.0, 46899.0, 104443.0, 214224.0, 290205.0, 186438.0, 87955.0, 39616.0, 17902.0, 8665.0, 4380.0, 2353.0, 1286.0, 764.0, 512.0, 289.0, 185.0, 150.0, 86.0, 67.0, 28.0, 26.0, 19.0, 15.0, 8.0, 14.0, 4.0, 3.0, 6.0, 5.0, 1.0, 0.0, 3.0], "bins": [-22.5, -21.8642578125, -21.228515625, -20.5927734375, -19.95703125, -19.3212890625, -18.685546875, -18.0498046875, -17.4140625, -16.7783203125, -16.142578125, -15.5068359375, -14.87109375, -14.2353515625, -13.599609375, -12.9638671875, -12.328125, -11.6923828125, -11.056640625, -10.4208984375, -9.78515625, -9.1494140625, -8.513671875, -7.8779296875, -7.2421875, -6.6064453125, -5.970703125, -5.3349609375, -4.69921875, -4.0634765625, -3.427734375, -2.7919921875, -2.15625, -1.5205078125, -0.884765625, -0.2490234375, 0.38671875, 1.0224609375, 1.658203125, 2.2939453125, 2.9296875, 3.5654296875, 4.201171875, 4.8369140625, 5.47265625, 6.1083984375, 6.744140625, 7.3798828125, 8.015625, 8.6513671875, 9.287109375, 9.9228515625, 10.55859375, 11.1943359375, 11.830078125, 12.4658203125, 13.1015625, 13.7373046875, 14.373046875, 15.0087890625, 15.64453125, 16.2802734375, 16.916015625, 17.5517578125, 18.1875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 2.0, 7.0, 8.0, 8.0, 11.0, 12.0, 16.0, 22.0, 19.0, 27.0, 27.0, 31.0, 31.0, 39.0, 37.0, 47.0, 43.0, 49.0, 36.0, 46.0, 47.0, 48.0, 43.0, 42.0, 35.0, 35.0, 22.0, 34.0, 36.0, 32.0, 29.0, 12.0, 13.0, 11.0, 3.0, 10.0, 9.0, 10.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5906982421875, -9.282958984375, -8.9752197265625, -8.66748046875, -8.3597412109375, -8.052001953125, -7.7442626953125, -7.4365234375, -7.1287841796875, -6.821044921875, -6.5133056640625, -6.20556640625, -5.8978271484375, -5.590087890625, -5.2823486328125, -4.974609375, -4.6668701171875, -4.359130859375, -4.0513916015625, -3.74365234375, -3.4359130859375, -3.128173828125, -2.8204345703125, -2.5126953125, -2.2049560546875, -1.897216796875, -1.5894775390625, -1.28173828125, -0.9739990234375, -0.666259765625, -0.3585205078125, -0.05078125, 0.2569580078125, 0.564697265625, 0.8724365234375, 1.18017578125, 1.4879150390625, 1.795654296875, 2.1033935546875, 2.4111328125, 2.7188720703125, 3.026611328125, 3.3343505859375, 3.64208984375, 3.9498291015625, 4.257568359375, 4.5653076171875, 4.873046875, 5.1807861328125, 5.488525390625, 5.7962646484375, 6.10400390625, 6.4117431640625, 6.719482421875, 7.0272216796875, 7.3349609375, 7.6427001953125, 7.950439453125, 8.2581787109375, 8.56591796875, 8.8736572265625, 9.181396484375, 9.4891357421875, 9.796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 10.0, 21.0, 38.0, 32.0, 58.0, 85.0, 125.0, 184.0, 310.0, 529.0, 900.0, 1679.0, 3293.0, 7191.0, 16946.0, 44905.0, 128895.0, 319091.0, 319119.0, 128698.0, 44447.0, 17339.0, 7318.0, 3344.0, 1716.0, 883.0, 493.0, 311.0, 186.0, 116.0, 71.0, 72.0, 35.0, 23.0, 16.0, 13.0, 11.0, 7.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.6875, -17.134765625, -16.58203125, -16.029296875, -15.4765625, -14.923828125, -14.37109375, -13.818359375, -13.265625, -12.712890625, -12.16015625, -11.607421875, -11.0546875, -10.501953125, -9.94921875, -9.396484375, -8.84375, -8.291015625, -7.73828125, -7.185546875, -6.6328125, -6.080078125, -5.52734375, -4.974609375, -4.421875, -3.869140625, -3.31640625, -2.763671875, -2.2109375, -1.658203125, -1.10546875, -0.552734375, 0.0, 0.552734375, 1.10546875, 1.658203125, 2.2109375, 2.763671875, 3.31640625, 3.869140625, 4.421875, 4.974609375, 5.52734375, 6.080078125, 6.6328125, 7.185546875, 7.73828125, 8.291015625, 8.84375, 9.396484375, 9.94921875, 10.501953125, 11.0546875, 11.607421875, 12.16015625, 12.712890625, 13.265625, 13.818359375, 14.37109375, 14.923828125, 15.4765625, 16.029296875, 16.58203125, 17.134765625, 17.6875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 6.0, 9.0, 7.0, 7.0, 10.0, 18.0, 10.0, 19.0, 23.0, 43.0, 40.0, 74.0, 102.0, 129.0, 101.0, 109.0, 74.0, 51.0, 49.0, 32.0, 26.0, 14.0, 15.0, 9.0, 7.0, 1.0, 3.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025787353515625, -0.002490013837814331, -0.002401292324066162, -0.002312570810317993, -0.0022238492965698242, -0.0021351277828216553, -0.0020464062690734863, -0.0019576847553253174, -0.0018689632415771484, -0.0017802417278289795, -0.0016915202140808105, -0.0016027987003326416, -0.0015140771865844727, -0.0014253556728363037, -0.0013366341590881348, -0.0012479126453399658, -0.0011591911315917969, -0.001070469617843628, -0.000981748104095459, -0.00089302659034729, -0.0008043050765991211, -0.0007155835628509521, -0.0006268620491027832, -0.0005381405353546143, -0.0004494190216064453, -0.00036069750785827637, -0.0002719759941101074, -0.00018325448036193848, -9.453296661376953e-05, -5.811452865600586e-06, 8.291006088256836e-05, 0.0001716315746307373, 0.00026035308837890625, 0.0003490746021270752, 0.00043779611587524414, 0.0005265176296234131, 0.000615239143371582, 0.000703960657119751, 0.0007926821708679199, 0.0008814036846160889, 0.0009701251983642578, 0.0010588467121124268, 0.0011475682258605957, 0.0012362897396087646, 0.0013250112533569336, 0.0014137327671051025, 0.0015024542808532715, 0.0015911757946014404, 0.0016798973083496094, 0.0017686188220977783, 0.0018573403358459473, 0.0019460618495941162, 0.002034783363342285, 0.002123504877090454, 0.002212226390838623, 0.002300947904586792, 0.002389669418334961, 0.00247839093208313, 0.002567112445831299, 0.0026558339595794678, 0.0027445554733276367, 0.0028332769870758057, 0.0029219985008239746, 0.0030107200145721436, 0.0030994415283203125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 8.0, 14.0, 17.0, 19.0, 29.0, 30.0, 41.0, 61.0, 78.0, 114.0, 147.0, 266.0, 402.0, 544.0, 889.0, 1483.0, 2378.0, 4647.0, 9698.0, 23271.0, 68475.0, 236615.0, 425570.0, 183334.0, 53429.0, 18977.0, 8070.0, 3968.0, 2286.0, 1359.0, 769.0, 484.0, 294.0, 240.0, 168.0, 106.0, 64.0, 50.0, 51.0, 28.0, 21.0, 10.0, 10.0, 8.0, 7.0, 5.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.984375, -19.326904296875, -18.66943359375, -18.011962890625, -17.3544921875, -16.697021484375, -16.03955078125, -15.382080078125, -14.724609375, -14.067138671875, -13.40966796875, -12.752197265625, -12.0947265625, -11.437255859375, -10.77978515625, -10.122314453125, -9.46484375, -8.807373046875, -8.14990234375, -7.492431640625, -6.8349609375, -6.177490234375, -5.52001953125, -4.862548828125, -4.205078125, -3.547607421875, -2.89013671875, -2.232666015625, -1.5751953125, -0.917724609375, -0.26025390625, 0.397216796875, 1.0546875, 1.712158203125, 2.36962890625, 3.027099609375, 3.6845703125, 4.342041015625, 4.99951171875, 5.656982421875, 6.314453125, 6.971923828125, 7.62939453125, 8.286865234375, 8.9443359375, 9.601806640625, 10.25927734375, 10.916748046875, 11.57421875, 12.231689453125, 12.88916015625, 13.546630859375, 14.2041015625, 14.861572265625, 15.51904296875, 16.176513671875, 16.833984375, 17.491455078125, 18.14892578125, 18.806396484375, 19.4638671875, 20.121337890625, 20.77880859375, 21.436279296875, 22.09375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 9.0, 6.0, 13.0, 16.0, 20.0, 19.0, 30.0, 27.0, 38.0, 64.0, 54.0, 78.0, 60.0, 67.0, 88.0, 73.0, 60.0, 55.0, 48.0, 37.0, 31.0, 22.0, 21.0, 16.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5390625, -8.2318115234375, -7.924560546875, -7.6173095703125, -7.31005859375, -7.0028076171875, -6.695556640625, -6.3883056640625, -6.0810546875, -5.7738037109375, -5.466552734375, -5.1593017578125, -4.85205078125, -4.5447998046875, -4.237548828125, -3.9302978515625, -3.623046875, -3.3157958984375, -3.008544921875, -2.7012939453125, -2.39404296875, -2.0867919921875, -1.779541015625, -1.4722900390625, -1.1650390625, -0.8577880859375, -0.550537109375, -0.2432861328125, 0.06396484375, 0.3712158203125, 0.678466796875, 0.9857177734375, 1.29296875, 1.6002197265625, 1.907470703125, 2.2147216796875, 2.52197265625, 2.8292236328125, 3.136474609375, 3.4437255859375, 3.7509765625, 4.0582275390625, 4.365478515625, 4.6727294921875, 4.97998046875, 5.2872314453125, 5.594482421875, 5.9017333984375, 6.208984375, 6.5162353515625, 6.823486328125, 7.1307373046875, 7.43798828125, 7.7452392578125, 8.052490234375, 8.3597412109375, 8.6669921875, 8.9742431640625, 9.281494140625, 9.5887451171875, 9.89599609375, 10.2032470703125, 10.510498046875, 10.8177490234375, 11.125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 10.0, 8.0, 10.0, 17.0, 25.0, 31.0, 51.0, 84.0, 79.0, 108.0, 122.0, 112.0, 98.0, 74.0, 48.0, 36.0, 30.0, 15.0, 13.0, 7.0, 4.0, 3.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.39254760742188, -139.79901123046875, -135.20547485351562, -130.6119384765625, -126.01839447021484, -121.42485809326172, -116.83131408691406, -112.23777770996094, -107.64424133300781, -103.05070495605469, -98.45716857910156, -93.8636245727539, -89.27008819580078, -84.67655181884766, -80.0830078125, -75.48947143554688, -70.89593505859375, -66.30239868164062, -61.708858489990234, -57.115318298339844, -52.52178192138672, -47.928245544433594, -43.3347053527832, -38.74116516113281, -34.14762878417969, -29.55409049987793, -24.960552215576172, -20.367013931274414, -15.773475646972656, -11.179937362670898, -6.586399078369141, -1.99285888671875, 2.600677490234375, 7.194215774536133, 11.78775405883789, 16.38129234313965, 20.974830627441406, 25.568368911743164, 30.161907196044922, 34.75544738769531, 39.34898376464844, 43.94252014160156, 48.53606033325195, 53.129600524902344, 57.72313690185547, 62.316673278808594, 66.91021728515625, 71.50375366210938, 76.0972900390625, 80.69082641601562, 85.28436279296875, 89.8779067993164, 94.47144317626953, 99.06497955322266, 103.65852355957031, 108.25205993652344, 112.84559631347656, 117.43913269042969, 122.03266906738281, 126.62621307373047, 131.21975708007812, 135.81329345703125, 140.40682983398438, 145.0003662109375, 149.59390258789062]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 10.0, 16.0, 11.0, 18.0, 25.0, 23.0, 27.0, 38.0, 35.0, 38.0, 59.0, 47.0, 48.0, 45.0, 47.0, 59.0, 58.0, 54.0, 47.0, 55.0, 31.0, 34.0, 35.0, 27.0, 25.0, 20.0, 14.0, 17.0, 9.0, 8.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.48682403564453, -53.96778106689453, -51.44873809814453, -48.92969512939453, -46.4106559753418, -43.8916130065918, -41.3725700378418, -38.85353088378906, -36.33448791503906, -33.81544494628906, -31.296403884887695, -28.777360916137695, -26.258319854736328, -23.739276885986328, -21.220233917236328, -18.70119285583496, -16.182147979736328, -13.663105964660645, -11.144063949584961, -8.625020980834961, -6.105978965759277, -3.5869369506835938, -1.0678939819335938, 1.4511470794677734, 3.9701900482177734, 6.489232063293457, 9.00827407836914, 11.52731704711914, 14.046359062194824, 16.565401077270508, 19.084444046020508, 21.603485107421875, 24.122528076171875, 26.641571044921875, 29.160612106323242, 31.679655075073242, 34.19869613647461, 36.71773910522461, 39.23678207397461, 41.755821228027344, 44.274864196777344, 46.793907165527344, 49.312950134277344, 51.831993103027344, 54.35103225708008, 56.87007522583008, 59.38911819458008, 61.90815734863281, 64.42720031738281, 66.94624328613281, 69.46528625488281, 71.98432922363281, 74.50337219238281, 77.02241516113281, 79.54145812988281, 82.06049346923828, 84.57954406738281, 87.09858703613281, 89.61763000488281, 92.13667297363281, 94.65571594238281, 97.17475891113281, 99.69380187988281, 102.21283721923828, 104.73188018798828]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 11.0, 15.0, 20.0, 34.0, 44.0, 59.0, 100.0, 239.0, 807.0, 3312.0, 16488.0, 107179.0, 3776436.0, 251306.0, 30063.0, 5822.0, 1465.0, 456.0, 179.0, 86.0, 37.0, 26.0, 25.0, 13.0, 16.0, 12.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-118.875, -115.6337890625, -112.392578125, -109.1513671875, -105.91015625, -102.6689453125, -99.427734375, -96.1865234375, -92.9453125, -89.7041015625, -86.462890625, -83.2216796875, -79.98046875, -76.7392578125, -73.498046875, -70.2568359375, -67.015625, -63.7744140625, -60.533203125, -57.2919921875, -54.05078125, -50.8095703125, -47.568359375, -44.3271484375, -41.0859375, -37.8447265625, -34.603515625, -31.3623046875, -28.12109375, -24.8798828125, -21.638671875, -18.3974609375, -15.15625, -11.9150390625, -8.673828125, -5.4326171875, -2.19140625, 1.0498046875, 4.291015625, 7.5322265625, 10.7734375, 14.0146484375, 17.255859375, 20.4970703125, 23.73828125, 26.9794921875, 30.220703125, 33.4619140625, 36.703125, 39.9443359375, 43.185546875, 46.4267578125, 49.66796875, 52.9091796875, 56.150390625, 59.3916015625, 62.6328125, 65.8740234375, 69.115234375, 72.3564453125, 75.59765625, 78.8388671875, 82.080078125, 85.3212890625, 88.5625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 7.0, 8.0, 15.0, 16.0, 29.0, 25.0, 36.0, 36.0, 31.0, 37.0, 44.0, 49.0, 58.0, 58.0, 73.0, 62.0, 44.0, 52.0, 56.0, 49.0, 35.0, 32.0, 28.0, 36.0, 17.0, 17.0, 14.0, 6.0, 5.0, 11.0, 4.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.818359375, -2.7413330078125, -2.664306640625, -2.5872802734375, -2.51025390625, -2.4332275390625, -2.356201171875, -2.2791748046875, -2.2021484375, -2.1251220703125, -2.048095703125, -1.9710693359375, -1.89404296875, -1.8170166015625, -1.739990234375, -1.6629638671875, -1.5859375, -1.5089111328125, -1.431884765625, -1.3548583984375, -1.27783203125, -1.2008056640625, -1.123779296875, -1.0467529296875, -0.9697265625, -0.8927001953125, -0.815673828125, -0.7386474609375, -0.66162109375, -0.5845947265625, -0.507568359375, -0.4305419921875, -0.353515625, -0.2764892578125, -0.199462890625, -0.1224365234375, -0.04541015625, 0.0316162109375, 0.108642578125, 0.1856689453125, 0.2626953125, 0.3397216796875, 0.416748046875, 0.4937744140625, 0.57080078125, 0.6478271484375, 0.724853515625, 0.8018798828125, 0.87890625, 0.9559326171875, 1.032958984375, 1.1099853515625, 1.18701171875, 1.2640380859375, 1.341064453125, 1.4180908203125, 1.4951171875, 1.5721435546875, 1.649169921875, 1.7261962890625, 1.80322265625, 1.8802490234375, 1.957275390625, 2.0343017578125, 2.111328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 16.0, 24.0, 43.0, 63.0, 160.0, 406.0, 1387.0, 5798.0, 29734.0, 217038.0, 3617014.0, 277750.0, 35670.0, 6740.0, 1556.0, 448.0, 166.0, 83.0, 51.0, 30.0, 29.0, 11.0, 15.0, 5.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.9375, -114.0537109375, -111.169921875, -108.2861328125, -105.40234375, -102.5185546875, -99.634765625, -96.7509765625, -93.8671875, -90.9833984375, -88.099609375, -85.2158203125, -82.33203125, -79.4482421875, -76.564453125, -73.6806640625, -70.796875, -67.9130859375, -65.029296875, -62.1455078125, -59.26171875, -56.3779296875, -53.494140625, -50.6103515625, -47.7265625, -44.8427734375, -41.958984375, -39.0751953125, -36.19140625, -33.3076171875, -30.423828125, -27.5400390625, -24.65625, -21.7724609375, -18.888671875, -16.0048828125, -13.12109375, -10.2373046875, -7.353515625, -4.4697265625, -1.5859375, 1.2978515625, 4.181640625, 7.0654296875, 9.94921875, 12.8330078125, 15.716796875, 18.6005859375, 21.484375, 24.3681640625, 27.251953125, 30.1357421875, 33.01953125, 35.9033203125, 38.787109375, 41.6708984375, 44.5546875, 47.4384765625, 50.322265625, 53.2060546875, 56.08984375, 58.9736328125, 61.857421875, 64.7412109375, 67.625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 8.0, 8.0, 8.0, 21.0, 12.0, 19.0, 30.0, 38.0, 30.0, 39.0, 85.0, 122.0, 170.0, 293.0, 822.0, 1391.0, 322.0, 174.0, 124.0, 94.0, 51.0, 55.0, 30.0, 33.0, 27.0, 22.0, 7.0, 8.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.68988037109375, -6.4227294921875, -6.15557861328125, -5.888427734375, -5.62127685546875, -5.3541259765625, -5.08697509765625, -4.81982421875, -4.55267333984375, -4.2855224609375, -4.01837158203125, -3.751220703125, -3.48406982421875, -3.2169189453125, -2.94976806640625, -2.6826171875, -2.41546630859375, -2.1483154296875, -1.88116455078125, -1.614013671875, -1.34686279296875, -1.0797119140625, -0.81256103515625, -0.54541015625, -0.27825927734375, -0.0111083984375, 0.25604248046875, 0.523193359375, 0.79034423828125, 1.0574951171875, 1.32464599609375, 1.591796875, 1.85894775390625, 2.1260986328125, 2.39324951171875, 2.660400390625, 2.92755126953125, 3.1947021484375, 3.46185302734375, 3.72900390625, 3.99615478515625, 4.2633056640625, 4.53045654296875, 4.797607421875, 5.06475830078125, 5.3319091796875, 5.59906005859375, 5.8662109375, 6.13336181640625, 6.4005126953125, 6.66766357421875, 6.934814453125, 7.20196533203125, 7.4691162109375, 7.73626708984375, 8.00341796875, 8.27056884765625, 8.5377197265625, 8.80487060546875, 9.072021484375, 9.33917236328125, 9.6063232421875, 9.87347412109375, 10.140625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 5.0, 10.0, 8.0, 32.0, 44.0, 77.0, 116.0, 151.0, 212.0, 144.0, 89.0, 49.0, 27.0, 21.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.19717407226562, -110.63522338867188, -107.07328033447266, -103.5113296508789, -99.94937896728516, -96.38743591308594, -92.82548522949219, -89.26353454589844, -85.70158386230469, -82.13963317871094, -78.57769012451172, -75.01573944091797, -71.45378875732422, -67.891845703125, -64.32989501953125, -60.7679443359375, -57.20600128173828, -53.6440544128418, -50.08210372924805, -46.52015686035156, -42.95820617675781, -39.39625930786133, -35.834312438964844, -32.272361755371094, -28.71041488647461, -25.148466110229492, -21.586517333984375, -18.02457046508789, -14.462621688842773, -10.900672912597656, -7.338726043701172, -3.7767772674560547, -0.2148284912109375, 3.3471198081970215, 6.9090681076049805, 10.471015930175781, 14.032964706420898, 17.594913482666016, 21.1568603515625, 24.718809127807617, 28.280757904052734, 31.84270668029785, 35.40465545654297, 38.96660232543945, 42.52854919433594, 46.09049987792969, 49.65244674682617, 53.214393615722656, 56.776344299316406, 60.33829116821289, 63.90024185180664, 67.46218872070312, 71.02413940429688, 74.58609008789062, 78.14803314208984, 81.7099838256836, 85.27192687988281, 88.83387756347656, 92.39582061767578, 95.95777130126953, 99.51972198486328, 103.0816650390625, 106.64361572265625, 110.20556640625, 113.76751708984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 6.0, 6.0, 10.0, 19.0, 17.0, 15.0, 22.0, 28.0, 28.0, 35.0, 29.0, 31.0, 41.0, 48.0, 46.0, 44.0, 57.0, 54.0, 41.0, 39.0, 42.0, 34.0, 44.0, 44.0, 39.0, 28.0, 26.0, 25.0, 26.0, 13.0, 9.0, 13.0, 14.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.62100601196289, -32.501705169677734, -31.382408142089844, -30.26310920715332, -29.143810272216797, -28.02450942993164, -26.905210494995117, -25.785911560058594, -24.66661262512207, -23.547313690185547, -22.428014755249023, -21.3087158203125, -20.189414978027344, -19.070117950439453, -17.950817108154297, -16.831518173217773, -15.71221923828125, -14.592920303344727, -13.473621368408203, -12.354321479797363, -11.23502254486084, -10.115723609924316, -8.996423721313477, -7.877124786376953, -6.75782585144043, -5.638526916503906, -4.519227504730225, -3.399928331375122, -2.2806291580200195, -1.161330223083496, -0.04203081130981445, 1.0772686004638672, 2.196563720703125, 3.3158628940582275, 4.43516206741333, 5.554461479187012, 6.673760414123535, 7.793059349060059, 8.912359237670898, 10.031658172607422, 11.150957107543945, 12.270256042480469, 13.389554977416992, 14.508854866027832, 15.628153800964355, 16.747451782226562, 17.86675262451172, 18.986051559448242, 20.105350494384766, 21.22464942932129, 22.343948364257812, 23.463247299194336, 24.58254623413086, 25.701847076416016, 26.82114601135254, 27.940444946289062, 29.059743881225586, 30.17904281616211, 31.298341751098633, 32.417640686035156, 33.53694152832031, 34.6562385559082, 35.77553939819336, 36.89483642578125, 38.014137268066406]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 5.0, 4.0, 9.0, 19.0, 13.0, 27.0, 18.0, 37.0, 51.0, 68.0, 147.0, 275.0, 437.0, 911.0, 1964.0, 4861.0, 12901.0, 39852.0, 126906.0, 373849.0, 325894.0, 107290.0, 33880.0, 11401.0, 4141.0, 1764.0, 810.0, 409.0, 247.0, 122.0, 76.0, 49.0, 37.0, 22.0, 17.0, 9.0, 7.0, 10.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-32.15625, -31.1796875, -30.203125, -29.2265625, -28.25, -27.2734375, -26.296875, -25.3203125, -24.34375, -23.3671875, -22.390625, -21.4140625, -20.4375, -19.4609375, -18.484375, -17.5078125, -16.53125, -15.5546875, -14.578125, -13.6015625, -12.625, -11.6484375, -10.671875, -9.6953125, -8.71875, -7.7421875, -6.765625, -5.7890625, -4.8125, -3.8359375, -2.859375, -1.8828125, -0.90625, 0.0703125, 1.046875, 2.0234375, 3.0, 3.9765625, 4.953125, 5.9296875, 6.90625, 7.8828125, 8.859375, 9.8359375, 10.8125, 11.7890625, 12.765625, 13.7421875, 14.71875, 15.6953125, 16.671875, 17.6484375, 18.625, 19.6015625, 20.578125, 21.5546875, 22.53125, 23.5078125, 24.484375, 25.4609375, 26.4375, 27.4140625, 28.390625, 29.3671875, 30.34375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 9.0, 15.0, 15.0, 18.0, 26.0, 41.0, 57.0, 57.0, 65.0, 76.0, 87.0, 101.0, 84.0, 68.0, 63.0, 62.0, 45.0, 36.0, 26.0, 15.0, 11.0, 10.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.080230712890625, -3.95733642578125, -3.834442138671875, -3.7115478515625, -3.588653564453125, -3.46575927734375, -3.342864990234375, -3.219970703125, -3.097076416015625, -2.97418212890625, -2.851287841796875, -2.7283935546875, -2.605499267578125, -2.48260498046875, -2.359710693359375, -2.23681640625, -2.113922119140625, -1.99102783203125, -1.868133544921875, -1.7452392578125, -1.622344970703125, -1.49945068359375, -1.376556396484375, -1.253662109375, -1.130767822265625, -1.00787353515625, -0.884979248046875, -0.7620849609375, -0.639190673828125, -0.51629638671875, -0.393402099609375, -0.2705078125, -0.147613525390625, -0.02471923828125, 0.098175048828125, 0.2210693359375, 0.343963623046875, 0.46685791015625, 0.589752197265625, 0.712646484375, 0.835540771484375, 0.95843505859375, 1.081329345703125, 1.2042236328125, 1.327117919921875, 1.45001220703125, 1.572906494140625, 1.69580078125, 1.818695068359375, 1.94158935546875, 2.064483642578125, 2.1873779296875, 2.310272216796875, 2.43316650390625, 2.556060791015625, 2.678955078125, 2.801849365234375, 2.92474365234375, 3.047637939453125, 3.1705322265625, 3.293426513671875, 3.41632080078125, 3.539215087890625, 3.662109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 8.0, 9.0, 11.0, 15.0, 25.0, 36.0, 53.0, 70.0, 100.0, 191.0, 271.0, 422.0, 757.0, 1656.0, 3490.0, 9226.0, 26804.0, 90307.0, 338525.0, 413021.0, 112209.0, 32567.0, 10656.0, 4064.0, 1835.0, 891.0, 515.0, 301.0, 172.0, 122.0, 75.0, 55.0, 34.0, 12.0, 21.0, 9.0, 5.0, 5.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-37.5625, -36.521484375, -35.48046875, -34.439453125, -33.3984375, -32.357421875, -31.31640625, -30.275390625, -29.234375, -28.193359375, -27.15234375, -26.111328125, -25.0703125, -24.029296875, -22.98828125, -21.947265625, -20.90625, -19.865234375, -18.82421875, -17.783203125, -16.7421875, -15.701171875, -14.66015625, -13.619140625, -12.578125, -11.537109375, -10.49609375, -9.455078125, -8.4140625, -7.373046875, -6.33203125, -5.291015625, -4.25, -3.208984375, -2.16796875, -1.126953125, -0.0859375, 0.955078125, 1.99609375, 3.037109375, 4.078125, 5.119140625, 6.16015625, 7.201171875, 8.2421875, 9.283203125, 10.32421875, 11.365234375, 12.40625, 13.447265625, 14.48828125, 15.529296875, 16.5703125, 17.611328125, 18.65234375, 19.693359375, 20.734375, 21.775390625, 22.81640625, 23.857421875, 24.8984375, 25.939453125, 26.98046875, 28.021484375, 29.0625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 9.0, 7.0, 13.0, 7.0, 19.0, 15.0, 21.0, 22.0, 21.0, 32.0, 29.0, 46.0, 42.0, 46.0, 54.0, 57.0, 62.0, 50.0, 52.0, 44.0, 59.0, 46.0, 40.0, 28.0, 33.0, 27.0, 22.0, 16.0, 27.0, 21.0, 13.0, 7.0, 9.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.34375, -11.8310546875, -11.318359375, -10.8056640625, -10.29296875, -9.7802734375, -9.267578125, -8.7548828125, -8.2421875, -7.7294921875, -7.216796875, -6.7041015625, -6.19140625, -5.6787109375, -5.166015625, -4.6533203125, -4.140625, -3.6279296875, -3.115234375, -2.6025390625, -2.08984375, -1.5771484375, -1.064453125, -0.5517578125, -0.0390625, 0.4736328125, 0.986328125, 1.4990234375, 2.01171875, 2.5244140625, 3.037109375, 3.5498046875, 4.0625, 4.5751953125, 5.087890625, 5.6005859375, 6.11328125, 6.6259765625, 7.138671875, 7.6513671875, 8.1640625, 8.6767578125, 9.189453125, 9.7021484375, 10.21484375, 10.7275390625, 11.240234375, 11.7529296875, 12.265625, 12.7783203125, 13.291015625, 13.8037109375, 14.31640625, 14.8291015625, 15.341796875, 15.8544921875, 16.3671875, 16.8798828125, 17.392578125, 17.9052734375, 18.41796875, 18.9306640625, 19.443359375, 19.9560546875, 20.46875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 6.0, 17.0, 36.0, 34.0, 53.0, 98.0, 149.0, 284.0, 497.0, 962.0, 1905.0, 4344.0, 11947.0, 51447.0, 419526.0, 477117.0, 58020.0, 13212.0, 4687.0, 2022.0, 936.0, 530.0, 279.0, 170.0, 90.0, 54.0, 30.0, 19.0, 24.0, 10.0, 4.0, 10.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-36.71875, -35.670654296875, -34.62255859375, -33.574462890625, -32.5263671875, -31.478271484375, -30.43017578125, -29.382080078125, -28.333984375, -27.285888671875, -26.23779296875, -25.189697265625, -24.1416015625, -23.093505859375, -22.04541015625, -20.997314453125, -19.94921875, -18.901123046875, -17.85302734375, -16.804931640625, -15.7568359375, -14.708740234375, -13.66064453125, -12.612548828125, -11.564453125, -10.516357421875, -9.46826171875, -8.420166015625, -7.3720703125, -6.323974609375, -5.27587890625, -4.227783203125, -3.1796875, -2.131591796875, -1.08349609375, -0.035400390625, 1.0126953125, 2.060791015625, 3.10888671875, 4.156982421875, 5.205078125, 6.253173828125, 7.30126953125, 8.349365234375, 9.3974609375, 10.445556640625, 11.49365234375, 12.541748046875, 13.58984375, 14.637939453125, 15.68603515625, 16.734130859375, 17.7822265625, 18.830322265625, 19.87841796875, 20.926513671875, 21.974609375, 23.022705078125, 24.07080078125, 25.118896484375, 26.1669921875, 27.215087890625, 28.26318359375, 29.311279296875, 30.359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 2.0, 17.0, 25.0, 68.0, 174.0, 309.0, 215.0, 84.0, 53.0, 18.0, 11.0, 8.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00970458984375, -0.009477376937866211, -0.009250164031982422, -0.009022951126098633, -0.008795738220214844, -0.008568525314331055, -0.008341312408447266, -0.008114099502563477, -0.007886886596679688, -0.0076596736907958984, -0.007432460784912109, -0.00720524787902832, -0.006978034973144531, -0.006750822067260742, -0.006523609161376953, -0.006296396255493164, -0.006069183349609375, -0.005841970443725586, -0.005614757537841797, -0.005387544631958008, -0.005160331726074219, -0.00493311882019043, -0.004705905914306641, -0.0044786930084228516, -0.0042514801025390625, -0.0040242671966552734, -0.0037970542907714844, -0.0035698413848876953, -0.0033426284790039062, -0.003115415573120117, -0.002888202667236328, -0.002660989761352539, -0.00243377685546875, -0.002206563949584961, -0.001979351043701172, -0.0017521381378173828, -0.0015249252319335938, -0.0012977123260498047, -0.0010704994201660156, -0.0008432865142822266, -0.0006160736083984375, -0.00038886070251464844, -0.00016164779663085938, 6.556510925292969e-05, 0.00029277801513671875, 0.0005199909210205078, 0.0007472038269042969, 0.0009744167327880859, 0.001201629638671875, 0.001428842544555664, 0.0016560554504394531, 0.0018832683563232422, 0.0021104812622070312, 0.0023376941680908203, 0.0025649070739746094, 0.0027921199798583984, 0.0030193328857421875, 0.0032465457916259766, 0.0034737586975097656, 0.0037009716033935547, 0.003928184509277344, 0.004155397415161133, 0.004382610321044922, 0.004609823226928711, 0.0048370361328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 8.0, 7.0, 16.0, 13.0, 23.0, 39.0, 58.0, 54.0, 124.0, 175.0, 295.0, 468.0, 769.0, 1392.0, 2870.0, 6549.0, 17591.0, 70880.0, 507869.0, 363691.0, 50922.0, 14052.0, 5340.0, 2393.0, 1259.0, 624.0, 395.0, 237.0, 136.0, 77.0, 59.0, 40.0, 28.0, 22.0, 20.0, 13.0, 12.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-32.03125, -30.9228515625, -29.814453125, -28.7060546875, -27.59765625, -26.4892578125, -25.380859375, -24.2724609375, -23.1640625, -22.0556640625, -20.947265625, -19.8388671875, -18.73046875, -17.6220703125, -16.513671875, -15.4052734375, -14.296875, -13.1884765625, -12.080078125, -10.9716796875, -9.86328125, -8.7548828125, -7.646484375, -6.5380859375, -5.4296875, -4.3212890625, -3.212890625, -2.1044921875, -0.99609375, 0.1123046875, 1.220703125, 2.3291015625, 3.4375, 4.5458984375, 5.654296875, 6.7626953125, 7.87109375, 8.9794921875, 10.087890625, 11.1962890625, 12.3046875, 13.4130859375, 14.521484375, 15.6298828125, 16.73828125, 17.8466796875, 18.955078125, 20.0634765625, 21.171875, 22.2802734375, 23.388671875, 24.4970703125, 25.60546875, 26.7138671875, 27.822265625, 28.9306640625, 30.0390625, 31.1474609375, 32.255859375, 33.3642578125, 34.47265625, 35.5810546875, 36.689453125, 37.7978515625, 38.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 2.0, 5.0, 6.0, 10.0, 17.0, 12.0, 19.0, 38.0, 43.0, 58.0, 94.0, 136.0, 127.0, 121.0, 114.0, 56.0, 33.0, 25.0, 21.0, 16.0, 14.0, 4.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.110595703125, -19.48681640625, -18.863037109375, -18.2392578125, -17.615478515625, -16.99169921875, -16.367919921875, -15.744140625, -15.120361328125, -14.49658203125, -13.872802734375, -13.2490234375, -12.625244140625, -12.00146484375, -11.377685546875, -10.75390625, -10.130126953125, -9.50634765625, -8.882568359375, -8.2587890625, -7.635009765625, -7.01123046875, -6.387451171875, -5.763671875, -5.139892578125, -4.51611328125, -3.892333984375, -3.2685546875, -2.644775390625, -2.02099609375, -1.397216796875, -0.7734375, -0.149658203125, 0.47412109375, 1.097900390625, 1.7216796875, 2.345458984375, 2.96923828125, 3.593017578125, 4.216796875, 4.840576171875, 5.46435546875, 6.088134765625, 6.7119140625, 7.335693359375, 7.95947265625, 8.583251953125, 9.20703125, 9.830810546875, 10.45458984375, 11.078369140625, 11.7021484375, 12.325927734375, 12.94970703125, 13.573486328125, 14.197265625, 14.821044921875, 15.44482421875, 16.068603515625, 16.6923828125, 17.316162109375, 17.93994140625, 18.563720703125, 19.1875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 9.0, 20.0, 69.0, 105.0, 213.0, 238.0, 187.0, 85.0, 34.0, 16.0, 4.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-286.85784912109375, -275.50750732421875, -264.1571350097656, -252.80679321289062, -241.45645141601562, -230.10609436035156, -218.7557373046875, -207.4053955078125, -196.05503845214844, -184.70468139648438, -173.35433959960938, -162.0039825439453, -150.65362548828125, -139.30328369140625, -127.95292663574219, -116.60257720947266, -105.25222778320312, -93.9018783569336, -82.55152893066406, -71.201171875, -59.85082244873047, -48.50047302246094, -37.150115966796875, -25.799766540527344, -14.449417114257812, -3.0990657806396484, 8.251285552978516, 19.601638793945312, 30.951988220214844, 42.302337646484375, 53.65269470214844, 65.00304412841797, 76.3533935546875, 87.70374298095703, 99.05409240722656, 110.40444946289062, 121.75479888916016, 133.1051483154297, 144.45550537109375, 155.80584716796875, 167.1562042236328, 178.50656127929688, 189.85690307617188, 201.20726013183594, 212.5576171875, 223.907958984375, 235.25831604003906, 246.60867309570312, 257.9590148925781, 269.3093566894531, 280.65972900390625, 292.01007080078125, 303.36041259765625, 314.71075439453125, 326.0611267089844, 337.4114685058594, 348.7618408203125, 360.1121826171875, 371.4625549316406, 382.8128967285156, 394.1632385253906, 405.51361083984375, 416.86395263671875, 428.21429443359375, 439.56463623046875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 8.0, 5.0, 7.0, 10.0, 17.0, 20.0, 29.0, 23.0, 26.0, 45.0, 37.0, 43.0, 44.0, 34.0, 68.0, 51.0, 66.0, 50.0, 54.0, 38.0, 44.0, 40.0, 51.0, 32.0, 31.0, 30.0, 23.0, 20.0, 12.0, 10.0, 5.0, 7.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.79647827148438, -115.7995376586914, -111.8025894165039, -107.80564880371094, -103.80870819091797, -99.811767578125, -95.8148193359375, -91.81787872314453, -87.82093811035156, -83.8239974975586, -79.8270492553711, -75.83010864257812, -71.83316802978516, -67.83622741699219, -63.83927917480469, -59.84233856201172, -55.84539031982422, -51.848445892333984, -47.851505279541016, -43.85456085205078, -39.85762023925781, -35.86067581176758, -31.863731384277344, -27.866788864135742, -23.86984634399414, -19.87290382385254, -15.875960350036621, -11.879016876220703, -7.882074356079102, -3.8851318359375, 0.11181259155273438, 4.108755111694336, 8.105697631835938, 12.102640151977539, 16.09958267211914, 20.096527099609375, 24.093469619750977, 28.090412139892578, 32.08735656738281, 36.08429718017578, 40.081241607666016, 44.07818603515625, 48.07512664794922, 52.07207107543945, 56.06901550292969, 60.065956115722656, 64.06289672851562, 68.05984497070312, 72.0567855834961, 76.05372619628906, 80.05067443847656, 84.04761505126953, 88.0445556640625, 92.04150390625, 96.03844451904297, 100.03538513183594, 104.03233337402344, 108.0292739868164, 112.0262222290039, 116.02316284179688, 120.02010345458984, 124.01704406738281, 128.0139923095703, 132.0109405517578, 136.00787353515625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 13.0, 15.0, 28.0, 43.0, 78.0, 230.0, 600.0, 1878.0, 7606.0, 44257.0, 3272968.0, 821891.0, 35696.0, 6314.0, 1649.0, 519.0, 226.0, 111.0, 63.0, 37.0, 18.0, 19.0, 8.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.625, -67.7939453125, -64.962890625, -62.1318359375, -59.30078125, -56.4697265625, -53.638671875, -50.8076171875, -47.9765625, -45.1455078125, -42.314453125, -39.4833984375, -36.65234375, -33.8212890625, -30.990234375, -28.1591796875, -25.328125, -22.4970703125, -19.666015625, -16.8349609375, -14.00390625, -11.1728515625, -8.341796875, -5.5107421875, -2.6796875, 0.1513671875, 2.982421875, 5.8134765625, 8.64453125, 11.4755859375, 14.306640625, 17.1376953125, 19.96875, 22.7998046875, 25.630859375, 28.4619140625, 31.29296875, 34.1240234375, 36.955078125, 39.7861328125, 42.6171875, 45.4482421875, 48.279296875, 51.1103515625, 53.94140625, 56.7724609375, 59.603515625, 62.4345703125, 65.265625, 68.0966796875, 70.927734375, 73.7587890625, 76.58984375, 79.4208984375, 82.251953125, 85.0830078125, 87.9140625, 90.7451171875, 93.576171875, 96.4072265625, 99.23828125, 102.0693359375, 104.900390625, 107.7314453125, 110.5625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 5.0, 4.0, 7.0, 14.0, 9.0, 19.0, 15.0, 31.0, 27.0, 38.0, 37.0, 46.0, 48.0, 61.0, 53.0, 70.0, 63.0, 62.0, 54.0, 58.0, 51.0, 44.0, 31.0, 33.0, 30.0, 21.0, 15.0, 9.0, 11.0, 5.0, 12.0, 3.0, 3.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.15057373046875, -3.0491943359375, -2.94781494140625, -2.846435546875, -2.74505615234375, -2.6436767578125, -2.54229736328125, -2.44091796875, -2.33953857421875, -2.2381591796875, -2.13677978515625, -2.035400390625, -1.93402099609375, -1.8326416015625, -1.73126220703125, -1.6298828125, -1.52850341796875, -1.4271240234375, -1.32574462890625, -1.224365234375, -1.12298583984375, -1.0216064453125, -0.92022705078125, -0.81884765625, -0.71746826171875, -0.6160888671875, -0.51470947265625, -0.413330078125, -0.31195068359375, -0.2105712890625, -0.10919189453125, -0.0078125, 0.09356689453125, 0.1949462890625, 0.29632568359375, 0.397705078125, 0.49908447265625, 0.6004638671875, 0.70184326171875, 0.80322265625, 0.90460205078125, 1.0059814453125, 1.10736083984375, 1.208740234375, 1.31011962890625, 1.4114990234375, 1.51287841796875, 1.6142578125, 1.71563720703125, 1.8170166015625, 1.91839599609375, 2.019775390625, 2.12115478515625, 2.2225341796875, 2.32391357421875, 2.42529296875, 2.52667236328125, 2.6280517578125, 2.72943115234375, 2.830810546875, 2.93218994140625, 3.0335693359375, 3.13494873046875, 3.236328125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 11.0, 5.0, 6.0, 19.0, 31.0, 31.0, 53.0, 80.0, 129.0, 215.0, 352.0, 531.0, 986.0, 1882.0, 3436.0, 6770.0, 15153.0, 36428.0, 101548.0, 406668.0, 3095974.0, 364709.0, 95448.0, 34534.0, 14695.0, 6934.0, 3371.0, 1787.0, 966.0, 609.0, 351.0, 208.0, 131.0, 74.0, 45.0, 32.0, 24.0, 16.0, 14.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.25, -32.193359375, -31.13671875, -30.080078125, -29.0234375, -27.966796875, -26.91015625, -25.853515625, -24.796875, -23.740234375, -22.68359375, -21.626953125, -20.5703125, -19.513671875, -18.45703125, -17.400390625, -16.34375, -15.287109375, -14.23046875, -13.173828125, -12.1171875, -11.060546875, -10.00390625, -8.947265625, -7.890625, -6.833984375, -5.77734375, -4.720703125, -3.6640625, -2.607421875, -1.55078125, -0.494140625, 0.5625, 1.619140625, 2.67578125, 3.732421875, 4.7890625, 5.845703125, 6.90234375, 7.958984375, 9.015625, 10.072265625, 11.12890625, 12.185546875, 13.2421875, 14.298828125, 15.35546875, 16.412109375, 17.46875, 18.525390625, 19.58203125, 20.638671875, 21.6953125, 22.751953125, 23.80859375, 24.865234375, 25.921875, 26.978515625, 28.03515625, 29.091796875, 30.1484375, 31.205078125, 32.26171875, 33.318359375, 34.375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 7.0, 6.0, 7.0, 6.0, 9.0, 11.0, 14.0, 19.0, 23.0, 38.0, 36.0, 46.0, 56.0, 64.0, 111.0, 183.0, 273.0, 622.0, 1337.0, 430.0, 203.0, 145.0, 90.0, 72.0, 42.0, 41.0, 33.0, 30.0, 24.0, 24.0, 14.0, 13.0, 6.0, 8.0, 9.0, 6.0, 1.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.95703125, -6.73419189453125, -6.5113525390625, -6.28851318359375, -6.065673828125, -5.84283447265625, -5.6199951171875, -5.39715576171875, -5.17431640625, -4.95147705078125, -4.7286376953125, -4.50579833984375, -4.282958984375, -4.06011962890625, -3.8372802734375, -3.61444091796875, -3.3916015625, -3.16876220703125, -2.9459228515625, -2.72308349609375, -2.500244140625, -2.27740478515625, -2.0545654296875, -1.83172607421875, -1.60888671875, -1.38604736328125, -1.1632080078125, -0.94036865234375, -0.717529296875, -0.49468994140625, -0.2718505859375, -0.04901123046875, 0.173828125, 0.39666748046875, 0.6195068359375, 0.84234619140625, 1.065185546875, 1.28802490234375, 1.5108642578125, 1.73370361328125, 1.95654296875, 2.17938232421875, 2.4022216796875, 2.62506103515625, 2.847900390625, 3.07073974609375, 3.2935791015625, 3.51641845703125, 3.7392578125, 3.96209716796875, 4.1849365234375, 4.40777587890625, 4.630615234375, 4.85345458984375, 5.0762939453125, 5.29913330078125, 5.52197265625, 5.74481201171875, 5.9676513671875, 6.19049072265625, 6.413330078125, 6.63616943359375, 6.8590087890625, 7.08184814453125, 7.3046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 7.0, 14.0, 21.0, 42.0, 74.0, 101.0, 154.0, 152.0, 151.0, 113.0, 65.0, 50.0, 25.0, 12.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.99539184570312, -88.19281005859375, -85.3902359008789, -82.58765411376953, -79.78507995605469, -76.98249816894531, -74.17991638183594, -71.3773422241211, -68.57476806640625, -65.77218627929688, -62.96961212158203, -60.167030334472656, -57.36445617675781, -54.56187438964844, -51.75929641723633, -48.95671844482422, -46.154136657714844, -43.351558685302734, -40.548980712890625, -37.74639892578125, -34.943824768066406, -32.14124298095703, -29.338665008544922, -26.536087036132812, -23.733509063720703, -20.930931091308594, -18.128353118896484, -15.325773239135742, -12.523195266723633, -9.720617294311523, -6.918037414550781, -4.115459442138672, -1.3128814697265625, 1.489696979522705, 4.292275428771973, 7.094854354858398, 9.897432327270508, 12.700010299682617, 15.50259017944336, 18.30516815185547, 21.107746124267578, 23.910324096679688, 26.712902069091797, 29.51548194885254, 32.31806182861328, 35.120635986328125, 37.9232177734375, 40.72579574584961, 43.52837371826172, 46.33095169067383, 49.13352966308594, 51.93611145019531, 54.738685607910156, 57.54126739501953, 60.34384536743164, 63.14642333984375, 65.94900512695312, 68.7515869140625, 71.55416107177734, 74.35674285888672, 77.15931701660156, 79.96189880371094, 82.76448059082031, 85.56705474853516, 88.36962890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 8.0, 8.0, 5.0, 11.0, 10.0, 24.0, 17.0, 27.0, 25.0, 31.0, 32.0, 28.0, 36.0, 46.0, 50.0, 48.0, 44.0, 44.0, 46.0, 59.0, 49.0, 44.0, 41.0, 34.0, 35.0, 37.0, 29.0, 27.0, 22.0, 15.0, 14.0, 9.0, 11.0, 9.0, 4.0, 9.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.064754486083984, -29.007160186767578, -27.949567794799805, -26.89197540283203, -25.834381103515625, -24.77678680419922, -23.719194412231445, -22.661602020263672, -21.604007720947266, -20.54641342163086, -19.488821029663086, -18.431228637695312, -17.373634338378906, -16.3160400390625, -15.258447647094727, -14.200854301452637, -13.143260955810547, -12.085667610168457, -11.028074264526367, -9.970480918884277, -8.912887573242188, -7.855294227600098, -6.797700881958008, -5.740107536315918, -4.682514190673828, -3.6249208450317383, -2.5673274993896484, -1.5097341537475586, -0.45214080810546875, 0.6054525375366211, 1.663045883178711, 2.720639228820801, 3.778228759765625, 4.835822105407715, 5.893415451049805, 6.9510087966918945, 8.008602142333984, 9.066195487976074, 10.123788833618164, 11.181382179260254, 12.238975524902344, 13.296568870544434, 14.354162216186523, 15.411755561828613, 16.469348907470703, 17.52694320678711, 18.584535598754883, 19.642127990722656, 20.699722290039062, 21.75731658935547, 22.814908981323242, 23.872501373291016, 24.930095672607422, 25.987689971923828, 27.0452823638916, 28.102874755859375, 29.16046905517578, 30.218063354492188, 31.27565574645996, 32.333248138427734, 33.39084243774414, 34.44843673706055, 35.50602722167969, 36.563621520996094, 37.6212158203125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 2.0, 11.0, 8.0, 13.0, 22.0, 30.0, 32.0, 39.0, 73.0, 119.0, 172.0, 219.0, 360.0, 595.0, 1027.0, 1896.0, 3733.0, 7884.0, 17781.0, 41341.0, 101300.0, 231960.0, 327225.0, 179791.0, 75092.0, 31258.0, 13550.0, 6243.0, 2963.0, 1516.0, 852.0, 478.0, 296.0, 214.0, 121.0, 95.0, 68.0, 48.0, 36.0, 26.0, 16.0, 13.0, 11.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.609375, -18.94091796875, -18.2724609375, -17.60400390625, -16.935546875, -16.26708984375, -15.5986328125, -14.93017578125, -14.26171875, -13.59326171875, -12.9248046875, -12.25634765625, -11.587890625, -10.91943359375, -10.2509765625, -9.58251953125, -8.9140625, -8.24560546875, -7.5771484375, -6.90869140625, -6.240234375, -5.57177734375, -4.9033203125, -4.23486328125, -3.56640625, -2.89794921875, -2.2294921875, -1.56103515625, -0.892578125, -0.22412109375, 0.4443359375, 1.11279296875, 1.78125, 2.44970703125, 3.1181640625, 3.78662109375, 4.455078125, 5.12353515625, 5.7919921875, 6.46044921875, 7.12890625, 7.79736328125, 8.4658203125, 9.13427734375, 9.802734375, 10.47119140625, 11.1396484375, 11.80810546875, 12.4765625, 13.14501953125, 13.8134765625, 14.48193359375, 15.150390625, 15.81884765625, 16.4873046875, 17.15576171875, 17.82421875, 18.49267578125, 19.1611328125, 19.82958984375, 20.498046875, 21.16650390625, 21.8349609375, 22.50341796875, 23.171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 12.0, 11.0, 17.0, 22.0, 22.0, 19.0, 37.0, 32.0, 55.0, 60.0, 75.0, 76.0, 81.0, 75.0, 77.0, 60.0, 68.0, 51.0, 40.0, 27.0, 20.0, 24.0, 9.0, 10.0, 4.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.90625, -3.7745361328125, -3.642822265625, -3.5111083984375, -3.37939453125, -3.2476806640625, -3.115966796875, -2.9842529296875, -2.8525390625, -2.7208251953125, -2.589111328125, -2.4573974609375, -2.32568359375, -2.1939697265625, -2.062255859375, -1.9305419921875, -1.798828125, -1.6671142578125, -1.535400390625, -1.4036865234375, -1.27197265625, -1.1402587890625, -1.008544921875, -0.8768310546875, -0.7451171875, -0.6134033203125, -0.481689453125, -0.3499755859375, -0.21826171875, -0.0865478515625, 0.045166015625, 0.1768798828125, 0.30859375, 0.4403076171875, 0.572021484375, 0.7037353515625, 0.83544921875, 0.9671630859375, 1.098876953125, 1.2305908203125, 1.3623046875, 1.4940185546875, 1.625732421875, 1.7574462890625, 1.88916015625, 2.0208740234375, 2.152587890625, 2.2843017578125, 2.416015625, 2.5477294921875, 2.679443359375, 2.8111572265625, 2.94287109375, 3.0745849609375, 3.206298828125, 3.3380126953125, 3.4697265625, 3.6014404296875, 3.733154296875, 3.8648681640625, 3.99658203125, 4.1282958984375, 4.260009765625, 4.3917236328125, 4.5234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 8.0, 16.0, 11.0, 10.0, 24.0, 31.0, 36.0, 50.0, 95.0, 115.0, 163.0, 235.0, 384.0, 583.0, 981.0, 1692.0, 3258.0, 6507.0, 14645.0, 33847.0, 80254.0, 180389.0, 300287.0, 229978.0, 110049.0, 46871.0, 19862.0, 8606.0, 4084.0, 2161.0, 1148.0, 746.0, 472.0, 282.0, 196.0, 134.0, 108.0, 77.0, 42.0, 33.0, 29.0, 16.0, 19.0, 11.0, 4.0, 3.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.039794921875, -15.51708984375, -14.994384765625, -14.4716796875, -13.948974609375, -13.42626953125, -12.903564453125, -12.380859375, -11.858154296875, -11.33544921875, -10.812744140625, -10.2900390625, -9.767333984375, -9.24462890625, -8.721923828125, -8.19921875, -7.676513671875, -7.15380859375, -6.631103515625, -6.1083984375, -5.585693359375, -5.06298828125, -4.540283203125, -4.017578125, -3.494873046875, -2.97216796875, -2.449462890625, -1.9267578125, -1.404052734375, -0.88134765625, -0.358642578125, 0.1640625, 0.686767578125, 1.20947265625, 1.732177734375, 2.2548828125, 2.777587890625, 3.30029296875, 3.822998046875, 4.345703125, 4.868408203125, 5.39111328125, 5.913818359375, 6.4365234375, 6.959228515625, 7.48193359375, 8.004638671875, 8.52734375, 9.050048828125, 9.57275390625, 10.095458984375, 10.6181640625, 11.140869140625, 11.66357421875, 12.186279296875, 12.708984375, 13.231689453125, 13.75439453125, 14.277099609375, 14.7998046875, 15.322509765625, 15.84521484375, 16.367919921875, 16.890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 7.0, 10.0, 9.0, 14.0, 14.0, 21.0, 27.0, 29.0, 23.0, 41.0, 34.0, 34.0, 43.0, 48.0, 48.0, 44.0, 59.0, 43.0, 57.0, 62.0, 49.0, 42.0, 38.0, 33.0, 33.0, 22.0, 16.0, 27.0, 17.0, 13.0, 8.0, 7.0, 5.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.640625, -13.166259765625, -12.69189453125, -12.217529296875, -11.7431640625, -11.268798828125, -10.79443359375, -10.320068359375, -9.845703125, -9.371337890625, -8.89697265625, -8.422607421875, -7.9482421875, -7.473876953125, -6.99951171875, -6.525146484375, -6.05078125, -5.576416015625, -5.10205078125, -4.627685546875, -4.1533203125, -3.678955078125, -3.20458984375, -2.730224609375, -2.255859375, -1.781494140625, -1.30712890625, -0.832763671875, -0.3583984375, 0.115966796875, 0.59033203125, 1.064697265625, 1.5390625, 2.013427734375, 2.48779296875, 2.962158203125, 3.4365234375, 3.910888671875, 4.38525390625, 4.859619140625, 5.333984375, 5.808349609375, 6.28271484375, 6.757080078125, 7.2314453125, 7.705810546875, 8.18017578125, 8.654541015625, 9.12890625, 9.603271484375, 10.07763671875, 10.552001953125, 11.0263671875, 11.500732421875, 11.97509765625, 12.449462890625, 12.923828125, 13.398193359375, 13.87255859375, 14.346923828125, 14.8212890625, 15.295654296875, 15.77001953125, 16.244384765625, 16.71875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 13.0, 16.0, 18.0, 34.0, 57.0, 87.0, 144.0, 275.0, 581.0, 1271.0, 3245.0, 9930.0, 40480.0, 224007.0, 550457.0, 172289.0, 32179.0, 8320.0, 2890.0, 1094.0, 523.0, 254.0, 147.0, 82.0, 45.0, 39.0, 19.0, 17.0, 7.0, 7.0, 8.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.046142578125, -13.58447265625, -13.122802734375, -12.6611328125, -12.199462890625, -11.73779296875, -11.276123046875, -10.814453125, -10.352783203125, -9.89111328125, -9.429443359375, -8.9677734375, -8.506103515625, -8.04443359375, -7.582763671875, -7.12109375, -6.659423828125, -6.19775390625, -5.736083984375, -5.2744140625, -4.812744140625, -4.35107421875, -3.889404296875, -3.427734375, -2.966064453125, -2.50439453125, -2.042724609375, -1.5810546875, -1.119384765625, -0.65771484375, -0.196044921875, 0.265625, 0.727294921875, 1.18896484375, 1.650634765625, 2.1123046875, 2.573974609375, 3.03564453125, 3.497314453125, 3.958984375, 4.420654296875, 4.88232421875, 5.343994140625, 5.8056640625, 6.267333984375, 6.72900390625, 7.190673828125, 7.65234375, 8.114013671875, 8.57568359375, 9.037353515625, 9.4990234375, 9.960693359375, 10.42236328125, 10.884033203125, 11.345703125, 11.807373046875, 12.26904296875, 12.730712890625, 13.1923828125, 13.654052734375, 14.11572265625, 14.577392578125, 15.0390625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 7.0, 5.0, 6.0, 20.0, 28.0, 38.0, 49.0, 44.0, 64.0, 88.0, 94.0, 111.0, 97.0, 74.0, 58.0, 45.0, 36.0, 27.0, 25.0, 27.0, 9.0, 11.0, 4.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016641616821289062, -0.001610592007637024, -0.0015570223331451416, -0.0015034526586532593, -0.001449882984161377, -0.0013963133096694946, -0.0013427436351776123, -0.00128917396068573, -0.0012356042861938477, -0.0011820346117019653, -0.001128464937210083, -0.0010748952627182007, -0.0010213255882263184, -0.000967755913734436, -0.0009141862392425537, -0.0008606165647506714, -0.0008070468902587891, -0.0007534772157669067, -0.0006999075412750244, -0.0006463378667831421, -0.0005927681922912598, -0.0005391985177993774, -0.0004856288433074951, -0.0004320591688156128, -0.00037848949432373047, -0.00032491981983184814, -0.0002713501453399658, -0.0002177804708480835, -0.00016421079635620117, -0.00011064112186431885, -5.7071447372436523e-05, -3.5017728805541992e-06, 5.0067901611328125e-05, 0.00010363757610321045, 0.00015720725059509277, 0.0002107769250869751, 0.0002643465995788574, 0.00031791627407073975, 0.00037148594856262207, 0.0004250556230545044, 0.0004786252975463867, 0.000532194972038269, 0.0005857646465301514, 0.0006393343210220337, 0.000692903995513916, 0.0007464736700057983, 0.0008000433444976807, 0.000853613018989563, 0.0009071826934814453, 0.0009607523679733276, 0.00101432204246521, 0.0010678917169570923, 0.0011214613914489746, 0.001175031065940857, 0.0012286007404327393, 0.0012821704149246216, 0.001335740089416504, 0.0013893097639083862, 0.0014428794384002686, 0.0014964491128921509, 0.0015500187873840332, 0.0016035884618759155, 0.0016571581363677979, 0.0017107278108596802, 0.0017642974853515625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 15.0, 20.0, 17.0, 26.0, 31.0, 84.0, 92.0, 161.0, 261.0, 414.0, 702.0, 1211.0, 2203.0, 4489.0, 10704.0, 32470.0, 133760.0, 464620.0, 297539.0, 66883.0, 18666.0, 6909.0, 3185.0, 1618.0, 970.0, 556.0, 347.0, 204.0, 109.0, 82.0, 62.0, 36.0, 39.0, 24.0, 9.0, 4.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1796875, -12.7513427734375, -12.322998046875, -11.8946533203125, -11.46630859375, -11.0379638671875, -10.609619140625, -10.1812744140625, -9.7529296875, -9.3245849609375, -8.896240234375, -8.4678955078125, -8.03955078125, -7.6112060546875, -7.182861328125, -6.7545166015625, -6.326171875, -5.8978271484375, -5.469482421875, -5.0411376953125, -4.61279296875, -4.1844482421875, -3.756103515625, -3.3277587890625, -2.8994140625, -2.4710693359375, -2.042724609375, -1.6143798828125, -1.18603515625, -0.7576904296875, -0.329345703125, 0.0989990234375, 0.52734375, 0.9556884765625, 1.384033203125, 1.8123779296875, 2.24072265625, 2.6690673828125, 3.097412109375, 3.5257568359375, 3.9541015625, 4.3824462890625, 4.810791015625, 5.2391357421875, 5.66748046875, 6.0958251953125, 6.524169921875, 6.9525146484375, 7.380859375, 7.8092041015625, 8.237548828125, 8.6658935546875, 9.09423828125, 9.5225830078125, 9.950927734375, 10.3792724609375, 10.8076171875, 11.2359619140625, 11.664306640625, 12.0926513671875, 12.52099609375, 12.9493408203125, 13.377685546875, 13.8060302734375, 14.234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 9.0, 10.0, 11.0, 22.0, 26.0, 28.0, 39.0, 53.0, 58.0, 91.0, 84.0, 70.0, 84.0, 70.0, 68.0, 56.0, 43.0, 31.0, 34.0, 24.0, 24.0, 9.0, 10.0, 9.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.2734375, -8.02020263671875, -7.7669677734375, -7.51373291015625, -7.260498046875, -7.00726318359375, -6.7540283203125, -6.50079345703125, -6.24755859375, -5.99432373046875, -5.7410888671875, -5.48785400390625, -5.234619140625, -4.98138427734375, -4.7281494140625, -4.47491455078125, -4.2216796875, -3.96844482421875, -3.7152099609375, -3.46197509765625, -3.208740234375, -2.95550537109375, -2.7022705078125, -2.44903564453125, -2.19580078125, -1.94256591796875, -1.6893310546875, -1.43609619140625, -1.182861328125, -0.92962646484375, -0.6763916015625, -0.42315673828125, -0.169921875, 0.08331298828125, 0.3365478515625, 0.58978271484375, 0.843017578125, 1.09625244140625, 1.3494873046875, 1.60272216796875, 1.85595703125, 2.10919189453125, 2.3624267578125, 2.61566162109375, 2.868896484375, 3.12213134765625, 3.3753662109375, 3.62860107421875, 3.8818359375, 4.13507080078125, 4.3883056640625, 4.64154052734375, 4.894775390625, 5.14801025390625, 5.4012451171875, 5.65447998046875, 5.90771484375, 6.16094970703125, 6.4141845703125, 6.66741943359375, 6.920654296875, 7.17388916015625, 7.4271240234375, 7.68035888671875, 7.93359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 11.0, 11.0, 16.0, 37.0, 65.0, 82.0, 131.0, 134.0, 136.0, 133.0, 83.0, 61.0, 35.0, 24.0, 17.0, 7.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-231.2439422607422, -225.8752899169922, -220.50665283203125, -215.13800048828125, -209.76934814453125, -204.40069580078125, -199.03204345703125, -193.6634063720703, -188.2947540283203, -182.9261016845703, -177.55746459960938, -172.18881225585938, -166.82015991210938, -161.45150756835938, -156.08285522460938, -150.71421813964844, -145.34556579589844, -139.97691345214844, -134.6082763671875, -129.2396240234375, -123.8709716796875, -118.5023193359375, -113.13367462158203, -107.76502990722656, -102.39637756347656, -97.02772521972656, -91.6590805053711, -86.29043579101562, -80.92178344726562, -75.55313110351562, -70.18448638916016, -64.81584167480469, -59.44718933105469, -54.07854080200195, -48.70989227294922, -43.341243743896484, -37.97259521484375, -32.603946685791016, -27.23529815673828, -21.866649627685547, -16.498001098632812, -11.129352569580078, -5.760704040527344, -0.3920555114746094, 4.976593017578125, 10.34524154663086, 15.713890075683594, 21.082538604736328, 26.451187133789062, 31.819835662841797, 37.18848419189453, 42.557132720947266, 47.92578125, 53.294429779052734, 58.66307830810547, 64.03172302246094, 69.40037536621094, 74.76902770996094, 80.1376724243164, 85.50631713867188, 90.87496948242188, 96.24362182617188, 101.61226654052734, 106.98091125488281, 112.34956359863281]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 6.0, 9.0, 7.0, 15.0, 11.0, 22.0, 26.0, 32.0, 39.0, 36.0, 46.0, 45.0, 59.0, 69.0, 55.0, 61.0, 48.0, 51.0, 57.0, 48.0, 40.0, 34.0, 40.0, 31.0, 25.0, 22.0, 19.0, 13.0, 12.0, 10.0, 5.0, 1.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-124.23015594482422, -120.9374771118164, -117.6447982788086, -114.35211944580078, -111.05944061279297, -107.76676177978516, -104.47407531738281, -101.181396484375, -97.88871765136719, -94.59603881835938, -91.30335998535156, -88.01068115234375, -84.71800231933594, -81.42532348632812, -78.13264465332031, -74.8399658203125, -71.54728698730469, -68.25460815429688, -64.96192932128906, -61.66925048828125, -58.37657165527344, -55.083892822265625, -51.79121017456055, -48.498531341552734, -45.20585250854492, -41.91317367553711, -38.6204948425293, -35.32781219482422, -32.035133361816406, -28.742456436157227, -25.44977569580078, -22.15709686279297, -18.864425659179688, -15.571746826171875, -12.279067039489746, -8.986387252807617, -5.693708419799805, -2.401029586791992, 0.8916511535644531, 4.184329986572266, 7.477008819580078, 10.76968765258789, 14.06236743927002, 17.35504722595215, 20.64772605895996, 23.940404891967773, 27.23308563232422, 30.52576446533203, 33.818443298339844, 37.111122131347656, 40.40380096435547, 43.69647979736328, 46.989158630371094, 50.281837463378906, 53.574520111083984, 56.8671989440918, 60.15987777709961, 63.45255661010742, 66.7452392578125, 70.03791809082031, 73.33059692382812, 76.62327575683594, 79.91595458984375, 83.20863342285156, 86.50131225585938]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 7.0, 8.0, 10.0, 28.0, 19.0, 30.0, 49.0, 77.0, 106.0, 169.0, 343.0, 583.0, 1349.0, 3243.0, 9946.0, 40609.0, 420549.0, 3616919.0, 76118.0, 15792.0, 4705.0, 1756.0, 798.0, 409.0, 220.0, 132.0, 87.0, 49.0, 44.0, 26.0, 24.0, 20.0, 15.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-53.21875, -51.61474609375, -50.0107421875, -48.40673828125, -46.802734375, -45.19873046875, -43.5947265625, -41.99072265625, -40.38671875, -38.78271484375, -37.1787109375, -35.57470703125, -33.970703125, -32.36669921875, -30.7626953125, -29.15869140625, -27.5546875, -25.95068359375, -24.3466796875, -22.74267578125, -21.138671875, -19.53466796875, -17.9306640625, -16.32666015625, -14.72265625, -13.11865234375, -11.5146484375, -9.91064453125, -8.306640625, -6.70263671875, -5.0986328125, -3.49462890625, -1.890625, -0.28662109375, 1.3173828125, 2.92138671875, 4.525390625, 6.12939453125, 7.7333984375, 9.33740234375, 10.94140625, 12.54541015625, 14.1494140625, 15.75341796875, 17.357421875, 18.96142578125, 20.5654296875, 22.16943359375, 23.7734375, 25.37744140625, 26.9814453125, 28.58544921875, 30.189453125, 31.79345703125, 33.3974609375, 35.00146484375, 36.60546875, 38.20947265625, 39.8134765625, 41.41748046875, 43.021484375, 44.62548828125, 46.2294921875, 47.83349609375, 49.4375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 10.0, 9.0, 12.0, 13.0, 18.0, 25.0, 25.0, 23.0, 35.0, 57.0, 55.0, 66.0, 53.0, 71.0, 66.0, 72.0, 76.0, 46.0, 72.0, 45.0, 29.0, 26.0, 29.0, 13.0, 7.0, 14.0, 3.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.482421875, -3.366790771484375, -3.25115966796875, -3.135528564453125, -3.0198974609375, -2.904266357421875, -2.78863525390625, -2.673004150390625, -2.557373046875, -2.441741943359375, -2.32611083984375, -2.210479736328125, -2.0948486328125, -1.979217529296875, -1.86358642578125, -1.747955322265625, -1.63232421875, -1.516693115234375, -1.40106201171875, -1.285430908203125, -1.1697998046875, -1.054168701171875, -0.93853759765625, -0.822906494140625, -0.707275390625, -0.591644287109375, -0.47601318359375, -0.360382080078125, -0.2447509765625, -0.129119873046875, -0.01348876953125, 0.102142333984375, 0.2177734375, 0.333404541015625, 0.44903564453125, 0.564666748046875, 0.6802978515625, 0.795928955078125, 0.91156005859375, 1.027191162109375, 1.142822265625, 1.258453369140625, 1.37408447265625, 1.489715576171875, 1.6053466796875, 1.720977783203125, 1.83660888671875, 1.952239990234375, 2.06787109375, 2.183502197265625, 2.29913330078125, 2.414764404296875, 2.5303955078125, 2.646026611328125, 2.76165771484375, 2.877288818359375, 2.992919921875, 3.108551025390625, 3.22418212890625, 3.339813232421875, 3.4554443359375, 3.571075439453125, 3.68670654296875, 3.802337646484375, 3.91796875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 6.0, 3.0, 6.0, 12.0, 17.0, 14.0, 29.0, 33.0, 67.0, 82.0, 108.0, 204.0, 307.0, 523.0, 933.0, 1670.0, 3203.0, 7082.0, 18120.0, 55877.0, 235414.0, 3165374.0, 562807.0, 95182.0, 28066.0, 10040.0, 4168.0, 2118.0, 1047.0, 654.0, 398.0, 241.0, 152.0, 81.0, 60.0, 43.0, 29.0, 34.0, 23.0, 15.0, 6.0, 14.0, 7.0, 9.0, 3.0, 3.0, 2.0], "bins": [-34.46875, -33.578369140625, -32.68798828125, -31.797607421875, -30.9072265625, -30.016845703125, -29.12646484375, -28.236083984375, -27.345703125, -26.455322265625, -25.56494140625, -24.674560546875, -23.7841796875, -22.893798828125, -22.00341796875, -21.113037109375, -20.22265625, -19.332275390625, -18.44189453125, -17.551513671875, -16.6611328125, -15.770751953125, -14.88037109375, -13.989990234375, -13.099609375, -12.209228515625, -11.31884765625, -10.428466796875, -9.5380859375, -8.647705078125, -7.75732421875, -6.866943359375, -5.9765625, -5.086181640625, -4.19580078125, -3.305419921875, -2.4150390625, -1.524658203125, -0.63427734375, 0.256103515625, 1.146484375, 2.036865234375, 2.92724609375, 3.817626953125, 4.7080078125, 5.598388671875, 6.48876953125, 7.379150390625, 8.26953125, 9.159912109375, 10.05029296875, 10.940673828125, 11.8310546875, 12.721435546875, 13.61181640625, 14.502197265625, 15.392578125, 16.282958984375, 17.17333984375, 18.063720703125, 18.9541015625, 19.844482421875, 20.73486328125, 21.625244140625, 22.515625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 8.0, 10.0, 15.0, 18.0, 23.0, 46.0, 45.0, 60.0, 109.0, 129.0, 224.0, 408.0, 1477.0, 679.0, 274.0, 176.0, 112.0, 66.0, 47.0, 34.0, 26.0, 17.0, 14.0, 9.0, 10.0, 10.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.05859375, -6.84283447265625, -6.6270751953125, -6.41131591796875, -6.195556640625, -5.97979736328125, -5.7640380859375, -5.54827880859375, -5.33251953125, -5.11676025390625, -4.9010009765625, -4.68524169921875, -4.469482421875, -4.25372314453125, -4.0379638671875, -3.82220458984375, -3.6064453125, -3.39068603515625, -3.1749267578125, -2.95916748046875, -2.743408203125, -2.52764892578125, -2.3118896484375, -2.09613037109375, -1.88037109375, -1.66461181640625, -1.4488525390625, -1.23309326171875, -1.017333984375, -0.80157470703125, -0.5858154296875, -0.37005615234375, -0.154296875, 0.06146240234375, 0.2772216796875, 0.49298095703125, 0.708740234375, 0.92449951171875, 1.1402587890625, 1.35601806640625, 1.57177734375, 1.78753662109375, 2.0032958984375, 2.21905517578125, 2.434814453125, 2.65057373046875, 2.8663330078125, 3.08209228515625, 3.2978515625, 3.51361083984375, 3.7293701171875, 3.94512939453125, 4.160888671875, 4.37664794921875, 4.5924072265625, 4.80816650390625, 5.02392578125, 5.23968505859375, 5.4554443359375, 5.67120361328125, 5.886962890625, 6.10272216796875, 6.3184814453125, 6.53424072265625, 6.75]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 8.0, 11.0, 18.0, 25.0, 49.0, 83.0, 115.0, 168.0, 155.0, 136.0, 88.0, 76.0, 36.0, 23.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.60932540893555, -40.41290283203125, -38.21647644042969, -36.02005386352539, -33.823631286621094, -31.627206802368164, -29.430782318115234, -27.234359741210938, -25.037935256958008, -22.841510772705078, -20.64508819580078, -18.44866371154785, -16.252239227294922, -14.055816650390625, -11.859392166137695, -9.662968635559082, -7.466545104980469, -5.2701215744018555, -3.073697566986084, -0.8772735595703125, 1.3191499710083008, 3.515573501586914, 5.711997985839844, 7.908421516418457, 10.10484504699707, 12.301268577575684, 14.497692108154297, 16.694116592407227, 18.890541076660156, 21.086963653564453, 23.283388137817383, 25.479812622070312, 27.676231384277344, 29.872655868530273, 32.0690803527832, 34.2655029296875, 36.4619255065918, 38.658348083496094, 40.854774475097656, 43.05119705200195, 45.24761962890625, 47.44404220581055, 49.64046859741211, 51.836891174316406, 54.0333137512207, 56.229736328125, 58.42616271972656, 60.62258529663086, 62.81901168823242, 65.01543426513672, 67.21186065673828, 69.40827941894531, 71.60470581054688, 73.80113220214844, 75.99755859375, 78.19397735595703, 80.3904037475586, 82.58683013916016, 84.78324890136719, 86.97967529296875, 89.17610168457031, 91.37252044677734, 93.5689468383789, 95.76537322998047, 97.9617919921875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 9.0, 9.0, 7.0, 8.0, 10.0, 23.0, 16.0, 13.0, 25.0, 30.0, 31.0, 30.0, 23.0, 36.0, 41.0, 42.0, 41.0, 33.0, 42.0, 57.0, 49.0, 49.0, 39.0, 29.0, 33.0, 40.0, 34.0, 34.0, 17.0, 33.0, 19.0, 13.0, 13.0, 18.0, 7.0, 10.0, 12.0, 10.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.85400390625, -24.11969757080078, -23.38538932800293, -22.65108299255371, -21.91677474975586, -21.18246841430664, -20.448162078857422, -19.71385383605957, -18.97954750061035, -18.245241165161133, -17.51093292236328, -16.776626586914062, -16.04231834411621, -15.308012008666992, -14.573704719543457, -13.839397430419922, -13.105090141296387, -12.370782852172852, -11.636475563049316, -10.902168273925781, -10.167861938476562, -9.433554649353027, -8.699247360229492, -7.964940547943115, -7.23063325881958, -6.496325969696045, -5.762019157409668, -5.027711868286133, -4.293404579162598, -3.5590977668762207, -2.8247904777526855, -2.0904836654663086, -1.3561763763427734, -0.6218692660331726, 0.11243784427642822, 0.8467450141906738, 1.5810520648956299, 2.315359115600586, 3.049666404724121, 3.783973217010498, 4.518280506134033, 5.252587795257568, 5.986894607543945, 6.7212018966674805, 7.455509185791016, 8.189815521240234, 8.924123764038086, 9.658430099487305, 10.39273738861084, 11.127044677734375, 11.86135196685791, 12.595659255981445, 13.329965591430664, 14.0642728805542, 14.798580169677734, 15.532886505126953, 16.267194747924805, 17.001501083374023, 17.735809326171875, 18.470115661621094, 19.204423904418945, 19.938730239868164, 20.673038482666016, 21.407344818115234, 22.141651153564453]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 14.0, 15.0, 10.0, 26.0, 31.0, 35.0, 67.0, 61.0, 118.0, 211.0, 319.0, 512.0, 977.0, 1855.0, 3951.0, 9469.0, 25275.0, 74204.0, 227009.0, 412822.0, 192014.0, 62129.0, 21788.0, 8218.0, 3551.0, 1646.0, 845.0, 502.0, 302.0, 193.0, 137.0, 74.0, 58.0, 41.0, 24.0, 17.0, 13.0, 5.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.062255859375, -20.26513671875, -19.468017578125, -18.6708984375, -17.873779296875, -17.07666015625, -16.279541015625, -15.482421875, -14.685302734375, -13.88818359375, -13.091064453125, -12.2939453125, -11.496826171875, -10.69970703125, -9.902587890625, -9.10546875, -8.308349609375, -7.51123046875, -6.714111328125, -5.9169921875, -5.119873046875, -4.32275390625, -3.525634765625, -2.728515625, -1.931396484375, -1.13427734375, -0.337158203125, 0.4599609375, 1.257080078125, 2.05419921875, 2.851318359375, 3.6484375, 4.445556640625, 5.24267578125, 6.039794921875, 6.8369140625, 7.634033203125, 8.43115234375, 9.228271484375, 10.025390625, 10.822509765625, 11.61962890625, 12.416748046875, 13.2138671875, 14.010986328125, 14.80810546875, 15.605224609375, 16.40234375, 17.199462890625, 17.99658203125, 18.793701171875, 19.5908203125, 20.387939453125, 21.18505859375, 21.982177734375, 22.779296875, 23.576416015625, 24.37353515625, 25.170654296875, 25.9677734375, 26.764892578125, 27.56201171875, 28.359130859375, 29.15625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 20.0, 12.0, 15.0, 21.0, 32.0, 28.0, 33.0, 43.0, 51.0, 55.0, 54.0, 56.0, 64.0, 57.0, 66.0, 54.0, 57.0, 59.0, 41.0, 45.0, 28.0, 23.0, 10.0, 11.0, 7.0, 10.0, 7.0, 3.0, 2.0, 3.0, 5.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.23828125, -3.12921142578125, -3.0201416015625, -2.91107177734375, -2.802001953125, -2.69293212890625, -2.5838623046875, -2.47479248046875, -2.36572265625, -2.25665283203125, -2.1475830078125, -2.03851318359375, -1.929443359375, -1.82037353515625, -1.7113037109375, -1.60223388671875, -1.4931640625, -1.38409423828125, -1.2750244140625, -1.16595458984375, -1.056884765625, -0.94781494140625, -0.8387451171875, -0.72967529296875, -0.62060546875, -0.51153564453125, -0.4024658203125, -0.29339599609375, -0.184326171875, -0.07525634765625, 0.0338134765625, 0.14288330078125, 0.251953125, 0.36102294921875, 0.4700927734375, 0.57916259765625, 0.688232421875, 0.79730224609375, 0.9063720703125, 1.01544189453125, 1.12451171875, 1.23358154296875, 1.3426513671875, 1.45172119140625, 1.560791015625, 1.66986083984375, 1.7789306640625, 1.88800048828125, 1.9970703125, 2.10614013671875, 2.2152099609375, 2.32427978515625, 2.433349609375, 2.54241943359375, 2.6514892578125, 2.76055908203125, 2.86962890625, 2.97869873046875, 3.0877685546875, 3.19683837890625, 3.305908203125, 3.41497802734375, 3.5240478515625, 3.63311767578125, 3.7421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 15.0, 17.0, 9.0, 30.0, 35.0, 49.0, 77.0, 113.0, 144.0, 229.0, 332.0, 558.0, 942.0, 1698.0, 3144.0, 6540.0, 14856.0, 35924.0, 88962.0, 204667.0, 319750.0, 211072.0, 92381.0, 37334.0, 15427.0, 6771.0, 3195.0, 1716.0, 903.0, 539.0, 347.0, 258.0, 168.0, 107.0, 68.0, 38.0, 51.0, 29.0, 14.0, 8.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.625, -16.1290283203125, -15.633056640625, -15.1370849609375, -14.64111328125, -14.1451416015625, -13.649169921875, -13.1531982421875, -12.6572265625, -12.1612548828125, -11.665283203125, -11.1693115234375, -10.67333984375, -10.1773681640625, -9.681396484375, -9.1854248046875, -8.689453125, -8.1934814453125, -7.697509765625, -7.2015380859375, -6.70556640625, -6.2095947265625, -5.713623046875, -5.2176513671875, -4.7216796875, -4.2257080078125, -3.729736328125, -3.2337646484375, -2.73779296875, -2.2418212890625, -1.745849609375, -1.2498779296875, -0.75390625, -0.2579345703125, 0.238037109375, 0.7340087890625, 1.22998046875, 1.7259521484375, 2.221923828125, 2.7178955078125, 3.2138671875, 3.7098388671875, 4.205810546875, 4.7017822265625, 5.19775390625, 5.6937255859375, 6.189697265625, 6.6856689453125, 7.181640625, 7.6776123046875, 8.173583984375, 8.6695556640625, 9.16552734375, 9.6614990234375, 10.157470703125, 10.6534423828125, 11.1494140625, 11.6453857421875, 12.141357421875, 12.6373291015625, 13.13330078125, 13.6292724609375, 14.125244140625, 14.6212158203125, 15.1171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 6.0, 14.0, 12.0, 18.0, 16.0, 17.0, 16.0, 38.0, 29.0, 39.0, 37.0, 30.0, 40.0, 37.0, 39.0, 42.0, 50.0, 51.0, 44.0, 49.0, 32.0, 53.0, 32.0, 42.0, 39.0, 34.0, 23.0, 25.0, 14.0, 13.0, 10.0, 5.0, 8.0, 6.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.20458984375, -11.7763671875, -11.34814453125, -10.919921875, -10.49169921875, -10.0634765625, -9.63525390625, -9.20703125, -8.77880859375, -8.3505859375, -7.92236328125, -7.494140625, -7.06591796875, -6.6376953125, -6.20947265625, -5.78125, -5.35302734375, -4.9248046875, -4.49658203125, -4.068359375, -3.64013671875, -3.2119140625, -2.78369140625, -2.35546875, -1.92724609375, -1.4990234375, -1.07080078125, -0.642578125, -0.21435546875, 0.2138671875, 0.64208984375, 1.0703125, 1.49853515625, 1.9267578125, 2.35498046875, 2.783203125, 3.21142578125, 3.6396484375, 4.06787109375, 4.49609375, 4.92431640625, 5.3525390625, 5.78076171875, 6.208984375, 6.63720703125, 7.0654296875, 7.49365234375, 7.921875, 8.35009765625, 8.7783203125, 9.20654296875, 9.634765625, 10.06298828125, 10.4912109375, 10.91943359375, 11.34765625, 11.77587890625, 12.2041015625, 12.63232421875, 13.060546875, 13.48876953125, 13.9169921875, 14.34521484375, 14.7734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 4.0, 14.0, 11.0, 15.0, 26.0, 36.0, 60.0, 125.0, 183.0, 327.0, 547.0, 997.0, 2197.0, 5262.0, 14460.0, 50433.0, 218781.0, 502503.0, 187145.0, 43990.0, 12635.0, 4474.0, 2075.0, 984.0, 520.0, 287.0, 173.0, 94.0, 76.0, 48.0, 13.0, 14.0, 18.0, 10.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.6484375, -12.28125, -11.9140625, -11.546875, -11.1796875, -10.8125, -10.4453125, -10.078125, -9.7109375, -9.34375, -8.9765625, -8.609375, -8.2421875, -7.875, -7.5078125, -7.140625, -6.7734375, -6.40625, -6.0390625, -5.671875, -5.3046875, -4.9375, -4.5703125, -4.203125, -3.8359375, -3.46875, -3.1015625, -2.734375, -2.3671875, -2.0, -1.6328125, -1.265625, -0.8984375, -0.53125, -0.1640625, 0.203125, 0.5703125, 0.9375, 1.3046875, 1.671875, 2.0390625, 2.40625, 2.7734375, 3.140625, 3.5078125, 3.875, 4.2421875, 4.609375, 4.9765625, 5.34375, 5.7109375, 6.078125, 6.4453125, 6.8125, 7.1796875, 7.546875, 7.9140625, 8.28125, 8.6484375, 9.015625, 9.3828125, 9.75, 10.1171875, 10.484375, 10.8515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 32.0, 38.0, 57.0, 117.0, 153.0, 216.0, 147.0, 86.0, 40.0, 29.0, 18.0, 15.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003940582275390625, -0.0038427412509918213, -0.0037449002265930176, -0.003647059202194214, -0.00354921817779541, -0.0034513771533966064, -0.0033535361289978027, -0.003255695104598999, -0.0031578540802001953, -0.0030600130558013916, -0.002962172031402588, -0.002864331007003784, -0.0027664899826049805, -0.0026686489582061768, -0.002570807933807373, -0.0024729669094085693, -0.0023751258850097656, -0.002277284860610962, -0.002179443836212158, -0.0020816028118133545, -0.0019837617874145508, -0.001885920763015747, -0.0017880797386169434, -0.0016902387142181396, -0.001592397689819336, -0.0014945566654205322, -0.0013967156410217285, -0.0012988746166229248, -0.001201033592224121, -0.0011031925678253174, -0.0010053515434265137, -0.00090751051902771, -0.0008096694946289062, -0.0007118284702301025, -0.0006139874458312988, -0.0005161464214324951, -0.0004183053970336914, -0.0003204643726348877, -0.00022262334823608398, -0.00012478232383728027, -2.6941299438476562e-05, 7.089972496032715e-05, 0.00016874074935913086, 0.00026658177375793457, 0.0003644227981567383, 0.000462263822555542, 0.0005601048469543457, 0.0006579458713531494, 0.0007557868957519531, 0.0008536279201507568, 0.0009514689445495605, 0.0010493099689483643, 0.001147150993347168, 0.0012449920177459717, 0.0013428330421447754, 0.001440674066543579, 0.0015385150909423828, 0.0016363561153411865, 0.0017341971397399902, 0.001832038164138794, 0.0019298791885375977, 0.0020277202129364014, 0.002125561237335205, 0.002223402261734009, 0.0023212432861328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 5.0, 5.0, 6.0, 11.0, 19.0, 16.0, 23.0, 37.0, 56.0, 59.0, 99.0, 143.0, 263.0, 331.0, 603.0, 952.0, 1755.0, 3125.0, 6457.0, 14097.0, 33191.0, 89177.0, 263816.0, 381670.0, 156523.0, 54574.0, 21856.0, 9630.0, 4574.0, 2285.0, 1199.0, 720.0, 443.0, 274.0, 156.0, 126.0, 88.0, 60.0, 41.0, 23.0, 19.0, 15.0, 11.0, 8.0, 4.0, 4.0, 2.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.0887451171875, -7.802490234375, -7.5162353515625, -7.22998046875, -6.9437255859375, -6.657470703125, -6.3712158203125, -6.0849609375, -5.7987060546875, -5.512451171875, -5.2261962890625, -4.93994140625, -4.6536865234375, -4.367431640625, -4.0811767578125, -3.794921875, -3.5086669921875, -3.222412109375, -2.9361572265625, -2.64990234375, -2.3636474609375, -2.077392578125, -1.7911376953125, -1.5048828125, -1.2186279296875, -0.932373046875, -0.6461181640625, -0.35986328125, -0.0736083984375, 0.212646484375, 0.4989013671875, 0.78515625, 1.0714111328125, 1.357666015625, 1.6439208984375, 1.93017578125, 2.2164306640625, 2.502685546875, 2.7889404296875, 3.0751953125, 3.3614501953125, 3.647705078125, 3.9339599609375, 4.22021484375, 4.5064697265625, 4.792724609375, 5.0789794921875, 5.365234375, 5.6514892578125, 5.937744140625, 6.2239990234375, 6.51025390625, 6.7965087890625, 7.082763671875, 7.3690185546875, 7.6552734375, 7.9415283203125, 8.227783203125, 8.5140380859375, 8.80029296875, 9.0865478515625, 9.372802734375, 9.6590576171875, 9.9453125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 3.0, 7.0, 2.0, 9.0, 9.0, 14.0, 12.0, 15.0, 24.0, 22.0, 38.0, 47.0, 62.0, 62.0, 60.0, 62.0, 47.0, 64.0, 59.0, 47.0, 56.0, 42.0, 54.0, 28.0, 36.0, 28.0, 10.0, 18.0, 6.0, 11.0, 15.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.43585205078125, -5.2545166015625, -5.07318115234375, -4.891845703125, -4.71051025390625, -4.5291748046875, -4.34783935546875, -4.16650390625, -3.98516845703125, -3.8038330078125, -3.62249755859375, -3.441162109375, -3.25982666015625, -3.0784912109375, -2.89715576171875, -2.7158203125, -2.53448486328125, -2.3531494140625, -2.17181396484375, -1.990478515625, -1.80914306640625, -1.6278076171875, -1.44647216796875, -1.26513671875, -1.08380126953125, -0.9024658203125, -0.72113037109375, -0.539794921875, -0.35845947265625, -0.1771240234375, 0.00421142578125, 0.185546875, 0.36688232421875, 0.5482177734375, 0.72955322265625, 0.910888671875, 1.09222412109375, 1.2735595703125, 1.45489501953125, 1.63623046875, 1.81756591796875, 1.9989013671875, 2.18023681640625, 2.361572265625, 2.54290771484375, 2.7242431640625, 2.90557861328125, 3.0869140625, 3.26824951171875, 3.4495849609375, 3.63092041015625, 3.812255859375, 3.99359130859375, 4.1749267578125, 4.35626220703125, 4.53759765625, 4.71893310546875, 4.9002685546875, 5.08160400390625, 5.262939453125, 5.44427490234375, 5.6256103515625, 5.80694580078125, 5.98828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 10.0, 6.0, 13.0, 30.0, 21.0, 46.0, 79.0, 67.0, 96.0, 130.0, 111.0, 103.0, 83.0, 60.0, 43.0, 28.0, 28.0, 16.0, 14.0, 5.0, 10.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.42857360839844, -100.54557800292969, -96.66259002685547, -92.77959442138672, -88.8966064453125, -85.01361083984375, -81.13062286376953, -77.24762725830078, -73.36463928222656, -69.48164367675781, -65.5986557006836, -61.71566390991211, -57.832672119140625, -53.949676513671875, -50.066688537597656, -46.183692932128906, -42.30070114135742, -38.41770935058594, -34.53471755981445, -30.65172576904297, -26.768733978271484, -22.885740280151367, -19.002748489379883, -15.119756698608398, -11.236764907836914, -7.35377311706543, -3.470780849456787, 0.41221141815185547, 4.29520320892334, 8.17819595336914, 12.061187744140625, 15.94417953491211, 19.827171325683594, 23.710163116455078, 27.593154907226562, 31.476146697998047, 35.35913848876953, 39.24213409423828, 43.1251220703125, 47.00811767578125, 50.89110565185547, 54.77409744262695, 58.65708923339844, 62.54008102416992, 66.4230728149414, 70.30606842041016, 74.18905639648438, 78.07205200195312, 81.95504760742188, 85.83804321289062, 89.72103118896484, 93.6040267944336, 97.48701477050781, 101.37001037597656, 105.25299835205078, 109.13599395751953, 113.01898193359375, 116.9019775390625, 120.78496551513672, 124.66796112060547, 128.5509490966797, 132.43394470214844, 136.3169403076172, 140.19992065429688, 144.08291625976562]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 9.0, 6.0, 10.0, 11.0, 22.0, 23.0, 27.0, 35.0, 28.0, 47.0, 41.0, 41.0, 44.0, 46.0, 67.0, 53.0, 65.0, 39.0, 45.0, 35.0, 36.0, 41.0, 36.0, 34.0, 38.0, 20.0, 24.0, 8.0, 19.0, 18.0, 5.0, 5.0, 7.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.70628356933594, -91.90457153320312, -89.10285949707031, -86.3011474609375, -83.49942779541016, -80.69771575927734, -77.89600372314453, -75.09429168701172, -72.2925796508789, -69.4908676147461, -66.68915557861328, -63.8874397277832, -61.08572769165039, -58.28401184082031, -55.4822998046875, -52.68058776855469, -49.87887191772461, -47.0771598815918, -44.27544403076172, -41.473731994628906, -38.672019958496094, -35.87030792236328, -33.0685920715332, -30.26688003540039, -27.465166091918945, -24.6634521484375, -21.861740112304688, -19.060026168823242, -16.258312225341797, -13.456600189208984, -10.654886245727539, -7.853174209594727, -5.051460266113281, -2.2497470378875732, 0.5519661903381348, 3.353679656982422, 6.155392646789551, 8.95710563659668, 11.758819580078125, 14.560531616210938, 17.362245559692383, 20.163959503173828, 22.96567153930664, 25.767385482788086, 28.56909942626953, 31.370811462402344, 34.172523498535156, 36.97423553466797, 39.77595138549805, 42.57766342163086, 45.37937927246094, 48.18109130859375, 50.98280334472656, 53.784515380859375, 56.58623123168945, 59.387943267822266, 62.189659118652344, 64.99137115478516, 67.79308319091797, 70.59480285644531, 73.39651489257812, 76.19822692871094, 78.99993896484375, 81.80165100097656, 84.60336303710938]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 8.0, 13.0, 13.0, 23.0, 37.0, 50.0, 84.0, 120.0, 225.0, 478.0, 829.0, 1867.0, 4123.0, 11698.0, 41955.0, 256906.0, 3605847.0, 214454.0, 37875.0, 10545.0, 3802.0, 1596.0, 739.0, 376.0, 213.0, 137.0, 88.0, 55.0, 44.0, 27.0, 15.0, 11.0, 8.0, 4.0, 1.0, 2.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.59375, -30.2470703125, -28.900390625, -27.5537109375, -26.20703125, -24.8603515625, -23.513671875, -22.1669921875, -20.8203125, -19.4736328125, -18.126953125, -16.7802734375, -15.43359375, -14.0869140625, -12.740234375, -11.3935546875, -10.046875, -8.7001953125, -7.353515625, -6.0068359375, -4.66015625, -3.3134765625, -1.966796875, -0.6201171875, 0.7265625, 2.0732421875, 3.419921875, 4.7666015625, 6.11328125, 7.4599609375, 8.806640625, 10.1533203125, 11.5, 12.8466796875, 14.193359375, 15.5400390625, 16.88671875, 18.2333984375, 19.580078125, 20.9267578125, 22.2734375, 23.6201171875, 24.966796875, 26.3134765625, 27.66015625, 29.0068359375, 30.353515625, 31.7001953125, 33.046875, 34.3935546875, 35.740234375, 37.0869140625, 38.43359375, 39.7802734375, 41.126953125, 42.4736328125, 43.8203125, 45.1669921875, 46.513671875, 47.8603515625, 49.20703125, 50.5537109375, 51.900390625, 53.2470703125, 54.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 6.0, 8.0, 3.0, 8.0, 9.0, 14.0, 14.0, 17.0, 25.0, 32.0, 26.0, 46.0, 50.0, 47.0, 65.0, 47.0, 49.0, 48.0, 63.0, 55.0, 61.0, 57.0, 51.0, 42.0, 33.0, 34.0, 23.0, 15.0, 15.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.8248291015625, -2.721923828125, -2.6190185546875, -2.51611328125, -2.4132080078125, -2.310302734375, -2.2073974609375, -2.1044921875, -2.0015869140625, -1.898681640625, -1.7957763671875, -1.69287109375, -1.5899658203125, -1.487060546875, -1.3841552734375, -1.28125, -1.1783447265625, -1.075439453125, -0.9725341796875, -0.86962890625, -0.7667236328125, -0.663818359375, -0.5609130859375, -0.4580078125, -0.3551025390625, -0.252197265625, -0.1492919921875, -0.04638671875, 0.0565185546875, 0.159423828125, 0.2623291015625, 0.365234375, 0.4681396484375, 0.571044921875, 0.6739501953125, 0.77685546875, 0.8797607421875, 0.982666015625, 1.0855712890625, 1.1884765625, 1.2913818359375, 1.394287109375, 1.4971923828125, 1.60009765625, 1.7030029296875, 1.805908203125, 1.9088134765625, 2.01171875, 2.1146240234375, 2.217529296875, 2.3204345703125, 2.42333984375, 2.5262451171875, 2.629150390625, 2.7320556640625, 2.8349609375, 2.9378662109375, 3.040771484375, 3.1436767578125, 3.24658203125, 3.3494873046875, 3.452392578125, 3.5552978515625, 3.658203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 16.0, 23.0, 34.0, 44.0, 43.0, 83.0, 104.0, 179.0, 264.0, 391.0, 682.0, 1138.0, 2079.0, 3952.0, 9093.0, 26972.0, 112297.0, 957635.0, 2841035.0, 177482.0, 38206.0, 11849.0, 4952.0, 2357.0, 1280.0, 744.0, 482.0, 278.0, 190.0, 108.0, 81.0, 51.0, 43.0, 33.0, 20.0, 16.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.0625, -29.06494140625, -28.0673828125, -27.06982421875, -26.072265625, -25.07470703125, -24.0771484375, -23.07958984375, -22.08203125, -21.08447265625, -20.0869140625, -19.08935546875, -18.091796875, -17.09423828125, -16.0966796875, -15.09912109375, -14.1015625, -13.10400390625, -12.1064453125, -11.10888671875, -10.111328125, -9.11376953125, -8.1162109375, -7.11865234375, -6.12109375, -5.12353515625, -4.1259765625, -3.12841796875, -2.130859375, -1.13330078125, -0.1357421875, 0.86181640625, 1.859375, 2.85693359375, 3.8544921875, 4.85205078125, 5.849609375, 6.84716796875, 7.8447265625, 8.84228515625, 9.83984375, 10.83740234375, 11.8349609375, 12.83251953125, 13.830078125, 14.82763671875, 15.8251953125, 16.82275390625, 17.8203125, 18.81787109375, 19.8154296875, 20.81298828125, 21.810546875, 22.80810546875, 23.8056640625, 24.80322265625, 25.80078125, 26.79833984375, 27.7958984375, 28.79345703125, 29.791015625, 30.78857421875, 31.7861328125, 32.78369140625, 33.78125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 4.0, 10.0, 10.0, 24.0, 37.0, 78.0, 93.0, 149.0, 255.0, 568.0, 1530.0, 617.0, 291.0, 115.0, 99.0, 68.0, 40.0, 21.0, 17.0, 13.0, 9.0, 7.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.0523681640625, -10.635986328125, -10.2196044921875, -9.80322265625, -9.3868408203125, -8.970458984375, -8.5540771484375, -8.1376953125, -7.7213134765625, -7.304931640625, -6.8885498046875, -6.47216796875, -6.0557861328125, -5.639404296875, -5.2230224609375, -4.806640625, -4.3902587890625, -3.973876953125, -3.5574951171875, -3.14111328125, -2.7247314453125, -2.308349609375, -1.8919677734375, -1.4755859375, -1.0592041015625, -0.642822265625, -0.2264404296875, 0.18994140625, 0.6063232421875, 1.022705078125, 1.4390869140625, 1.85546875, 2.2718505859375, 2.688232421875, 3.1046142578125, 3.52099609375, 3.9373779296875, 4.353759765625, 4.7701416015625, 5.1865234375, 5.6029052734375, 6.019287109375, 6.4356689453125, 6.85205078125, 7.2684326171875, 7.684814453125, 8.1011962890625, 8.517578125, 8.9339599609375, 9.350341796875, 9.7667236328125, 10.18310546875, 10.5994873046875, 11.015869140625, 11.4322509765625, 11.8486328125, 12.2650146484375, 12.681396484375, 13.0977783203125, 13.51416015625, 13.9305419921875, 14.346923828125, 14.7633056640625, 15.1796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 22.0, 42.0, 87.0, 100.0, 161.0, 176.0, 160.0, 111.0, 56.0, 28.0, 20.0, 12.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.69322967529297, -86.62968444824219, -82.5661392211914, -78.50259399414062, -74.43904113769531, -70.37550354003906, -66.31195068359375, -62.24840545654297, -58.18486022949219, -54.121315002441406, -50.057769775390625, -45.99422073364258, -41.9306755065918, -37.867130279541016, -33.80358123779297, -29.740036010742188, -25.676490783691406, -21.612945556640625, -17.54939842224121, -13.485852241516113, -9.422306060791016, -5.358760833740234, -1.2952136993408203, 2.7683334350585938, 6.831878662109375, 10.895424842834473, 14.95897102355957, 19.022518157958984, 23.086063385009766, 27.149608612060547, 31.21315574645996, 35.276702880859375, 39.340240478515625, 43.403785705566406, 47.46733093261719, 51.530879974365234, 55.594425201416016, 59.6579704284668, 63.721519470214844, 67.78506469726562, 71.8486099243164, 75.91215515136719, 79.97570037841797, 84.03924560546875, 88.10279846191406, 92.16633605957031, 96.22988891601562, 100.2934341430664, 104.35697937011719, 108.42052459716797, 112.48406982421875, 116.54761505126953, 120.61116027832031, 124.67471313476562, 128.73825073242188, 132.8018035888672, 136.8653564453125, 140.9289093017578, 144.99244689941406, 149.05599975585938, 153.11953735351562, 157.18309020996094, 161.2466278076172, 165.3101806640625, 169.37371826171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 10.0, 7.0, 15.0, 21.0, 18.0, 31.0, 29.0, 45.0, 48.0, 53.0, 74.0, 56.0, 68.0, 54.0, 74.0, 66.0, 63.0, 45.0, 50.0, 37.0, 40.0, 20.0, 18.0, 14.0, 8.0, 11.0, 9.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.470516204833984, -36.8317985534668, -35.19308090209961, -33.55436325073242, -31.915645599365234, -30.276927947998047, -28.638208389282227, -26.99949073791504, -25.36077308654785, -23.722055435180664, -22.083337783813477, -20.444618225097656, -18.80590057373047, -17.16718292236328, -15.528465270996094, -13.889747619628906, -12.251029968261719, -10.612312316894531, -8.973594665527344, -7.33487606048584, -5.696158409118652, -4.057440757751465, -2.418722152709961, -0.7800045013427734, 0.8587131500244141, 2.4974310398101807, 4.136148929595947, 5.774867057800293, 7.4135847091674805, 9.052302360534668, 10.691020965576172, 12.32973861694336, 13.968452453613281, 15.607170104980469, 17.245887756347656, 18.884605407714844, 20.52332305908203, 22.16204071044922, 23.80076026916504, 25.439477920532227, 27.078195571899414, 28.7169132232666, 30.35563087463379, 31.99435043334961, 33.6330680847168, 35.271785736083984, 36.91050338745117, 38.54922103881836, 40.18793869018555, 41.826656341552734, 43.46537399291992, 45.10409164428711, 46.7428092956543, 48.381526947021484, 50.02024841308594, 51.658966064453125, 53.29768371582031, 54.9364013671875, 56.57511901855469, 58.213836669921875, 59.85255432128906, 61.49127197265625, 63.12998962402344, 64.76870727539062, 66.40742492675781]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 6.0, 8.0, 13.0, 14.0, 31.0, 45.0, 62.0, 73.0, 99.0, 149.0, 223.0, 396.0, 696.0, 1249.0, 2948.0, 9513.0, 40446.0, 240671.0, 624414.0, 97952.0, 20070.0, 5197.0, 1916.0, 885.0, 524.0, 335.0, 202.0, 123.0, 92.0, 54.0, 30.0, 37.0, 27.0, 16.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-43.6875, -42.33349609375, -40.9794921875, -39.62548828125, -38.271484375, -36.91748046875, -35.5634765625, -34.20947265625, -32.85546875, -31.50146484375, -30.1474609375, -28.79345703125, -27.439453125, -26.08544921875, -24.7314453125, -23.37744140625, -22.0234375, -20.66943359375, -19.3154296875, -17.96142578125, -16.607421875, -15.25341796875, -13.8994140625, -12.54541015625, -11.19140625, -9.83740234375, -8.4833984375, -7.12939453125, -5.775390625, -4.42138671875, -3.0673828125, -1.71337890625, -0.359375, 0.99462890625, 2.3486328125, 3.70263671875, 5.056640625, 6.41064453125, 7.7646484375, 9.11865234375, 10.47265625, 11.82666015625, 13.1806640625, 14.53466796875, 15.888671875, 17.24267578125, 18.5966796875, 19.95068359375, 21.3046875, 22.65869140625, 24.0126953125, 25.36669921875, 26.720703125, 28.07470703125, 29.4287109375, 30.78271484375, 32.13671875, 33.49072265625, 34.8447265625, 36.19873046875, 37.552734375, 38.90673828125, 40.2607421875, 41.61474609375, 42.96875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 9.0, 9.0, 9.0, 19.0, 19.0, 23.0, 37.0, 54.0, 62.0, 74.0, 72.0, 84.0, 82.0, 67.0, 72.0, 96.0, 69.0, 49.0, 25.0, 19.0, 18.0, 9.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.778350830078125, -3.62896728515625, -3.479583740234375, -3.3302001953125, -3.180816650390625, -3.03143310546875, -2.882049560546875, -2.732666015625, -2.583282470703125, -2.43389892578125, -2.284515380859375, -2.1351318359375, -1.985748291015625, -1.83636474609375, -1.686981201171875, -1.53759765625, -1.388214111328125, -1.23883056640625, -1.089447021484375, -0.9400634765625, -0.790679931640625, -0.64129638671875, -0.491912841796875, -0.342529296875, -0.193145751953125, -0.04376220703125, 0.105621337890625, 0.2550048828125, 0.404388427734375, 0.55377197265625, 0.703155517578125, 0.8525390625, 1.001922607421875, 1.15130615234375, 1.300689697265625, 1.4500732421875, 1.599456787109375, 1.74884033203125, 1.898223876953125, 2.047607421875, 2.196990966796875, 2.34637451171875, 2.495758056640625, 2.6451416015625, 2.794525146484375, 2.94390869140625, 3.093292236328125, 3.24267578125, 3.392059326171875, 3.54144287109375, 3.690826416015625, 3.8402099609375, 3.989593505859375, 4.13897705078125, 4.288360595703125, 4.437744140625, 4.587127685546875, 4.73651123046875, 4.885894775390625, 5.0352783203125, 5.184661865234375, 5.33404541015625, 5.483428955078125, 5.6328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 12.0, 22.0, 31.0, 46.0, 74.0, 92.0, 166.0, 348.0, 605.0, 1058.0, 2166.0, 4467.0, 10422.0, 25024.0, 63619.0, 175256.0, 437876.0, 204709.0, 72686.0, 28054.0, 11378.0, 5034.0, 2471.0, 1218.0, 678.0, 378.0, 248.0, 129.0, 110.0, 60.0, 30.0, 28.0, 16.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -13.992431640625, -13.48486328125, -12.977294921875, -12.4697265625, -11.962158203125, -11.45458984375, -10.947021484375, -10.439453125, -9.931884765625, -9.42431640625, -8.916748046875, -8.4091796875, -7.901611328125, -7.39404296875, -6.886474609375, -6.37890625, -5.871337890625, -5.36376953125, -4.856201171875, -4.3486328125, -3.841064453125, -3.33349609375, -2.825927734375, -2.318359375, -1.810791015625, -1.30322265625, -0.795654296875, -0.2880859375, 0.219482421875, 0.72705078125, 1.234619140625, 1.7421875, 2.249755859375, 2.75732421875, 3.264892578125, 3.7724609375, 4.280029296875, 4.78759765625, 5.295166015625, 5.802734375, 6.310302734375, 6.81787109375, 7.325439453125, 7.8330078125, 8.340576171875, 8.84814453125, 9.355712890625, 9.86328125, 10.370849609375, 10.87841796875, 11.385986328125, 11.8935546875, 12.401123046875, 12.90869140625, 13.416259765625, 13.923828125, 14.431396484375, 14.93896484375, 15.446533203125, 15.9541015625, 16.461669921875, 16.96923828125, 17.476806640625, 17.984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 4.0, 6.0, 2.0, 9.0, 12.0, 14.0, 21.0, 19.0, 21.0, 23.0, 26.0, 32.0, 48.0, 33.0, 40.0, 42.0, 55.0, 44.0, 50.0, 46.0, 52.0, 45.0, 42.0, 46.0, 42.0, 34.0, 26.0, 27.0, 19.0, 18.0, 17.0, 17.0, 8.0, 13.0, 14.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.234375, -13.8353271484375, -13.436279296875, -13.0372314453125, -12.63818359375, -12.2391357421875, -11.840087890625, -11.4410400390625, -11.0419921875, -10.6429443359375, -10.243896484375, -9.8448486328125, -9.44580078125, -9.0467529296875, -8.647705078125, -8.2486572265625, -7.849609375, -7.4505615234375, -7.051513671875, -6.6524658203125, -6.25341796875, -5.8543701171875, -5.455322265625, -5.0562744140625, -4.6572265625, -4.2581787109375, -3.859130859375, -3.4600830078125, -3.06103515625, -2.6619873046875, -2.262939453125, -1.8638916015625, -1.46484375, -1.0657958984375, -0.666748046875, -0.2677001953125, 0.13134765625, 0.5303955078125, 0.929443359375, 1.3284912109375, 1.7275390625, 2.1265869140625, 2.525634765625, 2.9246826171875, 3.32373046875, 3.7227783203125, 4.121826171875, 4.5208740234375, 4.919921875, 5.3189697265625, 5.718017578125, 6.1170654296875, 6.51611328125, 6.9151611328125, 7.314208984375, 7.7132568359375, 8.1123046875, 8.5113525390625, 8.910400390625, 9.3094482421875, 9.70849609375, 10.1075439453125, 10.506591796875, 10.9056396484375, 11.3046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 7.0, 22.0, 22.0, 24.0, 32.0, 46.0, 78.0, 134.0, 222.0, 361.0, 703.0, 1408.0, 3065.0, 7207.0, 19558.0, 60754.0, 209607.0, 467572.0, 191198.0, 55820.0, 18208.0, 6670.0, 2850.0, 1304.0, 699.0, 349.0, 208.0, 131.0, 80.0, 58.0, 36.0, 20.0, 28.0, 14.0, 9.0, 12.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.625, -9.319091796875, -9.01318359375, -8.707275390625, -8.4013671875, -8.095458984375, -7.78955078125, -7.483642578125, -7.177734375, -6.871826171875, -6.56591796875, -6.260009765625, -5.9541015625, -5.648193359375, -5.34228515625, -5.036376953125, -4.73046875, -4.424560546875, -4.11865234375, -3.812744140625, -3.5068359375, -3.200927734375, -2.89501953125, -2.589111328125, -2.283203125, -1.977294921875, -1.67138671875, -1.365478515625, -1.0595703125, -0.753662109375, -0.44775390625, -0.141845703125, 0.1640625, 0.469970703125, 0.77587890625, 1.081787109375, 1.3876953125, 1.693603515625, 1.99951171875, 2.305419921875, 2.611328125, 2.917236328125, 3.22314453125, 3.529052734375, 3.8349609375, 4.140869140625, 4.44677734375, 4.752685546875, 5.05859375, 5.364501953125, 5.67041015625, 5.976318359375, 6.2822265625, 6.588134765625, 6.89404296875, 7.199951171875, 7.505859375, 7.811767578125, 8.11767578125, 8.423583984375, 8.7294921875, 9.035400390625, 9.34130859375, 9.647216796875, 9.953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 1.0, 4.0, 3.0, 7.0, 9.0, 6.0, 12.0, 22.0, 27.0, 34.0, 57.0, 105.0, 217.0, 189.0, 93.0, 69.0, 39.0, 20.0, 15.0, 14.0, 9.0, 9.0, 9.0, 8.0, 3.0, 5.0, 6.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00218963623046875, -0.0021186470985412598, -0.0020476579666137695, -0.0019766688346862793, -0.001905679702758789, -0.0018346905708312988, -0.0017637014389038086, -0.0016927123069763184, -0.0016217231750488281, -0.0015507340431213379, -0.0014797449111938477, -0.0014087557792663574, -0.0013377666473388672, -0.001266777515411377, -0.0011957883834838867, -0.0011247992515563965, -0.0010538101196289062, -0.000982820987701416, -0.0009118318557739258, -0.0008408427238464355, -0.0007698535919189453, -0.0006988644599914551, -0.0006278753280639648, -0.0005568861961364746, -0.0004858970642089844, -0.00041490793228149414, -0.0003439188003540039, -0.00027292966842651367, -0.00020194053649902344, -0.0001309514045715332, -5.996227264404297e-05, 1.1026859283447266e-05, 8.20159912109375e-05, 0.00015300512313842773, 0.00022399425506591797, 0.0002949833869934082, 0.00036597251892089844, 0.00043696165084838867, 0.0005079507827758789, 0.0005789399147033691, 0.0006499290466308594, 0.0007209181785583496, 0.0007919073104858398, 0.0008628964424133301, 0.0009338855743408203, 0.0010048747062683105, 0.0010758638381958008, 0.001146852970123291, 0.0012178421020507812, 0.0012888312339782715, 0.0013598203659057617, 0.001430809497833252, 0.0015017986297607422, 0.0015727877616882324, 0.0016437768936157227, 0.0017147660255432129, 0.0017857551574707031, 0.0018567442893981934, 0.0019277334213256836, 0.001998722553253174, 0.002069711685180664, 0.0021407008171081543, 0.0022116899490356445, 0.0022826790809631348, 0.002353668212890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 7.0, 13.0, 21.0, 26.0, 33.0, 43.0, 77.0, 116.0, 169.0, 281.0, 460.0, 826.0, 1360.0, 2726.0, 5629.0, 12424.0, 30644.0, 86585.0, 269878.0, 405870.0, 146975.0, 49203.0, 18838.0, 8024.0, 3844.0, 1859.0, 1040.0, 627.0, 337.0, 228.0, 129.0, 82.0, 55.0, 37.0, 27.0, 16.0, 13.0, 6.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.609130859375, -8.30419921875, -7.999267578125, -7.6943359375, -7.389404296875, -7.08447265625, -6.779541015625, -6.474609375, -6.169677734375, -5.86474609375, -5.559814453125, -5.2548828125, -4.949951171875, -4.64501953125, -4.340087890625, -4.03515625, -3.730224609375, -3.42529296875, -3.120361328125, -2.8154296875, -2.510498046875, -2.20556640625, -1.900634765625, -1.595703125, -1.290771484375, -0.98583984375, -0.680908203125, -0.3759765625, -0.071044921875, 0.23388671875, 0.538818359375, 0.84375, 1.148681640625, 1.45361328125, 1.758544921875, 2.0634765625, 2.368408203125, 2.67333984375, 2.978271484375, 3.283203125, 3.588134765625, 3.89306640625, 4.197998046875, 4.5029296875, 4.807861328125, 5.11279296875, 5.417724609375, 5.72265625, 6.027587890625, 6.33251953125, 6.637451171875, 6.9423828125, 7.247314453125, 7.55224609375, 7.857177734375, 8.162109375, 8.467041015625, 8.77197265625, 9.076904296875, 9.3818359375, 9.686767578125, 9.99169921875, 10.296630859375, 10.6015625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 12.0, 5.0, 11.0, 0.0, 20.0, 29.0, 21.0, 42.0, 38.0, 61.0, 61.0, 86.0, 110.0, 94.0, 67.0, 67.0, 48.0, 53.0, 35.0, 38.0, 12.0, 19.0, 10.0, 14.0, 7.0, 9.0, 6.0, 4.0, 5.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5859375, -8.33489990234375, -8.0838623046875, -7.83282470703125, -7.581787109375, -7.33074951171875, -7.0797119140625, -6.82867431640625, -6.57763671875, -6.32659912109375, -6.0755615234375, -5.82452392578125, -5.573486328125, -5.32244873046875, -5.0714111328125, -4.82037353515625, -4.5693359375, -4.31829833984375, -4.0672607421875, -3.81622314453125, -3.565185546875, -3.31414794921875, -3.0631103515625, -2.81207275390625, -2.56103515625, -2.30999755859375, -2.0589599609375, -1.80792236328125, -1.556884765625, -1.30584716796875, -1.0548095703125, -0.80377197265625, -0.552734375, -0.30169677734375, -0.0506591796875, 0.20037841796875, 0.451416015625, 0.70245361328125, 0.9534912109375, 1.20452880859375, 1.45556640625, 1.70660400390625, 1.9576416015625, 2.20867919921875, 2.459716796875, 2.71075439453125, 2.9617919921875, 3.21282958984375, 3.4638671875, 3.71490478515625, 3.9659423828125, 4.21697998046875, 4.468017578125, 4.71905517578125, 4.9700927734375, 5.22113037109375, 5.47216796875, 5.72320556640625, 5.9742431640625, 6.22528076171875, 6.476318359375, 6.72735595703125, 6.9783935546875, 7.22943115234375, 7.48046875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 5.0, 4.0, 14.0, 22.0, 25.0, 24.0, 37.0, 52.0, 73.0, 65.0, 79.0, 82.0, 89.0, 97.0, 85.0, 63.0, 42.0, 50.0, 24.0, 15.0, 16.0, 11.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-121.91217803955078, -118.98638153076172, -116.06058502197266, -113.1347885131836, -110.208984375, -107.28318786621094, -104.35739135742188, -101.43159484863281, -98.50579833984375, -95.58000183105469, -92.65420532226562, -89.72840881347656, -86.8026123046875, -83.8768081665039, -80.95101165771484, -78.02521514892578, -75.09941864013672, -72.17362213134766, -69.2478256225586, -66.32202911376953, -63.3962287902832, -60.47043228149414, -57.54463195800781, -54.61883544921875, -51.69303894042969, -48.767242431640625, -45.84144592285156, -42.915645599365234, -39.98984909057617, -37.06405258178711, -34.13825225830078, -31.21245574951172, -28.286659240722656, -25.360862731933594, -22.4350643157959, -19.509265899658203, -16.58346939086914, -13.657671928405762, -10.731874465942383, -7.8060760498046875, -4.880279541015625, -1.954482078552246, 0.9713153839111328, 3.8971128463745117, 6.822910308837891, 9.74870777130127, 12.674505233764648, 15.600303649902344, 18.526100158691406, 21.45189666748047, 24.377695083618164, 27.30349349975586, 30.229290008544922, 33.155086517333984, 36.08088684082031, 39.006683349609375, 41.93247985839844, 44.8582763671875, 47.78407287597656, 50.70987319946289, 53.63566970825195, 56.561466217041016, 59.487266540527344, 62.413063049316406, 65.33885955810547]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 5.0, 13.0, 10.0, 14.0, 12.0, 7.0, 20.0, 19.0, 27.0, 33.0, 29.0, 33.0, 28.0, 34.0, 41.0, 42.0, 40.0, 49.0, 41.0, 48.0, 42.0, 36.0, 47.0, 44.0, 42.0, 39.0, 29.0, 31.0, 18.0, 20.0, 17.0, 14.0, 14.0, 9.0, 13.0, 3.0, 7.0, 7.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.07814407348633, -59.915199279785156, -57.75225830078125, -55.589317321777344, -53.42637252807617, -51.263427734375, -49.100486755371094, -46.93754577636719, -44.774600982666016, -42.611656188964844, -40.44871520996094, -38.28577423095703, -36.12282943725586, -33.95988464355469, -31.79694366455078, -29.634000778198242, -27.471057891845703, -25.308115005493164, -23.145172119140625, -20.982229232788086, -18.819286346435547, -16.656343460083008, -14.493400573730469, -12.33045768737793, -10.16751480102539, -8.004571914672852, -5.8416290283203125, -3.6786861419677734, -1.5157432556152344, 0.6471996307373047, 2.8101425170898438, 4.973085403442383, 7.1360321044921875, 9.298974990844727, 11.461917877197266, 13.624860763549805, 15.787803649902344, 17.950746536254883, 20.113689422607422, 22.27663230895996, 24.4395751953125, 26.60251808166504, 28.765460968017578, 30.928403854370117, 33.091346740722656, 35.25428771972656, 37.417232513427734, 39.580177307128906, 41.74311828613281, 43.90605926513672, 46.06900405883789, 48.23194885253906, 50.39488983154297, 52.557830810546875, 54.72077560424805, 56.88372039794922, 59.046661376953125, 61.20960235595703, 63.3725471496582, 65.53549194335938, 67.69843292236328, 69.86137390136719, 72.02432250976562, 74.18726348876953, 76.35020446777344]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 6.0, 10.0, 14.0, 19.0, 29.0, 55.0, 86.0, 188.0, 394.0, 919.0, 2499.0, 10342.0, 90305.0, 3923961.0, 146844.0, 13552.0, 3060.0, 1075.0, 443.0, 195.0, 98.0, 62.0, 37.0, 35.0, 15.0, 13.0, 7.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.2177734375, -58.998046875, -56.7783203125, -54.55859375, -52.3388671875, -50.119140625, -47.8994140625, -45.6796875, -43.4599609375, -41.240234375, -39.0205078125, -36.80078125, -34.5810546875, -32.361328125, -30.1416015625, -27.921875, -25.7021484375, -23.482421875, -21.2626953125, -19.04296875, -16.8232421875, -14.603515625, -12.3837890625, -10.1640625, -7.9443359375, -5.724609375, -3.5048828125, -1.28515625, 0.9345703125, 3.154296875, 5.3740234375, 7.59375, 9.8134765625, 12.033203125, 14.2529296875, 16.47265625, 18.6923828125, 20.912109375, 23.1318359375, 25.3515625, 27.5712890625, 29.791015625, 32.0107421875, 34.23046875, 36.4501953125, 38.669921875, 40.8896484375, 43.109375, 45.3291015625, 47.548828125, 49.7685546875, 51.98828125, 54.2080078125, 56.427734375, 58.6474609375, 60.8671875, 63.0869140625, 65.306640625, 67.5263671875, 69.74609375, 71.9658203125, 74.185546875, 76.4052734375, 78.625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 8.0, 9.0, 14.0, 28.0, 23.0, 43.0, 60.0, 57.0, 70.0, 75.0, 84.0, 65.0, 77.0, 89.0, 55.0, 75.0, 44.0, 33.0, 32.0, 13.0, 19.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.797149658203125, -3.64703369140625, -3.496917724609375, -3.3468017578125, -3.196685791015625, -3.04656982421875, -2.896453857421875, -2.746337890625, -2.596221923828125, -2.44610595703125, -2.295989990234375, -2.1458740234375, -1.995758056640625, -1.84564208984375, -1.695526123046875, -1.54541015625, -1.395294189453125, -1.24517822265625, -1.095062255859375, -0.9449462890625, -0.794830322265625, -0.64471435546875, -0.494598388671875, -0.344482421875, -0.194366455078125, -0.04425048828125, 0.105865478515625, 0.2559814453125, 0.406097412109375, 0.55621337890625, 0.706329345703125, 0.8564453125, 1.006561279296875, 1.15667724609375, 1.306793212890625, 1.4569091796875, 1.607025146484375, 1.75714111328125, 1.907257080078125, 2.057373046875, 2.207489013671875, 2.35760498046875, 2.507720947265625, 2.6578369140625, 2.807952880859375, 2.95806884765625, 3.108184814453125, 3.25830078125, 3.408416748046875, 3.55853271484375, 3.708648681640625, 3.8587646484375, 4.008880615234375, 4.15899658203125, 4.309112548828125, 4.459228515625, 4.609344482421875, 4.75946044921875, 4.909576416015625, 5.0596923828125, 5.209808349609375, 5.35992431640625, 5.510040283203125, 5.66015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 9.0, 6.0, 1.0, 9.0, 11.0, 13.0, 18.0, 30.0, 51.0, 108.0, 139.0, 244.0, 460.0, 829.0, 1502.0, 2965.0, 6468.0, 14231.0, 34343.0, 96087.0, 354668.0, 2919654.0, 557128.0, 129751.0, 43361.0, 17335.0, 7448.0, 3544.0, 1704.0, 911.0, 487.0, 290.0, 172.0, 85.0, 54.0, 52.0, 29.0, 19.0, 15.0, 12.0, 12.0, 8.0, 2.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.484375, -17.880859375, -17.27734375, -16.673828125, -16.0703125, -15.466796875, -14.86328125, -14.259765625, -13.65625, -13.052734375, -12.44921875, -11.845703125, -11.2421875, -10.638671875, -10.03515625, -9.431640625, -8.828125, -8.224609375, -7.62109375, -7.017578125, -6.4140625, -5.810546875, -5.20703125, -4.603515625, -4.0, -3.396484375, -2.79296875, -2.189453125, -1.5859375, -0.982421875, -0.37890625, 0.224609375, 0.828125, 1.431640625, 2.03515625, 2.638671875, 3.2421875, 3.845703125, 4.44921875, 5.052734375, 5.65625, 6.259765625, 6.86328125, 7.466796875, 8.0703125, 8.673828125, 9.27734375, 9.880859375, 10.484375, 11.087890625, 11.69140625, 12.294921875, 12.8984375, 13.501953125, 14.10546875, 14.708984375, 15.3125, 15.916015625, 16.51953125, 17.123046875, 17.7265625, 18.330078125, 18.93359375, 19.537109375, 20.140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 7.0, 4.0, 7.0, 5.0, 5.0, 11.0, 16.0, 15.0, 33.0, 25.0, 40.0, 45.0, 74.0, 94.0, 146.0, 214.0, 334.0, 973.0, 955.0, 363.0, 221.0, 129.0, 76.0, 85.0, 54.0, 30.0, 32.0, 20.0, 12.0, 18.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21484375, -5.99285888671875, -5.7708740234375, -5.54888916015625, -5.326904296875, -5.10491943359375, -4.8829345703125, -4.66094970703125, -4.43896484375, -4.21697998046875, -3.9949951171875, -3.77301025390625, -3.551025390625, -3.32904052734375, -3.1070556640625, -2.88507080078125, -2.6630859375, -2.44110107421875, -2.2191162109375, -1.99713134765625, -1.775146484375, -1.55316162109375, -1.3311767578125, -1.10919189453125, -0.88720703125, -0.66522216796875, -0.4432373046875, -0.22125244140625, 0.000732421875, 0.22271728515625, 0.4447021484375, 0.66668701171875, 0.888671875, 1.11065673828125, 1.3326416015625, 1.55462646484375, 1.776611328125, 1.99859619140625, 2.2205810546875, 2.44256591796875, 2.66455078125, 2.88653564453125, 3.1085205078125, 3.33050537109375, 3.552490234375, 3.77447509765625, 3.9964599609375, 4.21844482421875, 4.4404296875, 4.66241455078125, 4.8843994140625, 5.10638427734375, 5.328369140625, 5.55035400390625, 5.7723388671875, 5.99432373046875, 6.21630859375, 6.43829345703125, 6.6602783203125, 6.88226318359375, 7.104248046875, 7.32623291015625, 7.5482177734375, 7.77020263671875, 7.9921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 11.0, 10.0, 14.0, 20.0, 23.0, 30.0, 29.0, 31.0, 62.0, 68.0, 63.0, 74.0, 65.0, 70.0, 60.0, 64.0, 52.0, 37.0, 56.0, 39.0, 24.0, 24.0, 15.0, 10.0, 5.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.740596771240234, -33.64863204956055, -32.55666732788086, -31.464702606201172, -30.372739791870117, -29.28077507019043, -28.188810348510742, -27.096845626831055, -26.0048828125, -24.912918090820312, -23.820953369140625, -22.728988647460938, -21.637025833129883, -20.545061111450195, -19.453096389770508, -18.36113166809082, -17.269166946411133, -16.177202224731445, -15.085238456726074, -13.993273735046387, -12.901309967041016, -11.809345245361328, -10.71738052368164, -9.625415802001953, -8.533452033996582, -7.441487789154053, -6.349523544311523, -5.257558822631836, -4.165594577789307, -3.0736303329467773, -1.9816656112670898, -0.8897013664245605, 0.20226287841796875, 1.2942272424697876, 2.3861916065216064, 3.478156089782715, 4.570120334625244, 5.662084579467773, 6.754049301147461, 7.84601354598999, 8.93797779083252, 10.029942512512207, 11.121906280517578, 12.213871002197266, 13.305835723876953, 14.397799491882324, 15.489764213562012, 16.581727981567383, 17.67369270324707, 18.765657424926758, 19.857622146606445, 20.9495849609375, 22.041549682617188, 23.133514404296875, 24.225479125976562, 25.31744384765625, 26.409408569335938, 27.501373291015625, 28.593338012695312, 29.685302734375, 30.777265548706055, 31.869230270385742, 32.96119689941406, 34.053157806396484, 35.14512252807617]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 3.0, 4.0, 5.0, 7.0, 6.0, 11.0, 7.0, 14.0, 11.0, 17.0, 17.0, 17.0, 15.0, 23.0, 24.0, 21.0, 34.0, 31.0, 33.0, 37.0, 33.0, 28.0, 28.0, 45.0, 52.0, 47.0, 51.0, 40.0, 33.0, 31.0, 41.0, 27.0, 24.0, 30.0, 26.0, 23.0, 18.0, 16.0, 16.0, 15.0, 10.0, 7.0, 10.0, 5.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-25.82083511352539, -25.055906295776367, -24.290977478027344, -23.52604866027832, -22.761119842529297, -21.996191024780273, -21.23126220703125, -20.46633529663086, -19.701404571533203, -18.93647575378418, -18.171546936035156, -17.406618118286133, -16.64168930053711, -15.876760482788086, -15.111832618713379, -14.346903800964355, -13.581975936889648, -12.817047119140625, -12.052118301391602, -11.287189483642578, -10.522260665893555, -9.757331848144531, -8.992403984069824, -8.2274751663208, -7.462546348571777, -6.697617530822754, -5.9326887130737305, -5.167760372161865, -4.402831554412842, -3.6379027366638184, -2.872974395751953, -2.1080455780029297, -1.3431148529052734, -0.5781861543655396, 0.18674254417419434, 0.9516711235046387, 1.716599941253662, 2.4815287590026855, 3.246457099914551, 4.011385917663574, 4.776314735412598, 5.541243553161621, 6.3061723709106445, 7.07110071182251, 7.836029529571533, 8.600957870483398, 9.365886688232422, 10.130815505981445, 10.895744323730469, 11.660673141479492, 12.425601959228516, 13.190530776977539, 13.955459594726562, 14.720388412475586, 15.485316276550293, 16.250244140625, 17.015174865722656, 17.78010368347168, 18.545032501220703, 19.309961318969727, 20.07489013671875, 20.839818954467773, 21.604747772216797, 22.369674682617188, 23.13460350036621]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 5.0, 16.0, 23.0, 38.0, 52.0, 70.0, 100.0, 150.0, 210.0, 387.0, 608.0, 976.0, 2231.0, 5479.0, 17089.0, 64309.0, 274426.0, 512067.0, 123463.0, 31019.0, 9267.0, 3179.0, 1450.0, 697.0, 441.0, 233.0, 151.0, 121.0, 84.0, 54.0, 30.0, 34.0, 19.0, 14.0, 15.0, 12.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.53125, -36.40185546875, -35.2724609375, -34.14306640625, -33.013671875, -31.88427734375, -30.7548828125, -29.62548828125, -28.49609375, -27.36669921875, -26.2373046875, -25.10791015625, -23.978515625, -22.84912109375, -21.7197265625, -20.59033203125, -19.4609375, -18.33154296875, -17.2021484375, -16.07275390625, -14.943359375, -13.81396484375, -12.6845703125, -11.55517578125, -10.42578125, -9.29638671875, -8.1669921875, -7.03759765625, -5.908203125, -4.77880859375, -3.6494140625, -2.52001953125, -1.390625, -0.26123046875, 0.8681640625, 1.99755859375, 3.126953125, 4.25634765625, 5.3857421875, 6.51513671875, 7.64453125, 8.77392578125, 9.9033203125, 11.03271484375, 12.162109375, 13.29150390625, 14.4208984375, 15.55029296875, 16.6796875, 17.80908203125, 18.9384765625, 20.06787109375, 21.197265625, 22.32666015625, 23.4560546875, 24.58544921875, 25.71484375, 26.84423828125, 27.9736328125, 29.10302734375, 30.232421875, 31.36181640625, 32.4912109375, 33.62060546875, 34.75]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 7.0, 9.0, 17.0, 22.0, 20.0, 45.0, 39.0, 49.0, 75.0, 66.0, 62.0, 88.0, 73.0, 75.0, 91.0, 54.0, 50.0, 37.0, 30.0, 32.0, 20.0, 11.0, 11.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.814453125, -3.667327880859375, -3.52020263671875, -3.373077392578125, -3.2259521484375, -3.078826904296875, -2.93170166015625, -2.784576416015625, -2.637451171875, -2.490325927734375, -2.34320068359375, -2.196075439453125, -2.0489501953125, -1.901824951171875, -1.75469970703125, -1.607574462890625, -1.46044921875, -1.313323974609375, -1.16619873046875, -1.019073486328125, -0.8719482421875, -0.724822998046875, -0.57769775390625, -0.430572509765625, -0.283447265625, -0.136322021484375, 0.01080322265625, 0.157928466796875, 0.3050537109375, 0.452178955078125, 0.59930419921875, 0.746429443359375, 0.8935546875, 1.040679931640625, 1.18780517578125, 1.334930419921875, 1.4820556640625, 1.629180908203125, 1.77630615234375, 1.923431396484375, 2.070556640625, 2.217681884765625, 2.36480712890625, 2.511932373046875, 2.6590576171875, 2.806182861328125, 2.95330810546875, 3.100433349609375, 3.24755859375, 3.394683837890625, 3.54180908203125, 3.688934326171875, 3.8360595703125, 3.983184814453125, 4.13031005859375, 4.277435302734375, 4.424560546875, 4.571685791015625, 4.71881103515625, 4.865936279296875, 5.0130615234375, 5.160186767578125, 5.30731201171875, 5.454437255859375, 5.6015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 9.0, 7.0, 16.0, 14.0, 32.0, 27.0, 64.0, 87.0, 108.0, 152.0, 208.0, 291.0, 432.0, 717.0, 1380.0, 2750.0, 6611.0, 18114.0, 53849.0, 160858.0, 419193.0, 253211.0, 84226.0, 28214.0, 9876.0, 3766.0, 1726.0, 949.0, 523.0, 350.0, 223.0, 153.0, 112.0, 68.0, 56.0, 40.0, 29.0, 28.0, 15.0, 15.0, 10.0, 7.0, 10.0, 10.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.125, -15.563232421875, -15.00146484375, -14.439697265625, -13.8779296875, -13.316162109375, -12.75439453125, -12.192626953125, -11.630859375, -11.069091796875, -10.50732421875, -9.945556640625, -9.3837890625, -8.822021484375, -8.26025390625, -7.698486328125, -7.13671875, -6.574951171875, -6.01318359375, -5.451416015625, -4.8896484375, -4.327880859375, -3.76611328125, -3.204345703125, -2.642578125, -2.080810546875, -1.51904296875, -0.957275390625, -0.3955078125, 0.166259765625, 0.72802734375, 1.289794921875, 1.8515625, 2.413330078125, 2.97509765625, 3.536865234375, 4.0986328125, 4.660400390625, 5.22216796875, 5.783935546875, 6.345703125, 6.907470703125, 7.46923828125, 8.031005859375, 8.5927734375, 9.154541015625, 9.71630859375, 10.278076171875, 10.83984375, 11.401611328125, 11.96337890625, 12.525146484375, 13.0869140625, 13.648681640625, 14.21044921875, 14.772216796875, 15.333984375, 15.895751953125, 16.45751953125, 17.019287109375, 17.5810546875, 18.142822265625, 18.70458984375, 19.266357421875, 19.828125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 3.0, 12.0, 9.0, 13.0, 14.0, 14.0, 17.0, 23.0, 30.0, 31.0, 37.0, 41.0, 33.0, 40.0, 46.0, 49.0, 47.0, 54.0, 41.0, 49.0, 44.0, 51.0, 38.0, 41.0, 32.0, 28.0, 29.0, 24.0, 27.0, 18.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-15.0078125, -14.5946044921875, -14.181396484375, -13.7681884765625, -13.35498046875, -12.9417724609375, -12.528564453125, -12.1153564453125, -11.7021484375, -11.2889404296875, -10.875732421875, -10.4625244140625, -10.04931640625, -9.6361083984375, -9.222900390625, -8.8096923828125, -8.396484375, -7.9832763671875, -7.570068359375, -7.1568603515625, -6.74365234375, -6.3304443359375, -5.917236328125, -5.5040283203125, -5.0908203125, -4.6776123046875, -4.264404296875, -3.8511962890625, -3.43798828125, -3.0247802734375, -2.611572265625, -2.1983642578125, -1.78515625, -1.3719482421875, -0.958740234375, -0.5455322265625, -0.13232421875, 0.2808837890625, 0.694091796875, 1.1072998046875, 1.5205078125, 1.9337158203125, 2.346923828125, 2.7601318359375, 3.17333984375, 3.5865478515625, 3.999755859375, 4.4129638671875, 4.826171875, 5.2393798828125, 5.652587890625, 6.0657958984375, 6.47900390625, 6.8922119140625, 7.305419921875, 7.7186279296875, 8.1318359375, 8.5450439453125, 8.958251953125, 9.3714599609375, 9.78466796875, 10.1978759765625, 10.611083984375, 11.0242919921875, 11.4375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 8.0, 19.0, 19.0, 45.0, 51.0, 72.0, 139.0, 188.0, 275.0, 463.0, 798.0, 1322.0, 2358.0, 4624.0, 9339.0, 21325.0, 55845.0, 169465.0, 438565.0, 223832.0, 70203.0, 26217.0, 11244.0, 5481.0, 2800.0, 1544.0, 885.0, 502.0, 314.0, 188.0, 135.0, 93.0, 61.0, 46.0, 18.0, 17.0, 17.0, 10.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-10.4921875, -10.20562744140625, -9.9190673828125, -9.63250732421875, -9.345947265625, -9.05938720703125, -8.7728271484375, -8.48626708984375, -8.19970703125, -7.91314697265625, -7.6265869140625, -7.34002685546875, -7.053466796875, -6.76690673828125, -6.4803466796875, -6.19378662109375, -5.9072265625, -5.62066650390625, -5.3341064453125, -5.04754638671875, -4.760986328125, -4.47442626953125, -4.1878662109375, -3.90130615234375, -3.61474609375, -3.32818603515625, -3.0416259765625, -2.75506591796875, -2.468505859375, -2.18194580078125, -1.8953857421875, -1.60882568359375, -1.322265625, -1.03570556640625, -0.7491455078125, -0.46258544921875, -0.176025390625, 0.11053466796875, 0.3970947265625, 0.68365478515625, 0.97021484375, 1.25677490234375, 1.5433349609375, 1.82989501953125, 2.116455078125, 2.40301513671875, 2.6895751953125, 2.97613525390625, 3.2626953125, 3.54925537109375, 3.8358154296875, 4.12237548828125, 4.408935546875, 4.69549560546875, 4.9820556640625, 5.26861572265625, 5.55517578125, 5.84173583984375, 6.1282958984375, 6.41485595703125, 6.701416015625, 6.98797607421875, 7.2745361328125, 7.56109619140625, 7.84765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 11.0, 6.0, 16.0, 16.0, 36.0, 30.0, 59.0, 100.0, 156.0, 200.0, 109.0, 80.0, 44.0, 36.0, 23.0, 23.0, 12.0, 10.0, 10.0, 5.0, 8.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0035457611083984375, -0.00346393883228302, -0.0033821165561676025, -0.003300294280052185, -0.0032184720039367676, -0.00313664972782135, -0.0030548274517059326, -0.002973005175590515, -0.0028911828994750977, -0.00280936062335968, -0.0027275383472442627, -0.002645716071128845, -0.0025638937950134277, -0.0024820715188980103, -0.0024002492427825928, -0.0023184269666671753, -0.002236604690551758, -0.0021547824144363403, -0.002072960138320923, -0.0019911378622055054, -0.0019093155860900879, -0.0018274933099746704, -0.001745671033859253, -0.0016638487577438354, -0.001582026481628418, -0.0015002042055130005, -0.001418381929397583, -0.0013365596532821655, -0.001254737377166748, -0.0011729151010513306, -0.001091092824935913, -0.0010092705488204956, -0.0009274482727050781, -0.0008456259965896606, -0.0007638037204742432, -0.0006819814443588257, -0.0006001591682434082, -0.0005183368921279907, -0.00043651461601257324, -0.00035469233989715576, -0.0002728700637817383, -0.0001910477876663208, -0.00010922551155090332, -2.740323543548584e-05, 5.441904067993164e-05, 0.00013624131679534912, 0.0002180635929107666, 0.0002998858690261841, 0.00038170814514160156, 0.00046353042125701904, 0.0005453526973724365, 0.000627174973487854, 0.0007089972496032715, 0.000790819525718689, 0.0008726418018341064, 0.0009544640779495239, 0.0010362863540649414, 0.0011181086301803589, 0.0011999309062957764, 0.0012817531824111938, 0.0013635754585266113, 0.0014453977346420288, 0.0015272200107574463, 0.0016090422868728638, 0.0016908645629882812]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 9.0, 9.0, 14.0, 12.0, 28.0, 30.0, 72.0, 106.0, 155.0, 280.0, 578.0, 1080.0, 2430.0, 6134.0, 17869.0, 74289.0, 516158.0, 353187.0, 53199.0, 13841.0, 4940.0, 2068.0, 927.0, 473.0, 215.0, 170.0, 91.0, 65.0, 32.0, 29.0, 12.0, 11.0, 10.0, 10.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.239990234375, -15.71435546875, -15.188720703125, -14.6630859375, -14.137451171875, -13.61181640625, -13.086181640625, -12.560546875, -12.034912109375, -11.50927734375, -10.983642578125, -10.4580078125, -9.932373046875, -9.40673828125, -8.881103515625, -8.35546875, -7.829833984375, -7.30419921875, -6.778564453125, -6.2529296875, -5.727294921875, -5.20166015625, -4.676025390625, -4.150390625, -3.624755859375, -3.09912109375, -2.573486328125, -2.0478515625, -1.522216796875, -0.99658203125, -0.470947265625, 0.0546875, 0.580322265625, 1.10595703125, 1.631591796875, 2.1572265625, 2.682861328125, 3.20849609375, 3.734130859375, 4.259765625, 4.785400390625, 5.31103515625, 5.836669921875, 6.3623046875, 6.887939453125, 7.41357421875, 7.939208984375, 8.46484375, 8.990478515625, 9.51611328125, 10.041748046875, 10.5673828125, 11.093017578125, 11.61865234375, 12.144287109375, 12.669921875, 13.195556640625, 13.72119140625, 14.246826171875, 14.7724609375, 15.298095703125, 15.82373046875, 16.349365234375, 16.875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 10.0, 2.0, 8.0, 18.0, 18.0, 38.0, 47.0, 56.0, 78.0, 135.0, 133.0, 141.0, 87.0, 38.0, 38.0, 31.0, 32.0, 26.0, 17.0, 9.0, 9.0, 6.0, 6.0, 1.0, 6.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.421875, -11.0615234375, -10.701171875, -10.3408203125, -9.98046875, -9.6201171875, -9.259765625, -8.8994140625, -8.5390625, -8.1787109375, -7.818359375, -7.4580078125, -7.09765625, -6.7373046875, -6.376953125, -6.0166015625, -5.65625, -5.2958984375, -4.935546875, -4.5751953125, -4.21484375, -3.8544921875, -3.494140625, -3.1337890625, -2.7734375, -2.4130859375, -2.052734375, -1.6923828125, -1.33203125, -0.9716796875, -0.611328125, -0.2509765625, 0.109375, 0.4697265625, 0.830078125, 1.1904296875, 1.55078125, 1.9111328125, 2.271484375, 2.6318359375, 2.9921875, 3.3525390625, 3.712890625, 4.0732421875, 4.43359375, 4.7939453125, 5.154296875, 5.5146484375, 5.875, 6.2353515625, 6.595703125, 6.9560546875, 7.31640625, 7.6767578125, 8.037109375, 8.3974609375, 8.7578125, 9.1181640625, 9.478515625, 9.8388671875, 10.19921875, 10.5595703125, 10.919921875, 11.2802734375, 11.640625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 17.0, 21.0, 31.0, 46.0, 65.0, 88.0, 118.0, 88.0, 110.0, 110.0, 78.0, 75.0, 41.0, 41.0, 20.0, 16.0, 9.0, 9.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-86.82144165039062, -82.77363586425781, -78.72583770751953, -74.67803192138672, -70.63023376464844, -66.58242797851562, -62.53462219238281, -58.486820220947266, -54.43901824951172, -50.39121627807617, -46.343414306640625, -42.29560852050781, -38.247806549072266, -34.20000457763672, -30.15220069885254, -26.10439682006836, -22.056594848632812, -18.008792877197266, -13.960988998413086, -9.913186073303223, -5.865383148193359, -1.8175811767578125, 2.230222702026367, 6.278026580810547, 10.325828552246094, 14.373631477355957, 18.42143440246582, 22.46923828125, 26.517040252685547, 30.564842224121094, 34.612648010253906, 38.66044998168945, 42.70826721191406, 46.75606918334961, 50.803871154785156, 54.85167694091797, 58.899478912353516, 62.94728088378906, 66.99508666992188, 71.04289245605469, 75.09069061279297, 79.13849639892578, 83.18629455566406, 87.23410034179688, 91.28190612792969, 95.32970428466797, 99.37751007080078, 103.42530822753906, 107.47311401367188, 111.52091979980469, 115.56871795654297, 119.61652374267578, 123.66432189941406, 127.71212768554688, 131.7599334716797, 135.8077392578125, 139.85552978515625, 143.90333557128906, 147.95114135742188, 151.99893188476562, 156.04673767089844, 160.09454345703125, 164.14234924316406, 168.19015502929688, 172.2379608154297]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 5.0, 5.0, 9.0, 12.0, 10.0, 17.0, 12.0, 25.0, 23.0, 23.0, 28.0, 36.0, 25.0, 33.0, 34.0, 54.0, 40.0, 38.0, 49.0, 43.0, 40.0, 42.0, 52.0, 37.0, 37.0, 33.0, 37.0, 25.0, 26.0, 16.0, 28.0, 12.0, 13.0, 8.0, 7.0, 12.0, 11.0, 11.0, 6.0, 4.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-69.34349822998047, -67.10753631591797, -64.87157440185547, -62.6356086730957, -60.39964294433594, -58.16368103027344, -55.92771911621094, -53.69175720214844, -51.45579147338867, -49.21982955932617, -46.983863830566406, -44.747901916503906, -42.511940002441406, -40.27597427368164, -38.04001235961914, -35.804046630859375, -33.568084716796875, -31.332120895385742, -29.09615707397461, -26.86019515991211, -24.624231338500977, -22.388267517089844, -20.152305603027344, -17.91634178161621, -15.680377960205078, -13.444414138793945, -11.208451271057129, -8.972488403320312, -6.73652458190918, -4.500560760498047, -2.2645978927612305, -0.028635025024414062, 2.20733642578125, 4.443299770355225, 6.679263114929199, 8.915225982666016, 11.151189804077148, 13.387153625488281, 15.623116493225098, 17.859079360961914, 20.095043182373047, 22.33100700378418, 24.566970825195312, 26.802932739257812, 29.038896560668945, 31.274860382080078, 33.51082229614258, 35.746788024902344, 37.982749938964844, 40.218711853027344, 42.45467758178711, 44.69063949584961, 46.926605224609375, 49.162567138671875, 51.398529052734375, 53.634490966796875, 55.87045669555664, 58.10641860961914, 60.342384338378906, 62.578346252441406, 64.8143081665039, 67.05027770996094, 69.28623962402344, 71.52220153808594, 73.75816345214844]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 10.0, 8.0, 20.0, 17.0, 36.0, 45.0, 50.0, 82.0, 142.0, 251.0, 403.0, 792.0, 1613.0, 4024.0, 12781.0, 58090.0, 693228.0, 3288624.0, 104866.0, 19376.0, 5401.0, 2075.0, 988.0, 482.0, 300.0, 182.0, 109.0, 92.0, 56.0, 31.0, 26.0, 24.0, 13.0, 7.0, 4.0, 12.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.875, -45.26708984375, -43.6591796875, -42.05126953125, -40.443359375, -38.83544921875, -37.2275390625, -35.61962890625, -34.01171875, -32.40380859375, -30.7958984375, -29.18798828125, -27.580078125, -25.97216796875, -24.3642578125, -22.75634765625, -21.1484375, -19.54052734375, -17.9326171875, -16.32470703125, -14.716796875, -13.10888671875, -11.5009765625, -9.89306640625, -8.28515625, -6.67724609375, -5.0693359375, -3.46142578125, -1.853515625, -0.24560546875, 1.3623046875, 2.97021484375, 4.578125, 6.18603515625, 7.7939453125, 9.40185546875, 11.009765625, 12.61767578125, 14.2255859375, 15.83349609375, 17.44140625, 19.04931640625, 20.6572265625, 22.26513671875, 23.873046875, 25.48095703125, 27.0888671875, 28.69677734375, 30.3046875, 31.91259765625, 33.5205078125, 35.12841796875, 36.736328125, 38.34423828125, 39.9521484375, 41.56005859375, 43.16796875, 44.77587890625, 46.3837890625, 47.99169921875, 49.599609375, 51.20751953125, 52.8154296875, 54.42333984375, 56.03125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 9.0, 9.0, 18.0, 19.0, 23.0, 39.0, 35.0, 41.0, 68.0, 61.0, 58.0, 67.0, 87.0, 88.0, 68.0, 58.0, 54.0, 46.0, 42.0, 32.0, 28.0, 16.0, 9.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7109375, -3.56500244140625, -3.4190673828125, -3.27313232421875, -3.127197265625, -2.98126220703125, -2.8353271484375, -2.68939208984375, -2.54345703125, -2.39752197265625, -2.2515869140625, -2.10565185546875, -1.959716796875, -1.81378173828125, -1.6678466796875, -1.52191162109375, -1.3759765625, -1.23004150390625, -1.0841064453125, -0.93817138671875, -0.792236328125, -0.64630126953125, -0.5003662109375, -0.35443115234375, -0.20849609375, -0.06256103515625, 0.0833740234375, 0.22930908203125, 0.375244140625, 0.52117919921875, 0.6671142578125, 0.81304931640625, 0.958984375, 1.10491943359375, 1.2508544921875, 1.39678955078125, 1.542724609375, 1.68865966796875, 1.8345947265625, 1.98052978515625, 2.12646484375, 2.27239990234375, 2.4183349609375, 2.56427001953125, 2.710205078125, 2.85614013671875, 3.0020751953125, 3.14801025390625, 3.2939453125, 3.43988037109375, 3.5858154296875, 3.73175048828125, 3.877685546875, 4.02362060546875, 4.1695556640625, 4.31549072265625, 4.46142578125, 4.60736083984375, 4.7532958984375, 4.89923095703125, 5.045166015625, 5.19110107421875, 5.3370361328125, 5.48297119140625, 5.62890625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 12.0, 15.0, 17.0, 20.0, 33.0, 55.0, 64.0, 97.0, 132.0, 183.0, 328.0, 491.0, 824.0, 1577.0, 3028.0, 6619.0, 15752.0, 40614.0, 122523.0, 485074.0, 2759445.0, 547136.0, 135096.0, 44139.0, 16875.0, 6949.0, 3215.0, 1657.0, 883.0, 495.0, 313.0, 191.0, 98.0, 77.0, 80.0, 51.0, 39.0, 20.0, 17.0, 16.0, 13.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.53125, -17.8818359375, -17.232421875, -16.5830078125, -15.93359375, -15.2841796875, -14.634765625, -13.9853515625, -13.3359375, -12.6865234375, -12.037109375, -11.3876953125, -10.73828125, -10.0888671875, -9.439453125, -8.7900390625, -8.140625, -7.4912109375, -6.841796875, -6.1923828125, -5.54296875, -4.8935546875, -4.244140625, -3.5947265625, -2.9453125, -2.2958984375, -1.646484375, -0.9970703125, -0.34765625, 0.3017578125, 0.951171875, 1.6005859375, 2.25, 2.8994140625, 3.548828125, 4.1982421875, 4.84765625, 5.4970703125, 6.146484375, 6.7958984375, 7.4453125, 8.0947265625, 8.744140625, 9.3935546875, 10.04296875, 10.6923828125, 11.341796875, 11.9912109375, 12.640625, 13.2900390625, 13.939453125, 14.5888671875, 15.23828125, 15.8876953125, 16.537109375, 17.1865234375, 17.8359375, 18.4853515625, 19.134765625, 19.7841796875, 20.43359375, 21.0830078125, 21.732421875, 22.3818359375, 23.03125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 3.0, 4.0, 12.0, 4.0, 11.0, 16.0, 5.0, 15.0, 33.0, 54.0, 77.0, 67.0, 103.0, 156.0, 217.0, 371.0, 718.0, 912.0, 410.0, 236.0, 148.0, 116.0, 93.0, 84.0, 59.0, 35.0, 25.0, 20.0, 8.0, 13.0, 10.0, 7.0, 12.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8267822265625, -8.552001953125, -8.2772216796875, -8.00244140625, -7.7276611328125, -7.452880859375, -7.1781005859375, -6.9033203125, -6.6285400390625, -6.353759765625, -6.0789794921875, -5.80419921875, -5.5294189453125, -5.254638671875, -4.9798583984375, -4.705078125, -4.4302978515625, -4.155517578125, -3.8807373046875, -3.60595703125, -3.3311767578125, -3.056396484375, -2.7816162109375, -2.5068359375, -2.2320556640625, -1.957275390625, -1.6824951171875, -1.40771484375, -1.1329345703125, -0.858154296875, -0.5833740234375, -0.30859375, -0.0338134765625, 0.240966796875, 0.5157470703125, 0.79052734375, 1.0653076171875, 1.340087890625, 1.6148681640625, 1.8896484375, 2.1644287109375, 2.439208984375, 2.7139892578125, 2.98876953125, 3.2635498046875, 3.538330078125, 3.8131103515625, 4.087890625, 4.3626708984375, 4.637451171875, 4.9122314453125, 5.18701171875, 5.4617919921875, 5.736572265625, 6.0113525390625, 6.2861328125, 6.5609130859375, 6.835693359375, 7.1104736328125, 7.38525390625, 7.6600341796875, 7.934814453125, 8.2095947265625, 8.484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 15.0, 16.0, 27.0, 44.0, 55.0, 69.0, 97.0, 110.0, 115.0, 107.0, 102.0, 64.0, 68.0, 36.0, 28.0, 15.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.09645080566406, -39.640724182128906, -37.184993743896484, -34.72926712036133, -32.273536682128906, -29.81781005859375, -27.362083435058594, -24.906354904174805, -22.450626373291016, -19.994897842407227, -17.539169311523438, -15.083442687988281, -12.627714157104492, -10.171985626220703, -7.7162580490112305, -5.260530471801758, -2.8048019409179688, -0.3490738868713379, 2.106654167175293, 4.562382221221924, 7.018110275268555, 9.473838806152344, 11.929566383361816, 14.385293960571289, 16.841022491455078, 19.296751022338867, 21.752479553222656, 24.208206176757812, 26.6639347076416, 29.11966323852539, 31.575389862060547, 34.03112030029297, 36.486854553222656, 38.94258117675781, 41.398311614990234, 43.85403823852539, 46.30976867675781, 48.76549530029297, 51.221221923828125, 53.67694854736328, 56.1326789855957, 58.58840560913086, 61.04413604736328, 63.49986267089844, 65.9555892944336, 68.41131591796875, 70.86705017089844, 73.3227767944336, 75.77850341796875, 78.2342300415039, 80.68995666503906, 83.14569091796875, 85.6014175415039, 88.05714416503906, 90.51287078857422, 92.96859741210938, 95.42433166503906, 97.88005828857422, 100.33578491210938, 102.79151916503906, 105.24724578857422, 107.70297241210938, 110.15869903564453, 112.61442565917969, 115.07015228271484]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 1.0, 3.0, 7.0, 4.0, 11.0, 9.0, 13.0, 5.0, 20.0, 19.0, 12.0, 22.0, 19.0, 27.0, 22.0, 28.0, 40.0, 24.0, 38.0, 38.0, 40.0, 59.0, 37.0, 39.0, 37.0, 35.0, 35.0, 41.0, 25.0, 48.0, 32.0, 27.0, 21.0, 25.0, 23.0, 21.0, 12.0, 18.0, 9.0, 10.0, 11.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-36.86450958251953, -35.78415298461914, -34.70379638671875, -33.62343978881836, -32.54308319091797, -31.462726593017578, -30.382369995117188, -29.302013397216797, -28.221656799316406, -27.141300201416016, -26.060943603515625, -24.980587005615234, -23.900230407714844, -22.819873809814453, -21.739517211914062, -20.659160614013672, -19.57880210876465, -18.498445510864258, -17.418088912963867, -16.337732315063477, -15.257375717163086, -14.177019119262695, -13.096661567687988, -12.016304969787598, -10.935948371887207, -9.855591773986816, -8.775235176086426, -7.694878101348877, -6.614521503448486, -5.534164905548096, -4.453807830810547, -3.3734512329101562, -2.2930946350097656, -1.2127379179000854, -0.13238120079040527, 0.9479756355285645, 2.028332233428955, 3.1086888313293457, 4.1890459060668945, 5.269402503967285, 6.349759101867676, 7.430115699768066, 8.510472297668457, 9.590829849243164, 10.671186447143555, 11.751543045043945, 12.831899642944336, 13.912256240844727, 14.992612838745117, 16.072969436645508, 17.1533260345459, 18.23368263244629, 19.31403923034668, 20.39439582824707, 21.474754333496094, 22.555110931396484, 23.635467529296875, 24.715824127197266, 25.796180725097656, 26.876537322998047, 27.956893920898438, 29.037250518798828, 30.11760711669922, 31.19796371459961, 32.2783203125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 2.0, 7.0, 4.0, 11.0, 19.0, 14.0, 24.0, 36.0, 49.0, 66.0, 99.0, 149.0, 267.0, 448.0, 801.0, 1730.0, 4334.0, 12917.0, 47895.0, 249577.0, 611681.0, 85983.0, 21190.0, 6407.0, 2378.0, 1073.0, 495.0, 298.0, 206.0, 124.0, 95.0, 62.0, 27.0, 19.0, 17.0, 20.0, 9.0, 9.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.50244140625, -32.2236328125, -30.94482421875, -29.666015625, -28.38720703125, -27.1083984375, -25.82958984375, -24.55078125, -23.27197265625, -21.9931640625, -20.71435546875, -19.435546875, -18.15673828125, -16.8779296875, -15.59912109375, -14.3203125, -13.04150390625, -11.7626953125, -10.48388671875, -9.205078125, -7.92626953125, -6.6474609375, -5.36865234375, -4.08984375, -2.81103515625, -1.5322265625, -0.25341796875, 1.025390625, 2.30419921875, 3.5830078125, 4.86181640625, 6.140625, 7.41943359375, 8.6982421875, 9.97705078125, 11.255859375, 12.53466796875, 13.8134765625, 15.09228515625, 16.37109375, 17.64990234375, 18.9287109375, 20.20751953125, 21.486328125, 22.76513671875, 24.0439453125, 25.32275390625, 26.6015625, 27.88037109375, 29.1591796875, 30.43798828125, 31.716796875, 32.99560546875, 34.2744140625, 35.55322265625, 36.83203125, 38.11083984375, 39.3896484375, 40.66845703125, 41.947265625, 43.22607421875, 44.5048828125, 45.78369140625, 47.0625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 11.0, 11.0, 23.0, 30.0, 34.0, 40.0, 46.0, 57.0, 67.0, 55.0, 80.0, 73.0, 70.0, 61.0, 60.0, 64.0, 42.0, 34.0, 33.0, 25.0, 15.0, 12.0, 12.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8828125, -3.73492431640625, -3.5870361328125, -3.43914794921875, -3.291259765625, -3.14337158203125, -2.9954833984375, -2.84759521484375, -2.69970703125, -2.55181884765625, -2.4039306640625, -2.25604248046875, -2.108154296875, -1.96026611328125, -1.8123779296875, -1.66448974609375, -1.5166015625, -1.36871337890625, -1.2208251953125, -1.07293701171875, -0.925048828125, -0.77716064453125, -0.6292724609375, -0.48138427734375, -0.33349609375, -0.18560791015625, -0.0377197265625, 0.11016845703125, 0.258056640625, 0.40594482421875, 0.5538330078125, 0.70172119140625, 0.849609375, 0.99749755859375, 1.1453857421875, 1.29327392578125, 1.441162109375, 1.58905029296875, 1.7369384765625, 1.88482666015625, 2.03271484375, 2.18060302734375, 2.3284912109375, 2.47637939453125, 2.624267578125, 2.77215576171875, 2.9200439453125, 3.06793212890625, 3.2158203125, 3.36370849609375, 3.5115966796875, 3.65948486328125, 3.807373046875, 3.95526123046875, 4.1031494140625, 4.25103759765625, 4.39892578125, 4.54681396484375, 4.6947021484375, 4.84259033203125, 4.990478515625, 5.13836669921875, 5.2862548828125, 5.43414306640625, 5.58203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 12.0, 18.0, 18.0, 17.0, 27.0, 33.0, 49.0, 70.0, 92.0, 103.0, 188.0, 270.0, 437.0, 673.0, 1287.0, 2789.0, 6259.0, 16609.0, 48792.0, 179258.0, 592170.0, 135553.0, 39565.0, 13645.0, 5301.0, 2352.0, 1094.0, 643.0, 372.0, 264.0, 169.0, 101.0, 77.0, 64.0, 46.0, 33.0, 23.0, 16.0, 16.0, 10.0, 10.0, 7.0, 8.0, 4.0, 3.0, 3.0, 5.0, 0.0, 0.0, 3.0], "bins": [-24.21875, -23.514892578125, -22.81103515625, -22.107177734375, -21.4033203125, -20.699462890625, -19.99560546875, -19.291748046875, -18.587890625, -17.884033203125, -17.18017578125, -16.476318359375, -15.7724609375, -15.068603515625, -14.36474609375, -13.660888671875, -12.95703125, -12.253173828125, -11.54931640625, -10.845458984375, -10.1416015625, -9.437744140625, -8.73388671875, -8.030029296875, -7.326171875, -6.622314453125, -5.91845703125, -5.214599609375, -4.5107421875, -3.806884765625, -3.10302734375, -2.399169921875, -1.6953125, -0.991455078125, -0.28759765625, 0.416259765625, 1.1201171875, 1.823974609375, 2.52783203125, 3.231689453125, 3.935546875, 4.639404296875, 5.34326171875, 6.047119140625, 6.7509765625, 7.454833984375, 8.15869140625, 8.862548828125, 9.56640625, 10.270263671875, 10.97412109375, 11.677978515625, 12.3818359375, 13.085693359375, 13.78955078125, 14.493408203125, 15.197265625, 15.901123046875, 16.60498046875, 17.308837890625, 18.0126953125, 18.716552734375, 19.42041015625, 20.124267578125, 20.828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 4.0, 3.0, 1.0, 0.0, 2.0, 3.0, 8.0, 4.0, 3.0, 8.0, 14.0, 10.0, 8.0, 13.0, 18.0, 28.0, 17.0, 29.0, 24.0, 32.0, 47.0, 47.0, 52.0, 52.0, 44.0, 43.0, 70.0, 45.0, 42.0, 52.0, 39.0, 39.0, 36.0, 38.0, 24.0, 27.0, 16.0, 12.0, 8.0, 13.0, 6.0, 7.0, 10.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.0625, -13.59326171875, -13.1240234375, -12.65478515625, -12.185546875, -11.71630859375, -11.2470703125, -10.77783203125, -10.30859375, -9.83935546875, -9.3701171875, -8.90087890625, -8.431640625, -7.96240234375, -7.4931640625, -7.02392578125, -6.5546875, -6.08544921875, -5.6162109375, -5.14697265625, -4.677734375, -4.20849609375, -3.7392578125, -3.27001953125, -2.80078125, -2.33154296875, -1.8623046875, -1.39306640625, -0.923828125, -0.45458984375, 0.0146484375, 0.48388671875, 0.953125, 1.42236328125, 1.8916015625, 2.36083984375, 2.830078125, 3.29931640625, 3.7685546875, 4.23779296875, 4.70703125, 5.17626953125, 5.6455078125, 6.11474609375, 6.583984375, 7.05322265625, 7.5224609375, 7.99169921875, 8.4609375, 8.93017578125, 9.3994140625, 9.86865234375, 10.337890625, 10.80712890625, 11.2763671875, 11.74560546875, 12.21484375, 12.68408203125, 13.1533203125, 13.62255859375, 14.091796875, 14.56103515625, 15.0302734375, 15.49951171875, 15.96875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 23.0, 34.0, 69.0, 83.0, 147.0, 297.0, 538.0, 1159.0, 2617.0, 7237.0, 28088.0, 276255.0, 664487.0, 50452.0, 10524.0, 3567.0, 1516.0, 639.0, 347.0, 180.0, 103.0, 66.0, 34.0, 27.0, 15.0, 10.0, 5.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.551025390625, -18.96142578125, -18.371826171875, -17.7822265625, -17.192626953125, -16.60302734375, -16.013427734375, -15.423828125, -14.834228515625, -14.24462890625, -13.655029296875, -13.0654296875, -12.475830078125, -11.88623046875, -11.296630859375, -10.70703125, -10.117431640625, -9.52783203125, -8.938232421875, -8.3486328125, -7.759033203125, -7.16943359375, -6.579833984375, -5.990234375, -5.400634765625, -4.81103515625, -4.221435546875, -3.6318359375, -3.042236328125, -2.45263671875, -1.863037109375, -1.2734375, -0.683837890625, -0.09423828125, 0.495361328125, 1.0849609375, 1.674560546875, 2.26416015625, 2.853759765625, 3.443359375, 4.032958984375, 4.62255859375, 5.212158203125, 5.8017578125, 6.391357421875, 6.98095703125, 7.570556640625, 8.16015625, 8.749755859375, 9.33935546875, 9.928955078125, 10.5185546875, 11.108154296875, 11.69775390625, 12.287353515625, 12.876953125, 13.466552734375, 14.05615234375, 14.645751953125, 15.2353515625, 15.824951171875, 16.41455078125, 17.004150390625, 17.59375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 6.0, 3.0, 9.0, 2.0, 10.0, 13.0, 14.0, 30.0, 25.0, 56.0, 192.0, 404.0, 95.0, 53.0, 30.0, 16.0, 13.0, 7.0, 6.0, 10.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003871917724609375, -0.003744184970855713, -0.0036164522171020508, -0.0034887194633483887, -0.0033609867095947266, -0.0032332539558410645, -0.0031055212020874023, -0.0029777884483337402, -0.002850055694580078, -0.002722322940826416, -0.002594590187072754, -0.002466857433319092, -0.0023391246795654297, -0.0022113919258117676, -0.0020836591720581055, -0.0019559264183044434, -0.0018281936645507812, -0.0017004609107971191, -0.001572728157043457, -0.001444995403289795, -0.0013172626495361328, -0.0011895298957824707, -0.0010617971420288086, -0.0009340643882751465, -0.0008063316345214844, -0.0006785988807678223, -0.0005508661270141602, -0.00042313337326049805, -0.00029540061950683594, -0.00016766786575317383, -3.993511199951172e-05, 8.779764175415039e-05, 0.0002155303955078125, 0.0003432631492614746, 0.0004709959030151367, 0.0005987286567687988, 0.0007264614105224609, 0.000854194164276123, 0.0009819269180297852, 0.0011096596717834473, 0.0012373924255371094, 0.0013651251792907715, 0.0014928579330444336, 0.0016205906867980957, 0.0017483234405517578, 0.00187605619430542, 0.002003788948059082, 0.002131521701812744, 0.0022592544555664062, 0.0023869872093200684, 0.0025147199630737305, 0.0026424527168273926, 0.0027701854705810547, 0.002897918224334717, 0.003025650978088379, 0.003153383731842041, 0.003281116485595703, 0.0034088492393493652, 0.0035365819931030273, 0.0036643147468566895, 0.0037920475006103516, 0.003919780254364014, 0.004047513008117676, 0.004175245761871338, 0.004302978515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 4.0, 9.0, 14.0, 15.0, 39.0, 48.0, 78.0, 140.0, 262.0, 497.0, 1052.0, 2495.0, 6685.0, 23058.0, 139208.0, 739591.0, 105835.0, 19318.0, 5829.0, 2292.0, 956.0, 458.0, 242.0, 154.0, 79.0, 66.0, 25.0, 30.0, 18.0, 13.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.4381103515625, -14.930908203125, -14.4237060546875, -13.91650390625, -13.4093017578125, -12.902099609375, -12.3948974609375, -11.8876953125, -11.3804931640625, -10.873291015625, -10.3660888671875, -9.85888671875, -9.3516845703125, -8.844482421875, -8.3372802734375, -7.830078125, -7.3228759765625, -6.815673828125, -6.3084716796875, -5.80126953125, -5.2940673828125, -4.786865234375, -4.2796630859375, -3.7724609375, -3.2652587890625, -2.758056640625, -2.2508544921875, -1.74365234375, -1.2364501953125, -0.729248046875, -0.2220458984375, 0.28515625, 0.7923583984375, 1.299560546875, 1.8067626953125, 2.31396484375, 2.8211669921875, 3.328369140625, 3.8355712890625, 4.3427734375, 4.8499755859375, 5.357177734375, 5.8643798828125, 6.37158203125, 6.8787841796875, 7.385986328125, 7.8931884765625, 8.400390625, 8.9075927734375, 9.414794921875, 9.9219970703125, 10.42919921875, 10.9364013671875, 11.443603515625, 11.9508056640625, 12.4580078125, 12.9652099609375, 13.472412109375, 13.9796142578125, 14.48681640625, 14.9940185546875, 15.501220703125, 16.0084228515625, 16.515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 5.0, 10.0, 10.0, 12.0, 15.0, 18.0, 27.0, 30.0, 45.0, 49.0, 88.0, 131.0, 155.0, 112.0, 65.0, 48.0, 38.0, 22.0, 25.0, 19.0, 15.0, 13.0, 10.0, 4.0, 5.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2882080078125, -7.029541015625, -6.7708740234375, -6.51220703125, -6.2535400390625, -5.994873046875, -5.7362060546875, -5.4775390625, -5.2188720703125, -4.960205078125, -4.7015380859375, -4.44287109375, -4.1842041015625, -3.925537109375, -3.6668701171875, -3.408203125, -3.1495361328125, -2.890869140625, -2.6322021484375, -2.37353515625, -2.1148681640625, -1.856201171875, -1.5975341796875, -1.3388671875, -1.0802001953125, -0.821533203125, -0.5628662109375, -0.30419921875, -0.0455322265625, 0.213134765625, 0.4718017578125, 0.73046875, 0.9891357421875, 1.247802734375, 1.5064697265625, 1.76513671875, 2.0238037109375, 2.282470703125, 2.5411376953125, 2.7998046875, 3.0584716796875, 3.317138671875, 3.5758056640625, 3.83447265625, 4.0931396484375, 4.351806640625, 4.6104736328125, 4.869140625, 5.1278076171875, 5.386474609375, 5.6451416015625, 5.90380859375, 6.1624755859375, 6.421142578125, 6.6798095703125, 6.9384765625, 7.1971435546875, 7.455810546875, 7.7144775390625, 7.97314453125, 8.2318115234375, 8.490478515625, 8.7491455078125, 9.0078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 13.0, 15.0, 37.0, 49.0, 83.0, 98.0, 129.0, 139.0, 124.0, 92.0, 88.0, 52.0, 27.0, 12.0, 12.0, 9.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-182.28448486328125, -177.17799377441406, -172.07150268554688, -166.9650115966797, -161.8585205078125, -156.75204467773438, -151.6455535888672, -146.5390625, -141.4325714111328, -136.32608032226562, -131.21958923339844, -126.11310577392578, -121.0066146850586, -115.9001235961914, -110.79364013671875, -105.68714904785156, -100.58065795898438, -95.47416687011719, -90.36767578125, -85.26119232177734, -80.15470123291016, -75.04821014404297, -69.94172668457031, -64.83523559570312, -59.72874450683594, -54.62225341796875, -49.51576614379883, -44.409278869628906, -39.30278778076172, -34.19629669189453, -29.08980941772461, -23.983322143554688, -18.8768310546875, -13.770341873168945, -8.66385269165039, -3.557363510131836, 1.5491256713867188, 6.655614852905273, 11.762104034423828, 16.86859130859375, 21.975082397460938, 27.081571578979492, 32.18806076049805, 37.29454803466797, 42.401039123535156, 47.507530212402344, 52.614017486572266, 57.72050476074219, 62.826995849609375, 67.93348693847656, 73.03997802734375, 78.1464614868164, 83.2529525756836, 88.35944366455078, 93.46592712402344, 98.57241821289062, 103.67890930175781, 108.785400390625, 113.89189147949219, 118.99837493896484, 124.10486602783203, 129.2113494873047, 134.31784057617188, 139.42433166503906, 144.53082275390625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 7.0, 9.0, 12.0, 13.0, 15.0, 23.0, 23.0, 30.0, 39.0, 36.0, 35.0, 41.0, 60.0, 43.0, 50.0, 52.0, 42.0, 51.0, 47.0, 55.0, 48.0, 41.0, 37.0, 34.0, 35.0, 28.0, 13.0, 14.0, 12.0, 14.0, 6.0, 5.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.5390625, -71.9871597290039, -69.43525695800781, -66.88335418701172, -64.33145141601562, -61.779544830322266, -59.22764205932617, -56.67573547363281, -54.12383270263672, -51.571929931640625, -49.02002716064453, -46.46812438964844, -43.91621780395508, -41.364315032958984, -38.81241226196289, -36.26050567626953, -33.7086067199707, -31.15670394897461, -28.604799270629883, -26.05289649963379, -23.500991821289062, -20.94908905029297, -18.397186279296875, -15.845281600952148, -13.293378829956055, -10.741475105285645, -8.189571380615234, -5.637668609619141, -3.0857648849487305, -0.5338611602783203, 2.0180416107177734, 4.5699462890625, 7.121849060058594, 9.673752784729004, 12.225656509399414, 14.777559280395508, 17.329463958740234, 19.881366729736328, 22.433269500732422, 24.98517417907715, 27.537076950073242, 30.088979721069336, 32.64088439941406, 35.192787170410156, 37.74468994140625, 40.296592712402344, 42.84849548339844, 45.4004020690918, 47.95230484008789, 50.504207611083984, 53.05611038208008, 55.60801696777344, 58.15991973876953, 60.711822509765625, 63.26372528076172, 65.81562805175781, 68.3675308227539, 70.91943359375, 73.4713363647461, 76.02323913574219, 78.57514190673828, 81.12704467773438, 83.678955078125, 86.2308578491211, 88.78276062011719]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 0.0, 8.0, 8.0, 8.0, 17.0, 26.0, 36.0, 59.0, 67.0, 76.0, 136.0, 232.0, 389.0, 673.0, 1218.0, 2600.0, 6269.0, 18867.0, 79751.0, 1438621.0, 2527643.0, 85388.0, 19923.0, 6576.0, 2636.0, 1234.0, 644.0, 388.0, 224.0, 176.0, 103.0, 87.0, 40.0, 32.0, 19.0, 22.0, 24.0, 15.0, 13.0, 10.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.21875, -40.65625, -39.09375, -37.53125, -35.96875, -34.40625, -32.84375, -31.28125, -29.71875, -28.15625, -26.59375, -25.03125, -23.46875, -21.90625, -20.34375, -18.78125, -17.21875, -15.65625, -14.09375, -12.53125, -10.96875, -9.40625, -7.84375, -6.28125, -4.71875, -3.15625, -1.59375, -0.03125, 1.53125, 3.09375, 4.65625, 6.21875, 7.78125, 9.34375, 10.90625, 12.46875, 14.03125, 15.59375, 17.15625, 18.71875, 20.28125, 21.84375, 23.40625, 24.96875, 26.53125, 28.09375, 29.65625, 31.21875, 32.78125, 34.34375, 35.90625, 37.46875, 39.03125, 40.59375, 42.15625, 43.71875, 45.28125, 46.84375, 48.40625, 49.96875, 51.53125, 53.09375, 54.65625, 56.21875, 57.78125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 13.0, 10.0, 9.0, 14.0, 22.0, 25.0, 26.0, 33.0, 53.0, 52.0, 71.0, 67.0, 78.0, 56.0, 59.0, 63.0, 55.0, 66.0, 47.0, 31.0, 32.0, 37.0, 19.0, 10.0, 12.0, 12.0, 9.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87890625, -3.7327880859375, -3.586669921875, -3.4405517578125, -3.29443359375, -3.1483154296875, -3.002197265625, -2.8560791015625, -2.7099609375, -2.5638427734375, -2.417724609375, -2.2716064453125, -2.12548828125, -1.9793701171875, -1.833251953125, -1.6871337890625, -1.541015625, -1.3948974609375, -1.248779296875, -1.1026611328125, -0.95654296875, -0.8104248046875, -0.664306640625, -0.5181884765625, -0.3720703125, -0.2259521484375, -0.079833984375, 0.0662841796875, 0.21240234375, 0.3585205078125, 0.504638671875, 0.6507568359375, 0.796875, 0.9429931640625, 1.089111328125, 1.2352294921875, 1.38134765625, 1.5274658203125, 1.673583984375, 1.8197021484375, 1.9658203125, 2.1119384765625, 2.258056640625, 2.4041748046875, 2.55029296875, 2.6964111328125, 2.842529296875, 2.9886474609375, 3.134765625, 3.2808837890625, 3.427001953125, 3.5731201171875, 3.71923828125, 3.8653564453125, 4.011474609375, 4.1575927734375, 4.3037109375, 4.4498291015625, 4.595947265625, 4.7420654296875, 4.88818359375, 5.0343017578125, 5.180419921875, 5.3265380859375, 5.47265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 15.0, 10.0, 15.0, 22.0, 28.0, 37.0, 45.0, 72.0, 97.0, 137.0, 218.0, 323.0, 580.0, 985.0, 1999.0, 4274.0, 10250.0, 28516.0, 98824.0, 572743.0, 3127254.0, 256603.0, 58717.0, 18453.0, 7160.0, 3110.0, 1556.0, 815.0, 460.0, 300.0, 199.0, 122.0, 95.0, 61.0, 49.0, 31.0, 36.0, 16.0, 20.0, 8.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-32.96875, -32.034912109375, -31.10107421875, -30.167236328125, -29.2333984375, -28.299560546875, -27.36572265625, -26.431884765625, -25.498046875, -24.564208984375, -23.63037109375, -22.696533203125, -21.7626953125, -20.828857421875, -19.89501953125, -18.961181640625, -18.02734375, -17.093505859375, -16.15966796875, -15.225830078125, -14.2919921875, -13.358154296875, -12.42431640625, -11.490478515625, -10.556640625, -9.622802734375, -8.68896484375, -7.755126953125, -6.8212890625, -5.887451171875, -4.95361328125, -4.019775390625, -3.0859375, -2.152099609375, -1.21826171875, -0.284423828125, 0.6494140625, 1.583251953125, 2.51708984375, 3.450927734375, 4.384765625, 5.318603515625, 6.25244140625, 7.186279296875, 8.1201171875, 9.053955078125, 9.98779296875, 10.921630859375, 11.85546875, 12.789306640625, 13.72314453125, 14.656982421875, 15.5908203125, 16.524658203125, 17.45849609375, 18.392333984375, 19.326171875, 20.260009765625, 21.19384765625, 22.127685546875, 23.0615234375, 23.995361328125, 24.92919921875, 25.863037109375, 26.796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 13.0, 12.0, 17.0, 28.0, 35.0, 53.0, 85.0, 157.0, 255.0, 667.0, 1688.0, 475.0, 221.0, 142.0, 59.0, 50.0, 43.0, 18.0, 15.0, 10.0, 10.0, 6.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.1328125, -12.6851806640625, -12.237548828125, -11.7899169921875, -11.34228515625, -10.8946533203125, -10.447021484375, -9.9993896484375, -9.5517578125, -9.1041259765625, -8.656494140625, -8.2088623046875, -7.76123046875, -7.3135986328125, -6.865966796875, -6.4183349609375, -5.970703125, -5.5230712890625, -5.075439453125, -4.6278076171875, -4.18017578125, -3.7325439453125, -3.284912109375, -2.8372802734375, -2.3896484375, -1.9420166015625, -1.494384765625, -1.0467529296875, -0.59912109375, -0.1514892578125, 0.296142578125, 0.7437744140625, 1.19140625, 1.6390380859375, 2.086669921875, 2.5343017578125, 2.98193359375, 3.4295654296875, 3.877197265625, 4.3248291015625, 4.7724609375, 5.2200927734375, 5.667724609375, 6.1153564453125, 6.56298828125, 7.0106201171875, 7.458251953125, 7.9058837890625, 8.353515625, 8.8011474609375, 9.248779296875, 9.6964111328125, 10.14404296875, 10.5916748046875, 11.039306640625, 11.4869384765625, 11.9345703125, 12.3822021484375, 12.829833984375, 13.2774658203125, 13.72509765625, 14.1727294921875, 14.620361328125, 15.0679931640625, 15.515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 7.0, 14.0, 12.0, 19.0, 23.0, 34.0, 41.0, 60.0, 53.0, 64.0, 78.0, 71.0, 63.0, 79.0, 74.0, 72.0, 63.0, 39.0, 24.0, 25.0, 28.0, 14.0, 10.0, 10.0, 9.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.64527130126953, -57.903038024902344, -56.16080093383789, -54.4185676574707, -52.676334381103516, -50.93409729003906, -49.191864013671875, -47.44963073730469, -45.7073974609375, -43.96516418457031, -42.22292709350586, -40.48069381713867, -38.738460540771484, -36.99622344970703, -35.253990173339844, -33.511756896972656, -31.769519805908203, -30.027284622192383, -28.285051345825195, -26.542816162109375, -24.800582885742188, -23.058347702026367, -21.316112518310547, -19.57387924194336, -17.83164405822754, -16.08940887451172, -14.347175598144531, -12.604940414428711, -10.862706184387207, -9.120471954345703, -7.378236770629883, -5.636002540588379, -3.893768310546875, -2.151533842086792, -0.409299373626709, 1.3329353332519531, 3.075169563293457, 4.817403793334961, 6.559638977050781, 8.301873207092285, 10.044107437133789, 11.786341667175293, 13.528575897216797, 15.270811080932617, 17.013046264648438, 18.755279541015625, 20.497514724731445, 22.239749908447266, 23.981983184814453, 25.724218368530273, 27.46645164489746, 29.20868682861328, 30.95092010498047, 32.693153381347656, 34.43539047241211, 36.1776237487793, 37.91986083984375, 39.66209411621094, 41.40433120727539, 43.14656448364258, 44.888797760009766, 46.63103485107422, 48.373268127441406, 50.115501403808594, 51.85773468017578]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 11.0, 6.0, 8.0, 11.0, 10.0, 21.0, 25.0, 22.0, 20.0, 25.0, 28.0, 30.0, 38.0, 37.0, 37.0, 42.0, 46.0, 52.0, 49.0, 65.0, 32.0, 32.0, 44.0, 29.0, 43.0, 45.0, 22.0, 20.0, 22.0, 14.0, 9.0, 27.0, 10.0, 16.0, 9.0, 3.0, 14.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-44.61924743652344, -43.451416015625, -42.2835807800293, -41.11574935913086, -39.94791793823242, -38.780086517333984, -37.61225128173828, -36.444419860839844, -35.276588439941406, -34.10875701904297, -32.940921783447266, -31.773090362548828, -30.60525894165039, -29.43742561340332, -28.26959228515625, -27.101760864257812, -25.933927536010742, -24.766094207763672, -23.598262786865234, -22.430429458618164, -21.262598037719727, -20.094764709472656, -18.92693328857422, -17.75909996032715, -16.591266632080078, -15.423434257507324, -14.25560188293457, -13.0877685546875, -11.919937133789062, -10.752103805541992, -9.584271430969238, -8.416439056396484, -7.248607635498047, -6.080775260925293, -4.912942886352539, -3.745110034942627, -2.577277660369873, -1.4094452857971191, -0.24161243438720703, 0.9262199401855469, 2.094052314758301, 3.2618846893310547, 4.429717063903809, 5.597549915313721, 6.765382289886475, 7.9332146644592285, 9.10104751586914, 10.268879890441895, 11.436712265014648, 12.604544639587402, 13.772377014160156, 14.940210342407227, 16.108041763305664, 17.275875091552734, 18.443706512451172, 19.611539840698242, 20.779373168945312, 21.947206497192383, 23.11503791809082, 24.28287124633789, 25.450702667236328, 26.6185359954834, 27.78636932373047, 28.954200744628906, 30.122032165527344]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 8.0, 27.0, 33.0, 69.0, 103.0, 152.0, 292.0, 524.0, 1142.0, 3309.0, 11657.0, 46062.0, 277091.0, 605986.0, 75936.0, 18063.0, 4984.0, 1616.0, 714.0, 312.0, 182.0, 117.0, 74.0, 40.0, 21.0, 10.0, 8.0, 8.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.90625, -37.572265625, -36.23828125, -34.904296875, -33.5703125, -32.236328125, -30.90234375, -29.568359375, -28.234375, -26.900390625, -25.56640625, -24.232421875, -22.8984375, -21.564453125, -20.23046875, -18.896484375, -17.5625, -16.228515625, -14.89453125, -13.560546875, -12.2265625, -10.892578125, -9.55859375, -8.224609375, -6.890625, -5.556640625, -4.22265625, -2.888671875, -1.5546875, -0.220703125, 1.11328125, 2.447265625, 3.78125, 5.115234375, 6.44921875, 7.783203125, 9.1171875, 10.451171875, 11.78515625, 13.119140625, 14.453125, 15.787109375, 17.12109375, 18.455078125, 19.7890625, 21.123046875, 22.45703125, 23.791015625, 25.125, 26.458984375, 27.79296875, 29.126953125, 30.4609375, 31.794921875, 33.12890625, 34.462890625, 35.796875, 37.130859375, 38.46484375, 39.798828125, 41.1328125, 42.466796875, 43.80078125, 45.134765625, 46.46875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 5.0, 1.0, 5.0, 2.0, 7.0, 9.0, 9.0, 9.0, 11.0, 18.0, 26.0, 32.0, 39.0, 30.0, 52.0, 44.0, 60.0, 60.0, 59.0, 55.0, 70.0, 66.0, 51.0, 54.0, 43.0, 43.0, 29.0, 32.0, 16.0, 17.0, 19.0, 9.0, 9.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.234375, -4.0853271484375, -3.936279296875, -3.7872314453125, -3.63818359375, -3.4891357421875, -3.340087890625, -3.1910400390625, -3.0419921875, -2.8929443359375, -2.743896484375, -2.5948486328125, -2.44580078125, -2.2967529296875, -2.147705078125, -1.9986572265625, -1.849609375, -1.7005615234375, -1.551513671875, -1.4024658203125, -1.25341796875, -1.1043701171875, -0.955322265625, -0.8062744140625, -0.6572265625, -0.5081787109375, -0.359130859375, -0.2100830078125, -0.06103515625, 0.0880126953125, 0.237060546875, 0.3861083984375, 0.53515625, 0.6842041015625, 0.833251953125, 0.9822998046875, 1.13134765625, 1.2803955078125, 1.429443359375, 1.5784912109375, 1.7275390625, 1.8765869140625, 2.025634765625, 2.1746826171875, 2.32373046875, 2.4727783203125, 2.621826171875, 2.7708740234375, 2.919921875, 3.0689697265625, 3.218017578125, 3.3670654296875, 3.51611328125, 3.6651611328125, 3.814208984375, 3.9632568359375, 4.1123046875, 4.2613525390625, 4.410400390625, 4.5594482421875, 4.70849609375, 4.8575439453125, 5.006591796875, 5.1556396484375, 5.3046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 9.0, 4.0, 11.0, 16.0, 34.0, 42.0, 48.0, 70.0, 101.0, 154.0, 276.0, 487.0, 932.0, 1885.0, 4038.0, 8427.0, 18989.0, 44008.0, 134254.0, 585514.0, 161083.0, 49274.0, 21072.0, 9213.0, 4310.0, 1998.0, 984.0, 519.0, 300.0, 156.0, 94.0, 66.0, 48.0, 28.0, 21.0, 14.0, 19.0, 11.0, 9.0, 7.0, 7.0, 2.0, 10.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.875, -20.2529296875, -19.630859375, -19.0087890625, -18.38671875, -17.7646484375, -17.142578125, -16.5205078125, -15.8984375, -15.2763671875, -14.654296875, -14.0322265625, -13.41015625, -12.7880859375, -12.166015625, -11.5439453125, -10.921875, -10.2998046875, -9.677734375, -9.0556640625, -8.43359375, -7.8115234375, -7.189453125, -6.5673828125, -5.9453125, -5.3232421875, -4.701171875, -4.0791015625, -3.45703125, -2.8349609375, -2.212890625, -1.5908203125, -0.96875, -0.3466796875, 0.275390625, 0.8974609375, 1.51953125, 2.1416015625, 2.763671875, 3.3857421875, 4.0078125, 4.6298828125, 5.251953125, 5.8740234375, 6.49609375, 7.1181640625, 7.740234375, 8.3623046875, 8.984375, 9.6064453125, 10.228515625, 10.8505859375, 11.47265625, 12.0947265625, 12.716796875, 13.3388671875, 13.9609375, 14.5830078125, 15.205078125, 15.8271484375, 16.44921875, 17.0712890625, 17.693359375, 18.3154296875, 18.9375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 8.0, 9.0, 9.0, 11.0, 14.0, 21.0, 37.0, 34.0, 32.0, 43.0, 57.0, 48.0, 68.0, 54.0, 50.0, 77.0, 53.0, 56.0, 50.0, 46.0, 39.0, 47.0, 26.0, 21.0, 18.0, 13.0, 10.0, 12.0, 10.0, 6.0, 3.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.578125, -20.94140625, -20.3046875, -19.66796875, -19.03125, -18.39453125, -17.7578125, -17.12109375, -16.484375, -15.84765625, -15.2109375, -14.57421875, -13.9375, -13.30078125, -12.6640625, -12.02734375, -11.390625, -10.75390625, -10.1171875, -9.48046875, -8.84375, -8.20703125, -7.5703125, -6.93359375, -6.296875, -5.66015625, -5.0234375, -4.38671875, -3.75, -3.11328125, -2.4765625, -1.83984375, -1.203125, -0.56640625, 0.0703125, 0.70703125, 1.34375, 1.98046875, 2.6171875, 3.25390625, 3.890625, 4.52734375, 5.1640625, 5.80078125, 6.4375, 7.07421875, 7.7109375, 8.34765625, 8.984375, 9.62109375, 10.2578125, 10.89453125, 11.53125, 12.16796875, 12.8046875, 13.44140625, 14.078125, 14.71484375, 15.3515625, 15.98828125, 16.625, 17.26171875, 17.8984375, 18.53515625, 19.171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 11.0, 20.0, 32.0, 56.0, 101.0, 164.0, 375.0, 987.0, 3425.0, 14918.0, 90390.0, 778624.0, 133444.0, 19738.0, 4100.0, 1241.0, 452.0, 210.0, 90.0, 61.0, 45.0, 18.0, 5.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-22.21875, -21.6844482421875, -21.150146484375, -20.6158447265625, -20.08154296875, -19.5472412109375, -19.012939453125, -18.4786376953125, -17.9443359375, -17.4100341796875, -16.875732421875, -16.3414306640625, -15.80712890625, -15.2728271484375, -14.738525390625, -14.2042236328125, -13.669921875, -13.1356201171875, -12.601318359375, -12.0670166015625, -11.53271484375, -10.9984130859375, -10.464111328125, -9.9298095703125, -9.3955078125, -8.8612060546875, -8.326904296875, -7.7926025390625, -7.25830078125, -6.7239990234375, -6.189697265625, -5.6553955078125, -5.12109375, -4.5867919921875, -4.052490234375, -3.5181884765625, -2.98388671875, -2.4495849609375, -1.915283203125, -1.3809814453125, -0.8466796875, -0.3123779296875, 0.221923828125, 0.7562255859375, 1.29052734375, 1.8248291015625, 2.359130859375, 2.8934326171875, 3.427734375, 3.9620361328125, 4.496337890625, 5.0306396484375, 5.56494140625, 6.0992431640625, 6.633544921875, 7.1678466796875, 7.7021484375, 8.2364501953125, 8.770751953125, 9.3050537109375, 9.83935546875, 10.3736572265625, 10.907958984375, 11.4422607421875, 11.9765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 10.0, 17.0, 26.0, 28.0, 65.0, 270.0, 404.0, 82.0, 29.0, 20.0, 13.0, 8.0, 9.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0039520263671875, -0.0038326382637023926, -0.003713250160217285, -0.0035938620567321777, -0.0034744739532470703, -0.003355085849761963, -0.0032356977462768555, -0.003116309642791748, -0.0029969215393066406, -0.002877533435821533, -0.0027581453323364258, -0.0026387572288513184, -0.002519369125366211, -0.0023999810218811035, -0.002280592918395996, -0.0021612048149108887, -0.0020418167114257812, -0.0019224286079406738, -0.0018030405044555664, -0.001683652400970459, -0.0015642642974853516, -0.0014448761940002441, -0.0013254880905151367, -0.0012060999870300293, -0.0010867118835449219, -0.0009673237800598145, -0.000847935676574707, -0.0007285475730895996, -0.0006091594696044922, -0.0004897713661193848, -0.00037038326263427734, -0.0002509951591491699, -0.0001316070556640625, -1.2218952178955078e-05, 0.00010716915130615234, 0.00022655725479125977, 0.0003459453582763672, 0.0004653334617614746, 0.000584721565246582, 0.0007041096687316895, 0.0008234977722167969, 0.0009428858757019043, 0.0010622739791870117, 0.0011816620826721191, 0.0013010501861572266, 0.001420438289642334, 0.0015398263931274414, 0.0016592144966125488, 0.0017786026000976562, 0.0018979907035827637, 0.002017378807067871, 0.0021367669105529785, 0.002256155014038086, 0.0023755431175231934, 0.0024949312210083008, 0.002614319324493408, 0.0027337074279785156, 0.002853095531463623, 0.0029724836349487305, 0.003091871738433838, 0.0032112598419189453, 0.0033306479454040527, 0.00345003604888916, 0.0035694241523742676, 0.003688812255859375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 11.0, 9.0, 15.0, 9.0, 28.0, 57.0, 64.0, 112.0, 197.0, 355.0, 691.0, 1564.0, 3879.0, 12159.0, 51466.0, 531144.0, 387039.0, 42911.0, 10478.0, 3499.0, 1451.0, 638.0, 325.0, 153.0, 102.0, 63.0, 47.0, 35.0, 17.0, 9.0, 11.0, 9.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.171875, -11.641357421875, -11.11083984375, -10.580322265625, -10.0498046875, -9.519287109375, -8.98876953125, -8.458251953125, -7.927734375, -7.397216796875, -6.86669921875, -6.336181640625, -5.8056640625, -5.275146484375, -4.74462890625, -4.214111328125, -3.68359375, -3.153076171875, -2.62255859375, -2.092041015625, -1.5615234375, -1.031005859375, -0.50048828125, 0.030029296875, 0.560546875, 1.091064453125, 1.62158203125, 2.152099609375, 2.6826171875, 3.213134765625, 3.74365234375, 4.274169921875, 4.8046875, 5.335205078125, 5.86572265625, 6.396240234375, 6.9267578125, 7.457275390625, 7.98779296875, 8.518310546875, 9.048828125, 9.579345703125, 10.10986328125, 10.640380859375, 11.1708984375, 11.701416015625, 12.23193359375, 12.762451171875, 13.29296875, 13.823486328125, 14.35400390625, 14.884521484375, 15.4150390625, 15.945556640625, 16.47607421875, 17.006591796875, 17.537109375, 18.067626953125, 18.59814453125, 19.128662109375, 19.6591796875, 20.189697265625, 20.72021484375, 21.250732421875, 21.78125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 10.0, 4.0, 19.0, 16.0, 27.0, 38.0, 51.0, 122.0, 193.0, 207.0, 107.0, 64.0, 47.0, 25.0, 15.0, 10.0, 12.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.3046875, -10.8538818359375, -10.403076171875, -9.9522705078125, -9.50146484375, -9.0506591796875, -8.599853515625, -8.1490478515625, -7.6982421875, -7.2474365234375, -6.796630859375, -6.3458251953125, -5.89501953125, -5.4442138671875, -4.993408203125, -4.5426025390625, -4.091796875, -3.6409912109375, -3.190185546875, -2.7393798828125, -2.28857421875, -1.8377685546875, -1.386962890625, -0.9361572265625, -0.4853515625, -0.0345458984375, 0.416259765625, 0.8670654296875, 1.31787109375, 1.7686767578125, 2.219482421875, 2.6702880859375, 3.12109375, 3.5718994140625, 4.022705078125, 4.4735107421875, 4.92431640625, 5.3751220703125, 5.825927734375, 6.2767333984375, 6.7275390625, 7.1783447265625, 7.629150390625, 8.0799560546875, 8.53076171875, 8.9815673828125, 9.432373046875, 9.8831787109375, 10.333984375, 10.7847900390625, 11.235595703125, 11.6864013671875, 12.13720703125, 12.5880126953125, 13.038818359375, 13.4896240234375, 13.9404296875, 14.3912353515625, 14.842041015625, 15.2928466796875, 15.74365234375, 16.1944580078125, 16.645263671875, 17.0960693359375, 17.546875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 6.0, 14.0, 24.0, 39.0, 55.0, 86.0, 100.0, 105.0, 116.0, 127.0, 102.0, 82.0, 68.0, 29.0, 13.0, 14.0, 3.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-152.13160705566406, -147.47019958496094, -142.80877685546875, -138.14736938476562, -133.4859619140625, -128.82455444335938, -124.16313171386719, -119.50172424316406, -114.8403091430664, -110.17889404296875, -105.51748657226562, -100.85607147216797, -96.19465637207031, -91.53324890136719, -86.87183380126953, -82.21041870117188, -77.54901123046875, -72.8875961303711, -68.22618865966797, -63.56477355957031, -58.90336227416992, -54.24195098876953, -49.580535888671875, -44.919124603271484, -40.257713317871094, -35.5963020324707, -30.93488883972168, -26.273475646972656, -21.612064361572266, -16.950653076171875, -12.289239883422852, -7.627826690673828, -2.966400146484375, 1.695012092590332, 6.356424331665039, 11.017836570739746, 15.679248809814453, 20.340660095214844, 25.002073287963867, 29.66348648071289, 34.32489776611328, 38.98630905151367, 43.64772033691406, 48.30913543701172, 52.97054672241211, 57.6319580078125, 62.293373107910156, 66.95478820800781, 71.61619567871094, 76.2776107788086, 80.93901824951172, 85.60043334960938, 90.2618408203125, 94.92325592041016, 99.58467102050781, 104.24607849121094, 108.9074935913086, 113.56890869140625, 118.23031616210938, 122.89173126220703, 127.55314636230469, 132.2145538330078, 136.87596130371094, 141.53738403320312, 146.19879150390625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 5.0, 9.0, 11.0, 12.0, 18.0, 15.0, 19.0, 21.0, 31.0, 25.0, 25.0, 24.0, 41.0, 42.0, 34.0, 41.0, 45.0, 41.0, 51.0, 47.0, 43.0, 48.0, 42.0, 39.0, 44.0, 41.0, 34.0, 26.0, 23.0, 13.0, 11.0, 3.0, 19.0, 15.0, 4.0, 4.0, 4.0, 3.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-80.70736694335938, -78.14178466796875, -75.57620239257812, -73.0106201171875, -70.44503784179688, -67.87945556640625, -65.31387329101562, -62.748287200927734, -60.18270492553711, -57.617122650146484, -55.05154037475586, -52.485958099365234, -49.920372009277344, -47.35478973388672, -44.789207458496094, -42.22362518310547, -39.658042907714844, -37.09246063232422, -34.526878356933594, -31.961294174194336, -29.39571189880371, -26.830129623413086, -24.264545440673828, -21.698963165283203, -19.133380889892578, -16.567798614501953, -14.002215385437012, -11.43663215637207, -8.871049880981445, -6.30546760559082, -3.739884376525879, -1.1743011474609375, 1.3912887573242188, 3.956871509552002, 6.522454261779785, 9.088037490844727, 11.653619766235352, 14.219202041625977, 16.784786224365234, 19.35036849975586, 21.915950775146484, 24.48153305053711, 27.047115325927734, 29.612699508666992, 32.17828369140625, 34.743865966796875, 37.3094482421875, 39.875030517578125, 42.44061279296875, 45.006195068359375, 47.57177734375, 50.137359619140625, 52.70294189453125, 55.268524169921875, 57.834110260009766, 60.39969253540039, 62.965274810791016, 65.5308609008789, 68.09644317626953, 70.66202545166016, 73.22760772705078, 75.7931900024414, 78.35877227783203, 80.92435455322266, 83.48993682861328]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 17.0, 10.0, 16.0, 36.0, 39.0, 79.0, 118.0, 183.0, 336.0, 553.0, 1087.0, 2386.0, 6495.0, 20223.0, 91230.0, 3452286.0, 540421.0, 56170.0, 14152.0, 4550.0, 1846.0, 859.0, 431.0, 260.0, 163.0, 108.0, 62.0, 64.0, 31.0, 28.0, 11.0, 11.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.71875, -54.81884765625, -52.9189453125, -51.01904296875, -49.119140625, -47.21923828125, -45.3193359375, -43.41943359375, -41.51953125, -39.61962890625, -37.7197265625, -35.81982421875, -33.919921875, -32.02001953125, -30.1201171875, -28.22021484375, -26.3203125, -24.42041015625, -22.5205078125, -20.62060546875, -18.720703125, -16.82080078125, -14.9208984375, -13.02099609375, -11.12109375, -9.22119140625, -7.3212890625, -5.42138671875, -3.521484375, -1.62158203125, 0.2783203125, 2.17822265625, 4.078125, 5.97802734375, 7.8779296875, 9.77783203125, 11.677734375, 13.57763671875, 15.4775390625, 17.37744140625, 19.27734375, 21.17724609375, 23.0771484375, 24.97705078125, 26.876953125, 28.77685546875, 30.6767578125, 32.57666015625, 34.4765625, 36.37646484375, 38.2763671875, 40.17626953125, 42.076171875, 43.97607421875, 45.8759765625, 47.77587890625, 49.67578125, 51.57568359375, 53.4755859375, 55.37548828125, 57.275390625, 59.17529296875, 61.0751953125, 62.97509765625, 64.875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 8.0, 8.0, 10.0, 16.0, 14.0, 20.0, 31.0, 29.0, 37.0, 45.0, 54.0, 50.0, 66.0, 51.0, 66.0, 66.0, 70.0, 57.0, 47.0, 59.0, 38.0, 33.0, 30.0, 26.0, 17.0, 14.0, 13.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.12115478515625, -3.9610595703125, -3.80096435546875, -3.640869140625, -3.48077392578125, -3.3206787109375, -3.16058349609375, -3.00048828125, -2.84039306640625, -2.6802978515625, -2.52020263671875, -2.360107421875, -2.20001220703125, -2.0399169921875, -1.87982177734375, -1.7197265625, -1.55963134765625, -1.3995361328125, -1.23944091796875, -1.079345703125, -0.91925048828125, -0.7591552734375, -0.59906005859375, -0.43896484375, -0.27886962890625, -0.1187744140625, 0.04132080078125, 0.201416015625, 0.36151123046875, 0.5216064453125, 0.68170166015625, 0.841796875, 1.00189208984375, 1.1619873046875, 1.32208251953125, 1.482177734375, 1.64227294921875, 1.8023681640625, 1.96246337890625, 2.12255859375, 2.28265380859375, 2.4427490234375, 2.60284423828125, 2.762939453125, 2.92303466796875, 3.0831298828125, 3.24322509765625, 3.4033203125, 3.56341552734375, 3.7235107421875, 3.88360595703125, 4.043701171875, 4.20379638671875, 4.3638916015625, 4.52398681640625, 4.68408203125, 4.84417724609375, 5.0042724609375, 5.16436767578125, 5.324462890625, 5.48455810546875, 5.6446533203125, 5.80474853515625, 5.96484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 11.0, 19.0, 24.0, 33.0, 46.0, 81.0, 82.0, 127.0, 205.0, 299.0, 492.0, 634.0, 1067.0, 1729.0, 2824.0, 4783.0, 8588.0, 16226.0, 32317.0, 71008.0, 186237.0, 1085165.0, 2402847.0, 221744.0, 81345.0, 36308.0, 17698.0, 9124.0, 5170.0, 3013.0, 1813.0, 1071.0, 726.0, 481.0, 284.0, 209.0, 155.0, 98.0, 59.0, 44.0, 35.0, 14.0, 16.0, 13.0, 6.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.796875, -19.115966796875, -18.43505859375, -17.754150390625, -17.0732421875, -16.392333984375, -15.71142578125, -15.030517578125, -14.349609375, -13.668701171875, -12.98779296875, -12.306884765625, -11.6259765625, -10.945068359375, -10.26416015625, -9.583251953125, -8.90234375, -8.221435546875, -7.54052734375, -6.859619140625, -6.1787109375, -5.497802734375, -4.81689453125, -4.135986328125, -3.455078125, -2.774169921875, -2.09326171875, -1.412353515625, -0.7314453125, -0.050537109375, 0.63037109375, 1.311279296875, 1.9921875, 2.673095703125, 3.35400390625, 4.034912109375, 4.7158203125, 5.396728515625, 6.07763671875, 6.758544921875, 7.439453125, 8.120361328125, 8.80126953125, 9.482177734375, 10.1630859375, 10.843994140625, 11.52490234375, 12.205810546875, 12.88671875, 13.567626953125, 14.24853515625, 14.929443359375, 15.6103515625, 16.291259765625, 16.97216796875, 17.653076171875, 18.333984375, 19.014892578125, 19.69580078125, 20.376708984375, 21.0576171875, 21.738525390625, 22.41943359375, 23.100341796875, 23.78125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 7.0, 10.0, 7.0, 16.0, 12.0, 14.0, 35.0, 27.0, 52.0, 54.0, 90.0, 123.0, 228.0, 510.0, 1690.0, 466.0, 207.0, 147.0, 88.0, 62.0, 52.0, 42.0, 26.0, 25.0, 17.0, 13.0, 5.0, 3.0, 7.0, 5.0, 6.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.6640625, -12.30712890625, -11.9501953125, -11.59326171875, -11.236328125, -10.87939453125, -10.5224609375, -10.16552734375, -9.80859375, -9.45166015625, -9.0947265625, -8.73779296875, -8.380859375, -8.02392578125, -7.6669921875, -7.31005859375, -6.953125, -6.59619140625, -6.2392578125, -5.88232421875, -5.525390625, -5.16845703125, -4.8115234375, -4.45458984375, -4.09765625, -3.74072265625, -3.3837890625, -3.02685546875, -2.669921875, -2.31298828125, -1.9560546875, -1.59912109375, -1.2421875, -0.88525390625, -0.5283203125, -0.17138671875, 0.185546875, 0.54248046875, 0.8994140625, 1.25634765625, 1.61328125, 1.97021484375, 2.3271484375, 2.68408203125, 3.041015625, 3.39794921875, 3.7548828125, 4.11181640625, 4.46875, 4.82568359375, 5.1826171875, 5.53955078125, 5.896484375, 6.25341796875, 6.6103515625, 6.96728515625, 7.32421875, 7.68115234375, 8.0380859375, 8.39501953125, 8.751953125, 9.10888671875, 9.4658203125, 9.82275390625, 10.1796875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 9.0, 18.0, 52.0, 114.0, 233.0, 282.0, 185.0, 74.0, 36.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.41409301757812, -116.60543823242188, -109.7967758178711, -102.98811340332031, -96.17945861816406, -89.37080383300781, -82.56214141845703, -75.75347900390625, -68.94482421875, -62.136165618896484, -55.32750701904297, -48.51884841918945, -41.71018981933594, -34.90153121948242, -28.092872619628906, -21.28421401977539, -14.475555419921875, -7.666896820068359, -0.8582382202148438, 5.950420379638672, 12.759078979492188, 19.567737579345703, 26.37639617919922, 33.185054779052734, 39.99371337890625, 46.802371978759766, 53.61103057861328, 60.4196891784668, 67.22834777832031, 74.03700256347656, 80.84566497802734, 87.65432739257812, 94.46298217773438, 101.27163696289062, 108.0802993774414, 114.88896179199219, 121.69761657714844, 128.5062713623047, 135.31494140625, 142.12359619140625, 148.9322509765625, 155.74090576171875, 162.549560546875, 169.3582305908203, 176.16688537597656, 182.9755401611328, 189.78421020507812, 196.59286499023438, 203.40151977539062, 210.21017456054688, 217.01882934570312, 223.82749938964844, 230.6361541748047, 237.44480895996094, 244.25347900390625, 251.0621337890625, 257.87078857421875, 264.679443359375, 271.48809814453125, 278.2967529296875, 285.10540771484375, 291.9140930175781, 298.7227478027344, 305.5314025878906, 312.3400573730469]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 4.0, 7.0, 13.0, 13.0, 18.0, 17.0, 29.0, 33.0, 27.0, 36.0, 34.0, 30.0, 47.0, 41.0, 46.0, 39.0, 51.0, 50.0, 48.0, 57.0, 42.0, 28.0, 32.0, 34.0, 29.0, 30.0, 27.0, 22.0, 18.0, 26.0, 24.0, 12.0, 5.0, 10.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-50.9149169921875, -49.38372039794922, -47.85252380371094, -46.32133102416992, -44.79013442993164, -43.25893783569336, -41.727745056152344, -40.19654846191406, -38.66535186767578, -37.1341552734375, -35.60295867919922, -34.0717658996582, -32.54056930541992, -31.00937271118164, -29.478178024291992, -27.946983337402344, -26.415786743164062, -24.88459014892578, -23.353395462036133, -21.822200775146484, -20.291004180908203, -18.759807586669922, -17.228612899780273, -15.697417259216309, -14.166221618652344, -12.635025978088379, -11.103830337524414, -9.57263469696045, -8.041439056396484, -6.5102434158325195, -4.979047775268555, -3.44785213470459, -1.9166526794433594, -0.38545703887939453, 1.1457386016845703, 2.676934242248535, 4.2081298828125, 5.739325523376465, 7.27052116394043, 8.801716804504395, 10.33291244506836, 11.864108085632324, 13.395303726196289, 14.926499366760254, 16.45769500732422, 17.9888916015625, 19.52008628845215, 21.051280975341797, 22.582477569580078, 24.11367416381836, 25.644868850708008, 27.176063537597656, 28.707260131835938, 30.23845672607422, 31.769651412963867, 33.300846099853516, 34.8320426940918, 36.36323928833008, 37.894432067871094, 39.425628662109375, 40.956825256347656, 42.48802185058594, 44.01921844482422, 45.550411224365234, 47.081607818603516]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 14.0, 17.0, 28.0, 42.0, 70.0, 91.0, 155.0, 241.0, 407.0, 719.0, 1386.0, 2777.0, 6583.0, 17130.0, 48835.0, 139608.0, 400324.0, 279939.0, 95353.0, 33195.0, 12084.0, 4715.0, 2186.0, 1058.0, 598.0, 348.0, 228.0, 131.0, 95.0, 59.0, 47.0, 30.0, 19.0, 7.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.03125, -28.118896484375, -27.20654296875, -26.294189453125, -25.3818359375, -24.469482421875, -23.55712890625, -22.644775390625, -21.732421875, -20.820068359375, -19.90771484375, -18.995361328125, -18.0830078125, -17.170654296875, -16.25830078125, -15.345947265625, -14.43359375, -13.521240234375, -12.60888671875, -11.696533203125, -10.7841796875, -9.871826171875, -8.95947265625, -8.047119140625, -7.134765625, -6.222412109375, -5.31005859375, -4.397705078125, -3.4853515625, -2.572998046875, -1.66064453125, -0.748291015625, 0.1640625, 1.076416015625, 1.98876953125, 2.901123046875, 3.8134765625, 4.725830078125, 5.63818359375, 6.550537109375, 7.462890625, 8.375244140625, 9.28759765625, 10.199951171875, 11.1123046875, 12.024658203125, 12.93701171875, 13.849365234375, 14.76171875, 15.674072265625, 16.58642578125, 17.498779296875, 18.4111328125, 19.323486328125, 20.23583984375, 21.148193359375, 22.060546875, 22.972900390625, 23.88525390625, 24.797607421875, 25.7099609375, 26.622314453125, 27.53466796875, 28.447021484375, 29.359375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 9.0, 9.0, 11.0, 15.0, 18.0, 14.0, 15.0, 24.0, 26.0, 31.0, 33.0, 33.0, 49.0, 58.0, 43.0, 68.0, 59.0, 65.0, 53.0, 60.0, 40.0, 55.0, 33.0, 25.0, 44.0, 25.0, 18.0, 19.0, 11.0, 7.0, 12.0, 5.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.6063232421875, -4.439208984375, -4.2720947265625, -4.10498046875, -3.9378662109375, -3.770751953125, -3.6036376953125, -3.4365234375, -3.2694091796875, -3.102294921875, -2.9351806640625, -2.76806640625, -2.6009521484375, -2.433837890625, -2.2667236328125, -2.099609375, -1.9324951171875, -1.765380859375, -1.5982666015625, -1.43115234375, -1.2640380859375, -1.096923828125, -0.9298095703125, -0.7626953125, -0.5955810546875, -0.428466796875, -0.2613525390625, -0.09423828125, 0.0728759765625, 0.239990234375, 0.4071044921875, 0.57421875, 0.7413330078125, 0.908447265625, 1.0755615234375, 1.24267578125, 1.4097900390625, 1.576904296875, 1.7440185546875, 1.9111328125, 2.0782470703125, 2.245361328125, 2.4124755859375, 2.57958984375, 2.7467041015625, 2.913818359375, 3.0809326171875, 3.248046875, 3.4151611328125, 3.582275390625, 3.7493896484375, 3.91650390625, 4.0836181640625, 4.250732421875, 4.4178466796875, 4.5849609375, 4.7520751953125, 4.919189453125, 5.0863037109375, 5.25341796875, 5.4205322265625, 5.587646484375, 5.7547607421875, 5.921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 6.0, 13.0, 6.0, 13.0, 20.0, 26.0, 23.0, 44.0, 50.0, 81.0, 121.0, 141.0, 192.0, 299.0, 407.0, 751.0, 1525.0, 4575.0, 17284.0, 76280.0, 389911.0, 443248.0, 85385.0, 19100.0, 4990.0, 1735.0, 814.0, 444.0, 284.0, 195.0, 143.0, 99.0, 85.0, 63.0, 42.0, 32.0, 36.0, 15.0, 19.0, 15.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-32.25, -31.2109375, -30.171875, -29.1328125, -28.09375, -27.0546875, -26.015625, -24.9765625, -23.9375, -22.8984375, -21.859375, -20.8203125, -19.78125, -18.7421875, -17.703125, -16.6640625, -15.625, -14.5859375, -13.546875, -12.5078125, -11.46875, -10.4296875, -9.390625, -8.3515625, -7.3125, -6.2734375, -5.234375, -4.1953125, -3.15625, -2.1171875, -1.078125, -0.0390625, 1.0, 2.0390625, 3.078125, 4.1171875, 5.15625, 6.1953125, 7.234375, 8.2734375, 9.3125, 10.3515625, 11.390625, 12.4296875, 13.46875, 14.5078125, 15.546875, 16.5859375, 17.625, 18.6640625, 19.703125, 20.7421875, 21.78125, 22.8203125, 23.859375, 24.8984375, 25.9375, 26.9765625, 28.015625, 29.0546875, 30.09375, 31.1328125, 32.171875, 33.2109375, 34.25]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 2.0, 4.0, 10.0, 16.0, 12.0, 15.0, 19.0, 22.0, 27.0, 28.0, 26.0, 48.0, 39.0, 41.0, 71.0, 57.0, 53.0, 59.0, 51.0, 51.0, 45.0, 40.0, 42.0, 43.0, 24.0, 38.0, 21.0, 25.0, 16.0, 19.0, 10.0, 5.0, 3.0, 7.0, 1.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -26.3271484375, -25.560546875, -24.7939453125, -24.02734375, -23.2607421875, -22.494140625, -21.7275390625, -20.9609375, -20.1943359375, -19.427734375, -18.6611328125, -17.89453125, -17.1279296875, -16.361328125, -15.5947265625, -14.828125, -14.0615234375, -13.294921875, -12.5283203125, -11.76171875, -10.9951171875, -10.228515625, -9.4619140625, -8.6953125, -7.9287109375, -7.162109375, -6.3955078125, -5.62890625, -4.8623046875, -4.095703125, -3.3291015625, -2.5625, -1.7958984375, -1.029296875, -0.2626953125, 0.50390625, 1.2705078125, 2.037109375, 2.8037109375, 3.5703125, 4.3369140625, 5.103515625, 5.8701171875, 6.63671875, 7.4033203125, 8.169921875, 8.9365234375, 9.703125, 10.4697265625, 11.236328125, 12.0029296875, 12.76953125, 13.5361328125, 14.302734375, 15.0693359375, 15.8359375, 16.6025390625, 17.369140625, 18.1357421875, 18.90234375, 19.6689453125, 20.435546875, 21.2021484375, 21.96875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 8.0, 11.0, 15.0, 35.0, 59.0, 59.0, 142.0, 222.0, 441.0, 988.0, 2316.0, 5681.0, 16757.0, 63238.0, 342313.0, 499312.0, 84011.0, 21259.0, 6767.0, 2565.0, 1091.0, 596.0, 262.0, 165.0, 80.0, 55.0, 32.0, 26.0, 13.0, 9.0, 11.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4453125, -13.9952392578125, -13.545166015625, -13.0950927734375, -12.64501953125, -12.1949462890625, -11.744873046875, -11.2947998046875, -10.8447265625, -10.3946533203125, -9.944580078125, -9.4945068359375, -9.04443359375, -8.5943603515625, -8.144287109375, -7.6942138671875, -7.244140625, -6.7940673828125, -6.343994140625, -5.8939208984375, -5.44384765625, -4.9937744140625, -4.543701171875, -4.0936279296875, -3.6435546875, -3.1934814453125, -2.743408203125, -2.2933349609375, -1.84326171875, -1.3931884765625, -0.943115234375, -0.4930419921875, -0.04296875, 0.4071044921875, 0.857177734375, 1.3072509765625, 1.75732421875, 2.2073974609375, 2.657470703125, 3.1075439453125, 3.5576171875, 4.0076904296875, 4.457763671875, 4.9078369140625, 5.35791015625, 5.8079833984375, 6.258056640625, 6.7081298828125, 7.158203125, 7.6082763671875, 8.058349609375, 8.5084228515625, 8.95849609375, 9.4085693359375, 9.858642578125, 10.3087158203125, 10.7587890625, 11.2088623046875, 11.658935546875, 12.1090087890625, 12.55908203125, 13.0091552734375, 13.459228515625, 13.9093017578125, 14.359375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 4.0, 7.0, 9.0, 9.0, 16.0, 23.0, 21.0, 34.0, 32.0, 38.0, 60.0, 107.0, 244.0, 124.0, 69.0, 42.0, 32.0, 24.0, 27.0, 14.0, 16.0, 16.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0032558441162109375, -0.0031644105911254883, -0.003072977066040039, -0.00298154354095459, -0.0028901100158691406, -0.0027986764907836914, -0.002707242965698242, -0.002615809440612793, -0.0025243759155273438, -0.0024329423904418945, -0.0023415088653564453, -0.002250075340270996, -0.002158641815185547, -0.0020672082901000977, -0.0019757747650146484, -0.0018843412399291992, -0.00179290771484375, -0.0017014741897583008, -0.0016100406646728516, -0.0015186071395874023, -0.0014271736145019531, -0.001335740089416504, -0.0012443065643310547, -0.0011528730392456055, -0.0010614395141601562, -0.000970005989074707, -0.0008785724639892578, -0.0007871389389038086, -0.0006957054138183594, -0.0006042718887329102, -0.0005128383636474609, -0.0004214048385620117, -0.0003299713134765625, -0.00023853778839111328, -0.00014710426330566406, -5.5670738220214844e-05, 3.5762786865234375e-05, 0.0001271963119506836, 0.0002186298370361328, 0.00031006336212158203, 0.00040149688720703125, 0.0004929304122924805, 0.0005843639373779297, 0.0006757974624633789, 0.0007672309875488281, 0.0008586645126342773, 0.0009500980377197266, 0.0010415315628051758, 0.001132965087890625, 0.0012243986129760742, 0.0013158321380615234, 0.0014072656631469727, 0.0014986991882324219, 0.001590132713317871, 0.0016815662384033203, 0.0017729997634887695, 0.0018644332885742188, 0.001955866813659668, 0.002047300338745117, 0.0021387338638305664, 0.0022301673889160156, 0.002321600914001465, 0.002413034439086914, 0.0025044679641723633, 0.0025959014892578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 4.0, 14.0, 24.0, 34.0, 51.0, 111.0, 195.0, 397.0, 877.0, 2388.0, 11291.0, 102238.0, 808606.0, 106702.0, 11492.0, 2465.0, 819.0, 367.0, 196.0, 114.0, 43.0, 50.0, 30.0, 13.0, 11.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.546875, -25.730224609375, -24.91357421875, -24.096923828125, -23.2802734375, -22.463623046875, -21.64697265625, -20.830322265625, -20.013671875, -19.197021484375, -18.38037109375, -17.563720703125, -16.7470703125, -15.930419921875, -15.11376953125, -14.297119140625, -13.48046875, -12.663818359375, -11.84716796875, -11.030517578125, -10.2138671875, -9.397216796875, -8.58056640625, -7.763916015625, -6.947265625, -6.130615234375, -5.31396484375, -4.497314453125, -3.6806640625, -2.864013671875, -2.04736328125, -1.230712890625, -0.4140625, 0.402587890625, 1.21923828125, 2.035888671875, 2.8525390625, 3.669189453125, 4.48583984375, 5.302490234375, 6.119140625, 6.935791015625, 7.75244140625, 8.569091796875, 9.3857421875, 10.202392578125, 11.01904296875, 11.835693359375, 12.65234375, 13.468994140625, 14.28564453125, 15.102294921875, 15.9189453125, 16.735595703125, 17.55224609375, 18.368896484375, 19.185546875, 20.002197265625, 20.81884765625, 21.635498046875, 22.4521484375, 23.268798828125, 24.08544921875, 24.902099609375, 25.71875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 10.0, 9.0, 17.0, 46.0, 65.0, 91.0, 160.0, 218.0, 151.0, 93.0, 48.0, 43.0, 18.0, 16.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.59375, -19.86865234375, -19.1435546875, -18.41845703125, -17.693359375, -16.96826171875, -16.2431640625, -15.51806640625, -14.79296875, -14.06787109375, -13.3427734375, -12.61767578125, -11.892578125, -11.16748046875, -10.4423828125, -9.71728515625, -8.9921875, -8.26708984375, -7.5419921875, -6.81689453125, -6.091796875, -5.36669921875, -4.6416015625, -3.91650390625, -3.19140625, -2.46630859375, -1.7412109375, -1.01611328125, -0.291015625, 0.43408203125, 1.1591796875, 1.88427734375, 2.609375, 3.33447265625, 4.0595703125, 4.78466796875, 5.509765625, 6.23486328125, 6.9599609375, 7.68505859375, 8.41015625, 9.13525390625, 9.8603515625, 10.58544921875, 11.310546875, 12.03564453125, 12.7607421875, 13.48583984375, 14.2109375, 14.93603515625, 15.6611328125, 16.38623046875, 17.111328125, 17.83642578125, 18.5615234375, 19.28662109375, 20.01171875, 20.73681640625, 21.4619140625, 22.18701171875, 22.912109375, 23.63720703125, 24.3623046875, 25.08740234375, 25.8125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 26.0, 69.0, 157.0, 244.0, 253.0, 156.0, 69.0, 21.0, 4.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.71096801757812, -195.8920135498047, -182.07305908203125, -168.25408935546875, -154.4351348876953, -140.61618041992188, -126.7972183227539, -112.97825622558594, -99.1593017578125, -85.34034729003906, -71.5213851928711, -57.70242691040039, -43.88346862792969, -30.06451416015625, -16.24555206298828, -2.4265899658203125, 11.392364501953125, 25.211322784423828, 39.03028106689453, 52.849239349365234, 66.66819763183594, 80.48715209960938, 94.30611419677734, 108.12507629394531, 121.94403076171875, 135.7629852294922, 149.58193969726562, 163.40090942382812, 177.21986389160156, 191.038818359375, 204.8577880859375, 218.67674255371094, 232.4957275390625, 246.31468200683594, 260.1336364746094, 273.9526062011719, 287.77154541015625, 301.59051513671875, 315.40948486328125, 329.22845458984375, 343.0473937988281, 356.8663635253906, 370.685302734375, 384.5042724609375, 398.3232421875, 412.1421813964844, 425.9611511230469, 439.78009033203125, 453.59906005859375, 467.41802978515625, 481.2369689941406, 495.0559387207031, 508.8748779296875, 522.69384765625, 536.5128173828125, 550.331787109375, 564.1507568359375, 577.9697265625, 591.7886962890625, 605.6076049804688, 619.4265747070312, 633.2455444335938, 647.0645141601562, 660.8834838867188, 674.702392578125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 5.0, 7.0, 4.0, 7.0, 7.0, 13.0, 15.0, 14.0, 18.0, 15.0, 17.0, 16.0, 19.0, 23.0, 25.0, 30.0, 37.0, 26.0, 37.0, 34.0, 41.0, 43.0, 38.0, 54.0, 35.0, 50.0, 35.0, 32.0, 32.0, 31.0, 30.0, 27.0, 29.0, 17.0, 21.0, 21.0, 16.0, 11.0, 12.0, 16.0, 10.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0], "bins": [-107.6606674194336, -104.48535919189453, -101.31005096435547, -98.1347427368164, -94.95943450927734, -91.78412628173828, -88.60881805419922, -85.43350982666016, -82.2582015991211, -79.08289337158203, -75.90758514404297, -72.7322769165039, -69.55696868896484, -66.38166046142578, -63.20635223388672, -60.031044006347656, -56.85573196411133, -53.680423736572266, -50.5051155090332, -47.32980728149414, -44.15449905395508, -40.979190826416016, -37.80387878417969, -34.628570556640625, -31.453264236450195, -28.277956008911133, -25.10264778137207, -21.927337646484375, -18.752029418945312, -15.576722145080566, -12.401412963867188, -9.226104736328125, -6.0507965087890625, -2.875488042831421, 0.2998204231262207, 3.4751291275024414, 6.650437355041504, 9.825745582580566, 13.001054763793945, 16.176362991333008, 19.35167121887207, 22.526979446411133, 25.702287673950195, 28.87759780883789, 32.05290603637695, 35.228214263916016, 38.40352249145508, 41.57883071899414, 44.7541389465332, 47.929447174072266, 51.10475540161133, 54.28006362915039, 57.45537185668945, 60.630680084228516, 63.805992126464844, 66.9813003540039, 70.15660858154297, 73.33191680908203, 76.5072250366211, 79.68253326416016, 82.85784149169922, 86.03314971923828, 89.20845794677734, 92.3837661743164, 95.55907440185547]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 12.0, 22.0, 23.0, 42.0, 63.0, 111.0, 159.0, 280.0, 473.0, 863.0, 1776.0, 3917.0, 9983.0, 31445.0, 139836.0, 3306619.0, 592050.0, 74364.0, 19963.0, 6732.0, 2684.0, 1316.0, 639.0, 323.0, 184.0, 134.0, 77.0, 46.0, 45.0, 30.0, 20.0, 13.0, 8.0, 5.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.21875, -39.9228515625, -38.626953125, -37.3310546875, -36.03515625, -34.7392578125, -33.443359375, -32.1474609375, -30.8515625, -29.5556640625, -28.259765625, -26.9638671875, -25.66796875, -24.3720703125, -23.076171875, -21.7802734375, -20.484375, -19.1884765625, -17.892578125, -16.5966796875, -15.30078125, -14.0048828125, -12.708984375, -11.4130859375, -10.1171875, -8.8212890625, -7.525390625, -6.2294921875, -4.93359375, -3.6376953125, -2.341796875, -1.0458984375, 0.25, 1.5458984375, 2.841796875, 4.1376953125, 5.43359375, 6.7294921875, 8.025390625, 9.3212890625, 10.6171875, 11.9130859375, 13.208984375, 14.5048828125, 15.80078125, 17.0966796875, 18.392578125, 19.6884765625, 20.984375, 22.2802734375, 23.576171875, 24.8720703125, 26.16796875, 27.4638671875, 28.759765625, 30.0556640625, 31.3515625, 32.6474609375, 33.943359375, 35.2392578125, 36.53515625, 37.8310546875, 39.126953125, 40.4228515625, 41.71875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 8.0, 3.0, 7.0, 9.0, 16.0, 19.0, 25.0, 12.0, 15.0, 21.0, 25.0, 26.0, 26.0, 40.0, 51.0, 46.0, 53.0, 52.0, 66.0, 69.0, 39.0, 56.0, 53.0, 50.0, 40.0, 33.0, 35.0, 29.0, 16.0, 20.0, 11.0, 6.0, 7.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.6207275390625, -4.452392578125, -4.2840576171875, -4.11572265625, -3.9473876953125, -3.779052734375, -3.6107177734375, -3.4423828125, -3.2740478515625, -3.105712890625, -2.9373779296875, -2.76904296875, -2.6007080078125, -2.432373046875, -2.2640380859375, -2.095703125, -1.9273681640625, -1.759033203125, -1.5906982421875, -1.42236328125, -1.2540283203125, -1.085693359375, -0.9173583984375, -0.7490234375, -0.5806884765625, -0.412353515625, -0.2440185546875, -0.07568359375, 0.0926513671875, 0.260986328125, 0.4293212890625, 0.59765625, 0.7659912109375, 0.934326171875, 1.1026611328125, 1.27099609375, 1.4393310546875, 1.607666015625, 1.7760009765625, 1.9443359375, 2.1126708984375, 2.281005859375, 2.4493408203125, 2.61767578125, 2.7860107421875, 2.954345703125, 3.1226806640625, 3.291015625, 3.4593505859375, 3.627685546875, 3.7960205078125, 3.96435546875, 4.1326904296875, 4.301025390625, 4.4693603515625, 4.6376953125, 4.8060302734375, 4.974365234375, 5.1427001953125, 5.31103515625, 5.4793701171875, 5.647705078125, 5.8160400390625, 5.984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 12.0, 9.0, 13.0, 21.0, 30.0, 44.0, 82.0, 78.0, 138.0, 224.0, 345.0, 690.0, 1348.0, 2979.0, 7534.0, 23472.0, 93005.0, 656501.0, 3134849.0, 207711.0, 43785.0, 12601.0, 4630.0, 1931.0, 928.0, 492.0, 282.0, 172.0, 130.0, 79.0, 54.0, 28.0, 22.0, 21.0, 11.0, 8.0, 9.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.1875, -34.12890625, -33.0703125, -32.01171875, -30.953125, -29.89453125, -28.8359375, -27.77734375, -26.71875, -25.66015625, -24.6015625, -23.54296875, -22.484375, -21.42578125, -20.3671875, -19.30859375, -18.25, -17.19140625, -16.1328125, -15.07421875, -14.015625, -12.95703125, -11.8984375, -10.83984375, -9.78125, -8.72265625, -7.6640625, -6.60546875, -5.546875, -4.48828125, -3.4296875, -2.37109375, -1.3125, -0.25390625, 0.8046875, 1.86328125, 2.921875, 3.98046875, 5.0390625, 6.09765625, 7.15625, 8.21484375, 9.2734375, 10.33203125, 11.390625, 12.44921875, 13.5078125, 14.56640625, 15.625, 16.68359375, 17.7421875, 18.80078125, 19.859375, 20.91796875, 21.9765625, 23.03515625, 24.09375, 25.15234375, 26.2109375, 27.26953125, 28.328125, 29.38671875, 30.4453125, 31.50390625, 32.5625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 8.0, 4.0, 9.0, 4.0, 8.0, 15.0, 16.0, 18.0, 28.0, 36.0, 54.0, 75.0, 127.0, 224.0, 366.0, 985.0, 1204.0, 346.0, 202.0, 102.0, 80.0, 41.0, 34.0, 24.0, 18.0, 6.0, 12.0, 6.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.40625, -16.948486328125, -16.49072265625, -16.032958984375, -15.5751953125, -15.117431640625, -14.65966796875, -14.201904296875, -13.744140625, -13.286376953125, -12.82861328125, -12.370849609375, -11.9130859375, -11.455322265625, -10.99755859375, -10.539794921875, -10.08203125, -9.624267578125, -9.16650390625, -8.708740234375, -8.2509765625, -7.793212890625, -7.33544921875, -6.877685546875, -6.419921875, -5.962158203125, -5.50439453125, -5.046630859375, -4.5888671875, -4.131103515625, -3.67333984375, -3.215576171875, -2.7578125, -2.300048828125, -1.84228515625, -1.384521484375, -0.9267578125, -0.468994140625, -0.01123046875, 0.446533203125, 0.904296875, 1.362060546875, 1.81982421875, 2.277587890625, 2.7353515625, 3.193115234375, 3.65087890625, 4.108642578125, 4.56640625, 5.024169921875, 5.48193359375, 5.939697265625, 6.3974609375, 6.855224609375, 7.31298828125, 7.770751953125, 8.228515625, 8.686279296875, 9.14404296875, 9.601806640625, 10.0595703125, 10.517333984375, 10.97509765625, 11.432861328125, 11.890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 7.0, 2.0, 5.0, 1.0, 7.0, 13.0, 20.0, 36.0, 57.0, 77.0, 106.0, 131.0, 119.0, 131.0, 108.0, 67.0, 53.0, 37.0, 12.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-190.9217071533203, -187.27719116210938, -183.6326904296875, -179.98817443847656, -176.34365844726562, -172.6991424560547, -169.05462646484375, -165.41012573242188, -161.76560974121094, -158.12109375, -154.47659301757812, -150.8320770263672, -147.18756103515625, -143.5430450439453, -139.89852905273438, -136.2540283203125, -132.60951232910156, -128.96499633789062, -125.32048797607422, -121.67597961425781, -118.03146362304688, -114.38694763183594, -110.74243927001953, -107.09793090820312, -103.45341491699219, -99.80889892578125, -96.16439056396484, -92.51988220214844, -88.8753662109375, -85.23085021972656, -81.58634185791016, -77.94183349609375, -74.29731750488281, -70.65280151367188, -67.00829315185547, -63.3637809753418, -59.719268798828125, -56.07475662231445, -52.43024444580078, -48.78573226928711, -45.1412239074707, -41.49671173095703, -37.85219955444336, -34.20768737792969, -30.563175201416016, -26.918663024902344, -23.274150848388672, -19.629638671875, -15.985126495361328, -12.340614318847656, -8.696102142333984, -5.0515899658203125, -1.4070777893066406, 2.2374343872070312, 5.881946563720703, 9.526458740234375, 13.170970916748047, 16.81548309326172, 20.45999526977539, 24.104507446289062, 27.749019622802734, 31.393531799316406, 35.03804397583008, 38.68255615234375, 42.32706832885742]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 8.0, 18.0, 12.0, 18.0, 23.0, 17.0, 30.0, 26.0, 26.0, 33.0, 44.0, 51.0, 49.0, 56.0, 51.0, 55.0, 44.0, 51.0, 46.0, 54.0, 46.0, 38.0, 38.0, 29.0, 26.0, 16.0, 13.0, 19.0, 17.0, 15.0, 8.0, 6.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.61534881591797, -59.53145980834961, -57.447574615478516, -55.363685607910156, -53.27980041503906, -51.1959114074707, -49.112022399902344, -47.02813720703125, -44.94424819946289, -42.86035919189453, -40.77647399902344, -38.69258499145508, -36.60869598388672, -34.524810791015625, -32.440921783447266, -30.35703468322754, -28.273147583007812, -26.189260482788086, -24.10537338256836, -22.021484375, -19.937597274780273, -17.853710174560547, -15.769822120666504, -13.685934066772461, -11.602046966552734, -9.518159866333008, -7.434271812438965, -5.35038423538208, -3.2664966583251953, -1.1826095581054688, 0.9012784957885742, 2.985166549682617, 5.0690460205078125, 7.152933597564697, 9.236821174621582, 11.320709228515625, 13.404596328735352, 15.488483428955078, 17.572372436523438, 19.656259536743164, 21.74014663696289, 23.824033737182617, 25.907920837402344, 27.991809844970703, 30.07569694519043, 32.159584045410156, 34.243473052978516, 36.327362060546875, 38.41124725341797, 40.49513626098633, 42.57902145385742, 44.66291046142578, 46.746795654296875, 48.830684661865234, 50.914573669433594, 52.99845886230469, 55.08234786987305, 57.166236877441406, 59.2501220703125, 61.33401107788086, 63.41790008544922, 65.50178527832031, 67.5856704711914, 69.66956329345703, 71.75344848632812]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 6.0, 10.0, 16.0, 20.0, 24.0, 29.0, 84.0, 95.0, 153.0, 283.0, 483.0, 965.0, 2149.0, 5194.0, 14716.0, 48366.0, 182669.0, 460824.0, 239799.0, 62823.0, 18502.0, 6388.0, 2522.0, 1077.0, 584.0, 300.0, 169.0, 104.0, 81.0, 32.0, 32.0, 20.0, 12.0, 10.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.953125, -26.975830078125, -25.99853515625, -25.021240234375, -24.0439453125, -23.066650390625, -22.08935546875, -21.112060546875, -20.134765625, -19.157470703125, -18.18017578125, -17.202880859375, -16.2255859375, -15.248291015625, -14.27099609375, -13.293701171875, -12.31640625, -11.339111328125, -10.36181640625, -9.384521484375, -8.4072265625, -7.429931640625, -6.45263671875, -5.475341796875, -4.498046875, -3.520751953125, -2.54345703125, -1.566162109375, -0.5888671875, 0.388427734375, 1.36572265625, 2.343017578125, 3.3203125, 4.297607421875, 5.27490234375, 6.252197265625, 7.2294921875, 8.206787109375, 9.18408203125, 10.161376953125, 11.138671875, 12.115966796875, 13.09326171875, 14.070556640625, 15.0478515625, 16.025146484375, 17.00244140625, 17.979736328125, 18.95703125, 19.934326171875, 20.91162109375, 21.888916015625, 22.8662109375, 23.843505859375, 24.82080078125, 25.798095703125, 26.775390625, 27.752685546875, 28.72998046875, 29.707275390625, 30.6845703125, 31.661865234375, 32.63916015625, 33.616455078125, 34.59375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 8.0, 9.0, 18.0, 13.0, 17.0, 18.0, 22.0, 27.0, 33.0, 26.0, 40.0, 36.0, 52.0, 43.0, 47.0, 61.0, 48.0, 54.0, 53.0, 56.0, 39.0, 45.0, 32.0, 40.0, 28.0, 21.0, 18.0, 22.0, 15.0, 13.0, 5.0, 4.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.9453125, -4.77545166015625, -4.6055908203125, -4.43572998046875, -4.265869140625, -4.09600830078125, -3.9261474609375, -3.75628662109375, -3.58642578125, -3.41656494140625, -3.2467041015625, -3.07684326171875, -2.906982421875, -2.73712158203125, -2.5672607421875, -2.39739990234375, -2.2275390625, -2.05767822265625, -1.8878173828125, -1.71795654296875, -1.548095703125, -1.37823486328125, -1.2083740234375, -1.03851318359375, -0.86865234375, -0.69879150390625, -0.5289306640625, -0.35906982421875, -0.189208984375, -0.01934814453125, 0.1505126953125, 0.32037353515625, 0.490234375, 0.66009521484375, 0.8299560546875, 0.99981689453125, 1.169677734375, 1.33953857421875, 1.5093994140625, 1.67926025390625, 1.84912109375, 2.01898193359375, 2.1888427734375, 2.35870361328125, 2.528564453125, 2.69842529296875, 2.8682861328125, 3.03814697265625, 3.2080078125, 3.37786865234375, 3.5477294921875, 3.71759033203125, 3.887451171875, 4.05731201171875, 4.2271728515625, 4.39703369140625, 4.56689453125, 4.73675537109375, 4.9066162109375, 5.07647705078125, 5.246337890625, 5.41619873046875, 5.5860595703125, 5.75592041015625, 5.92578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 3.0, 9.0, 17.0, 25.0, 27.0, 36.0, 44.0, 59.0, 76.0, 118.0, 144.0, 259.0, 335.0, 473.0, 876.0, 1796.0, 4602.0, 15893.0, 68577.0, 378549.0, 461982.0, 85311.0, 19373.0, 5260.0, 1897.0, 957.0, 575.0, 353.0, 242.0, 166.0, 120.0, 109.0, 69.0, 46.0, 50.0, 36.0, 16.0, 15.0, 14.0, 9.0, 5.0, 5.0, 2.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.890625, -25.897216796875, -24.90380859375, -23.910400390625, -22.9169921875, -21.923583984375, -20.93017578125, -19.936767578125, -18.943359375, -17.949951171875, -16.95654296875, -15.963134765625, -14.9697265625, -13.976318359375, -12.98291015625, -11.989501953125, -10.99609375, -10.002685546875, -9.00927734375, -8.015869140625, -7.0224609375, -6.029052734375, -5.03564453125, -4.042236328125, -3.048828125, -2.055419921875, -1.06201171875, -0.068603515625, 0.9248046875, 1.918212890625, 2.91162109375, 3.905029296875, 4.8984375, 5.891845703125, 6.88525390625, 7.878662109375, 8.8720703125, 9.865478515625, 10.85888671875, 11.852294921875, 12.845703125, 13.839111328125, 14.83251953125, 15.825927734375, 16.8193359375, 17.812744140625, 18.80615234375, 19.799560546875, 20.79296875, 21.786376953125, 22.77978515625, 23.773193359375, 24.7666015625, 25.760009765625, 26.75341796875, 27.746826171875, 28.740234375, 29.733642578125, 30.72705078125, 31.720458984375, 32.7138671875, 33.707275390625, 34.70068359375, 35.694091796875, 36.6875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 5.0, 10.0, 17.0, 11.0, 18.0, 12.0, 18.0, 25.0, 25.0, 28.0, 31.0, 35.0, 44.0, 45.0, 43.0, 48.0, 55.0, 62.0, 47.0, 41.0, 37.0, 49.0, 48.0, 36.0, 37.0, 27.0, 12.0, 22.0, 23.0, 16.0, 10.0, 15.0, 9.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.765625, -24.982666015625, -24.19970703125, -23.416748046875, -22.6337890625, -21.850830078125, -21.06787109375, -20.284912109375, -19.501953125, -18.718994140625, -17.93603515625, -17.153076171875, -16.3701171875, -15.587158203125, -14.80419921875, -14.021240234375, -13.23828125, -12.455322265625, -11.67236328125, -10.889404296875, -10.1064453125, -9.323486328125, -8.54052734375, -7.757568359375, -6.974609375, -6.191650390625, -5.40869140625, -4.625732421875, -3.8427734375, -3.059814453125, -2.27685546875, -1.493896484375, -0.7109375, 0.072021484375, 0.85498046875, 1.637939453125, 2.4208984375, 3.203857421875, 3.98681640625, 4.769775390625, 5.552734375, 6.335693359375, 7.11865234375, 7.901611328125, 8.6845703125, 9.467529296875, 10.25048828125, 11.033447265625, 11.81640625, 12.599365234375, 13.38232421875, 14.165283203125, 14.9482421875, 15.731201171875, 16.51416015625, 17.297119140625, 18.080078125, 18.863037109375, 19.64599609375, 20.428955078125, 21.2119140625, 21.994873046875, 22.77783203125, 23.560791015625, 24.34375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 8.0, 17.0, 20.0, 37.0, 50.0, 85.0, 139.0, 270.0, 643.0, 1454.0, 4009.0, 13122.0, 51658.0, 224598.0, 499953.0, 191465.0, 43497.0, 11460.0, 3576.0, 1309.0, 563.0, 273.0, 133.0, 86.0, 43.0, 30.0, 19.0, 12.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.249267578125, -9.91259765625, -9.575927734375, -9.2392578125, -8.902587890625, -8.56591796875, -8.229248046875, -7.892578125, -7.555908203125, -7.21923828125, -6.882568359375, -6.5458984375, -6.209228515625, -5.87255859375, -5.535888671875, -5.19921875, -4.862548828125, -4.52587890625, -4.189208984375, -3.8525390625, -3.515869140625, -3.17919921875, -2.842529296875, -2.505859375, -2.169189453125, -1.83251953125, -1.495849609375, -1.1591796875, -0.822509765625, -0.48583984375, -0.149169921875, 0.1875, 0.524169921875, 0.86083984375, 1.197509765625, 1.5341796875, 1.870849609375, 2.20751953125, 2.544189453125, 2.880859375, 3.217529296875, 3.55419921875, 3.890869140625, 4.2275390625, 4.564208984375, 4.90087890625, 5.237548828125, 5.57421875, 5.910888671875, 6.24755859375, 6.584228515625, 6.9208984375, 7.257568359375, 7.59423828125, 7.930908203125, 8.267578125, 8.604248046875, 8.94091796875, 9.277587890625, 9.6142578125, 9.950927734375, 10.28759765625, 10.624267578125, 10.9609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 1.0, 6.0, 9.0, 12.0, 16.0, 28.0, 33.0, 49.0, 77.0, 117.0, 167.0, 167.0, 118.0, 77.0, 48.0, 20.0, 16.0, 10.0, 9.0, 4.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002475738525390625, -0.0023717284202575684, -0.0022677183151245117, -0.002163708209991455, -0.0020596981048583984, -0.001955687999725342, -0.0018516778945922852, -0.0017476677894592285, -0.0016436576843261719, -0.0015396475791931152, -0.0014356374740600586, -0.001331627368927002, -0.0012276172637939453, -0.0011236071586608887, -0.001019597053527832, -0.0009155869483947754, -0.0008115768432617188, -0.0007075667381286621, -0.0006035566329956055, -0.0004995465278625488, -0.0003955364227294922, -0.00029152631759643555, -0.0001875162124633789, -8.350610733032227e-05, 2.0503997802734375e-05, 0.00012451410293579102, 0.00022852420806884766, 0.0003325343132019043, 0.00043654441833496094, 0.0005405545234680176, 0.0006445646286010742, 0.0007485747337341309, 0.0008525848388671875, 0.0009565949440002441, 0.0010606050491333008, 0.0011646151542663574, 0.001268625259399414, 0.0013726353645324707, 0.0014766454696655273, 0.001580655574798584, 0.0016846656799316406, 0.0017886757850646973, 0.001892685890197754, 0.0019966959953308105, 0.002100706100463867, 0.002204716205596924, 0.0023087263107299805, 0.002412736415863037, 0.0025167465209960938, 0.0026207566261291504, 0.002724766731262207, 0.0028287768363952637, 0.0029327869415283203, 0.003036797046661377, 0.0031408071517944336, 0.0032448172569274902, 0.003348827362060547, 0.0034528374671936035, 0.00355684757232666, 0.003660857677459717, 0.0037648677825927734, 0.00386887788772583, 0.003972887992858887, 0.004076898097991943, 0.004180908203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 14.0, 24.0, 32.0, 59.0, 106.0, 206.0, 440.0, 1085.0, 4213.0, 49544.0, 763150.0, 216105.0, 10565.0, 1844.0, 588.0, 309.0, 128.0, 75.0, 26.0, 16.0, 14.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.625, -22.85595703125, -22.0869140625, -21.31787109375, -20.548828125, -19.77978515625, -19.0107421875, -18.24169921875, -17.47265625, -16.70361328125, -15.9345703125, -15.16552734375, -14.396484375, -13.62744140625, -12.8583984375, -12.08935546875, -11.3203125, -10.55126953125, -9.7822265625, -9.01318359375, -8.244140625, -7.47509765625, -6.7060546875, -5.93701171875, -5.16796875, -4.39892578125, -3.6298828125, -2.86083984375, -2.091796875, -1.32275390625, -0.5537109375, 0.21533203125, 0.984375, 1.75341796875, 2.5224609375, 3.29150390625, 4.060546875, 4.82958984375, 5.5986328125, 6.36767578125, 7.13671875, 7.90576171875, 8.6748046875, 9.44384765625, 10.212890625, 10.98193359375, 11.7509765625, 12.52001953125, 13.2890625, 14.05810546875, 14.8271484375, 15.59619140625, 16.365234375, 17.13427734375, 17.9033203125, 18.67236328125, 19.44140625, 20.21044921875, 20.9794921875, 21.74853515625, 22.517578125, 23.28662109375, 24.0556640625, 24.82470703125, 25.59375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 2.0, 8.0, 6.0, 15.0, 28.0, 38.0, 46.0, 70.0, 78.0, 112.0, 126.0, 130.0, 101.0, 87.0, 50.0, 33.0, 25.0, 17.0, 17.0, 5.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.625, -19.141357421875, -18.65771484375, -18.174072265625, -17.6904296875, -17.206787109375, -16.72314453125, -16.239501953125, -15.755859375, -15.272216796875, -14.78857421875, -14.304931640625, -13.8212890625, -13.337646484375, -12.85400390625, -12.370361328125, -11.88671875, -11.403076171875, -10.91943359375, -10.435791015625, -9.9521484375, -9.468505859375, -8.98486328125, -8.501220703125, -8.017578125, -7.533935546875, -7.05029296875, -6.566650390625, -6.0830078125, -5.599365234375, -5.11572265625, -4.632080078125, -4.1484375, -3.664794921875, -3.18115234375, -2.697509765625, -2.2138671875, -1.730224609375, -1.24658203125, -0.762939453125, -0.279296875, 0.204345703125, 0.68798828125, 1.171630859375, 1.6552734375, 2.138916015625, 2.62255859375, 3.106201171875, 3.58984375, 4.073486328125, 4.55712890625, 5.040771484375, 5.5244140625, 6.008056640625, 6.49169921875, 6.975341796875, 7.458984375, 7.942626953125, 8.42626953125, 8.909912109375, 9.3935546875, 9.877197265625, 10.36083984375, 10.844482421875, 11.328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 32.0, 65.0, 128.0, 181.0, 209.0, 174.0, 99.0, 62.0, 24.0, 15.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-340.65350341796875, -330.6536865234375, -320.65386962890625, -310.654052734375, -300.65423583984375, -290.6544189453125, -280.65460205078125, -270.65478515625, -260.65496826171875, -250.6551513671875, -240.65533447265625, -230.655517578125, -220.65570068359375, -210.6558837890625, -200.6560821533203, -190.65626525878906, -180.65646362304688, -170.65664672851562, -160.65682983398438, -150.65701293945312, -140.65719604492188, -130.65737915039062, -120.65757751464844, -110.65776062011719, -100.65794372558594, -90.65812683105469, -80.65830993652344, -70.65850067138672, -60.65868377685547, -50.65886688232422, -40.659053802490234, -30.65924072265625, -20.659423828125, -10.659608840942383, -0.6597938537597656, 9.340021133422852, 19.33983612060547, 29.33965301513672, 39.3394660949707, 49.33927917480469, 59.33909606933594, 69.33891296386719, 79.33872985839844, 89.33853912353516, 99.3383560180664, 109.33817291259766, 119.33798217773438, 129.33779907226562, 139.33761596679688, 149.33743286132812, 159.33724975585938, 169.33706665039062, 179.33688354492188, 189.33670043945312, 199.3365020751953, 209.33631896972656, 219.3361358642578, 229.33595275878906, 239.3357696533203, 249.33558654785156, 259.33538818359375, 269.335205078125, 279.33502197265625, 289.3348388671875, 299.33465576171875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 8.0, 8.0, 15.0, 9.0, 13.0, 20.0, 20.0, 16.0, 27.0, 29.0, 31.0, 28.0, 32.0, 32.0, 39.0, 43.0, 49.0, 43.0, 42.0, 48.0, 27.0, 43.0, 34.0, 43.0, 37.0, 41.0, 38.0, 22.0, 26.0, 20.0, 17.0, 17.0, 21.0, 10.0, 8.0, 12.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.77908325195312, -101.2737045288086, -97.76831817626953, -94.262939453125, -90.75755310058594, -87.2521743774414, -83.74679565429688, -80.24140930175781, -76.73603057861328, -73.23065185546875, -69.72526550292969, -66.21988677978516, -62.71450424194336, -59.20912170410156, -55.70374298095703, -52.198360443115234, -48.69297790527344, -45.18759536743164, -41.682212829589844, -38.17683410644531, -34.671451568603516, -31.16606903076172, -27.660688400268555, -24.15530776977539, -20.649925231933594, -17.144542694091797, -13.639162063598633, -10.133780479431152, -6.628398895263672, -3.123016357421875, 0.38236427307128906, 3.887744903564453, 7.393119812011719, 10.8985013961792, 14.40388298034668, 17.909263610839844, 21.41464614868164, 24.920028686523438, 28.4254093170166, 31.930789947509766, 35.43617248535156, 38.94155502319336, 42.446937561035156, 45.95231628417969, 49.457698822021484, 52.96308135986328, 56.46846008300781, 59.97384262084961, 63.479225158691406, 66.98460388183594, 70.489990234375, 73.99536895751953, 77.50074768066406, 81.00613403320312, 84.51151275634766, 88.01689147949219, 91.52227783203125, 95.02765655517578, 98.53304290771484, 102.03842163085938, 105.54380798339844, 109.04918670654297, 112.5545654296875, 116.05995178222656, 119.5653305053711]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 3.0, 8.0, 7.0, 11.0, 22.0, 29.0, 25.0, 55.0, 107.0, 154.0, 287.0, 482.0, 935.0, 1818.0, 3958.0, 11294.0, 54579.0, 4054931.0, 47354.0, 10491.0, 3890.0, 1791.0, 861.0, 489.0, 260.0, 154.0, 94.0, 58.0, 42.0, 16.0, 14.0, 18.0, 9.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0, -68.08056640625, -66.1611328125, -64.24169921875, -62.322265625, -60.40283203125, -58.4833984375, -56.56396484375, -54.64453125, -52.72509765625, -50.8056640625, -48.88623046875, -46.966796875, -45.04736328125, -43.1279296875, -41.20849609375, -39.2890625, -37.36962890625, -35.4501953125, -33.53076171875, -31.611328125, -29.69189453125, -27.7724609375, -25.85302734375, -23.93359375, -22.01416015625, -20.0947265625, -18.17529296875, -16.255859375, -14.33642578125, -12.4169921875, -10.49755859375, -8.578125, -6.65869140625, -4.7392578125, -2.81982421875, -0.900390625, 1.01904296875, 2.9384765625, 4.85791015625, 6.77734375, 8.69677734375, 10.6162109375, 12.53564453125, 14.455078125, 16.37451171875, 18.2939453125, 20.21337890625, 22.1328125, 24.05224609375, 25.9716796875, 27.89111328125, 29.810546875, 31.72998046875, 33.6494140625, 35.56884765625, 37.48828125, 39.40771484375, 41.3271484375, 43.24658203125, 45.166015625, 47.08544921875, 49.0048828125, 50.92431640625, 52.84375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 8.0, 1.0, 7.0, 8.0, 8.0, 15.0, 13.0, 19.0, 20.0, 21.0, 17.0, 24.0, 32.0, 39.0, 36.0, 49.0, 48.0, 59.0, 55.0, 51.0, 45.0, 47.0, 41.0, 35.0, 39.0, 34.0, 33.0, 32.0, 40.0, 20.0, 21.0, 15.0, 16.0, 12.0, 8.0, 10.0, 3.0, 3.0, 5.0, 4.0, 2.0, 3.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.72271728515625, -4.5469970703125, -4.37127685546875, -4.195556640625, -4.01983642578125, -3.8441162109375, -3.66839599609375, -3.49267578125, -3.31695556640625, -3.1412353515625, -2.96551513671875, -2.789794921875, -2.61407470703125, -2.4383544921875, -2.26263427734375, -2.0869140625, -1.91119384765625, -1.7354736328125, -1.55975341796875, -1.384033203125, -1.20831298828125, -1.0325927734375, -0.85687255859375, -0.68115234375, -0.50543212890625, -0.3297119140625, -0.15399169921875, 0.021728515625, 0.19744873046875, 0.3731689453125, 0.54888916015625, 0.724609375, 0.90032958984375, 1.0760498046875, 1.25177001953125, 1.427490234375, 1.60321044921875, 1.7789306640625, 1.95465087890625, 2.13037109375, 2.30609130859375, 2.4818115234375, 2.65753173828125, 2.833251953125, 3.00897216796875, 3.1846923828125, 3.36041259765625, 3.5361328125, 3.71185302734375, 3.8875732421875, 4.06329345703125, 4.239013671875, 4.41473388671875, 4.5904541015625, 4.76617431640625, 4.94189453125, 5.11761474609375, 5.2933349609375, 5.46905517578125, 5.644775390625, 5.82049560546875, 5.9962158203125, 6.17193603515625, 6.34765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 9.0, 18.0, 30.0, 53.0, 78.0, 144.0, 209.0, 342.0, 520.0, 855.0, 1484.0, 2740.0, 5143.0, 11241.0, 28630.0, 145966.0, 3881324.0, 76318.0, 20783.0, 8721.0, 4177.0, 2286.0, 1269.0, 750.0, 463.0, 264.0, 184.0, 131.0, 54.0, 39.0, 13.0, 11.0, 13.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.0, -26.1904296875, -25.380859375, -24.5712890625, -23.76171875, -22.9521484375, -22.142578125, -21.3330078125, -20.5234375, -19.7138671875, -18.904296875, -18.0947265625, -17.28515625, -16.4755859375, -15.666015625, -14.8564453125, -14.046875, -13.2373046875, -12.427734375, -11.6181640625, -10.80859375, -9.9990234375, -9.189453125, -8.3798828125, -7.5703125, -6.7607421875, -5.951171875, -5.1416015625, -4.33203125, -3.5224609375, -2.712890625, -1.9033203125, -1.09375, -0.2841796875, 0.525390625, 1.3349609375, 2.14453125, 2.9541015625, 3.763671875, 4.5732421875, 5.3828125, 6.1923828125, 7.001953125, 7.8115234375, 8.62109375, 9.4306640625, 10.240234375, 11.0498046875, 11.859375, 12.6689453125, 13.478515625, 14.2880859375, 15.09765625, 15.9072265625, 16.716796875, 17.5263671875, 18.3359375, 19.1455078125, 19.955078125, 20.7646484375, 21.57421875, 22.3837890625, 23.193359375, 24.0029296875, 24.8125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 4.0, 11.0, 8.0, 15.0, 17.0, 24.0, 25.0, 33.0, 90.0, 199.0, 3032.0, 330.0, 104.0, 54.0, 29.0, 14.0, 15.0, 10.0, 8.0, 14.0, 4.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.0078125, -4.867584228515625, -4.72735595703125, -4.587127685546875, -4.4468994140625, -4.306671142578125, -4.16644287109375, -4.026214599609375, -3.885986328125, -3.745758056640625, -3.60552978515625, -3.465301513671875, -3.3250732421875, -3.184844970703125, -3.04461669921875, -2.904388427734375, -2.76416015625, -2.623931884765625, -2.48370361328125, -2.343475341796875, -2.2032470703125, -2.063018798828125, -1.92279052734375, -1.782562255859375, -1.642333984375, -1.502105712890625, -1.36187744140625, -1.221649169921875, -1.0814208984375, -0.941192626953125, -0.80096435546875, -0.660736083984375, -0.5205078125, -0.380279541015625, -0.24005126953125, -0.099822998046875, 0.0404052734375, 0.180633544921875, 0.32086181640625, 0.461090087890625, 0.601318359375, 0.741546630859375, 0.88177490234375, 1.022003173828125, 1.1622314453125, 1.302459716796875, 1.44268798828125, 1.582916259765625, 1.72314453125, 1.863372802734375, 2.00360107421875, 2.143829345703125, 2.2840576171875, 2.424285888671875, 2.56451416015625, 2.704742431640625, 2.844970703125, 2.985198974609375, 3.12542724609375, 3.265655517578125, 3.4058837890625, 3.546112060546875, 3.68634033203125, 3.826568603515625, 3.966796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 11.0, 8.0, 29.0, 39.0, 86.0, 101.0, 139.0, 160.0, 152.0, 120.0, 76.0, 47.0, 18.0, 11.0, 5.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0], "bins": [-54.106842041015625, -53.04995346069336, -51.99306869506836, -50.936180114746094, -49.879295349121094, -48.82240676879883, -47.76551818847656, -46.70863342285156, -45.6517448425293, -44.59485626220703, -43.53797149658203, -42.481082916259766, -41.424198150634766, -40.3673095703125, -39.3104248046875, -38.253536224365234, -37.19664764404297, -36.1397590637207, -35.0828742980957, -34.02598571777344, -32.96910095214844, -31.912212371826172, -30.85532569885254, -29.798439025878906, -28.741554260253906, -27.684667587280273, -26.62778091430664, -25.570892333984375, -24.514005661010742, -23.45711898803711, -22.400232315063477, -21.343345642089844, -20.286457061767578, -19.229570388793945, -18.172683715820312, -17.115795135498047, -16.058908462524414, -15.002021789550781, -13.945135116577148, -12.888248443603516, -11.83135986328125, -10.774473190307617, -9.717585563659668, -8.660698890686035, -7.603811740875244, -6.546924591064453, -5.49003791809082, -4.433150768280029, -3.3762636184692383, -2.3193764686584473, -1.2624895572662354, -0.20560264587402344, 0.8512845039367676, 1.9081716537475586, 2.9650583267211914, 4.021945476531982, 5.078832626342773, 6.1357197761535645, 7.1926069259643555, 8.249493598937988, 9.306381225585938, 10.36326789855957, 11.420154571533203, 12.477041244506836, 13.533928871154785]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 9.0, 8.0, 20.0, 11.0, 10.0, 14.0, 14.0, 20.0, 21.0, 26.0, 33.0, 28.0, 34.0, 31.0, 35.0, 26.0, 46.0, 42.0, 42.0, 51.0, 41.0, 41.0, 34.0, 32.0, 40.0, 45.0, 31.0, 25.0, 25.0, 33.0, 21.0, 14.0, 19.0, 10.0, 9.0, 11.0, 11.0, 10.0, 10.0, 3.0, 4.0, 4.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.904415130615234, -11.51807689666748, -11.131739616394043, -10.745401382446289, -10.359063148498535, -9.972724914550781, -9.586387634277344, -9.20004940032959, -8.813711166381836, -8.427372932434082, -8.041035652160645, -7.654697418212891, -7.268359184265137, -6.882021427154541, -6.495683670043945, -6.109345436096191, -5.723008155822754, -5.336670398712158, -4.950332164764404, -4.563994407653809, -4.177656173706055, -3.791318416595459, -3.4049806594848633, -3.0186426639556885, -2.6323046684265137, -2.245966672897339, -1.8596287965774536, -1.4732909202575684, -1.0869529247283936, -0.7006149291992188, -0.31427717208862305, 0.07206082344055176, 0.45839977264404297, 0.844737708568573, 1.231075644493103, 1.6174135208129883, 2.003751516342163, 2.390089511871338, 2.7764272689819336, 3.1627652645111084, 3.549103260040283, 3.935441255569458, 4.321779251098633, 4.7081170082092285, 5.094454765319824, 5.480792999267578, 5.867130756378174, 6.2534685134887695, 6.639806747436523, 7.026144504547119, 7.412482738494873, 7.798820495605469, 8.185158729553223, 8.571496963500977, 8.957834243774414, 9.344172477722168, 9.730510711669922, 10.116848945617676, 10.503186225891113, 10.889524459838867, 11.275862693786621, 11.662200927734375, 12.048538208007812, 12.434876441955566, 12.821213722229004]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 16.0, 13.0, 20.0, 46.0, 82.0, 82.0, 141.0, 272.0, 491.0, 1060.0, 2442.0, 6465.0, 18082.0, 53784.0, 172750.0, 423039.0, 251410.0, 78091.0, 25325.0, 8831.0, 3285.0, 1362.0, 636.0, 318.0, 178.0, 108.0, 69.0, 43.0, 42.0, 21.0, 12.0, 12.0, 10.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.390625, -23.666015625, -22.94140625, -22.216796875, -21.4921875, -20.767578125, -20.04296875, -19.318359375, -18.59375, -17.869140625, -17.14453125, -16.419921875, -15.6953125, -14.970703125, -14.24609375, -13.521484375, -12.796875, -12.072265625, -11.34765625, -10.623046875, -9.8984375, -9.173828125, -8.44921875, -7.724609375, -7.0, -6.275390625, -5.55078125, -4.826171875, -4.1015625, -3.376953125, -2.65234375, -1.927734375, -1.203125, -0.478515625, 0.24609375, 0.970703125, 1.6953125, 2.419921875, 3.14453125, 3.869140625, 4.59375, 5.318359375, 6.04296875, 6.767578125, 7.4921875, 8.216796875, 8.94140625, 9.666015625, 10.390625, 11.115234375, 11.83984375, 12.564453125, 13.2890625, 14.013671875, 14.73828125, 15.462890625, 16.1875, 16.912109375, 17.63671875, 18.361328125, 19.0859375, 19.810546875, 20.53515625, 21.259765625, 21.984375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 14.0, 6.0, 8.0, 14.0, 13.0, 19.0, 14.0, 19.0, 22.0, 22.0, 29.0, 32.0, 37.0, 35.0, 44.0, 43.0, 50.0, 42.0, 38.0, 45.0, 44.0, 42.0, 44.0, 31.0, 42.0, 29.0, 28.0, 25.0, 31.0, 27.0, 17.0, 14.0, 11.0, 14.0, 10.0, 4.0, 4.0, 6.0, 4.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.6500244140625, -4.475830078125, -4.3016357421875, -4.12744140625, -3.9532470703125, -3.779052734375, -3.6048583984375, -3.4306640625, -3.2564697265625, -3.082275390625, -2.9080810546875, -2.73388671875, -2.5596923828125, -2.385498046875, -2.2113037109375, -2.037109375, -1.8629150390625, -1.688720703125, -1.5145263671875, -1.34033203125, -1.1661376953125, -0.991943359375, -0.8177490234375, -0.6435546875, -0.4693603515625, -0.295166015625, -0.1209716796875, 0.05322265625, 0.2274169921875, 0.401611328125, 0.5758056640625, 0.75, 0.9241943359375, 1.098388671875, 1.2725830078125, 1.44677734375, 1.6209716796875, 1.795166015625, 1.9693603515625, 2.1435546875, 2.3177490234375, 2.491943359375, 2.6661376953125, 2.84033203125, 3.0145263671875, 3.188720703125, 3.3629150390625, 3.537109375, 3.7113037109375, 3.885498046875, 4.0596923828125, 4.23388671875, 4.4080810546875, 4.582275390625, 4.7564697265625, 4.9306640625, 5.1048583984375, 5.279052734375, 5.4532470703125, 5.62744140625, 5.8016357421875, 5.975830078125, 6.1500244140625, 6.32421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 10.0, 8.0, 7.0, 14.0, 14.0, 21.0, 36.0, 56.0, 81.0, 98.0, 166.0, 209.0, 307.0, 449.0, 902.0, 1777.0, 5355.0, 27869.0, 250834.0, 670590.0, 72961.0, 10838.0, 2855.0, 1222.0, 608.0, 407.0, 284.0, 169.0, 116.0, 91.0, 59.0, 42.0, 28.0, 18.0, 18.0, 8.0, 6.0, 6.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-34.6875, -33.5771484375, -32.466796875, -31.3564453125, -30.24609375, -29.1357421875, -28.025390625, -26.9150390625, -25.8046875, -24.6943359375, -23.583984375, -22.4736328125, -21.36328125, -20.2529296875, -19.142578125, -18.0322265625, -16.921875, -15.8115234375, -14.701171875, -13.5908203125, -12.48046875, -11.3701171875, -10.259765625, -9.1494140625, -8.0390625, -6.9287109375, -5.818359375, -4.7080078125, -3.59765625, -2.4873046875, -1.376953125, -0.2666015625, 0.84375, 1.9541015625, 3.064453125, 4.1748046875, 5.28515625, 6.3955078125, 7.505859375, 8.6162109375, 9.7265625, 10.8369140625, 11.947265625, 13.0576171875, 14.16796875, 15.2783203125, 16.388671875, 17.4990234375, 18.609375, 19.7197265625, 20.830078125, 21.9404296875, 23.05078125, 24.1611328125, 25.271484375, 26.3818359375, 27.4921875, 28.6025390625, 29.712890625, 30.8232421875, 31.93359375, 33.0439453125, 34.154296875, 35.2646484375, 36.375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 11.0, 8.0, 7.0, 10.0, 20.0, 26.0, 27.0, 37.0, 37.0, 49.0, 55.0, 55.0, 54.0, 70.0, 53.0, 54.0, 61.0, 53.0, 60.0, 49.0, 43.0, 34.0, 26.0, 22.0, 10.0, 17.0, 11.0, 11.0, 14.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.03125, -37.99658203125, -36.9619140625, -35.92724609375, -34.892578125, -33.85791015625, -32.8232421875, -31.78857421875, -30.75390625, -29.71923828125, -28.6845703125, -27.64990234375, -26.615234375, -25.58056640625, -24.5458984375, -23.51123046875, -22.4765625, -21.44189453125, -20.4072265625, -19.37255859375, -18.337890625, -17.30322265625, -16.2685546875, -15.23388671875, -14.19921875, -13.16455078125, -12.1298828125, -11.09521484375, -10.060546875, -9.02587890625, -7.9912109375, -6.95654296875, -5.921875, -4.88720703125, -3.8525390625, -2.81787109375, -1.783203125, -0.74853515625, 0.2861328125, 1.32080078125, 2.35546875, 3.39013671875, 4.4248046875, 5.45947265625, 6.494140625, 7.52880859375, 8.5634765625, 9.59814453125, 10.6328125, 11.66748046875, 12.7021484375, 13.73681640625, 14.771484375, 15.80615234375, 16.8408203125, 17.87548828125, 18.91015625, 19.94482421875, 20.9794921875, 22.01416015625, 23.048828125, 24.08349609375, 25.1181640625, 26.15283203125, 27.1875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 8.0, 5.0, 5.0, 7.0, 13.0, 19.0, 33.0, 44.0, 64.0, 110.0, 133.0, 241.0, 368.0, 687.0, 1228.0, 2522.0, 6057.0, 16056.0, 55153.0, 270950.0, 531560.0, 117583.0, 28417.0, 9335.0, 3803.0, 1823.0, 941.0, 493.0, 277.0, 193.0, 151.0, 72.0, 53.0, 52.0, 33.0, 17.0, 9.0, 14.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.72705078125, -10.3837890625, -10.04052734375, -9.697265625, -9.35400390625, -9.0107421875, -8.66748046875, -8.32421875, -7.98095703125, -7.6376953125, -7.29443359375, -6.951171875, -6.60791015625, -6.2646484375, -5.92138671875, -5.578125, -5.23486328125, -4.8916015625, -4.54833984375, -4.205078125, -3.86181640625, -3.5185546875, -3.17529296875, -2.83203125, -2.48876953125, -2.1455078125, -1.80224609375, -1.458984375, -1.11572265625, -0.7724609375, -0.42919921875, -0.0859375, 0.25732421875, 0.6005859375, 0.94384765625, 1.287109375, 1.63037109375, 1.9736328125, 2.31689453125, 2.66015625, 3.00341796875, 3.3466796875, 3.68994140625, 4.033203125, 4.37646484375, 4.7197265625, 5.06298828125, 5.40625, 5.74951171875, 6.0927734375, 6.43603515625, 6.779296875, 7.12255859375, 7.4658203125, 7.80908203125, 8.15234375, 8.49560546875, 8.8388671875, 9.18212890625, 9.525390625, 9.86865234375, 10.2119140625, 10.55517578125, 10.8984375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 9.0, 11.0, 13.0, 13.0, 9.0, 13.0, 21.0, 31.0, 47.0, 47.0, 60.0, 84.0, 92.0, 106.0, 95.0, 76.0, 59.0, 44.0, 41.0, 28.0, 19.0, 14.0, 15.0, 11.0, 11.0, 7.0, 5.0, 2.0, 7.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015048980712890625, -0.0014552474021911621, -0.0014055967330932617, -0.0013559460639953613, -0.001306295394897461, -0.0012566447257995605, -0.0012069940567016602, -0.0011573433876037598, -0.0011076927185058594, -0.001058042049407959, -0.0010083913803100586, -0.0009587407112121582, -0.0009090900421142578, -0.0008594393730163574, -0.000809788703918457, -0.0007601380348205566, -0.0007104873657226562, -0.0006608366966247559, -0.0006111860275268555, -0.0005615353584289551, -0.0005118846893310547, -0.0004622340202331543, -0.0004125833511352539, -0.0003629326820373535, -0.0003132820129394531, -0.00026363134384155273, -0.00021398067474365234, -0.00016433000564575195, -0.00011467933654785156, -6.502866744995117e-05, -1.537799835205078e-05, 3.427267074584961e-05, 8.392333984375e-05, 0.0001335740089416504, 0.00018322467803955078, 0.00023287534713745117, 0.00028252601623535156, 0.00033217668533325195, 0.00038182735443115234, 0.00043147802352905273, 0.0004811286926269531, 0.0005307793617248535, 0.0005804300308227539, 0.0006300806999206543, 0.0006797313690185547, 0.0007293820381164551, 0.0007790327072143555, 0.0008286833763122559, 0.0008783340454101562, 0.0009279847145080566, 0.000977635383605957, 0.0010272860527038574, 0.0010769367218017578, 0.0011265873908996582, 0.0011762380599975586, 0.001225888729095459, 0.0012755393981933594, 0.0013251900672912598, 0.0013748407363891602, 0.0014244914054870605, 0.001474142074584961, 0.0015237927436828613, 0.0015734434127807617, 0.0016230940818786621, 0.0016727447509765625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 11.0, 14.0, 22.0, 48.0, 87.0, 135.0, 230.0, 488.0, 980.0, 2626.0, 10068.0, 72924.0, 726373.0, 208117.0, 19362.0, 4210.0, 1492.0, 629.0, 303.0, 149.0, 99.0, 56.0, 45.0, 20.0, 19.0, 10.0, 10.0, 7.0, 2.0, 5.0, 1.0, 3.0, 3.0], "bins": [-26.296875, -25.695068359375, -25.09326171875, -24.491455078125, -23.8896484375, -23.287841796875, -22.68603515625, -22.084228515625, -21.482421875, -20.880615234375, -20.27880859375, -19.677001953125, -19.0751953125, -18.473388671875, -17.87158203125, -17.269775390625, -16.66796875, -16.066162109375, -15.46435546875, -14.862548828125, -14.2607421875, -13.658935546875, -13.05712890625, -12.455322265625, -11.853515625, -11.251708984375, -10.64990234375, -10.048095703125, -9.4462890625, -8.844482421875, -8.24267578125, -7.640869140625, -7.0390625, -6.437255859375, -5.83544921875, -5.233642578125, -4.6318359375, -4.030029296875, -3.42822265625, -2.826416015625, -2.224609375, -1.622802734375, -1.02099609375, -0.419189453125, 0.1826171875, 0.784423828125, 1.38623046875, 1.988037109375, 2.58984375, 3.191650390625, 3.79345703125, 4.395263671875, 4.9970703125, 5.598876953125, 6.20068359375, 6.802490234375, 7.404296875, 8.006103515625, 8.60791015625, 9.209716796875, 9.8115234375, 10.413330078125, 11.01513671875, 11.616943359375, 12.21875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 7.0, 5.0, 4.0, 13.0, 12.0, 12.0, 17.0, 41.0, 48.0, 70.0, 111.0, 113.0, 130.0, 119.0, 104.0, 60.0, 44.0, 24.0, 24.0, 16.0, 11.0, 12.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.796875, -13.31396484375, -12.8310546875, -12.34814453125, -11.865234375, -11.38232421875, -10.8994140625, -10.41650390625, -9.93359375, -9.45068359375, -8.9677734375, -8.48486328125, -8.001953125, -7.51904296875, -7.0361328125, -6.55322265625, -6.0703125, -5.58740234375, -5.1044921875, -4.62158203125, -4.138671875, -3.65576171875, -3.1728515625, -2.68994140625, -2.20703125, -1.72412109375, -1.2412109375, -0.75830078125, -0.275390625, 0.20751953125, 0.6904296875, 1.17333984375, 1.65625, 2.13916015625, 2.6220703125, 3.10498046875, 3.587890625, 4.07080078125, 4.5537109375, 5.03662109375, 5.51953125, 6.00244140625, 6.4853515625, 6.96826171875, 7.451171875, 7.93408203125, 8.4169921875, 8.89990234375, 9.3828125, 9.86572265625, 10.3486328125, 10.83154296875, 11.314453125, 11.79736328125, 12.2802734375, 12.76318359375, 13.24609375, 13.72900390625, 14.2119140625, 14.69482421875, 15.177734375, 15.66064453125, 16.1435546875, 16.62646484375, 17.109375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 9.0, 60.0, 254.0, 458.0, 178.0, 36.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-632.3053588867188, -609.2362060546875, -586.1669921875, -563.0978393554688, -540.0286865234375, -516.9595336914062, -493.8903503417969, -470.8211669921875, -447.75201416015625, -424.682861328125, -401.6136779785156, -378.54449462890625, -355.475341796875, -332.40618896484375, -309.3370056152344, -286.267822265625, -263.19866943359375, -240.12950134277344, -217.06033325195312, -193.9911651611328, -170.9219970703125, -147.8528289794922, -124.78366088867188, -101.71449279785156, -78.64532470703125, -55.57615661621094, -32.506988525390625, -9.437820434570312, 13.63134765625, 36.70051574707031, 59.769683837890625, 82.83885192871094, 105.9080810546875, 128.9772491455078, 152.04641723632812, 175.11558532714844, 198.18475341796875, 221.25392150878906, 244.32308959960938, 267.39227294921875, 290.46142578125, 313.53057861328125, 336.5997619628906, 359.6689453125, 382.73809814453125, 405.8072509765625, 428.8764343261719, 451.94561767578125, 475.0147705078125, 498.08392333984375, 521.153076171875, 544.2222900390625, 567.2914428710938, 590.360595703125, 613.4298095703125, 636.4989624023438, 659.568115234375, 682.6372680664062, 705.7064208984375, 728.775634765625, 751.8447875976562, 774.9139404296875, 797.983154296875, 821.0523071289062, 844.1214599609375]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 5.0, 9.0, 9.0, 7.0, 4.0, 13.0, 23.0, 23.0, 31.0, 17.0, 34.0, 31.0, 43.0, 66.0, 57.0, 42.0, 39.0, 65.0, 50.0, 57.0, 52.0, 45.0, 46.0, 32.0, 35.0, 25.0, 19.0, 20.0, 20.0, 15.0, 11.0, 12.0, 10.0, 9.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.51470947265625, -137.2794952392578, -133.0442657470703, -128.80905151367188, -124.5738296508789, -120.33860778808594, -116.1033935546875, -111.86817169189453, -107.63294982910156, -103.3977279663086, -99.16250610351562, -94.92729187011719, -90.69207000732422, -86.45684814453125, -82.22163391113281, -77.98641204833984, -73.75119018554688, -69.5159683227539, -65.28074645996094, -61.0455322265625, -56.81031036376953, -52.57508850097656, -48.33987045288086, -44.104652404785156, -39.86943054199219, -35.63420867919922, -31.398990631103516, -27.16377067565918, -22.928550720214844, -18.693330764770508, -14.458110809326172, -10.222890853881836, -5.9876708984375, -1.752450942993164, 2.482769012451172, 6.717988967895508, 10.953208923339844, 15.18842887878418, 19.423648834228516, 23.65886878967285, 27.894088745117188, 32.129310607910156, 36.36452865600586, 40.59974670410156, 44.83496856689453, 49.0701904296875, 53.3054084777832, 57.540626525878906, 61.775848388671875, 66.01107025146484, 70.24629211425781, 74.48150634765625, 78.71672821044922, 82.95195007324219, 87.18716430664062, 91.4223861694336, 95.65760803222656, 99.89282989501953, 104.1280517578125, 108.36326599121094, 112.5984878540039, 116.83370971679688, 121.06892395019531, 125.30414581298828, 129.53936767578125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 7.0, 8.0, 4.0, 13.0, 18.0, 17.0, 29.0, 30.0, 51.0, 64.0, 80.0, 141.0, 253.0, 407.0, 746.0, 1340.0, 2776.0, 5825.0, 16340.0, 88822.0, 3989316.0, 63607.0, 13888.0, 5082.0, 2478.0, 1240.0, 687.0, 371.0, 199.0, 124.0, 85.0, 65.0, 38.0, 25.0, 32.0, 18.0, 13.0, 11.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-48.78125, -47.3642578125, -45.947265625, -44.5302734375, -43.11328125, -41.6962890625, -40.279296875, -38.8623046875, -37.4453125, -36.0283203125, -34.611328125, -33.1943359375, -31.77734375, -30.3603515625, -28.943359375, -27.5263671875, -26.109375, -24.6923828125, -23.275390625, -21.8583984375, -20.44140625, -19.0244140625, -17.607421875, -16.1904296875, -14.7734375, -13.3564453125, -11.939453125, -10.5224609375, -9.10546875, -7.6884765625, -6.271484375, -4.8544921875, -3.4375, -2.0205078125, -0.603515625, 0.8134765625, 2.23046875, 3.6474609375, 5.064453125, 6.4814453125, 7.8984375, 9.3154296875, 10.732421875, 12.1494140625, 13.56640625, 14.9833984375, 16.400390625, 17.8173828125, 19.234375, 20.6513671875, 22.068359375, 23.4853515625, 24.90234375, 26.3193359375, 27.736328125, 29.1533203125, 30.5703125, 31.9873046875, 33.404296875, 34.8212890625, 36.23828125, 37.6552734375, 39.072265625, 40.4892578125, 41.90625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 13.0, 13.0, 19.0, 21.0, 11.0, 31.0, 24.0, 32.0, 42.0, 34.0, 42.0, 51.0, 36.0, 43.0, 59.0, 39.0, 43.0, 46.0, 46.0, 43.0, 33.0, 30.0, 43.0, 26.0, 20.0, 25.0, 21.0, 13.0, 19.0, 11.0, 12.0, 9.0, 7.0, 3.0, 7.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.875, -4.6982421875, -4.521484375, -4.3447265625, -4.16796875, -3.9912109375, -3.814453125, -3.6376953125, -3.4609375, -3.2841796875, -3.107421875, -2.9306640625, -2.75390625, -2.5771484375, -2.400390625, -2.2236328125, -2.046875, -1.8701171875, -1.693359375, -1.5166015625, -1.33984375, -1.1630859375, -0.986328125, -0.8095703125, -0.6328125, -0.4560546875, -0.279296875, -0.1025390625, 0.07421875, 0.2509765625, 0.427734375, 0.6044921875, 0.78125, 0.9580078125, 1.134765625, 1.3115234375, 1.48828125, 1.6650390625, 1.841796875, 2.0185546875, 2.1953125, 2.3720703125, 2.548828125, 2.7255859375, 2.90234375, 3.0791015625, 3.255859375, 3.4326171875, 3.609375, 3.7861328125, 3.962890625, 4.1396484375, 4.31640625, 4.4931640625, 4.669921875, 4.8466796875, 5.0234375, 5.2001953125, 5.376953125, 5.5537109375, 5.73046875, 5.9072265625, 6.083984375, 6.2607421875, 6.4375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 6.0, 9.0, 7.0, 14.0, 24.0, 14.0, 32.0, 32.0, 65.0, 88.0, 115.0, 201.0, 335.0, 551.0, 1079.0, 2151.0, 5315.0, 15146.0, 62811.0, 3886333.0, 178483.0, 26852.0, 8250.0, 3146.0, 1393.0, 711.0, 395.0, 235.0, 144.0, 81.0, 71.0, 65.0, 33.0, 25.0, 20.0, 13.0, 13.0, 10.0, 1.0, 1.0, 7.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.125, -34.08349609375, -33.0419921875, -32.00048828125, -30.958984375, -29.91748046875, -28.8759765625, -27.83447265625, -26.79296875, -25.75146484375, -24.7099609375, -23.66845703125, -22.626953125, -21.58544921875, -20.5439453125, -19.50244140625, -18.4609375, -17.41943359375, -16.3779296875, -15.33642578125, -14.294921875, -13.25341796875, -12.2119140625, -11.17041015625, -10.12890625, -9.08740234375, -8.0458984375, -7.00439453125, -5.962890625, -4.92138671875, -3.8798828125, -2.83837890625, -1.796875, -0.75537109375, 0.2861328125, 1.32763671875, 2.369140625, 3.41064453125, 4.4521484375, 5.49365234375, 6.53515625, 7.57666015625, 8.6181640625, 9.65966796875, 10.701171875, 11.74267578125, 12.7841796875, 13.82568359375, 14.8671875, 15.90869140625, 16.9501953125, 17.99169921875, 19.033203125, 20.07470703125, 21.1162109375, 22.15771484375, 23.19921875, 24.24072265625, 25.2822265625, 26.32373046875, 27.365234375, 28.40673828125, 29.4482421875, 30.48974609375, 31.53125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 7.0, 9.0, 16.0, 19.0, 26.0, 37.0, 86.0, 293.0, 3204.0, 182.0, 78.0, 38.0, 30.0, 16.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66796875, -7.40667724609375, -7.1453857421875, -6.88409423828125, -6.622802734375, -6.36151123046875, -6.1002197265625, -5.83892822265625, -5.57763671875, -5.31634521484375, -5.0550537109375, -4.79376220703125, -4.532470703125, -4.27117919921875, -4.0098876953125, -3.74859619140625, -3.4873046875, -3.22601318359375, -2.9647216796875, -2.70343017578125, -2.442138671875, -2.18084716796875, -1.9195556640625, -1.65826416015625, -1.39697265625, -1.13568115234375, -0.8743896484375, -0.61309814453125, -0.351806640625, -0.09051513671875, 0.1707763671875, 0.43206787109375, 0.693359375, 0.95465087890625, 1.2159423828125, 1.47723388671875, 1.738525390625, 1.99981689453125, 2.2611083984375, 2.52239990234375, 2.78369140625, 3.04498291015625, 3.3062744140625, 3.56756591796875, 3.828857421875, 4.09014892578125, 4.3514404296875, 4.61273193359375, 4.8740234375, 5.13531494140625, 5.3966064453125, 5.65789794921875, 5.919189453125, 6.18048095703125, 6.4417724609375, 6.70306396484375, 6.96435546875, 7.22564697265625, 7.4869384765625, 7.74822998046875, 8.009521484375, 8.27081298828125, 8.5321044921875, 8.79339599609375, 9.0546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 9.0, 14.0, 25.0, 30.0, 12.0, 43.0, 51.0, 55.0, 53.0, 60.0, 71.0, 74.0, 83.0, 59.0, 71.0, 57.0, 43.0, 36.0, 36.0, 22.0, 14.0, 14.0, 20.0, 9.0, 9.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.555381774902344, -23.896461486816406, -23.23754119873047, -22.57862091064453, -21.919700622558594, -21.260780334472656, -20.60186004638672, -19.94293975830078, -19.284019470214844, -18.625099182128906, -17.96617889404297, -17.30725860595703, -16.648338317871094, -15.989418029785156, -15.330496788024902, -14.671576499938965, -14.012655258178711, -13.353734970092773, -12.694814682006836, -12.035894393920898, -11.376974105834961, -10.718053817749023, -10.05913257598877, -9.400212287902832, -8.741291999816895, -8.082371711730957, -7.4234514236450195, -6.764530658721924, -6.105610370635986, -5.446690082550049, -4.787769317626953, -4.128849029541016, -3.469928741455078, -2.8110084533691406, -2.152087926864624, -1.493167519569397, -0.8342471122741699, -0.17532682418823242, 0.4835937023162842, 1.1425142288208008, 1.8014345169067383, 2.460354804992676, 3.1192753314971924, 3.778195858001709, 4.4371161460876465, 5.096036434173584, 5.75495719909668, 6.413877487182617, 7.072797775268555, 7.731718063354492, 8.39063835144043, 9.049558639526367, 9.708478927612305, 10.367399215698242, 11.026320457458496, 11.685240745544434, 12.344161033630371, 13.003081321716309, 13.662001609802246, 14.320921897888184, 14.979843139648438, 15.638763427734375, 16.297683715820312, 16.95660400390625, 17.615524291992188]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 1.0, 5.0, 7.0, 6.0, 6.0, 11.0, 12.0, 15.0, 14.0, 25.0, 22.0, 22.0, 27.0, 30.0, 21.0, 26.0, 28.0, 35.0, 29.0, 39.0, 39.0, 38.0, 39.0, 40.0, 39.0, 47.0, 47.0, 33.0, 36.0, 41.0, 30.0, 27.0, 16.0, 29.0, 22.0, 17.0, 16.0, 12.0, 12.0, 9.0, 6.0, 6.0, 4.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.945549964904785, -13.530129432678223, -13.11470890045166, -12.699287414550781, -12.283866882324219, -11.868446350097656, -11.453025817871094, -11.037605285644531, -10.622184753417969, -10.206764221191406, -9.791343688964844, -9.375923156738281, -8.960501670837402, -8.54508113861084, -8.129660606384277, -7.714240074157715, -7.298819065093994, -6.883398532867432, -6.467977523803711, -6.052556991577148, -5.637136459350586, -5.221715927124023, -4.806294918060303, -4.39087438583374, -3.9754536151885986, -3.560032844543457, -3.1446123123168945, -2.729191541671753, -2.3137707710266113, -1.8983502388000488, -1.4829294681549072, -1.0675089359283447, -0.6520881652832031, -0.2366674840450287, 0.17875319719314575, 0.5941739082336426, 1.0095945596694946, 1.4250152111053467, 1.8404359817504883, 2.255856513977051, 2.6712772846221924, 3.086698055267334, 3.5021185874938965, 3.917539358139038, 4.33296012878418, 4.748380661010742, 5.163801193237305, 5.579221725463867, 5.994642734527588, 6.41006326675415, 6.825484275817871, 7.240904808044434, 7.656325340270996, 8.071745872497559, 8.487167358398438, 8.902587890625, 9.318008422851562, 9.733428955078125, 10.148849487304688, 10.56427001953125, 10.979691505432129, 11.395112037658691, 11.810532569885254, 12.225953102111816, 12.641373634338379]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 7.0, 5.0, 11.0, 13.0, 15.0, 23.0, 45.0, 58.0, 99.0, 137.0, 205.0, 375.0, 554.0, 1112.0, 2106.0, 4410.0, 9923.0, 23513.0, 58557.0, 150233.0, 317612.0, 278340.0, 119881.0, 46594.0, 19001.0, 7943.0, 3704.0, 1803.0, 933.0, 514.0, 296.0, 168.0, 116.0, 76.0, 58.0, 46.0, 16.0, 19.0, 10.0, 8.0, 1.0, 1.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.9375, -14.483154296875, -14.02880859375, -13.574462890625, -13.1201171875, -12.665771484375, -12.21142578125, -11.757080078125, -11.302734375, -10.848388671875, -10.39404296875, -9.939697265625, -9.4853515625, -9.031005859375, -8.57666015625, -8.122314453125, -7.66796875, -7.213623046875, -6.75927734375, -6.304931640625, -5.8505859375, -5.396240234375, -4.94189453125, -4.487548828125, -4.033203125, -3.578857421875, -3.12451171875, -2.670166015625, -2.2158203125, -1.761474609375, -1.30712890625, -0.852783203125, -0.3984375, 0.055908203125, 0.51025390625, 0.964599609375, 1.4189453125, 1.873291015625, 2.32763671875, 2.781982421875, 3.236328125, 3.690673828125, 4.14501953125, 4.599365234375, 5.0537109375, 5.508056640625, 5.96240234375, 6.416748046875, 6.87109375, 7.325439453125, 7.77978515625, 8.234130859375, 8.6884765625, 9.142822265625, 9.59716796875, 10.051513671875, 10.505859375, 10.960205078125, 11.41455078125, 11.868896484375, 12.3232421875, 12.777587890625, 13.23193359375, 13.686279296875, 14.140625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 10.0, 5.0, 9.0, 16.0, 15.0, 15.0, 12.0, 20.0, 19.0, 31.0, 25.0, 32.0, 26.0, 43.0, 39.0, 48.0, 38.0, 40.0, 51.0, 35.0, 49.0, 35.0, 45.0, 45.0, 45.0, 33.0, 30.0, 27.0, 19.0, 22.0, 17.0, 18.0, 10.0, 10.0, 10.0, 10.0, 7.0, 11.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.86328125, -4.68389892578125, -4.5045166015625, -4.32513427734375, -4.145751953125, -3.96636962890625, -3.7869873046875, -3.60760498046875, -3.42822265625, -3.24884033203125, -3.0694580078125, -2.89007568359375, -2.710693359375, -2.53131103515625, -2.3519287109375, -2.17254638671875, -1.9931640625, -1.81378173828125, -1.6343994140625, -1.45501708984375, -1.275634765625, -1.09625244140625, -0.9168701171875, -0.73748779296875, -0.55810546875, -0.37872314453125, -0.1993408203125, -0.01995849609375, 0.159423828125, 0.33880615234375, 0.5181884765625, 0.69757080078125, 0.876953125, 1.05633544921875, 1.2357177734375, 1.41510009765625, 1.594482421875, 1.77386474609375, 1.9532470703125, 2.13262939453125, 2.31201171875, 2.49139404296875, 2.6707763671875, 2.85015869140625, 3.029541015625, 3.20892333984375, 3.3883056640625, 3.56768798828125, 3.7470703125, 3.92645263671875, 4.1058349609375, 4.28521728515625, 4.464599609375, 4.64398193359375, 4.8233642578125, 5.00274658203125, 5.18212890625, 5.36151123046875, 5.5408935546875, 5.72027587890625, 5.899658203125, 6.07904052734375, 6.2584228515625, 6.43780517578125, 6.6171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 9.0, 11.0, 13.0, 19.0, 33.0, 47.0, 56.0, 103.0, 152.0, 237.0, 348.0, 626.0, 1017.0, 2074.0, 6846.0, 51568.0, 655181.0, 299449.0, 22825.0, 4060.0, 1536.0, 896.0, 509.0, 308.0, 198.0, 164.0, 96.0, 55.0, 41.0, 29.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.21875, -35.1787109375, -34.138671875, -33.0986328125, -32.05859375, -31.0185546875, -29.978515625, -28.9384765625, -27.8984375, -26.8583984375, -25.818359375, -24.7783203125, -23.73828125, -22.6982421875, -21.658203125, -20.6181640625, -19.578125, -18.5380859375, -17.498046875, -16.4580078125, -15.41796875, -14.3779296875, -13.337890625, -12.2978515625, -11.2578125, -10.2177734375, -9.177734375, -8.1376953125, -7.09765625, -6.0576171875, -5.017578125, -3.9775390625, -2.9375, -1.8974609375, -0.857421875, 0.1826171875, 1.22265625, 2.2626953125, 3.302734375, 4.3427734375, 5.3828125, 6.4228515625, 7.462890625, 8.5029296875, 9.54296875, 10.5830078125, 11.623046875, 12.6630859375, 13.703125, 14.7431640625, 15.783203125, 16.8232421875, 17.86328125, 18.9033203125, 19.943359375, 20.9833984375, 22.0234375, 23.0634765625, 24.103515625, 25.1435546875, 26.18359375, 27.2236328125, 28.263671875, 29.3037109375, 30.34375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 12.0, 19.0, 23.0, 25.0, 31.0, 40.0, 45.0, 39.0, 56.0, 46.0, 65.0, 49.0, 73.0, 52.0, 61.0, 60.0, 59.0, 40.0, 46.0, 34.0, 36.0, 15.0, 16.0, 13.0, 5.0, 3.0, 14.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.03515625, -29.9140625, -28.79296875, -27.671875, -26.55078125, -25.4296875, -24.30859375, -23.1875, -22.06640625, -20.9453125, -19.82421875, -18.703125, -17.58203125, -16.4609375, -15.33984375, -14.21875, -13.09765625, -11.9765625, -10.85546875, -9.734375, -8.61328125, -7.4921875, -6.37109375, -5.25, -4.12890625, -3.0078125, -1.88671875, -0.765625, 0.35546875, 1.4765625, 2.59765625, 3.71875, 4.83984375, 5.9609375, 7.08203125, 8.203125, 9.32421875, 10.4453125, 11.56640625, 12.6875, 13.80859375, 14.9296875, 16.05078125, 17.171875, 18.29296875, 19.4140625, 20.53515625, 21.65625, 22.77734375, 23.8984375, 25.01953125, 26.140625, 27.26171875, 28.3828125, 29.50390625, 30.625, 31.74609375, 32.8671875, 33.98828125, 35.109375, 36.23046875, 37.3515625, 38.47265625, 39.59375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 7.0, 18.0, 30.0, 41.0, 54.0, 83.0, 154.0, 258.0, 631.0, 1548.0, 4952.0, 22522.0, 225746.0, 717350.0, 60865.0, 9698.0, 2620.0, 963.0, 441.0, 189.0, 123.0, 63.0, 57.0, 25.0, 25.0, 17.0, 11.0, 9.0, 10.0, 7.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.84375, -16.3046875, -15.765625, -15.2265625, -14.6875, -14.1484375, -13.609375, -13.0703125, -12.53125, -11.9921875, -11.453125, -10.9140625, -10.375, -9.8359375, -9.296875, -8.7578125, -8.21875, -7.6796875, -7.140625, -6.6015625, -6.0625, -5.5234375, -4.984375, -4.4453125, -3.90625, -3.3671875, -2.828125, -2.2890625, -1.75, -1.2109375, -0.671875, -0.1328125, 0.40625, 0.9453125, 1.484375, 2.0234375, 2.5625, 3.1015625, 3.640625, 4.1796875, 4.71875, 5.2578125, 5.796875, 6.3359375, 6.875, 7.4140625, 7.953125, 8.4921875, 9.03125, 9.5703125, 10.109375, 10.6484375, 11.1875, 11.7265625, 12.265625, 12.8046875, 13.34375, 13.8828125, 14.421875, 14.9609375, 15.5, 16.0390625, 16.578125, 17.1171875, 17.65625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 7.0, 3.0, 7.0, 8.0, 15.0, 14.0, 22.0, 15.0, 30.0, 42.0, 67.0, 78.0, 109.0, 119.0, 109.0, 83.0, 73.0, 37.0, 39.0, 28.0, 17.0, 20.0, 17.0, 10.0, 11.0, 8.0, 9.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012178421020507812, -0.0011663883924484253, -0.0011149346828460693, -0.0010634809732437134, -0.0010120272636413574, -0.0009605735540390015, -0.0009091198444366455, -0.0008576661348342896, -0.0008062124252319336, -0.0007547587156295776, -0.0007033050060272217, -0.0006518512964248657, -0.0006003975868225098, -0.0005489438772201538, -0.0004974901676177979, -0.0004460364580154419, -0.00039458274841308594, -0.00034312903881073, -0.000291675329208374, -0.00024022161960601807, -0.0001887679100036621, -0.00013731420040130615, -8.58604907989502e-05, -3.440678119659424e-05, 1.704692840576172e-05, 6.850063800811768e-05, 0.00011995434761047363, 0.0001714080572128296, 0.00022286176681518555, 0.0002743154764175415, 0.00032576918601989746, 0.0003772228956222534, 0.0004286766052246094, 0.00048013031482696533, 0.0005315840244293213, 0.0005830377340316772, 0.0006344914436340332, 0.0006859451532363892, 0.0007373988628387451, 0.0007888525724411011, 0.000840306282043457, 0.000891759991645813, 0.0009432137012481689, 0.000994667410850525, 0.0010461211204528809, 0.0010975748300552368, 0.0011490285396575928, 0.0012004822492599487, 0.0012519359588623047, 0.0013033896684646606, 0.0013548433780670166, 0.0014062970876693726, 0.0014577507972717285, 0.0015092045068740845, 0.0015606582164764404, 0.0016121119260787964, 0.0016635656356811523, 0.0017150193452835083, 0.0017664730548858643, 0.0018179267644882202, 0.0018693804740905762, 0.0019208341836929321, 0.001972287893295288, 0.002023741602897644, 0.0020751953125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 7.0, 16.0, 38.0, 62.0, 76.0, 148.0, 301.0, 611.0, 1499.0, 5175.0, 36460.0, 734544.0, 248608.0, 15854.0, 3094.0, 1045.0, 428.0, 220.0, 132.0, 88.0, 37.0, 29.0, 23.0, 10.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.346435546875, -20.63037109375, -19.914306640625, -19.1982421875, -18.482177734375, -17.76611328125, -17.050048828125, -16.333984375, -15.617919921875, -14.90185546875, -14.185791015625, -13.4697265625, -12.753662109375, -12.03759765625, -11.321533203125, -10.60546875, -9.889404296875, -9.17333984375, -8.457275390625, -7.7412109375, -7.025146484375, -6.30908203125, -5.593017578125, -4.876953125, -4.160888671875, -3.44482421875, -2.728759765625, -2.0126953125, -1.296630859375, -0.58056640625, 0.135498046875, 0.8515625, 1.567626953125, 2.28369140625, 2.999755859375, 3.7158203125, 4.431884765625, 5.14794921875, 5.864013671875, 6.580078125, 7.296142578125, 8.01220703125, 8.728271484375, 9.4443359375, 10.160400390625, 10.87646484375, 11.592529296875, 12.30859375, 13.024658203125, 13.74072265625, 14.456787109375, 15.1728515625, 15.888916015625, 16.60498046875, 17.321044921875, 18.037109375, 18.753173828125, 19.46923828125, 20.185302734375, 20.9013671875, 21.617431640625, 22.33349609375, 23.049560546875, 23.765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 27.0, 34.0, 66.0, 107.0, 118.0, 149.0, 167.0, 111.0, 65.0, 49.0, 22.0, 22.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.421875, -12.83203125, -12.2421875, -11.65234375, -11.0625, -10.47265625, -9.8828125, -9.29296875, -8.703125, -8.11328125, -7.5234375, -6.93359375, -6.34375, -5.75390625, -5.1640625, -4.57421875, -3.984375, -3.39453125, -2.8046875, -2.21484375, -1.625, -1.03515625, -0.4453125, 0.14453125, 0.734375, 1.32421875, 1.9140625, 2.50390625, 3.09375, 3.68359375, 4.2734375, 4.86328125, 5.453125, 6.04296875, 6.6328125, 7.22265625, 7.8125, 8.40234375, 8.9921875, 9.58203125, 10.171875, 10.76171875, 11.3515625, 11.94140625, 12.53125, 13.12109375, 13.7109375, 14.30078125, 14.890625, 15.48046875, 16.0703125, 16.66015625, 17.25, 17.83984375, 18.4296875, 19.01953125, 19.609375, 20.19921875, 20.7890625, 21.37890625, 21.96875, 22.55859375, 23.1484375, 23.73828125, 24.328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 17.0, 33.0, 66.0, 110.0, 146.0, 143.0, 146.0, 114.0, 75.0, 44.0, 33.0, 26.0, 14.0, 6.0, 2.0, 7.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.2418212890625, -259.2886962890625, -252.33558654785156, -245.38247680664062, -238.42935180664062, -231.4762420654297, -224.5231170654297, -217.57000732421875, -210.61688232421875, -203.6637725830078, -196.7106475830078, -189.75753784179688, -182.80441284179688, -175.85130310058594, -168.89817810058594, -161.945068359375, -154.991943359375, -148.03883361816406, -141.08570861816406, -134.13259887695312, -127.17947387695312, -120.22636413574219, -113.27323913574219, -106.32012939453125, -99.36701965332031, -92.41390228271484, -85.46078491210938, -78.5076675415039, -71.55455017089844, -64.6014404296875, -57.648319244384766, -50.6952018737793, -43.74208068847656, -36.788963317871094, -29.835845947265625, -22.88273048400879, -15.92961311340332, -8.976497650146484, -2.0233802795410156, 4.929737091064453, 11.882854461669922, 18.83597183227539, 25.78908920288086, 32.74220275878906, 39.69532012939453, 46.6484375, 53.60155487060547, 60.55467224121094, 67.5077896118164, 74.46090698242188, 81.41402435302734, 88.36714172363281, 95.32025909423828, 102.27337646484375, 109.22648620605469, 116.17961120605469, 123.13272094726562, 130.08583068847656, 137.03895568847656, 143.9920654296875, 150.9451904296875, 157.89830017089844, 164.85142517089844, 171.80453491210938, 178.75765991210938]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 6.0, 11.0, 10.0, 5.0, 15.0, 19.0, 13.0, 26.0, 30.0, 37.0, 29.0, 26.0, 39.0, 49.0, 56.0, 51.0, 51.0, 44.0, 46.0, 48.0, 58.0, 44.0, 48.0, 41.0, 38.0, 25.0, 24.0, 17.0, 16.0, 21.0, 9.0, 10.0, 5.0, 2.0, 2.0, 6.0, 7.0, 3.0, 1.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0], "bins": [-147.55712890625, -143.3653564453125, -139.173583984375, -134.98179626464844, -130.79002380371094, -126.59825134277344, -122.40647888183594, -118.21470642089844, -114.0229263305664, -109.8311538696289, -105.63937377929688, -101.44760131835938, -97.25582885742188, -93.06404876708984, -88.87227630615234, -84.68049621582031, -80.48872375488281, -76.29695129394531, -72.10517120361328, -67.91339874267578, -63.721622467041016, -59.52984619140625, -55.33807373046875, -51.146297454833984, -46.95452117919922, -42.76274490356445, -38.57096862792969, -34.37919616699219, -30.187419891357422, -25.995643615722656, -21.803869247436523, -17.61209487915039, -13.420318603515625, -9.228543281555176, -5.036767959594727, -0.8449926376342773, 3.346782684326172, 7.5385589599609375, 11.73033332824707, 15.922107696533203, 20.11388397216797, 24.305660247802734, 28.497434616088867, 32.689208984375, 36.880985260009766, 41.07276153564453, 45.26453399658203, 49.4563102722168, 53.64808654785156, 57.83986282348633, 62.031639099121094, 66.2234115600586, 70.41519165039062, 74.60696411132812, 78.79873657226562, 82.99050903320312, 87.18228912353516, 91.37406158447266, 95.56584167480469, 99.75761413574219, 103.94938659667969, 108.14116668701172, 112.33293914794922, 116.52471923828125, 120.71649169921875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 8.0, 6.0, 12.0, 15.0, 22.0, 38.0, 56.0, 82.0, 160.0, 232.0, 431.0, 1047.0, 2523.0, 8023.0, 87217.0, 4075276.0, 13030.0, 3403.0, 1342.0, 626.0, 295.0, 176.0, 90.0, 61.0, 38.0, 22.0, 10.0, 12.0, 9.0, 6.0, 4.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.3125, -65.2822265625, -63.251953125, -61.2216796875, -59.19140625, -57.1611328125, -55.130859375, -53.1005859375, -51.0703125, -49.0400390625, -47.009765625, -44.9794921875, -42.94921875, -40.9189453125, -38.888671875, -36.8583984375, -34.828125, -32.7978515625, -30.767578125, -28.7373046875, -26.70703125, -24.6767578125, -22.646484375, -20.6162109375, -18.5859375, -16.5556640625, -14.525390625, -12.4951171875, -10.46484375, -8.4345703125, -6.404296875, -4.3740234375, -2.34375, -0.3134765625, 1.716796875, 3.7470703125, 5.77734375, 7.8076171875, 9.837890625, 11.8681640625, 13.8984375, 15.9287109375, 17.958984375, 19.9892578125, 22.01953125, 24.0498046875, 26.080078125, 28.1103515625, 30.140625, 32.1708984375, 34.201171875, 36.2314453125, 38.26171875, 40.2919921875, 42.322265625, 44.3525390625, 46.3828125, 48.4130859375, 50.443359375, 52.4736328125, 54.50390625, 56.5341796875, 58.564453125, 60.5947265625, 62.625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 6.0, 11.0, 9.0, 7.0, 17.0, 15.0, 24.0, 26.0, 24.0, 41.0, 35.0, 49.0, 58.0, 45.0, 62.0, 56.0, 57.0, 57.0, 51.0, 39.0, 59.0, 36.0, 37.0, 32.0, 31.0, 18.0, 20.0, 18.0, 17.0, 9.0, 12.0, 7.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.6319580078125, -6.396728515625, -6.1614990234375, -5.92626953125, -5.6910400390625, -5.455810546875, -5.2205810546875, -4.9853515625, -4.7501220703125, -4.514892578125, -4.2796630859375, -4.04443359375, -3.8092041015625, -3.573974609375, -3.3387451171875, -3.103515625, -2.8682861328125, -2.633056640625, -2.3978271484375, -2.16259765625, -1.9273681640625, -1.692138671875, -1.4569091796875, -1.2216796875, -0.9864501953125, -0.751220703125, -0.5159912109375, -0.28076171875, -0.0455322265625, 0.189697265625, 0.4249267578125, 0.66015625, 0.8953857421875, 1.130615234375, 1.3658447265625, 1.60107421875, 1.8363037109375, 2.071533203125, 2.3067626953125, 2.5419921875, 2.7772216796875, 3.012451171875, 3.2476806640625, 3.48291015625, 3.7181396484375, 3.953369140625, 4.1885986328125, 4.423828125, 4.6590576171875, 4.894287109375, 5.1295166015625, 5.36474609375, 5.5999755859375, 5.835205078125, 6.0704345703125, 6.3056640625, 6.5408935546875, 6.776123046875, 7.0113525390625, 7.24658203125, 7.4818115234375, 7.717041015625, 7.9522705078125, 8.1875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 9.0, 17.0, 20.0, 28.0, 46.0, 53.0, 73.0, 79.0, 140.0, 261.0, 520.0, 834.0, 1457.0, 2900.0, 6509.0, 19265.0, 270259.0, 3852952.0, 24218.0, 7577.0, 3219.0, 1647.0, 833.0, 486.0, 305.0, 165.0, 119.0, 63.0, 56.0, 45.0, 23.0, 19.0, 19.0, 19.0, 9.0, 9.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.0, -33.030517578125, -32.06103515625, -31.091552734375, -30.1220703125, -29.152587890625, -28.18310546875, -27.213623046875, -26.244140625, -25.274658203125, -24.30517578125, -23.335693359375, -22.3662109375, -21.396728515625, -20.42724609375, -19.457763671875, -18.48828125, -17.518798828125, -16.54931640625, -15.579833984375, -14.6103515625, -13.640869140625, -12.67138671875, -11.701904296875, -10.732421875, -9.762939453125, -8.79345703125, -7.823974609375, -6.8544921875, -5.885009765625, -4.91552734375, -3.946044921875, -2.9765625, -2.007080078125, -1.03759765625, -0.068115234375, 0.9013671875, 1.870849609375, 2.84033203125, 3.809814453125, 4.779296875, 5.748779296875, 6.71826171875, 7.687744140625, 8.6572265625, 9.626708984375, 10.59619140625, 11.565673828125, 12.53515625, 13.504638671875, 14.47412109375, 15.443603515625, 16.4130859375, 17.382568359375, 18.35205078125, 19.321533203125, 20.291015625, 21.260498046875, 22.22998046875, 23.199462890625, 24.1689453125, 25.138427734375, 26.10791015625, 27.077392578125, 28.046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 15.0, 21.0, 81.0, 385.0, 3333.0, 79.0, 48.0, 25.0, 15.0, 14.0, 5.0, 12.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.3310546875, -5.126953125, -4.9228515625, -4.71875, -4.5146484375, -4.310546875, -4.1064453125, -3.90234375, -3.6982421875, -3.494140625, -3.2900390625, -3.0859375, -2.8818359375, -2.677734375, -2.4736328125, -2.26953125, -2.0654296875, -1.861328125, -1.6572265625, -1.453125, -1.2490234375, -1.044921875, -0.8408203125, -0.63671875, -0.4326171875, -0.228515625, -0.0244140625, 0.1796875, 0.3837890625, 0.587890625, 0.7919921875, 0.99609375, 1.2001953125, 1.404296875, 1.6083984375, 1.8125, 2.0166015625, 2.220703125, 2.4248046875, 2.62890625, 2.8330078125, 3.037109375, 3.2412109375, 3.4453125, 3.6494140625, 3.853515625, 4.0576171875, 4.26171875, 4.4658203125, 4.669921875, 4.8740234375, 5.078125, 5.2822265625, 5.486328125, 5.6904296875, 5.89453125, 6.0986328125, 6.302734375, 6.5068359375, 6.7109375, 6.9150390625, 7.119140625, 7.3232421875, 7.52734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 10.0, 5.0, 15.0, 22.0, 38.0, 47.0, 67.0, 86.0, 100.0, 106.0, 131.0, 98.0, 84.0, 53.0, 43.0, 36.0, 21.0, 15.0, 17.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.397785186767578, -20.671911239624023, -19.94603729248047, -19.220163345336914, -18.49428939819336, -17.768415451049805, -17.04254150390625, -16.316667556762695, -15.59079360961914, -14.864919662475586, -14.139045715332031, -13.413171768188477, -12.687297821044922, -11.961423873901367, -11.235549926757812, -10.509675979614258, -9.783802032470703, -9.057928085327148, -8.332054138183594, -7.606180191040039, -6.880306243896484, -6.15443229675293, -5.428558349609375, -4.70268440246582, -3.9768104553222656, -3.250936508178711, -2.5250625610351562, -1.7991886138916016, -1.0733146667480469, -0.3474407196044922, 0.3784332275390625, 1.1043071746826172, 1.830179214477539, 2.5560531616210938, 3.2819271087646484, 4.007801055908203, 4.733675003051758, 5.4595489501953125, 6.185422897338867, 6.911296844482422, 7.637170791625977, 8.363044738769531, 9.088918685913086, 9.81479263305664, 10.540666580200195, 11.26654052734375, 11.992414474487305, 12.71828842163086, 13.444162368774414, 14.170036315917969, 14.895910263061523, 15.621784210205078, 16.347658157348633, 17.073532104492188, 17.799406051635742, 18.525279998779297, 19.25115394592285, 19.977027893066406, 20.70290184020996, 21.428775787353516, 22.15464973449707, 22.880523681640625, 23.60639762878418, 24.332271575927734, 25.05814552307129]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 5.0, 3.0, 2.0, 7.0, 9.0, 7.0, 7.0, 10.0, 13.0, 16.0, 20.0, 26.0, 26.0, 20.0, 36.0, 34.0, 34.0, 41.0, 41.0, 43.0, 42.0, 46.0, 44.0, 48.0, 45.0, 36.0, 45.0, 44.0, 30.0, 45.0, 36.0, 23.0, 18.0, 16.0, 17.0, 14.0, 12.0, 9.0, 8.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.715166091918945, -11.347990989685059, -10.980815887451172, -10.613640785217285, -10.246465682983398, -9.879291534423828, -9.512116432189941, -9.144941329956055, -8.777766227722168, -8.410591125488281, -8.043416023254395, -7.676241397857666, -7.309066295623779, -6.941891193389893, -6.574716567993164, -6.207541465759277, -5.840366363525391, -5.473191261291504, -5.106016159057617, -4.738841533660889, -4.371666431427002, -4.004491329193115, -3.6373164653778076, -3.2701416015625, -2.9029664993286133, -2.5357913970947266, -2.168616533279419, -1.8014415502548218, -1.4342665672302246, -1.0670915842056274, -0.6999166011810303, -0.33274173736572266, 0.03443336486816406, 0.40160834789276123, 0.7687833309173584, 1.1359583139419556, 1.5031332969665527, 1.87030827999115, 2.237483263015747, 2.6046581268310547, 2.9718332290649414, 3.339008331298828, 3.7061831951141357, 4.073358058929443, 4.44053316116333, 4.807708263397217, 5.174882888793945, 5.542057991027832, 5.909233093261719, 6.2764081954956055, 6.643583297729492, 7.010757923126221, 7.377933025360107, 7.745108127593994, 8.112282752990723, 8.47945785522461, 8.846632957458496, 9.213808059692383, 9.58098316192627, 9.948158264160156, 10.315332412719727, 10.682507514953613, 11.0496826171875, 11.416857719421387, 11.784032821655273]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 16.0, 21.0, 36.0, 72.0, 117.0, 216.0, 361.0, 633.0, 1241.0, 2909.0, 6820.0, 17651.0, 50233.0, 144028.0, 358394.0, 295431.0, 109291.0, 37670.0, 13487.0, 5403.0, 2184.0, 1032.0, 558.0, 327.0, 168.0, 96.0, 54.0, 28.0, 17.0, 12.0, 18.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-17.171875, -16.7183837890625, -16.264892578125, -15.8114013671875, -15.35791015625, -14.9044189453125, -14.450927734375, -13.9974365234375, -13.5439453125, -13.0904541015625, -12.636962890625, -12.1834716796875, -11.72998046875, -11.2764892578125, -10.822998046875, -10.3695068359375, -9.916015625, -9.4625244140625, -9.009033203125, -8.5555419921875, -8.10205078125, -7.6485595703125, -7.195068359375, -6.7415771484375, -6.2880859375, -5.8345947265625, -5.381103515625, -4.9276123046875, -4.47412109375, -4.0206298828125, -3.567138671875, -3.1136474609375, -2.66015625, -2.2066650390625, -1.753173828125, -1.2996826171875, -0.84619140625, -0.3927001953125, 0.060791015625, 0.5142822265625, 0.9677734375, 1.4212646484375, 1.874755859375, 2.3282470703125, 2.78173828125, 3.2352294921875, 3.688720703125, 4.1422119140625, 4.595703125, 5.0491943359375, 5.502685546875, 5.9561767578125, 6.40966796875, 6.8631591796875, 7.316650390625, 7.7701416015625, 8.2236328125, 8.6771240234375, 9.130615234375, 9.5841064453125, 10.03759765625, 10.4910888671875, 10.944580078125, 11.3980712890625, 11.8515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 10.0, 4.0, 3.0, 7.0, 9.0, 14.0, 13.0, 18.0, 18.0, 27.0, 37.0, 31.0, 40.0, 53.0, 45.0, 50.0, 54.0, 61.0, 70.0, 51.0, 33.0, 42.0, 46.0, 42.0, 38.0, 37.0, 25.0, 22.0, 22.0, 15.0, 16.0, 20.0, 2.0, 7.0, 7.0, 2.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2578125, -7.02557373046875, -6.7933349609375, -6.56109619140625, -6.328857421875, -6.09661865234375, -5.8643798828125, -5.63214111328125, -5.39990234375, -5.16766357421875, -4.9354248046875, -4.70318603515625, -4.470947265625, -4.23870849609375, -4.0064697265625, -3.77423095703125, -3.5419921875, -3.30975341796875, -3.0775146484375, -2.84527587890625, -2.613037109375, -2.38079833984375, -2.1485595703125, -1.91632080078125, -1.68408203125, -1.45184326171875, -1.2196044921875, -0.98736572265625, -0.755126953125, -0.52288818359375, -0.2906494140625, -0.05841064453125, 0.173828125, 0.40606689453125, 0.6383056640625, 0.87054443359375, 1.102783203125, 1.33502197265625, 1.5672607421875, 1.79949951171875, 2.03173828125, 2.26397705078125, 2.4962158203125, 2.72845458984375, 2.960693359375, 3.19293212890625, 3.4251708984375, 3.65740966796875, 3.8896484375, 4.12188720703125, 4.3541259765625, 4.58636474609375, 4.818603515625, 5.05084228515625, 5.2830810546875, 5.51531982421875, 5.74755859375, 5.97979736328125, 6.2120361328125, 6.44427490234375, 6.676513671875, 6.90875244140625, 7.1409912109375, 7.37322998046875, 7.60546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 17.0, 21.0, 37.0, 37.0, 78.0, 131.0, 186.0, 331.0, 479.0, 892.0, 1945.0, 7128.0, 72852.0, 832661.0, 117685.0, 9441.0, 2204.0, 973.0, 509.0, 326.0, 207.0, 137.0, 85.0, 64.0, 49.0, 24.0, 20.0, 11.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.52197265625, -30.4189453125, -29.31591796875, -28.212890625, -27.10986328125, -26.0068359375, -24.90380859375, -23.80078125, -22.69775390625, -21.5947265625, -20.49169921875, -19.388671875, -18.28564453125, -17.1826171875, -16.07958984375, -14.9765625, -13.87353515625, -12.7705078125, -11.66748046875, -10.564453125, -9.46142578125, -8.3583984375, -7.25537109375, -6.15234375, -5.04931640625, -3.9462890625, -2.84326171875, -1.740234375, -0.63720703125, 0.4658203125, 1.56884765625, 2.671875, 3.77490234375, 4.8779296875, 5.98095703125, 7.083984375, 8.18701171875, 9.2900390625, 10.39306640625, 11.49609375, 12.59912109375, 13.7021484375, 14.80517578125, 15.908203125, 17.01123046875, 18.1142578125, 19.21728515625, 20.3203125, 21.42333984375, 22.5263671875, 23.62939453125, 24.732421875, 25.83544921875, 26.9384765625, 28.04150390625, 29.14453125, 30.24755859375, 31.3505859375, 32.45361328125, 33.556640625, 34.65966796875, 35.7626953125, 36.86572265625, 37.96875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 6.0, 6.0, 5.0, 6.0, 8.0, 16.0, 18.0, 21.0, 16.0, 26.0, 28.0, 40.0, 38.0, 51.0, 30.0, 35.0, 43.0, 59.0, 54.0, 47.0, 53.0, 33.0, 42.0, 41.0, 38.0, 37.0, 42.0, 25.0, 27.0, 24.0, 20.0, 15.0, 10.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.109375, -28.184326171875, -27.25927734375, -26.334228515625, -25.4091796875, -24.484130859375, -23.55908203125, -22.634033203125, -21.708984375, -20.783935546875, -19.85888671875, -18.933837890625, -18.0087890625, -17.083740234375, -16.15869140625, -15.233642578125, -14.30859375, -13.383544921875, -12.45849609375, -11.533447265625, -10.6083984375, -9.683349609375, -8.75830078125, -7.833251953125, -6.908203125, -5.983154296875, -5.05810546875, -4.133056640625, -3.2080078125, -2.282958984375, -1.35791015625, -0.432861328125, 0.4921875, 1.417236328125, 2.34228515625, 3.267333984375, 4.1923828125, 5.117431640625, 6.04248046875, 6.967529296875, 7.892578125, 8.817626953125, 9.74267578125, 10.667724609375, 11.5927734375, 12.517822265625, 13.44287109375, 14.367919921875, 15.29296875, 16.218017578125, 17.14306640625, 18.068115234375, 18.9931640625, 19.918212890625, 20.84326171875, 21.768310546875, 22.693359375, 23.618408203125, 24.54345703125, 25.468505859375, 26.3935546875, 27.318603515625, 28.24365234375, 29.168701171875, 30.09375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 8.0, 6.0, 9.0, 6.0, 12.0, 20.0, 24.0, 31.0, 43.0, 54.0, 91.0, 156.0, 266.0, 460.0, 851.0, 1939.0, 5827.0, 25289.0, 241562.0, 695415.0, 60297.0, 10391.0, 3084.0, 1226.0, 617.0, 308.0, 173.0, 108.0, 75.0, 59.0, 39.0, 25.0, 19.0, 15.0, 11.0, 15.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.6640625, -12.2584228515625, -11.852783203125, -11.4471435546875, -11.04150390625, -10.6358642578125, -10.230224609375, -9.8245849609375, -9.4189453125, -9.0133056640625, -8.607666015625, -8.2020263671875, -7.79638671875, -7.3907470703125, -6.985107421875, -6.5794677734375, -6.173828125, -5.7681884765625, -5.362548828125, -4.9569091796875, -4.55126953125, -4.1456298828125, -3.739990234375, -3.3343505859375, -2.9287109375, -2.5230712890625, -2.117431640625, -1.7117919921875, -1.30615234375, -0.9005126953125, -0.494873046875, -0.0892333984375, 0.31640625, 0.7220458984375, 1.127685546875, 1.5333251953125, 1.93896484375, 2.3446044921875, 2.750244140625, 3.1558837890625, 3.5615234375, 3.9671630859375, 4.372802734375, 4.7784423828125, 5.18408203125, 5.5897216796875, 5.995361328125, 6.4010009765625, 6.806640625, 7.2122802734375, 7.617919921875, 8.0235595703125, 8.42919921875, 8.8348388671875, 9.240478515625, 9.6461181640625, 10.0517578125, 10.4573974609375, 10.863037109375, 11.2686767578125, 11.67431640625, 12.0799560546875, 12.485595703125, 12.8912353515625, 13.296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 13.0, 7.0, 16.0, 13.0, 21.0, 18.0, 25.0, 37.0, 44.0, 61.0, 124.0, 154.0, 129.0, 101.0, 61.0, 37.0, 29.0, 20.0, 15.0, 19.0, 10.0, 8.0, 10.0, 6.0, 3.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0015211105346679688, -0.001471981406211853, -0.0014228522777557373, -0.0013737231492996216, -0.0013245940208435059, -0.0012754648923873901, -0.0012263357639312744, -0.0011772066354751587, -0.001128077507019043, -0.0010789483785629272, -0.0010298192501068115, -0.0009806901216506958, -0.0009315609931945801, -0.0008824318647384644, -0.0008333027362823486, -0.0007841736078262329, -0.0007350444793701172, -0.0006859153509140015, -0.0006367862224578857, -0.00058765709400177, -0.0005385279655456543, -0.0004893988370895386, -0.00044026970863342285, -0.00039114058017730713, -0.0003420114517211914, -0.0002928823232650757, -0.00024375319480895996, -0.00019462406635284424, -0.00014549493789672852, -9.636580944061279e-05, -4.723668098449707e-05, 1.8924474716186523e-06, 5.1021575927734375e-05, 0.0001001507043838501, 0.00014927983283996582, 0.00019840896129608154, 0.00024753808975219727, 0.000296667218208313, 0.0003457963466644287, 0.00039492547512054443, 0.00044405460357666016, 0.0004931837320327759, 0.0005423128604888916, 0.0005914419889450073, 0.000640571117401123, 0.0006897002458572388, 0.0007388293743133545, 0.0007879585027694702, 0.0008370876312255859, 0.0008862167596817017, 0.0009353458881378174, 0.000984475016593933, 0.0010336041450500488, 0.0010827332735061646, 0.0011318624019622803, 0.001180991530418396, 0.0012301206588745117, 0.0012792497873306274, 0.0013283789157867432, 0.0013775080442428589, 0.0014266371726989746, 0.0014757663011550903, 0.001524895429611206, 0.0015740245580673218, 0.0016231536865234375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 19.0, 17.0, 19.0, 31.0, 65.0, 69.0, 156.0, 254.0, 497.0, 940.0, 2084.0, 5374.0, 21661.0, 183491.0, 721520.0, 91466.0, 13476.0, 3936.0, 1661.0, 759.0, 419.0, 233.0, 148.0, 90.0, 45.0, 29.0, 29.0, 19.0, 11.0, 6.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-15.6484375, -15.218017578125, -14.78759765625, -14.357177734375, -13.9267578125, -13.496337890625, -13.06591796875, -12.635498046875, -12.205078125, -11.774658203125, -11.34423828125, -10.913818359375, -10.4833984375, -10.052978515625, -9.62255859375, -9.192138671875, -8.76171875, -8.331298828125, -7.90087890625, -7.470458984375, -7.0400390625, -6.609619140625, -6.17919921875, -5.748779296875, -5.318359375, -4.887939453125, -4.45751953125, -4.027099609375, -3.5966796875, -3.166259765625, -2.73583984375, -2.305419921875, -1.875, -1.444580078125, -1.01416015625, -0.583740234375, -0.1533203125, 0.277099609375, 0.70751953125, 1.137939453125, 1.568359375, 1.998779296875, 2.42919921875, 2.859619140625, 3.2900390625, 3.720458984375, 4.15087890625, 4.581298828125, 5.01171875, 5.442138671875, 5.87255859375, 6.302978515625, 6.7333984375, 7.163818359375, 7.59423828125, 8.024658203125, 8.455078125, 8.885498046875, 9.31591796875, 9.746337890625, 10.1767578125, 10.607177734375, 11.03759765625, 11.468017578125, 11.8984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 2.0, 13.0, 12.0, 14.0, 22.0, 41.0, 38.0, 53.0, 67.0, 119.0, 110.0, 110.0, 112.0, 78.0, 52.0, 40.0, 35.0, 20.0, 12.0, 16.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.064208984375, -9.69091796875, -9.317626953125, -8.9443359375, -8.571044921875, -8.19775390625, -7.824462890625, -7.451171875, -7.077880859375, -6.70458984375, -6.331298828125, -5.9580078125, -5.584716796875, -5.21142578125, -4.838134765625, -4.46484375, -4.091552734375, -3.71826171875, -3.344970703125, -2.9716796875, -2.598388671875, -2.22509765625, -1.851806640625, -1.478515625, -1.105224609375, -0.73193359375, -0.358642578125, 0.0146484375, 0.387939453125, 0.76123046875, 1.134521484375, 1.5078125, 1.881103515625, 2.25439453125, 2.627685546875, 3.0009765625, 3.374267578125, 3.74755859375, 4.120849609375, 4.494140625, 4.867431640625, 5.24072265625, 5.614013671875, 5.9873046875, 6.360595703125, 6.73388671875, 7.107177734375, 7.48046875, 7.853759765625, 8.22705078125, 8.600341796875, 8.9736328125, 9.346923828125, 9.72021484375, 10.093505859375, 10.466796875, 10.840087890625, 11.21337890625, 11.586669921875, 11.9599609375, 12.333251953125, 12.70654296875, 13.079833984375, 13.453125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 9.0, 14.0, 50.0, 169.0, 341.0, 275.0, 93.0, 31.0, 11.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-577.6637573242188, -564.19189453125, -550.719970703125, -537.2481079101562, -523.7762451171875, -510.3043518066406, -496.83245849609375, -483.360595703125, -469.8887023925781, -456.41680908203125, -442.9449462890625, -429.4730529785156, -416.00115966796875, -402.529296875, -389.0574035644531, -375.58551025390625, -362.1136474609375, -348.6417541503906, -335.1698913574219, -321.697998046875, -308.2261047363281, -294.7542419433594, -281.2823486328125, -267.81048583984375, -254.33856201171875, -240.86668395996094, -227.39479064941406, -213.92291259765625, -200.45103454589844, -186.97915649414062, -173.50726318359375, -160.03538513183594, -146.56350708007812, -133.0916290283203, -119.61974334716797, -106.14785766601562, -92.67597961425781, -79.20409393310547, -65.73220825195312, -52.26033020019531, -38.78844451904297, -25.31656265258789, -11.84467887878418, 1.6272048950195312, 15.09908676147461, 28.570968627929688, 42.04285430908203, 55.514732360839844, 68.98661804199219, 82.45850372314453, 95.93038177490234, 109.40226745605469, 122.8741455078125, 136.34603881835938, 149.8179168701172, 163.289794921875, 176.76168823242188, 190.2335662841797, 203.70545959472656, 217.17733764648438, 230.6492156982422, 244.12109375, 257.5929870605469, 271.06488037109375, 284.5367431640625]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 13.0, 8.0, 15.0, 12.0, 13.0, 14.0, 18.0, 25.0, 35.0, 33.0, 42.0, 31.0, 51.0, 59.0, 42.0, 60.0, 63.0, 62.0, 44.0, 48.0, 38.0, 47.0, 32.0, 29.0, 26.0, 20.0, 22.0, 23.0, 17.0, 12.0, 10.0, 10.0, 3.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 4.0, 2.0, 3.0], "bins": [-171.3012237548828, -166.85560607910156, -162.4099884033203, -157.96437072753906, -153.5187530517578, -149.07313537597656, -144.6275177001953, -140.18190002441406, -135.7362823486328, -131.29066467285156, -126.84504699707031, -122.39942932128906, -117.95381164550781, -113.50819396972656, -109.06257629394531, -104.61695861816406, -100.17134857177734, -95.7257308959961, -91.28011322021484, -86.8344955444336, -82.38887786865234, -77.9432601928711, -73.49765014648438, -69.05203247070312, -64.60641479492188, -60.160797119140625, -55.715179443359375, -51.269561767578125, -46.823944091796875, -42.378326416015625, -37.93271255493164, -33.48709487915039, -29.041465759277344, -24.595848083496094, -20.150230407714844, -15.704614639282227, -11.258996963500977, -6.813379287719727, -2.3677635192871094, 2.0778541564941406, 6.523471832275391, 10.96908950805664, 15.414706230163574, 19.860322952270508, 24.305940628051758, 28.751558303833008, 33.197174072265625, 37.642791748046875, 42.088409423828125, 46.534027099609375, 50.979644775390625, 55.425262451171875, 59.870880126953125, 64.31649780273438, 68.76211547851562, 73.20773315429688, 77.65335083007812, 82.09896850585938, 86.54458618164062, 90.99020385742188, 95.43582153320312, 99.88143920898438, 104.32705688476562, 108.77267456054688, 113.2182846069336]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 13.0, 21.0, 16.0, 22.0, 32.0, 44.0, 50.0, 75.0, 90.0, 118.0, 178.0, 291.0, 446.0, 685.0, 1126.0, 2110.0, 4171.0, 9863.0, 33371.0, 3723504.0, 373755.0, 26850.0, 8698.0, 3786.0, 1953.0, 1112.0, 609.0, 362.0, 270.0, 185.0, 125.0, 85.0, 61.0, 50.0, 38.0, 32.0, 17.0, 12.0, 11.0, 4.0, 11.0, 4.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-29.734375, -28.831298828125, -27.92822265625, -27.025146484375, -26.1220703125, -25.218994140625, -24.31591796875, -23.412841796875, -22.509765625, -21.606689453125, -20.70361328125, -19.800537109375, -18.8974609375, -17.994384765625, -17.09130859375, -16.188232421875, -15.28515625, -14.382080078125, -13.47900390625, -12.575927734375, -11.6728515625, -10.769775390625, -9.86669921875, -8.963623046875, -8.060546875, -7.157470703125, -6.25439453125, -5.351318359375, -4.4482421875, -3.545166015625, -2.64208984375, -1.739013671875, -0.8359375, 0.067138671875, 0.97021484375, 1.873291015625, 2.7763671875, 3.679443359375, 4.58251953125, 5.485595703125, 6.388671875, 7.291748046875, 8.19482421875, 9.097900390625, 10.0009765625, 10.904052734375, 11.80712890625, 12.710205078125, 13.61328125, 14.516357421875, 15.41943359375, 16.322509765625, 17.2255859375, 18.128662109375, 19.03173828125, 19.934814453125, 20.837890625, 21.740966796875, 22.64404296875, 23.547119140625, 24.4501953125, 25.353271484375, 26.25634765625, 27.159423828125, 28.0625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 8.0, 7.0, 10.0, 8.0, 15.0, 26.0, 23.0, 21.0, 54.0, 40.0, 47.0, 52.0, 44.0, 46.0, 55.0, 59.0, 76.0, 56.0, 43.0, 37.0, 50.0, 35.0, 37.0, 26.0, 29.0, 14.0, 18.0, 22.0, 8.0, 10.0, 10.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.73046875, -7.4935302734375, -7.256591796875, -7.0196533203125, -6.78271484375, -6.5457763671875, -6.308837890625, -6.0718994140625, -5.8349609375, -5.5980224609375, -5.361083984375, -5.1241455078125, -4.88720703125, -4.6502685546875, -4.413330078125, -4.1763916015625, -3.939453125, -3.7025146484375, -3.465576171875, -3.2286376953125, -2.99169921875, -2.7547607421875, -2.517822265625, -2.2808837890625, -2.0439453125, -1.8070068359375, -1.570068359375, -1.3331298828125, -1.09619140625, -0.8592529296875, -0.622314453125, -0.3853759765625, -0.1484375, 0.0885009765625, 0.325439453125, 0.5623779296875, 0.79931640625, 1.0362548828125, 1.273193359375, 1.5101318359375, 1.7470703125, 1.9840087890625, 2.220947265625, 2.4578857421875, 2.69482421875, 2.9317626953125, 3.168701171875, 3.4056396484375, 3.642578125, 3.8795166015625, 4.116455078125, 4.3533935546875, 4.59033203125, 4.8272705078125, 5.064208984375, 5.3011474609375, 5.5380859375, 5.7750244140625, 6.011962890625, 6.2489013671875, 6.48583984375, 6.7227783203125, 6.959716796875, 7.1966552734375, 7.43359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 11.0, 8.0, 12.0, 9.0, 16.0, 21.0, 17.0, 43.0, 33.0, 60.0, 49.0, 78.0, 143.0, 181.0, 318.0, 587.0, 1510.0, 4217.0, 15735.0, 130010.0, 3981152.0, 46128.0, 8890.0, 2656.0, 995.0, 484.0, 240.0, 149.0, 118.0, 79.0, 64.0, 58.0, 50.0, 38.0, 25.0, 23.0, 13.0, 17.0, 10.0, 9.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.09375, -32.0693359375, -31.044921875, -30.0205078125, -28.99609375, -27.9716796875, -26.947265625, -25.9228515625, -24.8984375, -23.8740234375, -22.849609375, -21.8251953125, -20.80078125, -19.7763671875, -18.751953125, -17.7275390625, -16.703125, -15.6787109375, -14.654296875, -13.6298828125, -12.60546875, -11.5810546875, -10.556640625, -9.5322265625, -8.5078125, -7.4833984375, -6.458984375, -5.4345703125, -4.41015625, -3.3857421875, -2.361328125, -1.3369140625, -0.3125, 0.7119140625, 1.736328125, 2.7607421875, 3.78515625, 4.8095703125, 5.833984375, 6.8583984375, 7.8828125, 8.9072265625, 9.931640625, 10.9560546875, 11.98046875, 13.0048828125, 14.029296875, 15.0537109375, 16.078125, 17.1025390625, 18.126953125, 19.1513671875, 20.17578125, 21.2001953125, 22.224609375, 23.2490234375, 24.2734375, 25.2978515625, 26.322265625, 27.3466796875, 28.37109375, 29.3955078125, 30.419921875, 31.4443359375, 32.46875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 14.0, 26.0, 46.0, 94.0, 407.0, 3234.0, 136.0, 53.0, 24.0, 13.0, 11.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.7275390625, -7.220703125, -6.7138671875, -6.20703125, -5.7001953125, -5.193359375, -4.6865234375, -4.1796875, -3.6728515625, -3.166015625, -2.6591796875, -2.15234375, -1.6455078125, -1.138671875, -0.6318359375, -0.125, 0.3818359375, 0.888671875, 1.3955078125, 1.90234375, 2.4091796875, 2.916015625, 3.4228515625, 3.9296875, 4.4365234375, 4.943359375, 5.4501953125, 5.95703125, 6.4638671875, 6.970703125, 7.4775390625, 7.984375, 8.4912109375, 8.998046875, 9.5048828125, 10.01171875, 10.5185546875, 11.025390625, 11.5322265625, 12.0390625, 12.5458984375, 13.052734375, 13.5595703125, 14.06640625, 14.5732421875, 15.080078125, 15.5869140625, 16.09375, 16.6005859375, 17.107421875, 17.6142578125, 18.12109375, 18.6279296875, 19.134765625, 19.6416015625, 20.1484375, 20.6552734375, 21.162109375, 21.6689453125, 22.17578125, 22.6826171875, 23.189453125, 23.6962890625, 24.203125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 0.0, 5.0, 10.0, 17.0, 10.0, 30.0, 44.0, 67.0, 88.0, 153.0, 140.0, 133.0, 103.0, 82.0, 44.0, 33.0, 12.0, 10.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.354522705078125, -30.718544006347656, -29.082563400268555, -27.446584701538086, -25.810604095458984, -24.174625396728516, -22.538646697998047, -20.902666091918945, -19.266685485839844, -17.630706787109375, -15.994726181030273, -14.358747482299805, -12.722766876220703, -11.086788177490234, -9.45080852508545, -7.814828872680664, -6.178850173950195, -4.54287052154541, -2.906891107559204, -1.270911693572998, 0.3650679588317871, 2.001047134399414, 3.637026786804199, 5.273006439208984, 6.9089860916137695, 8.544965744018555, 10.18094539642334, 11.816925048828125, 13.452903747558594, 15.088883399963379, 16.724863052368164, 18.360843658447266, 19.996822357177734, 21.632801055908203, 23.268781661987305, 24.904760360717773, 26.540740966796875, 28.176719665527344, 29.812698364257812, 31.448678970336914, 33.084659576416016, 34.720638275146484, 36.35661697387695, 37.99259948730469, 39.628578186035156, 41.264556884765625, 42.900535583496094, 44.53651428222656, 46.17249298095703, 47.8084716796875, 49.44445037841797, 51.0804328918457, 52.71641159057617, 54.35239028930664, 55.98836898803711, 57.624351501464844, 59.26033020019531, 60.89630889892578, 62.53228759765625, 64.16826629638672, 65.80424499511719, 67.44023132324219, 69.07621002197266, 70.71218872070312, 72.3481674194336]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 10.0, 14.0, 15.0, 21.0, 30.0, 40.0, 49.0, 62.0, 84.0, 73.0, 80.0, 91.0, 86.0, 74.0, 67.0, 60.0, 42.0, 27.0, 22.0, 18.0, 11.0, 12.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.758331298828125, -53.35428237915039, -51.950233459472656, -50.546180725097656, -49.14213180541992, -47.73808288574219, -46.33403396606445, -44.92998504638672, -43.52593231201172, -42.121883392333984, -40.71783447265625, -39.31378173828125, -37.909732818603516, -36.50568389892578, -35.10163497924805, -33.69758605957031, -32.29353713989258, -30.889488220214844, -29.485437393188477, -28.081388473510742, -26.677337646484375, -25.27328872680664, -23.869239807128906, -22.465190887451172, -21.061140060424805, -19.65709114074707, -18.253040313720703, -16.84899139404297, -15.444941520690918, -14.040891647338867, -12.636842727661133, -11.232792854309082, -9.828746795654297, -8.424696922302246, -7.0206475257873535, -5.616598129272461, -4.21254825592041, -2.8084983825683594, -1.404449462890625, -0.00039958953857421875, 1.4036502838134766, 2.8076999187469482, 4.21174955368042, 5.6157989501953125, 7.019848823547363, 8.423898696899414, 9.827947616577148, 11.2319974899292, 12.63604736328125, 14.0400972366333, 15.444147109985352, 16.848196029663086, 18.252246856689453, 19.656295776367188, 21.060344696044922, 22.464393615722656, 23.868444442749023, 25.272493362426758, 26.676544189453125, 28.08059310913086, 29.484642028808594, 30.88869285583496, 32.29273986816406, 33.69679260253906, 35.1008415222168]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 9.0, 11.0, 10.0, 17.0, 27.0, 45.0, 60.0, 96.0, 153.0, 215.0, 366.0, 556.0, 977.0, 1677.0, 3272.0, 6770.0, 14495.0, 34246.0, 81065.0, 192033.0, 367426.0, 196754.0, 83743.0, 35124.0, 14949.0, 6745.0, 3421.0, 1724.0, 998.0, 616.0, 351.0, 206.0, 141.0, 74.0, 59.0, 34.0, 32.0, 16.0, 11.0, 8.0, 8.0, 7.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.015625, -16.4580078125, -15.900390625, -15.3427734375, -14.78515625, -14.2275390625, -13.669921875, -13.1123046875, -12.5546875, -11.9970703125, -11.439453125, -10.8818359375, -10.32421875, -9.7666015625, -9.208984375, -8.6513671875, -8.09375, -7.5361328125, -6.978515625, -6.4208984375, -5.86328125, -5.3056640625, -4.748046875, -4.1904296875, -3.6328125, -3.0751953125, -2.517578125, -1.9599609375, -1.40234375, -0.8447265625, -0.287109375, 0.2705078125, 0.828125, 1.3857421875, 1.943359375, 2.5009765625, 3.05859375, 3.6162109375, 4.173828125, 4.7314453125, 5.2890625, 5.8466796875, 6.404296875, 6.9619140625, 7.51953125, 8.0771484375, 8.634765625, 9.1923828125, 9.75, 10.3076171875, 10.865234375, 11.4228515625, 11.98046875, 12.5380859375, 13.095703125, 13.6533203125, 14.2109375, 14.7685546875, 15.326171875, 15.8837890625, 16.44140625, 16.9990234375, 17.556640625, 18.1142578125, 18.671875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 5.0, 12.0, 9.0, 12.0, 17.0, 24.0, 24.0, 24.0, 37.0, 30.0, 34.0, 44.0, 41.0, 49.0, 44.0, 38.0, 62.0, 51.0, 60.0, 40.0, 43.0, 44.0, 37.0, 33.0, 25.0, 33.0, 18.0, 14.0, 21.0, 18.0, 12.0, 8.0, 11.0, 6.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.80859375, -7.583740234375, -7.35888671875, -7.134033203125, -6.9091796875, -6.684326171875, -6.45947265625, -6.234619140625, -6.009765625, -5.784912109375, -5.56005859375, -5.335205078125, -5.1103515625, -4.885498046875, -4.66064453125, -4.435791015625, -4.2109375, -3.986083984375, -3.76123046875, -3.536376953125, -3.3115234375, -3.086669921875, -2.86181640625, -2.636962890625, -2.412109375, -2.187255859375, -1.96240234375, -1.737548828125, -1.5126953125, -1.287841796875, -1.06298828125, -0.838134765625, -0.61328125, -0.388427734375, -0.16357421875, 0.061279296875, 0.2861328125, 0.510986328125, 0.73583984375, 0.960693359375, 1.185546875, 1.410400390625, 1.63525390625, 1.860107421875, 2.0849609375, 2.309814453125, 2.53466796875, 2.759521484375, 2.984375, 3.209228515625, 3.43408203125, 3.658935546875, 3.8837890625, 4.108642578125, 4.33349609375, 4.558349609375, 4.783203125, 5.008056640625, 5.23291015625, 5.457763671875, 5.6826171875, 5.907470703125, 6.13232421875, 6.357177734375, 6.58203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 6.0, 10.0, 13.0, 22.0, 30.0, 50.0, 58.0, 94.0, 120.0, 216.0, 325.0, 625.0, 1105.0, 2705.0, 11252.0, 122003.0, 802360.0, 93176.0, 9336.0, 2510.0, 1031.0, 565.0, 337.0, 185.0, 123.0, 87.0, 63.0, 46.0, 17.0, 21.0, 13.0, 12.0, 17.0, 4.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-46.6875, -45.37060546875, -44.0537109375, -42.73681640625, -41.419921875, -40.10302734375, -38.7861328125, -37.46923828125, -36.15234375, -34.83544921875, -33.5185546875, -32.20166015625, -30.884765625, -29.56787109375, -28.2509765625, -26.93408203125, -25.6171875, -24.30029296875, -22.9833984375, -21.66650390625, -20.349609375, -19.03271484375, -17.7158203125, -16.39892578125, -15.08203125, -13.76513671875, -12.4482421875, -11.13134765625, -9.814453125, -8.49755859375, -7.1806640625, -5.86376953125, -4.546875, -3.22998046875, -1.9130859375, -0.59619140625, 0.720703125, 2.03759765625, 3.3544921875, 4.67138671875, 5.98828125, 7.30517578125, 8.6220703125, 9.93896484375, 11.255859375, 12.57275390625, 13.8896484375, 15.20654296875, 16.5234375, 17.84033203125, 19.1572265625, 20.47412109375, 21.791015625, 23.10791015625, 24.4248046875, 25.74169921875, 27.05859375, 28.37548828125, 29.6923828125, 31.00927734375, 32.326171875, 33.64306640625, 34.9599609375, 36.27685546875, 37.59375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 5.0, 10.0, 29.0, 28.0, 36.0, 62.0, 71.0, 84.0, 108.0, 82.0, 96.0, 77.0, 101.0, 56.0, 56.0, 40.0, 17.0, 17.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.3125, -71.46826171875, -69.6240234375, -67.77978515625, -65.935546875, -64.09130859375, -62.2470703125, -60.40283203125, -58.55859375, -56.71435546875, -54.8701171875, -53.02587890625, -51.181640625, -49.33740234375, -47.4931640625, -45.64892578125, -43.8046875, -41.96044921875, -40.1162109375, -38.27197265625, -36.427734375, -34.58349609375, -32.7392578125, -30.89501953125, -29.05078125, -27.20654296875, -25.3623046875, -23.51806640625, -21.673828125, -19.82958984375, -17.9853515625, -16.14111328125, -14.296875, -12.45263671875, -10.6083984375, -8.76416015625, -6.919921875, -5.07568359375, -3.2314453125, -1.38720703125, 0.45703125, 2.30126953125, 4.1455078125, 5.98974609375, 7.833984375, 9.67822265625, 11.5224609375, 13.36669921875, 15.2109375, 17.05517578125, 18.8994140625, 20.74365234375, 22.587890625, 24.43212890625, 26.2763671875, 28.12060546875, 29.96484375, 31.80908203125, 33.6533203125, 35.49755859375, 37.341796875, 39.18603515625, 41.0302734375, 42.87451171875, 44.71875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 12.0, 10.0, 18.0, 15.0, 26.0, 31.0, 55.0, 95.0, 139.0, 305.0, 600.0, 1377.0, 3905.0, 14718.0, 79106.0, 591508.0, 297720.0, 44637.0, 9331.0, 2770.0, 1037.0, 479.0, 233.0, 138.0, 97.0, 63.0, 36.0, 16.0, 18.0, 17.0, 7.0, 4.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.796875, -9.4571533203125, -9.117431640625, -8.7777099609375, -8.43798828125, -8.0982666015625, -7.758544921875, -7.4188232421875, -7.0791015625, -6.7393798828125, -6.399658203125, -6.0599365234375, -5.72021484375, -5.3804931640625, -5.040771484375, -4.7010498046875, -4.361328125, -4.0216064453125, -3.681884765625, -3.3421630859375, -3.00244140625, -2.6627197265625, -2.322998046875, -1.9832763671875, -1.6435546875, -1.3038330078125, -0.964111328125, -0.6243896484375, -0.28466796875, 0.0550537109375, 0.394775390625, 0.7344970703125, 1.07421875, 1.4139404296875, 1.753662109375, 2.0933837890625, 2.43310546875, 2.7728271484375, 3.112548828125, 3.4522705078125, 3.7919921875, 4.1317138671875, 4.471435546875, 4.8111572265625, 5.15087890625, 5.4906005859375, 5.830322265625, 6.1700439453125, 6.509765625, 6.8494873046875, 7.189208984375, 7.5289306640625, 7.86865234375, 8.2083740234375, 8.548095703125, 8.8878173828125, 9.2275390625, 9.5672607421875, 9.906982421875, 10.2467041015625, 10.58642578125, 10.9261474609375, 11.265869140625, 11.6055908203125, 11.9453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 11.0, 18.0, 13.0, 13.0, 13.0, 33.0, 31.0, 42.0, 40.0, 53.0, 90.0, 160.0, 138.0, 64.0, 61.0, 55.0, 32.0, 23.0, 23.0, 16.0, 18.0, 8.0, 10.0, 11.0, 5.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0022869110107421875, -0.00222131609916687, -0.0021557211875915527, -0.0020901262760162354, -0.002024531364440918, -0.0019589364528656006, -0.0018933415412902832, -0.0018277466297149658, -0.0017621517181396484, -0.001696556806564331, -0.0016309618949890137, -0.0015653669834136963, -0.001499772071838379, -0.0014341771602630615, -0.0013685822486877441, -0.0013029873371124268, -0.0012373924255371094, -0.001171797513961792, -0.0011062026023864746, -0.0010406076908111572, -0.0009750127792358398, -0.0009094178676605225, -0.0008438229560852051, -0.0007782280445098877, -0.0007126331329345703, -0.0006470382213592529, -0.0005814433097839355, -0.0005158483982086182, -0.0004502534866333008, -0.0003846585750579834, -0.000319063663482666, -0.00025346875190734863, -0.00018787384033203125, -0.00012227892875671387, -5.6684017181396484e-05, 8.910894393920898e-06, 7.450580596923828e-05, 0.00014010071754455566, 0.00020569562911987305, 0.00027129054069519043, 0.0003368854522705078, 0.0004024803638458252, 0.0004680752754211426, 0.00053367018699646, 0.0005992650985717773, 0.0006648600101470947, 0.0007304549217224121, 0.0007960498332977295, 0.0008616447448730469, 0.0009272396564483643, 0.0009928345680236816, 0.001058429479598999, 0.0011240243911743164, 0.0011896193027496338, 0.0012552142143249512, 0.0013208091259002686, 0.001386404037475586, 0.0014519989490509033, 0.0015175938606262207, 0.001583188772201538, 0.0016487836837768555, 0.0017143785953521729, 0.0017799735069274902, 0.0018455684185028076, 0.001911163330078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 9.0, 6.0, 10.0, 9.0, 18.0, 15.0, 31.0, 37.0, 53.0, 107.0, 177.0, 272.0, 501.0, 1007.0, 2656.0, 9607.0, 58767.0, 560924.0, 362557.0, 40431.0, 7299.0, 2144.0, 819.0, 424.0, 248.0, 170.0, 79.0, 54.0, 45.0, 28.0, 23.0, 8.0, 6.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.2578125, -13.8607177734375, -13.463623046875, -13.0665283203125, -12.66943359375, -12.2723388671875, -11.875244140625, -11.4781494140625, -11.0810546875, -10.6839599609375, -10.286865234375, -9.8897705078125, -9.49267578125, -9.0955810546875, -8.698486328125, -8.3013916015625, -7.904296875, -7.5072021484375, -7.110107421875, -6.7130126953125, -6.31591796875, -5.9188232421875, -5.521728515625, -5.1246337890625, -4.7275390625, -4.3304443359375, -3.933349609375, -3.5362548828125, -3.13916015625, -2.7420654296875, -2.344970703125, -1.9478759765625, -1.55078125, -1.1536865234375, -0.756591796875, -0.3594970703125, 0.03759765625, 0.4346923828125, 0.831787109375, 1.2288818359375, 1.6259765625, 2.0230712890625, 2.420166015625, 2.8172607421875, 3.21435546875, 3.6114501953125, 4.008544921875, 4.4056396484375, 4.802734375, 5.1998291015625, 5.596923828125, 5.9940185546875, 6.39111328125, 6.7882080078125, 7.185302734375, 7.5823974609375, 7.9794921875, 8.3765869140625, 8.773681640625, 9.1707763671875, 9.56787109375, 9.9649658203125, 10.362060546875, 10.7591552734375, 11.15625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 11.0, 9.0, 6.0, 16.0, 18.0, 28.0, 26.0, 43.0, 34.0, 55.0, 76.0, 99.0, 125.0, 101.0, 95.0, 57.0, 56.0, 32.0, 31.0, 23.0, 22.0, 14.0, 11.0, 6.0, 4.0, 4.0, 5.0, 3.0], "bins": [-17.25, -16.89483642578125, -16.5396728515625, -16.18450927734375, -15.829345703125, -15.47418212890625, -15.1190185546875, -14.76385498046875, -14.40869140625, -14.05352783203125, -13.6983642578125, -13.34320068359375, -12.988037109375, -12.63287353515625, -12.2777099609375, -11.92254638671875, -11.5673828125, -11.21221923828125, -10.8570556640625, -10.50189208984375, -10.146728515625, -9.79156494140625, -9.4364013671875, -9.08123779296875, -8.72607421875, -8.37091064453125, -8.0157470703125, -7.66058349609375, -7.305419921875, -6.95025634765625, -6.5950927734375, -6.23992919921875, -5.884765625, -5.52960205078125, -5.1744384765625, -4.81927490234375, -4.464111328125, -4.10894775390625, -3.7537841796875, -3.39862060546875, -3.04345703125, -2.68829345703125, -2.3331298828125, -1.97796630859375, -1.622802734375, -1.26763916015625, -0.9124755859375, -0.55731201171875, -0.2021484375, 0.15301513671875, 0.5081787109375, 0.86334228515625, 1.218505859375, 1.57366943359375, 1.9288330078125, 2.28399658203125, 2.63916015625, 2.99432373046875, 3.3494873046875, 3.70465087890625, 4.059814453125, 4.41497802734375, 4.7701416015625, 5.12530517578125, 5.48046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 5.0, 9.0, 21.0, 89.0, 156.0, 204.0, 223.0, 149.0, 87.0, 38.0, 11.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-573.8876953125, -562.5856323242188, -551.2835693359375, -539.9815063476562, -528.679443359375, -517.3773803710938, -506.0753173828125, -494.77325439453125, -483.47119140625, -472.16912841796875, -460.8670654296875, -449.56500244140625, -438.262939453125, -426.96087646484375, -415.6588134765625, -404.35675048828125, -393.0546569824219, -381.7525939941406, -370.4505310058594, -359.1484680175781, -347.8464050292969, -336.5443420410156, -325.24224853515625, -313.940185546875, -302.63812255859375, -291.3360595703125, -280.03399658203125, -268.73193359375, -257.42987060546875, -246.1278076171875, -234.8257293701172, -223.52366638183594, -212.22161865234375, -200.9195556640625, -189.61749267578125, -178.3154296875, -167.01336669921875, -155.7113037109375, -144.4092254638672, -133.10716247558594, -121.80509948730469, -110.50303649902344, -99.20097351074219, -87.8989028930664, -76.59683990478516, -65.2947769165039, -53.992706298828125, -42.690643310546875, -31.388580322265625, -20.086515426635742, -8.78445053100586, 2.5176162719726562, 13.819679260253906, 25.121742248535156, 36.42381286621094, 47.72587585449219, 59.02793884277344, 70.33000183105469, 81.63206481933594, 92.93413543701172, 104.23619842529297, 115.53826141357422, 126.84033203125, 138.14239501953125, 149.4444580078125]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 4.0, 7.0, 16.0, 12.0, 22.0, 24.0, 21.0, 21.0, 27.0, 40.0, 34.0, 36.0, 48.0, 33.0, 47.0, 42.0, 48.0, 52.0, 35.0, 49.0, 54.0, 43.0, 30.0, 32.0, 28.0, 30.0, 36.0, 17.0, 10.0, 20.0, 10.0, 10.0, 11.0, 10.0, 7.0, 5.0, 2.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-127.1452407836914, -123.16547393798828, -119.18571472167969, -115.20594787597656, -111.22618103027344, -107.24641418457031, -103.26664733886719, -99.2868881225586, -95.30712127685547, -91.32735443115234, -87.34759521484375, -83.36782836914062, -79.3880615234375, -75.40829467773438, -71.42852783203125, -67.44876861572266, -63.46900177001953, -59.489234924316406, -55.50947189331055, -51.52970886230469, -47.54994201660156, -43.57017517089844, -39.59041213989258, -35.61064910888672, -31.630882263183594, -27.6511173248291, -23.67135238647461, -19.691587448120117, -15.711822509765625, -11.732057571411133, -7.752292633056641, -3.7725276947021484, 0.2072296142578125, 4.186994552612305, 8.166759490966797, 12.146524429321289, 16.12628936767578, 20.106054306030273, 24.085819244384766, 28.065584182739258, 32.04534912109375, 36.025115966796875, 40.004878997802734, 43.984642028808594, 47.96440887451172, 51.944175720214844, 55.9239387512207, 59.90370178222656, 63.88346862792969, 67.86323547363281, 71.84300231933594, 75.82276153564453, 79.80252838134766, 83.78229522705078, 87.76205444335938, 91.7418212890625, 95.72158813476562, 99.70135498046875, 103.68112182617188, 107.66088104248047, 111.6406478881836, 115.62041473388672, 119.60017395019531, 123.57994079589844, 127.55970764160156]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 9.0, 16.0, 23.0, 29.0, 40.0, 49.0, 76.0, 102.0, 163.0, 247.0, 423.0, 556.0, 942.0, 1563.0, 2795.0, 5095.0, 9942.0, 21245.0, 50343.0, 149316.0, 928039.0, 2570522.0, 308170.0, 82247.0, 31755.0, 14390.0, 7089.0, 3766.0, 2076.0, 1150.0, 728.0, 459.0, 274.0, 198.0, 133.0, 75.0, 68.0, 43.0, 30.0, 21.0, 20.0, 17.0, 8.0, 6.0, 4.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0], "bins": [-12.2265625, -11.8695068359375, -11.512451171875, -11.1553955078125, -10.79833984375, -10.4412841796875, -10.084228515625, -9.7271728515625, -9.3701171875, -9.0130615234375, -8.656005859375, -8.2989501953125, -7.94189453125, -7.5848388671875, -7.227783203125, -6.8707275390625, -6.513671875, -6.1566162109375, -5.799560546875, -5.4425048828125, -5.08544921875, -4.7283935546875, -4.371337890625, -4.0142822265625, -3.6572265625, -3.3001708984375, -2.943115234375, -2.5860595703125, -2.22900390625, -1.8719482421875, -1.514892578125, -1.1578369140625, -0.80078125, -0.4437255859375, -0.086669921875, 0.2703857421875, 0.62744140625, 0.9844970703125, 1.341552734375, 1.6986083984375, 2.0556640625, 2.4127197265625, 2.769775390625, 3.1268310546875, 3.48388671875, 3.8409423828125, 4.197998046875, 4.5550537109375, 4.912109375, 5.2691650390625, 5.626220703125, 5.9832763671875, 6.34033203125, 6.6973876953125, 7.054443359375, 7.4114990234375, 7.7685546875, 8.1256103515625, 8.482666015625, 8.8397216796875, 9.19677734375, 9.5538330078125, 9.910888671875, 10.2679443359375, 10.625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 2.0, 11.0, 12.0, 20.0, 19.0, 32.0, 29.0, 41.0, 60.0, 35.0, 51.0, 56.0, 59.0, 63.0, 62.0, 67.0, 69.0, 57.0, 48.0, 39.0, 31.0, 25.0, 30.0, 14.0, 12.0, 14.0, 11.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.940185546875, -8.67724609375, -8.414306640625, -8.1513671875, -7.888427734375, -7.62548828125, -7.362548828125, -7.099609375, -6.836669921875, -6.57373046875, -6.310791015625, -6.0478515625, -5.784912109375, -5.52197265625, -5.259033203125, -4.99609375, -4.733154296875, -4.47021484375, -4.207275390625, -3.9443359375, -3.681396484375, -3.41845703125, -3.155517578125, -2.892578125, -2.629638671875, -2.36669921875, -2.103759765625, -1.8408203125, -1.577880859375, -1.31494140625, -1.052001953125, -0.7890625, -0.526123046875, -0.26318359375, -0.000244140625, 0.2626953125, 0.525634765625, 0.78857421875, 1.051513671875, 1.314453125, 1.577392578125, 1.84033203125, 2.103271484375, 2.3662109375, 2.629150390625, 2.89208984375, 3.155029296875, 3.41796875, 3.680908203125, 3.94384765625, 4.206787109375, 4.4697265625, 4.732666015625, 4.99560546875, 5.258544921875, 5.521484375, 5.784423828125, 6.04736328125, 6.310302734375, 6.5732421875, 6.836181640625, 7.09912109375, 7.362060546875, 7.625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 5.0, 6.0, 11.0, 10.0, 13.0, 16.0, 37.0, 67.0, 93.0, 211.0, 473.0, 1144.0, 3032.0, 8992.0, 33719.0, 224626.0, 3469368.0, 388131.0, 46328.0, 11825.0, 3774.0, 1359.0, 517.0, 218.0, 118.0, 61.0, 38.0, 25.0, 19.0, 16.0, 7.0, 6.0, 7.0, 4.0, 0.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.804443359375, -20.12451171875, -19.444580078125, -18.7646484375, -18.084716796875, -17.40478515625, -16.724853515625, -16.044921875, -15.364990234375, -14.68505859375, -14.005126953125, -13.3251953125, -12.645263671875, -11.96533203125, -11.285400390625, -10.60546875, -9.925537109375, -9.24560546875, -8.565673828125, -7.8857421875, -7.205810546875, -6.52587890625, -5.845947265625, -5.166015625, -4.486083984375, -3.80615234375, -3.126220703125, -2.4462890625, -1.766357421875, -1.08642578125, -0.406494140625, 0.2734375, 0.953369140625, 1.63330078125, 2.313232421875, 2.9931640625, 3.673095703125, 4.35302734375, 5.032958984375, 5.712890625, 6.392822265625, 7.07275390625, 7.752685546875, 8.4326171875, 9.112548828125, 9.79248046875, 10.472412109375, 11.15234375, 11.832275390625, 12.51220703125, 13.192138671875, 13.8720703125, 14.552001953125, 15.23193359375, 15.911865234375, 16.591796875, 17.271728515625, 17.95166015625, 18.631591796875, 19.3115234375, 19.991455078125, 20.67138671875, 21.351318359375, 22.03125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 9.0, 3.0, 2.0, 4.0, 4.0, 8.0, 9.0, 11.0, 12.0, 17.0, 28.0, 52.0, 70.0, 94.0, 168.0, 275.0, 535.0, 913.0, 704.0, 420.0, 247.0, 154.0, 96.0, 61.0, 42.0, 29.0, 26.0, 16.0, 15.0, 8.0, 8.0, 5.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.78125, -16.237060546875, -15.69287109375, -15.148681640625, -14.6044921875, -14.060302734375, -13.51611328125, -12.971923828125, -12.427734375, -11.883544921875, -11.33935546875, -10.795166015625, -10.2509765625, -9.706787109375, -9.16259765625, -8.618408203125, -8.07421875, -7.530029296875, -6.98583984375, -6.441650390625, -5.8974609375, -5.353271484375, -4.80908203125, -4.264892578125, -3.720703125, -3.176513671875, -2.63232421875, -2.088134765625, -1.5439453125, -0.999755859375, -0.45556640625, 0.088623046875, 0.6328125, 1.177001953125, 1.72119140625, 2.265380859375, 2.8095703125, 3.353759765625, 3.89794921875, 4.442138671875, 4.986328125, 5.530517578125, 6.07470703125, 6.618896484375, 7.1630859375, 7.707275390625, 8.25146484375, 8.795654296875, 9.33984375, 9.884033203125, 10.42822265625, 10.972412109375, 11.5166015625, 12.060791015625, 12.60498046875, 13.149169921875, 13.693359375, 14.237548828125, 14.78173828125, 15.325927734375, 15.8701171875, 16.414306640625, 16.95849609375, 17.502685546875, 18.046875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 14.0, 7.0, 27.0, 44.0, 73.0, 100.0, 127.0, 146.0, 132.0, 105.0, 76.0, 49.0, 21.0, 29.0, 11.0, 9.0, 4.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-116.73361206054688, -112.25304412841797, -107.77247619628906, -103.29190826416016, -98.81134033203125, -94.33077239990234, -89.85020446777344, -85.36964416503906, -80.88906860351562, -76.40850067138672, -71.92793273925781, -67.4473648071289, -62.966796875, -58.486228942871094, -54.00566482543945, -49.52509689331055, -45.044532775878906, -40.56396484375, -36.083396911621094, -31.60283088684082, -27.122262954711914, -22.641695022583008, -18.161128997802734, -13.680561065673828, -9.199993133544922, -4.719425678253174, -0.23885822296142578, 4.241708755493164, 8.72227668762207, 13.202844619750977, 17.68341064453125, 22.163978576660156, 26.644546508789062, 31.12511444091797, 35.605682373046875, 40.08625030517578, 44.56681823730469, 49.047386169433594, 53.527950286865234, 58.00851821899414, 62.48908615112305, 66.96965026855469, 71.4502182006836, 75.9307861328125, 80.4113540649414, 84.89192199707031, 89.37248992919922, 93.85305786132812, 98.33362579345703, 102.81419372558594, 107.29476165771484, 111.77532958984375, 116.25589752197266, 120.73646545410156, 125.21702575683594, 129.69760131835938, 134.17816162109375, 138.65872192382812, 143.13929748535156, 147.61985778808594, 152.10043334960938, 156.58099365234375, 161.0615692138672, 165.54212951660156, 170.022705078125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 5.0, 9.0, 3.0, 11.0, 13.0, 22.0, 19.0, 26.0, 18.0, 23.0, 38.0, 34.0, 44.0, 50.0, 44.0, 56.0, 50.0, 54.0, 55.0, 55.0, 44.0, 52.0, 51.0, 45.0, 40.0, 27.0, 20.0, 17.0, 12.0, 10.0, 9.0, 9.0, 6.0, 10.0, 5.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.94559478759766, -69.26214599609375, -66.57870483398438, -63.89525604248047, -61.21180725097656, -58.528358459472656, -55.844913482666016, -53.161468505859375, -50.47801971435547, -47.79457092285156, -45.11112594604492, -42.42768096923828, -39.744232177734375, -37.06078338623047, -34.37733840942383, -31.693891525268555, -29.01044464111328, -26.326997756958008, -23.643550872802734, -20.96010398864746, -18.276657104492188, -15.593210220336914, -12.90976333618164, -10.226316452026367, -7.542869567871094, -4.85942268371582, -2.175975799560547, 0.5074710845947266, 3.19091796875, 5.874364852905273, 8.557811737060547, 11.24125862121582, 13.924713134765625, 16.6081600189209, 19.291606903076172, 21.975053787231445, 24.65850067138672, 27.341947555541992, 30.025394439697266, 32.708839416503906, 35.39228820800781, 38.07573699951172, 40.75918197631836, 43.442626953125, 46.126075744628906, 48.80952453613281, 51.49296951293945, 54.176414489746094, 56.85986328125, 59.543312072753906, 62.22675704956055, 64.91020202636719, 67.5936508178711, 70.277099609375, 72.96054077148438, 75.64398956298828, 78.32743835449219, 81.0108871459961, 83.6943359375, 86.37777709960938, 89.06122589111328, 91.74467468261719, 94.42811584472656, 97.11156463623047, 99.79501342773438]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 8.0, 8.0, 23.0, 28.0, 48.0, 64.0, 98.0, 163.0, 287.0, 469.0, 765.0, 1349.0, 2523.0, 4958.0, 10451.0, 22906.0, 55378.0, 145200.0, 393773.0, 257475.0, 87077.0, 35053.0, 15175.0, 7207.0, 3607.0, 1912.0, 1092.0, 581.0, 330.0, 198.0, 119.0, 83.0, 45.0, 31.0, 20.0, 15.0, 11.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.28125, -16.783935546875, -16.28662109375, -15.789306640625, -15.2919921875, -14.794677734375, -14.29736328125, -13.800048828125, -13.302734375, -12.805419921875, -12.30810546875, -11.810791015625, -11.3134765625, -10.816162109375, -10.31884765625, -9.821533203125, -9.32421875, -8.826904296875, -8.32958984375, -7.832275390625, -7.3349609375, -6.837646484375, -6.34033203125, -5.843017578125, -5.345703125, -4.848388671875, -4.35107421875, -3.853759765625, -3.3564453125, -2.859130859375, -2.36181640625, -1.864501953125, -1.3671875, -0.869873046875, -0.37255859375, 0.124755859375, 0.6220703125, 1.119384765625, 1.61669921875, 2.114013671875, 2.611328125, 3.108642578125, 3.60595703125, 4.103271484375, 4.6005859375, 5.097900390625, 5.59521484375, 6.092529296875, 6.58984375, 7.087158203125, 7.58447265625, 8.081787109375, 8.5791015625, 9.076416015625, 9.57373046875, 10.071044921875, 10.568359375, 11.065673828125, 11.56298828125, 12.060302734375, 12.5576171875, 13.054931640625, 13.55224609375, 14.049560546875, 14.546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 10.0, 12.0, 8.0, 20.0, 17.0, 21.0, 27.0, 28.0, 27.0, 42.0, 44.0, 34.0, 49.0, 47.0, 46.0, 54.0, 40.0, 49.0, 42.0, 45.0, 47.0, 55.0, 39.0, 31.0, 26.0, 24.0, 22.0, 13.0, 11.0, 10.0, 8.0, 7.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.5635986328125, -6.357666015625, -6.1517333984375, -5.94580078125, -5.7398681640625, -5.533935546875, -5.3280029296875, -5.1220703125, -4.9161376953125, -4.710205078125, -4.5042724609375, -4.29833984375, -4.0924072265625, -3.886474609375, -3.6805419921875, -3.474609375, -3.2686767578125, -3.062744140625, -2.8568115234375, -2.65087890625, -2.4449462890625, -2.239013671875, -2.0330810546875, -1.8271484375, -1.6212158203125, -1.415283203125, -1.2093505859375, -1.00341796875, -0.7974853515625, -0.591552734375, -0.3856201171875, -0.1796875, 0.0262451171875, 0.232177734375, 0.4381103515625, 0.64404296875, 0.8499755859375, 1.055908203125, 1.2618408203125, 1.4677734375, 1.6737060546875, 1.879638671875, 2.0855712890625, 2.29150390625, 2.4974365234375, 2.703369140625, 2.9093017578125, 3.115234375, 3.3211669921875, 3.527099609375, 3.7330322265625, 3.93896484375, 4.1448974609375, 4.350830078125, 4.5567626953125, 4.7626953125, 4.9686279296875, 5.174560546875, 5.3804931640625, 5.58642578125, 5.7923583984375, 5.998291015625, 6.2042236328125, 6.41015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 7.0, 1.0, 5.0, 12.0, 7.0, 12.0, 18.0, 25.0, 30.0, 34.0, 50.0, 61.0, 103.0, 119.0, 187.0, 291.0, 487.0, 908.0, 2114.0, 6739.0, 46245.0, 709819.0, 252746.0, 20826.0, 4209.0, 1487.0, 769.0, 420.0, 222.0, 162.0, 105.0, 79.0, 61.0, 47.0, 36.0, 29.0, 19.0, 9.0, 6.0, 12.0, 11.0, 7.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-33.4375, -32.3525390625, -31.267578125, -30.1826171875, -29.09765625, -28.0126953125, -26.927734375, -25.8427734375, -24.7578125, -23.6728515625, -22.587890625, -21.5029296875, -20.41796875, -19.3330078125, -18.248046875, -17.1630859375, -16.078125, -14.9931640625, -13.908203125, -12.8232421875, -11.73828125, -10.6533203125, -9.568359375, -8.4833984375, -7.3984375, -6.3134765625, -5.228515625, -4.1435546875, -3.05859375, -1.9736328125, -0.888671875, 0.1962890625, 1.28125, 2.3662109375, 3.451171875, 4.5361328125, 5.62109375, 6.7060546875, 7.791015625, 8.8759765625, 9.9609375, 11.0458984375, 12.130859375, 13.2158203125, 14.30078125, 15.3857421875, 16.470703125, 17.5556640625, 18.640625, 19.7255859375, 20.810546875, 21.8955078125, 22.98046875, 24.0654296875, 25.150390625, 26.2353515625, 27.3203125, 28.4052734375, 29.490234375, 30.5751953125, 31.66015625, 32.7451171875, 33.830078125, 34.9150390625, 36.0]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 5.0, 13.0, 9.0, 15.0, 15.0, 15.0, 27.0, 37.0, 32.0, 43.0, 60.0, 57.0, 51.0, 52.0, 72.0, 61.0, 65.0, 55.0, 50.0, 47.0, 39.0, 33.0, 29.0, 23.0, 17.0, 15.0, 16.0, 10.0, 6.0, 5.0, 9.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.765625, -28.760009765625, -27.75439453125, -26.748779296875, -25.7431640625, -24.737548828125, -23.73193359375, -22.726318359375, -21.720703125, -20.715087890625, -19.70947265625, -18.703857421875, -17.6982421875, -16.692626953125, -15.68701171875, -14.681396484375, -13.67578125, -12.670166015625, -11.66455078125, -10.658935546875, -9.6533203125, -8.647705078125, -7.64208984375, -6.636474609375, -5.630859375, -4.625244140625, -3.61962890625, -2.614013671875, -1.6083984375, -0.602783203125, 0.40283203125, 1.408447265625, 2.4140625, 3.419677734375, 4.42529296875, 5.430908203125, 6.4365234375, 7.442138671875, 8.44775390625, 9.453369140625, 10.458984375, 11.464599609375, 12.47021484375, 13.475830078125, 14.4814453125, 15.487060546875, 16.49267578125, 17.498291015625, 18.50390625, 19.509521484375, 20.51513671875, 21.520751953125, 22.5263671875, 23.531982421875, 24.53759765625, 25.543212890625, 26.548828125, 27.554443359375, 28.56005859375, 29.565673828125, 30.5712890625, 31.576904296875, 32.58251953125, 33.588134765625, 34.59375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 9.0, 15.0, 10.0, 19.0, 23.0, 29.0, 70.0, 87.0, 176.0, 316.0, 725.0, 2354.0, 11207.0, 106338.0, 838407.0, 76418.0, 8975.0, 1966.0, 693.0, 276.0, 144.0, 96.0, 56.0, 39.0, 22.0, 16.0, 14.0, 3.0, 10.0, 7.0, 1.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.453125, -13.993408203125, -13.53369140625, -13.073974609375, -12.6142578125, -12.154541015625, -11.69482421875, -11.235107421875, -10.775390625, -10.315673828125, -9.85595703125, -9.396240234375, -8.9365234375, -8.476806640625, -8.01708984375, -7.557373046875, -7.09765625, -6.637939453125, -6.17822265625, -5.718505859375, -5.2587890625, -4.799072265625, -4.33935546875, -3.879638671875, -3.419921875, -2.960205078125, -2.50048828125, -2.040771484375, -1.5810546875, -1.121337890625, -0.66162109375, -0.201904296875, 0.2578125, 0.717529296875, 1.17724609375, 1.636962890625, 2.0966796875, 2.556396484375, 3.01611328125, 3.475830078125, 3.935546875, 4.395263671875, 4.85498046875, 5.314697265625, 5.7744140625, 6.234130859375, 6.69384765625, 7.153564453125, 7.61328125, 8.072998046875, 8.53271484375, 8.992431640625, 9.4521484375, 9.911865234375, 10.37158203125, 10.831298828125, 11.291015625, 11.750732421875, 12.21044921875, 12.670166015625, 13.1298828125, 13.589599609375, 14.04931640625, 14.509033203125, 14.96875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 5.0, 5.0, 13.0, 14.0, 10.0, 18.0, 23.0, 28.0, 35.0, 37.0, 68.0, 110.0, 163.0, 151.0, 87.0, 58.0, 34.0, 31.0, 29.0, 10.0, 12.0, 8.0, 11.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0021839141845703125, -0.0021189749240875244, -0.0020540356636047363, -0.0019890964031219482, -0.0019241571426391602, -0.001859217882156372, -0.001794278621673584, -0.001729339361190796, -0.0016644001007080078, -0.0015994608402252197, -0.0015345215797424316, -0.0014695823192596436, -0.0014046430587768555, -0.0013397037982940674, -0.0012747645378112793, -0.0012098252773284912, -0.0011448860168457031, -0.001079946756362915, -0.001015007495880127, -0.0009500682353973389, -0.0008851289749145508, -0.0008201897144317627, -0.0007552504539489746, -0.0006903111934661865, -0.0006253719329833984, -0.0005604326725006104, -0.0004954934120178223, -0.0004305541515350342, -0.0003656148910522461, -0.000300675630569458, -0.00023573637008666992, -0.00017079710960388184, -0.00010585784912109375, -4.0918588638305664e-05, 2.4020671844482422e-05, 8.895993232727051e-05, 0.0001538991928100586, 0.00021883845329284668, 0.00028377771377563477, 0.00034871697425842285, 0.00041365623474121094, 0.000478595495223999, 0.0005435347557067871, 0.0006084740161895752, 0.0006734132766723633, 0.0007383525371551514, 0.0008032917976379395, 0.0008682310581207275, 0.0009331703186035156, 0.0009981095790863037, 0.0010630488395690918, 0.0011279881000518799, 0.001192927360534668, 0.001257866621017456, 0.0013228058815002441, 0.0013877451419830322, 0.0014526844024658203, 0.0015176236629486084, 0.0015825629234313965, 0.0016475021839141846, 0.0017124414443969727, 0.0017773807048797607, 0.0018423199653625488, 0.001907259225845337, 0.001972198486328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 4.0, 4.0, 6.0, 13.0, 7.0, 9.0, 19.0, 18.0, 47.0, 77.0, 109.0, 159.0, 311.0, 644.0, 1416.0, 4544.0, 28006.0, 582208.0, 401391.0, 22871.0, 4091.0, 1289.0, 539.0, 295.0, 159.0, 110.0, 75.0, 45.0, 37.0, 22.0, 11.0, 10.0, 8.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.78125, -9.314453125, -8.84765625, -8.380859375, -7.9140625, -7.447265625, -6.98046875, -6.513671875, -6.046875, -5.580078125, -5.11328125, -4.646484375, -4.1796875, -3.712890625, -3.24609375, -2.779296875, -2.3125, -1.845703125, -1.37890625, -0.912109375, -0.4453125, 0.021484375, 0.48828125, 0.955078125, 1.421875, 1.888671875, 2.35546875, 2.822265625, 3.2890625, 3.755859375, 4.22265625, 4.689453125, 5.15625, 5.623046875, 6.08984375, 6.556640625, 7.0234375, 7.490234375, 7.95703125, 8.423828125, 8.890625, 9.357421875, 9.82421875, 10.291015625, 10.7578125, 11.224609375, 11.69140625, 12.158203125, 12.625, 13.091796875, 13.55859375, 14.025390625, 14.4921875, 14.958984375, 15.42578125, 15.892578125, 16.359375, 16.826171875, 17.29296875, 17.759765625, 18.2265625, 18.693359375, 19.16015625, 19.626953125, 20.09375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 8.0, 8.0, 16.0, 10.0, 10.0, 12.0, 21.0, 33.0, 33.0, 45.0, 70.0, 96.0, 97.0, 118.0, 84.0, 88.0, 49.0, 44.0, 53.0, 28.0, 19.0, 16.0, 15.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.455810546875, -9.12255859375, -8.789306640625, -8.4560546875, -8.122802734375, -7.78955078125, -7.456298828125, -7.123046875, -6.789794921875, -6.45654296875, -6.123291015625, -5.7900390625, -5.456787109375, -5.12353515625, -4.790283203125, -4.45703125, -4.123779296875, -3.79052734375, -3.457275390625, -3.1240234375, -2.790771484375, -2.45751953125, -2.124267578125, -1.791015625, -1.457763671875, -1.12451171875, -0.791259765625, -0.4580078125, -0.124755859375, 0.20849609375, 0.541748046875, 0.875, 1.208251953125, 1.54150390625, 1.874755859375, 2.2080078125, 2.541259765625, 2.87451171875, 3.207763671875, 3.541015625, 3.874267578125, 4.20751953125, 4.540771484375, 4.8740234375, 5.207275390625, 5.54052734375, 5.873779296875, 6.20703125, 6.540283203125, 6.87353515625, 7.206787109375, 7.5400390625, 7.873291015625, 8.20654296875, 8.539794921875, 8.873046875, 9.206298828125, 9.53955078125, 9.872802734375, 10.2060546875, 10.539306640625, 10.87255859375, 11.205810546875, 11.5390625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 24.0, 55.0, 119.0, 141.0, 227.0, 183.0, 127.0, 58.0, 28.0, 13.0, 8.0, 2.0, 5.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.61138916015625, -133.35787963867188, -126.10436248779297, -118.8508529663086, -111.59733581542969, -104.34382629394531, -97.09031677246094, -89.83680725097656, -82.58329010009766, -75.32978057861328, -68.07626342773438, -60.82275390625, -53.56924057006836, -46.31572723388672, -39.062217712402344, -31.808704376220703, -24.555191040039062, -17.301677703857422, -10.048166275024414, -2.7946548461914062, 4.458858489990234, 11.712371826171875, 18.96588134765625, 26.21939468383789, 33.47290802001953, 40.72642135620117, 47.97993469238281, 55.23344421386719, 62.48695755004883, 69.74047088623047, 76.99398040771484, 84.24749755859375, 91.50100708007812, 98.7545166015625, 106.0080337524414, 113.26154327392578, 120.51506042480469, 127.76856994628906, 135.02207946777344, 142.2755889892578, 149.52911376953125, 156.78262329101562, 164.0361328125, 171.28964233398438, 178.5431671142578, 185.7966766357422, 193.05018615722656, 200.30369567871094, 207.5572052001953, 214.8107147216797, 222.06422424316406, 229.3177490234375, 236.57125854492188, 243.82476806640625, 251.07827758789062, 258.331787109375, 265.5852966308594, 272.83880615234375, 280.0923156738281, 287.3458251953125, 294.5993347167969, 301.85284423828125, 309.10638427734375, 316.3598937988281, 323.6134033203125]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 9.0, 15.0, 6.0, 7.0, 7.0, 14.0, 19.0, 19.0, 22.0, 19.0, 26.0, 41.0, 30.0, 35.0, 39.0, 39.0, 48.0, 59.0, 46.0, 49.0, 32.0, 44.0, 41.0, 40.0, 30.0, 19.0, 27.0, 25.0, 30.0, 21.0, 19.0, 16.0, 16.0, 12.0, 9.0, 15.0, 10.0, 4.0, 6.0, 8.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0], "bins": [-97.423095703125, -94.56591796875, -91.708740234375, -88.8515625, -85.994384765625, -83.13721466064453, -80.28003692626953, -77.42285919189453, -74.56568145751953, -71.70850372314453, -68.85132598876953, -65.99414825439453, -63.1369743347168, -60.2797966003418, -57.42262268066406, -54.56544494628906, -51.70826721191406, -48.85108947753906, -45.99391174316406, -43.13673782348633, -40.27956008911133, -37.42238235473633, -34.565208435058594, -31.708030700683594, -28.850852966308594, -25.993675231933594, -23.136499404907227, -20.27932357788086, -17.42214584350586, -14.564969062805176, -11.707792282104492, -8.850616455078125, -5.993438720703125, -3.1362619400024414, -0.2790851593017578, 2.578091621398926, 5.435268402099609, 8.292445182800293, 11.149621963500977, 14.006797790527344, 16.863975524902344, 19.721153259277344, 22.57832908630371, 25.435504913330078, 28.292682647705078, 31.149860382080078, 34.00703430175781, 36.86421203613281, 39.72138977050781, 42.57856750488281, 45.43574523925781, 48.29291915893555, 51.15009689331055, 54.00727462768555, 56.86444854736328, 59.72162628173828, 62.57880401611328, 65.43598175048828, 68.29315948486328, 71.15033721923828, 74.00750732421875, 76.86468505859375, 79.72186279296875, 82.57904052734375, 85.43621826171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 17.0, 15.0, 26.0, 39.0, 49.0, 70.0, 120.0, 146.0, 273.0, 1245.0, 92480.0, 4093131.0, 5566.0, 452.0, 205.0, 131.0, 83.0, 71.0, 45.0, 22.0, 26.0, 16.0, 10.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-88.5, -86.0576171875, -83.615234375, -81.1728515625, -78.73046875, -76.2880859375, -73.845703125, -71.4033203125, -68.9609375, -66.5185546875, -64.076171875, -61.6337890625, -59.19140625, -56.7490234375, -54.306640625, -51.8642578125, -49.421875, -46.9794921875, -44.537109375, -42.0947265625, -39.65234375, -37.2099609375, -34.767578125, -32.3251953125, -29.8828125, -27.4404296875, -24.998046875, -22.5556640625, -20.11328125, -17.6708984375, -15.228515625, -12.7861328125, -10.34375, -7.9013671875, -5.458984375, -3.0166015625, -0.57421875, 1.8681640625, 4.310546875, 6.7529296875, 9.1953125, 11.6376953125, 14.080078125, 16.5224609375, 18.96484375, 21.4072265625, 23.849609375, 26.2919921875, 28.734375, 31.1767578125, 33.619140625, 36.0615234375, 38.50390625, 40.9462890625, 43.388671875, 45.8310546875, 48.2734375, 50.7158203125, 53.158203125, 55.6005859375, 58.04296875, 60.4853515625, 62.927734375, 65.3701171875, 67.8125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 14.0, 16.0, 21.0, 39.0, 46.0, 53.0, 56.0, 53.0, 71.0, 71.0, 79.0, 69.0, 87.0, 76.0, 53.0, 49.0, 40.0, 28.0, 21.0, 10.0, 8.0, 8.0, 7.0, 4.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.4837646484375, -7.178466796875, -6.8731689453125, -6.56787109375, -6.2625732421875, -5.957275390625, -5.6519775390625, -5.3466796875, -5.0413818359375, -4.736083984375, -4.4307861328125, -4.12548828125, -3.8201904296875, -3.514892578125, -3.2095947265625, -2.904296875, -2.5989990234375, -2.293701171875, -1.9884033203125, -1.68310546875, -1.3778076171875, -1.072509765625, -0.7672119140625, -0.4619140625, -0.1566162109375, 0.148681640625, 0.4539794921875, 0.75927734375, 1.0645751953125, 1.369873046875, 1.6751708984375, 1.98046875, 2.2857666015625, 2.591064453125, 2.8963623046875, 3.20166015625, 3.5069580078125, 3.812255859375, 4.1175537109375, 4.4228515625, 4.7281494140625, 5.033447265625, 5.3387451171875, 5.64404296875, 5.9493408203125, 6.254638671875, 6.5599365234375, 6.865234375, 7.1705322265625, 7.475830078125, 7.7811279296875, 8.08642578125, 8.3917236328125, 8.697021484375, 9.0023193359375, 9.3076171875, 9.6129150390625, 9.918212890625, 10.2235107421875, 10.52880859375, 10.8341064453125, 11.139404296875, 11.4447021484375, 11.75]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 8.0, 8.0, 18.0, 15.0, 28.0, 30.0, 55.0, 126.0, 192.0, 318.0, 630.0, 1193.0, 2362.0, 4713.0, 10432.0, 24725.0, 70969.0, 314086.0, 2753327.0, 826306.0, 121513.0, 36972.0, 14290.0, 6207.0, 2871.0, 1350.0, 699.0, 366.0, 195.0, 115.0, 58.0, 45.0, 26.0, 13.0, 12.0, 8.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1953125, -11.822509765625, -11.44970703125, -11.076904296875, -10.7041015625, -10.331298828125, -9.95849609375, -9.585693359375, -9.212890625, -8.840087890625, -8.46728515625, -8.094482421875, -7.7216796875, -7.348876953125, -6.97607421875, -6.603271484375, -6.23046875, -5.857666015625, -5.48486328125, -5.112060546875, -4.7392578125, -4.366455078125, -3.99365234375, -3.620849609375, -3.248046875, -2.875244140625, -2.50244140625, -2.129638671875, -1.7568359375, -1.384033203125, -1.01123046875, -0.638427734375, -0.265625, 0.107177734375, 0.47998046875, 0.852783203125, 1.2255859375, 1.598388671875, 1.97119140625, 2.343994140625, 2.716796875, 3.089599609375, 3.46240234375, 3.835205078125, 4.2080078125, 4.580810546875, 4.95361328125, 5.326416015625, 5.69921875, 6.072021484375, 6.44482421875, 6.817626953125, 7.1904296875, 7.563232421875, 7.93603515625, 8.308837890625, 8.681640625, 9.054443359375, 9.42724609375, 9.800048828125, 10.1728515625, 10.545654296875, 10.91845703125, 11.291259765625, 11.6640625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 9.0, 7.0, 7.0, 17.0, 20.0, 25.0, 34.0, 33.0, 57.0, 64.0, 130.0, 203.0, 314.0, 588.0, 831.0, 677.0, 420.0, 208.0, 113.0, 83.0, 57.0, 45.0, 31.0, 21.0, 15.0, 14.0, 8.0, 9.0, 5.0, 1.0, 11.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.21875, -14.7662353515625, -14.313720703125, -13.8612060546875, -13.40869140625, -12.9561767578125, -12.503662109375, -12.0511474609375, -11.5986328125, -11.1461181640625, -10.693603515625, -10.2410888671875, -9.78857421875, -9.3360595703125, -8.883544921875, -8.4310302734375, -7.978515625, -7.5260009765625, -7.073486328125, -6.6209716796875, -6.16845703125, -5.7159423828125, -5.263427734375, -4.8109130859375, -4.3583984375, -3.9058837890625, -3.453369140625, -3.0008544921875, -2.54833984375, -2.0958251953125, -1.643310546875, -1.1907958984375, -0.73828125, -0.2857666015625, 0.166748046875, 0.6192626953125, 1.07177734375, 1.5242919921875, 1.976806640625, 2.4293212890625, 2.8818359375, 3.3343505859375, 3.786865234375, 4.2393798828125, 4.69189453125, 5.1444091796875, 5.596923828125, 6.0494384765625, 6.501953125, 6.9544677734375, 7.406982421875, 7.8594970703125, 8.31201171875, 8.7645263671875, 9.217041015625, 9.6695556640625, 10.1220703125, 10.5745849609375, 11.027099609375, 11.4796142578125, 11.93212890625, 12.3846435546875, 12.837158203125, 13.2896728515625, 13.7421875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 21.0, 38.0, 73.0, 142.0, 197.0, 195.0, 159.0, 86.0, 37.0, 14.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.47695922851562, -169.2062530517578, -163.935546875, -158.66482543945312, -153.3941192626953, -148.1234130859375, -142.8527069091797, -137.58200073242188, -132.311279296875, -127.04057312011719, -121.76985931396484, -116.49915313720703, -111.22843933105469, -105.95773315429688, -100.68702697753906, -95.41631317138672, -90.1456069946289, -84.8749008178711, -79.60418701171875, -74.33348083496094, -69.0627670288086, -63.79206085205078, -58.5213508605957, -53.250640869140625, -47.97993087768555, -42.70922088623047, -37.43851089477539, -32.16780090332031, -26.897092819213867, -21.62638282775879, -16.355674743652344, -11.084964752197266, -5.8142547607421875, -0.5435452461242676, 4.727164268493652, 9.997873306274414, 15.268583297729492, 20.53929328918457, 25.810001373291016, 31.080711364746094, 36.35142135620117, 41.62213134765625, 46.89284133911133, 52.163551330566406, 57.43425750732422, 62.70497131347656, 67.97567749023438, 73.24638366699219, 78.51709747314453, 83.78780364990234, 89.05851745605469, 94.3292236328125, 99.59993743896484, 104.87064361572266, 110.141357421875, 115.41206359863281, 120.68276977539062, 125.95347595214844, 131.22418212890625, 136.49490356445312, 141.76560974121094, 147.03631591796875, 152.30702209472656, 157.57772827148438, 162.84844970703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 1.0, 5.0, 4.0, 5.0, 8.0, 11.0, 10.0, 18.0, 19.0, 32.0, 35.0, 33.0, 43.0, 57.0, 51.0, 65.0, 76.0, 78.0, 65.0, 66.0, 66.0, 50.0, 31.0, 40.0, 41.0, 22.0, 15.0, 16.0, 16.0, 14.0, 2.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.43794250488281, -84.58455657958984, -81.73117065429688, -78.87779235839844, -76.02440643310547, -73.1710205078125, -70.31763458251953, -67.46424865722656, -64.6108627319336, -61.757476806640625, -58.90409469604492, -56.05070877075195, -53.197322845458984, -50.34394073486328, -47.49055480957031, -44.637168884277344, -41.78378677368164, -38.93040084838867, -36.07701873779297, -33.2236328125, -30.37024688720703, -27.516862869262695, -24.66347885131836, -21.81009292602539, -18.956708908081055, -16.10332489013672, -13.24993896484375, -10.396554946899414, -7.543169975280762, -4.689785003662109, -1.8364009857177734, 1.0169849395751953, 3.8703689575195312, 6.723753929138184, 9.577138900756836, 12.430522918701172, 15.283907890319824, 18.137292861938477, 20.990676879882812, 23.84406280517578, 26.697446823120117, 29.550830841064453, 32.40421676635742, 35.257598876953125, 38.110984802246094, 40.96437072753906, 43.81775665283203, 46.671142578125, 49.5245246887207, 52.37791061401367, 55.231292724609375, 58.084678649902344, 60.93806457519531, 63.79145050048828, 66.64483642578125, 69.49821472167969, 72.35160064697266, 75.20498657226562, 78.0583724975586, 80.91175842285156, 83.76513671875, 86.61852264404297, 89.47190856933594, 92.3252944946289, 95.17868041992188]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 18.0, 24.0, 32.0, 52.0, 71.0, 108.0, 186.0, 293.0, 488.0, 835.0, 1499.0, 2801.0, 5304.0, 10649.0, 23082.0, 54383.0, 142473.0, 373836.0, 267378.0, 93999.0, 37246.0, 16708.0, 8063.0, 4002.0, 2049.0, 1199.0, 656.0, 406.0, 256.0, 151.0, 96.0, 62.0, 49.0, 22.0, 16.0, 15.0, 13.0, 2.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8515625, -11.43994140625, -11.0283203125, -10.61669921875, -10.205078125, -9.79345703125, -9.3818359375, -8.97021484375, -8.55859375, -8.14697265625, -7.7353515625, -7.32373046875, -6.912109375, -6.50048828125, -6.0888671875, -5.67724609375, -5.265625, -4.85400390625, -4.4423828125, -4.03076171875, -3.619140625, -3.20751953125, -2.7958984375, -2.38427734375, -1.97265625, -1.56103515625, -1.1494140625, -0.73779296875, -0.326171875, 0.08544921875, 0.4970703125, 0.90869140625, 1.3203125, 1.73193359375, 2.1435546875, 2.55517578125, 2.966796875, 3.37841796875, 3.7900390625, 4.20166015625, 4.61328125, 5.02490234375, 5.4365234375, 5.84814453125, 6.259765625, 6.67138671875, 7.0830078125, 7.49462890625, 7.90625, 8.31787109375, 8.7294921875, 9.14111328125, 9.552734375, 9.96435546875, 10.3759765625, 10.78759765625, 11.19921875, 11.61083984375, 12.0224609375, 12.43408203125, 12.845703125, 13.25732421875, 13.6689453125, 14.08056640625, 14.4921875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 11.0, 16.0, 12.0, 18.0, 13.0, 21.0, 36.0, 17.0, 27.0, 36.0, 43.0, 36.0, 35.0, 55.0, 45.0, 57.0, 39.0, 37.0, 49.0, 49.0, 52.0, 29.0, 40.0, 33.0, 33.0, 25.0, 11.0, 18.0, 21.0, 13.0, 13.0, 7.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.8671875, -5.672119140625, -5.47705078125, -5.281982421875, -5.0869140625, -4.891845703125, -4.69677734375, -4.501708984375, -4.306640625, -4.111572265625, -3.91650390625, -3.721435546875, -3.5263671875, -3.331298828125, -3.13623046875, -2.941162109375, -2.74609375, -2.551025390625, -2.35595703125, -2.160888671875, -1.9658203125, -1.770751953125, -1.57568359375, -1.380615234375, -1.185546875, -0.990478515625, -0.79541015625, -0.600341796875, -0.4052734375, -0.210205078125, -0.01513671875, 0.179931640625, 0.375, 0.570068359375, 0.76513671875, 0.960205078125, 1.1552734375, 1.350341796875, 1.54541015625, 1.740478515625, 1.935546875, 2.130615234375, 2.32568359375, 2.520751953125, 2.7158203125, 2.910888671875, 3.10595703125, 3.301025390625, 3.49609375, 3.691162109375, 3.88623046875, 4.081298828125, 4.2763671875, 4.471435546875, 4.66650390625, 4.861572265625, 5.056640625, 5.251708984375, 5.44677734375, 5.641845703125, 5.8369140625, 6.031982421875, 6.22705078125, 6.422119140625, 6.6171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 9.0, 13.0, 6.0, 9.0, 24.0, 29.0, 34.0, 79.0, 84.0, 111.0, 207.0, 345.0, 590.0, 1232.0, 2786.0, 8399.0, 32957.0, 186051.0, 667526.0, 114522.0, 22876.0, 6086.0, 2207.0, 1003.0, 493.0, 297.0, 169.0, 93.0, 87.0, 50.0, 37.0, 31.0, 26.0, 16.0, 15.0, 13.0, 7.0, 3.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-24.546875, -23.832763671875, -23.11865234375, -22.404541015625, -21.6904296875, -20.976318359375, -20.26220703125, -19.548095703125, -18.833984375, -18.119873046875, -17.40576171875, -16.691650390625, -15.9775390625, -15.263427734375, -14.54931640625, -13.835205078125, -13.12109375, -12.406982421875, -11.69287109375, -10.978759765625, -10.2646484375, -9.550537109375, -8.83642578125, -8.122314453125, -7.408203125, -6.694091796875, -5.97998046875, -5.265869140625, -4.5517578125, -3.837646484375, -3.12353515625, -2.409423828125, -1.6953125, -0.981201171875, -0.26708984375, 0.447021484375, 1.1611328125, 1.875244140625, 2.58935546875, 3.303466796875, 4.017578125, 4.731689453125, 5.44580078125, 6.159912109375, 6.8740234375, 7.588134765625, 8.30224609375, 9.016357421875, 9.73046875, 10.444580078125, 11.15869140625, 11.872802734375, 12.5869140625, 13.301025390625, 14.01513671875, 14.729248046875, 15.443359375, 16.157470703125, 16.87158203125, 17.585693359375, 18.2998046875, 19.013916015625, 19.72802734375, 20.442138671875, 21.15625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 1.0, 7.0, 10.0, 12.0, 16.0, 11.0, 17.0, 20.0, 15.0, 31.0, 53.0, 54.0, 43.0, 49.0, 57.0, 70.0, 65.0, 60.0, 61.0, 62.0, 45.0, 43.0, 41.0, 25.0, 30.0, 19.0, 14.0, 18.0, 12.0, 9.0, 8.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-36.4375, -35.491943359375, -34.54638671875, -33.600830078125, -32.6552734375, -31.709716796875, -30.76416015625, -29.818603515625, -28.873046875, -27.927490234375, -26.98193359375, -26.036376953125, -25.0908203125, -24.145263671875, -23.19970703125, -22.254150390625, -21.30859375, -20.363037109375, -19.41748046875, -18.471923828125, -17.5263671875, -16.580810546875, -15.63525390625, -14.689697265625, -13.744140625, -12.798583984375, -11.85302734375, -10.907470703125, -9.9619140625, -9.016357421875, -8.07080078125, -7.125244140625, -6.1796875, -5.234130859375, -4.28857421875, -3.343017578125, -2.3974609375, -1.451904296875, -0.50634765625, 0.439208984375, 1.384765625, 2.330322265625, 3.27587890625, 4.221435546875, 5.1669921875, 6.112548828125, 7.05810546875, 8.003662109375, 8.94921875, 9.894775390625, 10.84033203125, 11.785888671875, 12.7314453125, 13.677001953125, 14.62255859375, 15.568115234375, 16.513671875, 17.459228515625, 18.40478515625, 19.350341796875, 20.2958984375, 21.241455078125, 22.18701171875, 23.132568359375, 24.078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 10.0, 5.0, 3.0, 7.0, 13.0, 15.0, 18.0, 31.0, 48.0, 97.0, 217.0, 540.0, 1911.0, 11063.0, 339464.0, 675711.0, 15858.0, 2274.0, 720.0, 238.0, 126.0, 57.0, 31.0, 25.0, 15.0, 3.0, 8.0, 7.0, 6.0, 7.0, 3.0, 1.0, 8.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.3125, -18.69091796875, -18.0693359375, -17.44775390625, -16.826171875, -16.20458984375, -15.5830078125, -14.96142578125, -14.33984375, -13.71826171875, -13.0966796875, -12.47509765625, -11.853515625, -11.23193359375, -10.6103515625, -9.98876953125, -9.3671875, -8.74560546875, -8.1240234375, -7.50244140625, -6.880859375, -6.25927734375, -5.6376953125, -5.01611328125, -4.39453125, -3.77294921875, -3.1513671875, -2.52978515625, -1.908203125, -1.28662109375, -0.6650390625, -0.04345703125, 0.578125, 1.19970703125, 1.8212890625, 2.44287109375, 3.064453125, 3.68603515625, 4.3076171875, 4.92919921875, 5.55078125, 6.17236328125, 6.7939453125, 7.41552734375, 8.037109375, 8.65869140625, 9.2802734375, 9.90185546875, 10.5234375, 11.14501953125, 11.7666015625, 12.38818359375, 13.009765625, 13.63134765625, 14.2529296875, 14.87451171875, 15.49609375, 16.11767578125, 16.7392578125, 17.36083984375, 17.982421875, 18.60400390625, 19.2255859375, 19.84716796875, 20.46875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 4.0, 9.0, 12.0, 12.0, 22.0, 21.0, 27.0, 43.0, 59.0, 105.0, 154.0, 183.0, 113.0, 69.0, 43.0, 34.0, 16.0, 12.0, 11.0, 9.0, 7.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016984939575195312, -0.0016356557607650757, -0.0015728175640106201, -0.0015099793672561646, -0.001447141170501709, -0.0013843029737472534, -0.0013214647769927979, -0.0012586265802383423, -0.0011957883834838867, -0.0011329501867294312, -0.0010701119899749756, -0.00100727379322052, -0.0009444355964660645, -0.0008815973997116089, -0.0008187592029571533, -0.0007559210062026978, -0.0006930828094482422, -0.0006302446126937866, -0.0005674064159393311, -0.0005045682191848755, -0.0004417300224304199, -0.00037889182567596436, -0.0003160536289215088, -0.0002532154321670532, -0.00019037723541259766, -0.0001275390386581421, -6.470084190368652e-05, -1.862645149230957e-06, 6.097555160522461e-05, 0.00012381374835968018, 0.00018665194511413574, 0.0002494901418685913, 0.0003123283386230469, 0.00037516653537750244, 0.000438004732131958, 0.0005008429288864136, 0.0005636811256408691, 0.0006265193223953247, 0.0006893575191497803, 0.0007521957159042358, 0.0008150339126586914, 0.000877872109413147, 0.0009407103061676025, 0.001003548502922058, 0.0010663866996765137, 0.0011292248964309692, 0.0011920630931854248, 0.0012549012899398804, 0.001317739486694336, 0.0013805776834487915, 0.001443415880203247, 0.0015062540769577026, 0.0015690922737121582, 0.0016319304704666138, 0.0016947686672210693, 0.001757606863975525, 0.0018204450607299805, 0.001883283257484436, 0.0019461214542388916, 0.002008959650993347, 0.0020717978477478027, 0.0021346360445022583, 0.002197474241256714, 0.0022603124380111694, 0.002323150634765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 11.0, 25.0, 24.0, 45.0, 68.0, 113.0, 227.0, 453.0, 987.0, 2551.0, 9885.0, 83507.0, 795854.0, 135791.0, 13478.0, 3253.0, 1180.0, 508.0, 246.0, 123.0, 72.0, 36.0, 31.0, 17.0, 11.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.015625, -11.622802734375, -11.22998046875, -10.837158203125, -10.4443359375, -10.051513671875, -9.65869140625, -9.265869140625, -8.873046875, -8.480224609375, -8.08740234375, -7.694580078125, -7.3017578125, -6.908935546875, -6.51611328125, -6.123291015625, -5.73046875, -5.337646484375, -4.94482421875, -4.552001953125, -4.1591796875, -3.766357421875, -3.37353515625, -2.980712890625, -2.587890625, -2.195068359375, -1.80224609375, -1.409423828125, -1.0166015625, -0.623779296875, -0.23095703125, 0.161865234375, 0.5546875, 0.947509765625, 1.34033203125, 1.733154296875, 2.1259765625, 2.518798828125, 2.91162109375, 3.304443359375, 3.697265625, 4.090087890625, 4.48291015625, 4.875732421875, 5.2685546875, 5.661376953125, 6.05419921875, 6.447021484375, 6.83984375, 7.232666015625, 7.62548828125, 8.018310546875, 8.4111328125, 8.803955078125, 9.19677734375, 9.589599609375, 9.982421875, 10.375244140625, 10.76806640625, 11.160888671875, 11.5537109375, 11.946533203125, 12.33935546875, 12.732177734375, 13.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 13.0, 11.0, 20.0, 28.0, 28.0, 32.0, 57.0, 78.0, 60.0, 88.0, 90.0, 100.0, 80.0, 66.0, 69.0, 32.0, 34.0, 18.0, 20.0, 16.0, 12.0, 8.0, 5.0, 10.0, 3.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.3125, -8.0509033203125, -7.789306640625, -7.5277099609375, -7.26611328125, -7.0045166015625, -6.742919921875, -6.4813232421875, -6.2197265625, -5.9581298828125, -5.696533203125, -5.4349365234375, -5.17333984375, -4.9117431640625, -4.650146484375, -4.3885498046875, -4.126953125, -3.8653564453125, -3.603759765625, -3.3421630859375, -3.08056640625, -2.8189697265625, -2.557373046875, -2.2957763671875, -2.0341796875, -1.7725830078125, -1.510986328125, -1.2493896484375, -0.98779296875, -0.7261962890625, -0.464599609375, -0.2030029296875, 0.05859375, 0.3201904296875, 0.581787109375, 0.8433837890625, 1.10498046875, 1.3665771484375, 1.628173828125, 1.8897705078125, 2.1513671875, 2.4129638671875, 2.674560546875, 2.9361572265625, 3.19775390625, 3.4593505859375, 3.720947265625, 3.9825439453125, 4.244140625, 4.5057373046875, 4.767333984375, 5.0289306640625, 5.29052734375, 5.5521240234375, 5.813720703125, 6.0753173828125, 6.3369140625, 6.5985107421875, 6.860107421875, 7.1217041015625, 7.38330078125, 7.6448974609375, 7.906494140625, 8.1680908203125, 8.4296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 39.0, 94.0, 231.0, 317.0, 176.0, 77.0, 21.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-318.7530822753906, -310.2478942871094, -301.7427062988281, -293.2375183105469, -284.73236083984375, -276.2271728515625, -267.72198486328125, -259.216796875, -250.71160888671875, -242.2064208984375, -233.70123291015625, -225.19606018066406, -216.6908721923828, -208.18568420410156, -199.68051147460938, -191.17532348632812, -182.67013549804688, -174.16494750976562, -165.65975952148438, -157.1545867919922, -148.64939880371094, -140.1442108154297, -131.6390380859375, -123.13385009765625, -114.628662109375, -106.12347412109375, -97.61829376220703, -89.11311340332031, -80.60792541503906, -72.10273742675781, -63.597557067871094, -55.09237289428711, -46.587158203125, -38.081974029541016, -29.57678985595703, -21.071605682373047, -12.566421508789062, -4.061237335205078, 4.443946838378906, 12.94913101196289, 21.454315185546875, 29.95949935913086, 38.464683532714844, 46.96986770629883, 55.47505187988281, 63.9802360534668, 72.48542022705078, 80.9906005859375, 89.49578857421875, 98.0009765625, 106.50615692138672, 115.01133728027344, 123.51652526855469, 132.02171325683594, 140.52688598632812, 149.03207397460938, 157.53726196289062, 166.04244995117188, 174.54763793945312, 183.0528106689453, 191.55799865722656, 200.0631866455078, 208.568359375, 217.07354736328125, 225.5787353515625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 9.0, 10.0, 11.0, 14.0, 14.0, 23.0, 23.0, 31.0, 25.0, 34.0, 38.0, 36.0, 44.0, 51.0, 80.0, 57.0, 68.0, 64.0, 61.0, 47.0, 36.0, 39.0, 35.0, 24.0, 20.0, 8.0, 20.0, 15.0, 7.0, 10.0, 7.0, 5.0, 8.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.76423645019531, -98.24395751953125, -94.72367858886719, -91.20339965820312, -87.68312072753906, -84.162841796875, -80.6425552368164, -77.12227630615234, -73.60199737548828, -70.08171844482422, -66.56143951416016, -63.04115676879883, -59.520877838134766, -56.0005989074707, -52.480316162109375, -48.96003723144531, -45.43975830078125, -41.91947937011719, -38.399200439453125, -34.8789176940918, -31.358638763427734, -27.838359832763672, -24.318078994750977, -20.79779815673828, -17.27751922607422, -13.75723934173584, -10.236959457397461, -6.716679573059082, -3.196399688720703, 0.3238792419433594, 3.8441600799560547, 7.36444091796875, 10.884719848632812, 14.404999732971191, 17.92527961730957, 21.445560455322266, 24.965839385986328, 28.48611831665039, 32.00640106201172, 35.52667999267578, 39.046958923339844, 42.567237854003906, 46.08751678466797, 49.6077995300293, 53.12807846069336, 56.64835739135742, 60.16864013671875, 63.68891906738281, 67.20919799804688, 70.72947692871094, 74.249755859375, 77.77003479003906, 81.29031372070312, 84.81059265136719, 88.33087921142578, 91.85115814208984, 95.3714370727539, 98.89171600341797, 102.41199493408203, 105.9322738647461, 109.45256042480469, 112.97283935546875, 116.49311828613281, 120.01339721679688, 123.53367614746094]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 9.0, 7.0, 11.0, 18.0, 24.0, 43.0, 60.0, 128.0, 213.0, 384.0, 785.0, 1742.0, 4101.0, 11465.0, 38179.0, 179708.0, 1538148.0, 2094384.0, 253550.0, 48060.0, 14290.0, 5169.0, 2019.0, 887.0, 407.0, 207.0, 100.0, 65.0, 41.0, 25.0, 16.0, 12.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.796875, -11.460693359375, -11.12451171875, -10.788330078125, -10.4521484375, -10.115966796875, -9.77978515625, -9.443603515625, -9.107421875, -8.771240234375, -8.43505859375, -8.098876953125, -7.7626953125, -7.426513671875, -7.09033203125, -6.754150390625, -6.41796875, -6.081787109375, -5.74560546875, -5.409423828125, -5.0732421875, -4.737060546875, -4.40087890625, -4.064697265625, -3.728515625, -3.392333984375, -3.05615234375, -2.719970703125, -2.3837890625, -2.047607421875, -1.71142578125, -1.375244140625, -1.0390625, -0.702880859375, -0.36669921875, -0.030517578125, 0.3056640625, 0.641845703125, 0.97802734375, 1.314208984375, 1.650390625, 1.986572265625, 2.32275390625, 2.658935546875, 2.9951171875, 3.331298828125, 3.66748046875, 4.003662109375, 4.33984375, 4.676025390625, 5.01220703125, 5.348388671875, 5.6845703125, 6.020751953125, 6.35693359375, 6.693115234375, 7.029296875, 7.365478515625, 7.70166015625, 8.037841796875, 8.3740234375, 8.710205078125, 9.04638671875, 9.382568359375, 9.71875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 2.0, 8.0, 15.0, 17.0, 23.0, 20.0, 19.0, 42.0, 43.0, 47.0, 55.0, 47.0, 48.0, 60.0, 55.0, 58.0, 66.0, 69.0, 53.0, 41.0, 51.0, 38.0, 33.0, 16.0, 20.0, 11.0, 14.0, 15.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.25, -9.01129150390625, -8.7725830078125, -8.53387451171875, -8.295166015625, -8.05645751953125, -7.8177490234375, -7.57904052734375, -7.34033203125, -7.10162353515625, -6.8629150390625, -6.62420654296875, -6.385498046875, -6.14678955078125, -5.9080810546875, -5.66937255859375, -5.4306640625, -5.19195556640625, -4.9532470703125, -4.71453857421875, -4.475830078125, -4.23712158203125, -3.9984130859375, -3.75970458984375, -3.52099609375, -3.28228759765625, -3.0435791015625, -2.80487060546875, -2.566162109375, -2.32745361328125, -2.0887451171875, -1.85003662109375, -1.611328125, -1.37261962890625, -1.1339111328125, -0.89520263671875, -0.656494140625, -0.41778564453125, -0.1790771484375, 0.05963134765625, 0.29833984375, 0.53704833984375, 0.7757568359375, 1.01446533203125, 1.253173828125, 1.49188232421875, 1.7305908203125, 1.96929931640625, 2.2080078125, 2.44671630859375, 2.6854248046875, 2.92413330078125, 3.162841796875, 3.40155029296875, 3.6402587890625, 3.87896728515625, 4.11767578125, 4.35638427734375, 4.5950927734375, 4.83380126953125, 5.072509765625, 5.31121826171875, 5.5499267578125, 5.78863525390625, 6.02734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 19.0, 20.0, 37.0, 40.0, 52.0, 86.0, 171.0, 335.0, 798.0, 1762.0, 4833.0, 15363.0, 60058.0, 373749.0, 2965703.0, 652654.0, 86884.0, 20847.0, 6485.0, 2435.0, 931.0, 438.0, 245.0, 121.0, 78.0, 38.0, 40.0, 15.0, 12.0, 9.0, 2.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.453125, -12.0179443359375, -11.582763671875, -11.1475830078125, -10.71240234375, -10.2772216796875, -9.842041015625, -9.4068603515625, -8.9716796875, -8.5364990234375, -8.101318359375, -7.6661376953125, -7.23095703125, -6.7957763671875, -6.360595703125, -5.9254150390625, -5.490234375, -5.0550537109375, -4.619873046875, -4.1846923828125, -3.74951171875, -3.3143310546875, -2.879150390625, -2.4439697265625, -2.0087890625, -1.5736083984375, -1.138427734375, -0.7032470703125, -0.26806640625, 0.1671142578125, 0.602294921875, 1.0374755859375, 1.47265625, 1.9078369140625, 2.343017578125, 2.7781982421875, 3.21337890625, 3.6485595703125, 4.083740234375, 4.5189208984375, 4.9541015625, 5.3892822265625, 5.824462890625, 6.2596435546875, 6.69482421875, 7.1300048828125, 7.565185546875, 8.0003662109375, 8.435546875, 8.8707275390625, 9.305908203125, 9.7410888671875, 10.17626953125, 10.6114501953125, 11.046630859375, 11.4818115234375, 11.9169921875, 12.3521728515625, 12.787353515625, 13.2225341796875, 13.65771484375, 14.0928955078125, 14.528076171875, 14.9632568359375, 15.3984375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 10.0, 7.0, 18.0, 36.0, 47.0, 64.0, 87.0, 111.0, 212.0, 351.0, 613.0, 720.0, 599.0, 422.0, 261.0, 163.0, 95.0, 68.0, 53.0, 34.0, 28.0, 21.0, 12.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46875, -16.91845703125, -16.3681640625, -15.81787109375, -15.267578125, -14.71728515625, -14.1669921875, -13.61669921875, -13.06640625, -12.51611328125, -11.9658203125, -11.41552734375, -10.865234375, -10.31494140625, -9.7646484375, -9.21435546875, -8.6640625, -8.11376953125, -7.5634765625, -7.01318359375, -6.462890625, -5.91259765625, -5.3623046875, -4.81201171875, -4.26171875, -3.71142578125, -3.1611328125, -2.61083984375, -2.060546875, -1.51025390625, -0.9599609375, -0.40966796875, 0.140625, 0.69091796875, 1.2412109375, 1.79150390625, 2.341796875, 2.89208984375, 3.4423828125, 3.99267578125, 4.54296875, 5.09326171875, 5.6435546875, 6.19384765625, 6.744140625, 7.29443359375, 7.8447265625, 8.39501953125, 8.9453125, 9.49560546875, 10.0458984375, 10.59619140625, 11.146484375, 11.69677734375, 12.2470703125, 12.79736328125, 13.34765625, 13.89794921875, 14.4482421875, 14.99853515625, 15.548828125, 16.09912109375, 16.6494140625, 17.19970703125, 17.75]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 11.0, 13.0, 36.0, 68.0, 139.0, 207.0, 213.0, 139.0, 86.0, 33.0, 24.0, 7.0, 7.0, 12.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-184.69189453125, -178.52099609375, -172.35011291503906, -166.17921447753906, -160.00831604003906, -153.83741760253906, -147.66653442382812, -141.49563598632812, -135.32473754882812, -129.15383911132812, -122.98294830322266, -116.81205749511719, -110.64115905761719, -104.47026824951172, -98.29937744140625, -92.12847900390625, -85.95758819580078, -79.78669738769531, -73.61579895019531, -67.44490814208984, -61.274009704589844, -55.103118896484375, -48.93222427368164, -42.761329650878906, -36.59043502807617, -30.419540405273438, -24.248645782470703, -18.0777530670166, -11.906858444213867, -5.735963821411133, 0.43492889404296875, 6.605823516845703, 12.776718139648438, 18.947612762451172, 25.118507385253906, 31.289400100708008, 37.460296630859375, 43.631187438964844, 49.80208206176758, 55.97297668457031, 62.14387130737305, 68.31476593017578, 74.48565673828125, 80.65655517578125, 86.82744598388672, 92.99834442138672, 99.16923522949219, 105.34013366699219, 111.51102447509766, 117.68191528320312, 123.85281372070312, 130.02371215820312, 136.19459533691406, 142.36549377441406, 148.53639221191406, 154.707275390625, 160.878173828125, 167.049072265625, 173.21995544433594, 179.39085388183594, 185.56175231933594, 191.73265075683594, 197.90353393554688, 204.07443237304688, 210.24533081054688]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 6.0, 13.0, 6.0, 8.0, 12.0, 18.0, 13.0, 23.0, 17.0, 36.0, 35.0, 34.0, 29.0, 53.0, 56.0, 48.0, 46.0, 54.0, 55.0, 52.0, 43.0, 59.0, 33.0, 37.0, 43.0, 23.0, 29.0, 24.0, 16.0, 12.0, 19.0, 9.0, 8.0, 9.0, 7.0, 4.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-98.24458312988281, -95.57222747802734, -92.89987182617188, -90.22750854492188, -87.5551528930664, -84.88279724121094, -82.21044158935547, -79.5380859375, -76.86572265625, -74.19336700439453, -71.52101135253906, -68.84864807128906, -66.1762924194336, -63.503936767578125, -60.831581115722656, -58.15922546386719, -55.48686981201172, -52.81451416015625, -50.142154693603516, -47.46979904174805, -44.79743957519531, -42.125083923339844, -39.452728271484375, -36.780372619628906, -34.10801315307617, -31.43565559387207, -28.76329803466797, -26.0909423828125, -23.4185848236084, -20.746227264404297, -18.073871612548828, -15.401514053344727, -12.729156494140625, -10.056798934936523, -7.384442329406738, -4.712085723876953, -2.0397281646728516, 0.63262939453125, 3.3049850463867188, 5.97734260559082, 8.649700164794922, 11.322057723999023, 13.994414329528809, 16.666770935058594, 19.339128494262695, 22.011486053466797, 24.683841705322266, 27.356199264526367, 30.02855682373047, 32.70091247558594, 35.37327194213867, 38.04562759399414, 40.717987060546875, 43.390342712402344, 46.06269836425781, 48.73505401611328, 51.407413482666016, 54.079769134521484, 56.75212860107422, 59.42448425292969, 62.096839904785156, 64.76919555664062, 67.44155883789062, 70.1139144897461, 72.78627014160156]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 9.0, 13.0, 14.0, 18.0, 28.0, 42.0, 82.0, 105.0, 173.0, 278.0, 436.0, 746.0, 1281.0, 2621.0, 5555.0, 12050.0, 28007.0, 66532.0, 155571.0, 321829.0, 256141.0, 111830.0, 47671.0, 19993.0, 8808.0, 4038.0, 1951.0, 1097.0, 642.0, 360.0, 194.0, 152.0, 87.0, 59.0, 47.0, 24.0, 23.0, 14.0, 9.0, 6.0, 4.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.109375, -11.7286376953125, -11.347900390625, -10.9671630859375, -10.58642578125, -10.2056884765625, -9.824951171875, -9.4442138671875, -9.0634765625, -8.6827392578125, -8.302001953125, -7.9212646484375, -7.54052734375, -7.1597900390625, -6.779052734375, -6.3983154296875, -6.017578125, -5.6368408203125, -5.256103515625, -4.8753662109375, -4.49462890625, -4.1138916015625, -3.733154296875, -3.3524169921875, -2.9716796875, -2.5909423828125, -2.210205078125, -1.8294677734375, -1.44873046875, -1.0679931640625, -0.687255859375, -0.3065185546875, 0.07421875, 0.4549560546875, 0.835693359375, 1.2164306640625, 1.59716796875, 1.9779052734375, 2.358642578125, 2.7393798828125, 3.1201171875, 3.5008544921875, 3.881591796875, 4.2623291015625, 4.64306640625, 5.0238037109375, 5.404541015625, 5.7852783203125, 6.166015625, 6.5467529296875, 6.927490234375, 7.3082275390625, 7.68896484375, 8.0697021484375, 8.450439453125, 8.8311767578125, 9.2119140625, 9.5926513671875, 9.973388671875, 10.3541259765625, 10.73486328125, 11.1156005859375, 11.496337890625, 11.8770751953125, 12.2578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 9.0, 11.0, 11.0, 9.0, 10.0, 14.0, 15.0, 31.0, 22.0, 29.0, 38.0, 33.0, 32.0, 45.0, 37.0, 42.0, 56.0, 48.0, 49.0, 36.0, 34.0, 55.0, 45.0, 31.0, 41.0, 31.0, 31.0, 18.0, 18.0, 22.0, 17.0, 15.0, 18.0, 10.0, 10.0, 9.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.1171875, -4.9429931640625, -4.768798828125, -4.5946044921875, -4.42041015625, -4.2462158203125, -4.072021484375, -3.8978271484375, -3.7236328125, -3.5494384765625, -3.375244140625, -3.2010498046875, -3.02685546875, -2.8526611328125, -2.678466796875, -2.5042724609375, -2.330078125, -2.1558837890625, -1.981689453125, -1.8074951171875, -1.63330078125, -1.4591064453125, -1.284912109375, -1.1107177734375, -0.9365234375, -0.7623291015625, -0.588134765625, -0.4139404296875, -0.23974609375, -0.0655517578125, 0.108642578125, 0.2828369140625, 0.45703125, 0.6312255859375, 0.805419921875, 0.9796142578125, 1.15380859375, 1.3280029296875, 1.502197265625, 1.6763916015625, 1.8505859375, 2.0247802734375, 2.198974609375, 2.3731689453125, 2.54736328125, 2.7215576171875, 2.895751953125, 3.0699462890625, 3.244140625, 3.4183349609375, 3.592529296875, 3.7667236328125, 3.94091796875, 4.1151123046875, 4.289306640625, 4.4635009765625, 4.6376953125, 4.8118896484375, 4.986083984375, 5.1602783203125, 5.33447265625, 5.5086669921875, 5.682861328125, 5.8570556640625, 6.03125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 10.0, 7.0, 7.0, 16.0, 14.0, 24.0, 28.0, 42.0, 67.0, 100.0, 166.0, 254.0, 489.0, 885.0, 1887.0, 4978.0, 33057.0, 671674.0, 307486.0, 19958.0, 3972.0, 1562.0, 740.0, 416.0, 261.0, 135.0, 92.0, 67.0, 47.0, 37.0, 29.0, 16.0, 6.0, 8.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.40625, -32.25, -31.09375, -29.9375, -28.78125, -27.625, -26.46875, -25.3125, -24.15625, -23.0, -21.84375, -20.6875, -19.53125, -18.375, -17.21875, -16.0625, -14.90625, -13.75, -12.59375, -11.4375, -10.28125, -9.125, -7.96875, -6.8125, -5.65625, -4.5, -3.34375, -2.1875, -1.03125, 0.125, 1.28125, 2.4375, 3.59375, 4.75, 5.90625, 7.0625, 8.21875, 9.375, 10.53125, 11.6875, 12.84375, 14.0, 15.15625, 16.3125, 17.46875, 18.625, 19.78125, 20.9375, 22.09375, 23.25, 24.40625, 25.5625, 26.71875, 27.875, 29.03125, 30.1875, 31.34375, 32.5, 33.65625, 34.8125, 35.96875, 37.125, 38.28125, 39.4375, 40.59375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 9.0, 5.0, 5.0, 10.0, 12.0, 18.0, 12.0, 13.0, 23.0, 28.0, 14.0, 24.0, 31.0, 29.0, 24.0, 53.0, 41.0, 44.0, 47.0, 45.0, 42.0, 47.0, 43.0, 49.0, 50.0, 41.0, 32.0, 33.0, 32.0, 18.0, 25.0, 19.0, 16.0, 11.0, 7.0, 18.0, 8.0, 7.0, 1.0, 7.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.75, -22.035400390625, -21.32080078125, -20.606201171875, -19.8916015625, -19.177001953125, -18.46240234375, -17.747802734375, -17.033203125, -16.318603515625, -15.60400390625, -14.889404296875, -14.1748046875, -13.460205078125, -12.74560546875, -12.031005859375, -11.31640625, -10.601806640625, -9.88720703125, -9.172607421875, -8.4580078125, -7.743408203125, -7.02880859375, -6.314208984375, -5.599609375, -4.885009765625, -4.17041015625, -3.455810546875, -2.7412109375, -2.026611328125, -1.31201171875, -0.597412109375, 0.1171875, 0.831787109375, 1.54638671875, 2.260986328125, 2.9755859375, 3.690185546875, 4.40478515625, 5.119384765625, 5.833984375, 6.548583984375, 7.26318359375, 7.977783203125, 8.6923828125, 9.406982421875, 10.12158203125, 10.836181640625, 11.55078125, 12.265380859375, 12.97998046875, 13.694580078125, 14.4091796875, 15.123779296875, 15.83837890625, 16.552978515625, 17.267578125, 17.982177734375, 18.69677734375, 19.411376953125, 20.1259765625, 20.840576171875, 21.55517578125, 22.269775390625, 22.984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 4.0, 16.0, 19.0, 43.0, 52.0, 78.0, 120.0, 254.0, 530.0, 1606.0, 8925.0, 97047.0, 824871.0, 102573.0, 9457.0, 1765.0, 560.0, 249.0, 147.0, 66.0, 49.0, 20.0, 23.0, 16.0, 10.0, 11.0, 8.0, 4.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9190673828125, -10.549072265625, -10.1790771484375, -9.80908203125, -9.4390869140625, -9.069091796875, -8.6990966796875, -8.3291015625, -7.9591064453125, -7.589111328125, -7.2191162109375, -6.84912109375, -6.4791259765625, -6.109130859375, -5.7391357421875, -5.369140625, -4.9991455078125, -4.629150390625, -4.2591552734375, -3.88916015625, -3.5191650390625, -3.149169921875, -2.7791748046875, -2.4091796875, -2.0391845703125, -1.669189453125, -1.2991943359375, -0.92919921875, -0.5592041015625, -0.189208984375, 0.1807861328125, 0.55078125, 0.9207763671875, 1.290771484375, 1.6607666015625, 2.03076171875, 2.4007568359375, 2.770751953125, 3.1407470703125, 3.5107421875, 3.8807373046875, 4.250732421875, 4.6207275390625, 4.99072265625, 5.3607177734375, 5.730712890625, 6.1007080078125, 6.470703125, 6.8406982421875, 7.210693359375, 7.5806884765625, 7.95068359375, 8.3206787109375, 8.690673828125, 9.0606689453125, 9.4306640625, 9.8006591796875, 10.170654296875, 10.5406494140625, 10.91064453125, 11.2806396484375, 11.650634765625, 12.0206298828125, 12.390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 16.0, 11.0, 16.0, 14.0, 19.0, 25.0, 32.0, 34.0, 44.0, 56.0, 84.0, 116.0, 131.0, 73.0, 66.0, 43.0, 41.0, 22.0, 21.0, 17.0, 19.0, 13.0, 7.0, 18.0, 12.0, 9.0, 10.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0021343231201171875, -0.002076566219329834, -0.0020188093185424805, -0.001961052417755127, -0.0019032955169677734, -0.00184553861618042, -0.0017877817153930664, -0.0017300248146057129, -0.0016722679138183594, -0.0016145110130310059, -0.0015567541122436523, -0.0014989972114562988, -0.0014412403106689453, -0.0013834834098815918, -0.0013257265090942383, -0.0012679696083068848, -0.0012102127075195312, -0.0011524558067321777, -0.0010946989059448242, -0.0010369420051574707, -0.0009791851043701172, -0.0009214282035827637, -0.0008636713027954102, -0.0008059144020080566, -0.0007481575012207031, -0.0006904006004333496, -0.0006326436996459961, -0.0005748867988586426, -0.0005171298980712891, -0.00045937299728393555, -0.00040161609649658203, -0.0003438591957092285, -0.000286102294921875, -0.00022834539413452148, -0.00017058849334716797, -0.00011283159255981445, -5.507469177246094e-05, 2.682209014892578e-06, 6.0439109802246094e-05, 0.00011819601058959961, 0.00017595291137695312, 0.00023370981216430664, 0.00029146671295166016, 0.00034922361373901367, 0.0004069805145263672, 0.0004647374153137207, 0.0005224943161010742, 0.0005802512168884277, 0.0006380081176757812, 0.0006957650184631348, 0.0007535219192504883, 0.0008112788200378418, 0.0008690357208251953, 0.0009267926216125488, 0.0009845495223999023, 0.0010423064231872559, 0.0011000633239746094, 0.0011578202247619629, 0.0012155771255493164, 0.00127333402633667, 0.0013310909271240234, 0.001388847827911377, 0.0014466047286987305, 0.001504361629486084, 0.0015621185302734375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 14.0, 15.0, 22.0, 24.0, 45.0, 53.0, 92.0, 137.0, 239.0, 420.0, 786.0, 1717.0, 4384.0, 17819.0, 137233.0, 755196.0, 107915.0, 15119.0, 4053.0, 1495.0, 734.0, 373.0, 233.0, 147.0, 98.0, 48.0, 41.0, 28.0, 18.0, 11.0, 7.0, 2.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.09503173828125, -6.8267822265625, -6.55853271484375, -6.290283203125, -6.02203369140625, -5.7537841796875, -5.48553466796875, -5.21728515625, -4.94903564453125, -4.6807861328125, -4.41253662109375, -4.144287109375, -3.87603759765625, -3.6077880859375, -3.33953857421875, -3.0712890625, -2.80303955078125, -2.5347900390625, -2.26654052734375, -1.998291015625, -1.73004150390625, -1.4617919921875, -1.19354248046875, -0.92529296875, -0.65704345703125, -0.3887939453125, -0.12054443359375, 0.147705078125, 0.41595458984375, 0.6842041015625, 0.95245361328125, 1.220703125, 1.48895263671875, 1.7572021484375, 2.02545166015625, 2.293701171875, 2.56195068359375, 2.8302001953125, 3.09844970703125, 3.36669921875, 3.63494873046875, 3.9031982421875, 4.17144775390625, 4.439697265625, 4.70794677734375, 4.9761962890625, 5.24444580078125, 5.5126953125, 5.78094482421875, 6.0491943359375, 6.31744384765625, 6.585693359375, 6.85394287109375, 7.1221923828125, 7.39044189453125, 7.65869140625, 7.92694091796875, 8.1951904296875, 8.46343994140625, 8.731689453125, 8.99993896484375, 9.2681884765625, 9.53643798828125, 9.8046875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 6.0, 1.0, 4.0, 11.0, 14.0, 16.0, 14.0, 17.0, 23.0, 31.0, 31.0, 50.0, 44.0, 51.0, 58.0, 65.0, 77.0, 86.0, 60.0, 62.0, 63.0, 49.0, 43.0, 36.0, 22.0, 14.0, 12.0, 9.0, 12.0, 7.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.203125, -6.99713134765625, -6.7911376953125, -6.58514404296875, -6.379150390625, -6.17315673828125, -5.9671630859375, -5.76116943359375, -5.55517578125, -5.34918212890625, -5.1431884765625, -4.93719482421875, -4.731201171875, -4.52520751953125, -4.3192138671875, -4.11322021484375, -3.9072265625, -3.70123291015625, -3.4952392578125, -3.28924560546875, -3.083251953125, -2.87725830078125, -2.6712646484375, -2.46527099609375, -2.25927734375, -2.05328369140625, -1.8472900390625, -1.64129638671875, -1.435302734375, -1.22930908203125, -1.0233154296875, -0.81732177734375, -0.611328125, -0.40533447265625, -0.1993408203125, 0.00665283203125, 0.212646484375, 0.41864013671875, 0.6246337890625, 0.83062744140625, 1.03662109375, 1.24261474609375, 1.4486083984375, 1.65460205078125, 1.860595703125, 2.06658935546875, 2.2725830078125, 2.47857666015625, 2.6845703125, 2.89056396484375, 3.0965576171875, 3.30255126953125, 3.508544921875, 3.71453857421875, 3.9205322265625, 4.12652587890625, 4.33251953125, 4.53851318359375, 4.7445068359375, 4.95050048828125, 5.156494140625, 5.36248779296875, 5.5684814453125, 5.77447509765625, 5.98046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 11.0, 31.0, 55.0, 168.0, 319.0, 239.0, 105.0, 42.0, 15.0, 10.0, 6.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.81739807128906, -76.09461975097656, -67.37184143066406, -58.6490592956543, -49.9262809753418, -41.2035026550293, -32.48072052001953, -23.75794219970703, -15.035163879394531, -6.312384605407715, 2.4103946685791016, 11.133174896240234, 19.855953216552734, 28.578731536865234, 37.301513671875, 46.0242919921875, 54.7470703125, 63.4698486328125, 72.192626953125, 80.9154052734375, 89.63818359375, 98.3609619140625, 107.08374786376953, 115.80652618408203, 124.52930450439453, 133.25209045410156, 141.97486877441406, 150.69764709472656, 159.42042541503906, 168.14320373535156, 176.86598205566406, 185.58876037597656, 194.31155395507812, 203.03433227539062, 211.75711059570312, 220.47988891601562, 229.20266723632812, 237.92544555664062, 246.64822387695312, 255.37100219726562, 264.0937805175781, 272.8165588378906, 281.5393371582031, 290.2621154785156, 298.9848937988281, 307.7076721191406, 316.4304504394531, 325.1532287597656, 333.87603759765625, 342.59881591796875, 351.32159423828125, 360.04437255859375, 368.76715087890625, 377.48992919921875, 386.21270751953125, 394.93548583984375, 403.65826416015625, 412.38104248046875, 421.10382080078125, 429.82659912109375, 438.54937744140625, 447.27215576171875, 455.99493408203125, 464.71771240234375, 473.44049072265625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 10.0, 19.0, 10.0, 26.0, 29.0, 27.0, 32.0, 47.0, 46.0, 64.0, 81.0, 94.0, 98.0, 93.0, 53.0, 55.0, 39.0, 37.0, 33.0, 33.0, 17.0, 19.0, 7.0, 4.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.45133972167969, -110.85551452636719, -106.25968933105469, -101.66386413574219, -97.06803894042969, -92.47221374511719, -87.87638854980469, -83.28056335449219, -78.68473815917969, -74.08891296386719, -69.49308776855469, -64.89726257324219, -60.30143737792969, -55.70561218261719, -51.10978698730469, -46.51396179199219, -41.91813659667969, -37.32231140136719, -32.72648620605469, -28.130661010742188, -23.534835815429688, -18.939010620117188, -14.343185424804688, -9.747360229492188, -5.1515350341796875, -0.5557098388671875, 4.0401153564453125, 8.635940551757812, 13.231765747070312, 17.827590942382812, 22.423416137695312, 27.019241333007812, 31.615081787109375, 36.210906982421875, 40.806732177734375, 45.402557373046875, 49.998382568359375, 54.594207763671875, 59.190032958984375, 63.785858154296875, 68.38168334960938, 72.97750854492188, 77.57333374023438, 82.16915893554688, 86.76498413085938, 91.36080932617188, 95.95663452148438, 100.55245971679688, 105.14828491210938, 109.74411010742188, 114.33993530273438, 118.93576049804688, 123.53158569335938, 128.12741088867188, 132.72323608398438, 137.31906127929688, 141.91488647460938, 146.51071166992188, 151.10653686523438, 155.70236206054688, 160.29818725585938, 164.89401245117188, 169.48983764648438, 174.08566284179688, 178.68148803710938]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 14.0, 30.0, 56.0, 114.0, 258.0, 677.0, 1605.0, 4414.0, 14552.0, 65385.0, 752546.0, 3064360.0, 244069.0, 33386.0, 8466.0, 2590.0, 925.0, 417.0, 174.0, 91.0, 66.0, 34.0, 20.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59375, -6.1630859375, -5.732421875, -5.3017578125, -4.87109375, -4.4404296875, -4.009765625, -3.5791015625, -3.1484375, -2.7177734375, -2.287109375, -1.8564453125, -1.42578125, -0.9951171875, -0.564453125, -0.1337890625, 0.296875, 0.7275390625, 1.158203125, 1.5888671875, 2.01953125, 2.4501953125, 2.880859375, 3.3115234375, 3.7421875, 4.1728515625, 4.603515625, 5.0341796875, 5.46484375, 5.8955078125, 6.326171875, 6.7568359375, 7.1875, 7.6181640625, 8.048828125, 8.4794921875, 8.91015625, 9.3408203125, 9.771484375, 10.2021484375, 10.6328125, 11.0634765625, 11.494140625, 11.9248046875, 12.35546875, 12.7861328125, 13.216796875, 13.6474609375, 14.078125, 14.5087890625, 14.939453125, 15.3701171875, 15.80078125, 16.2314453125, 16.662109375, 17.0927734375, 17.5234375, 17.9541015625, 18.384765625, 18.8154296875, 19.24609375, 19.6767578125, 20.107421875, 20.5380859375, 20.96875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [5.0, 6.0, 8.0, 13.0, 24.0, 49.0, 65.0, 67.0, 82.0, 110.0, 115.0, 107.0, 101.0, 79.0, 58.0, 44.0, 31.0, 23.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.085693359375, -3.67138671875, -3.257080078125, -2.8427734375, -2.428466796875, -2.01416015625, -1.599853515625, -1.185546875, -0.771240234375, -0.35693359375, 0.057373046875, 0.4716796875, 0.885986328125, 1.30029296875, 1.714599609375, 2.12890625, 2.543212890625, 2.95751953125, 3.371826171875, 3.7861328125, 4.200439453125, 4.61474609375, 5.029052734375, 5.443359375, 5.857666015625, 6.27197265625, 6.686279296875, 7.1005859375, 7.514892578125, 7.92919921875, 8.343505859375, 8.7578125, 9.172119140625, 9.58642578125, 10.000732421875, 10.4150390625, 10.829345703125, 11.24365234375, 11.657958984375, 12.072265625, 12.486572265625, 12.90087890625, 13.315185546875, 13.7294921875, 14.143798828125, 14.55810546875, 14.972412109375, 15.38671875, 15.801025390625, 16.21533203125, 16.629638671875, 17.0439453125, 17.458251953125, 17.87255859375, 18.286865234375, 18.701171875, 19.115478515625, 19.52978515625, 19.944091796875, 20.3583984375, 20.772705078125, 21.18701171875, 21.601318359375, 22.015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 12.0, 11.0, 29.0, 37.0, 45.0, 103.0, 139.0, 364.0, 872.0, 2221.0, 7013.0, 26606.0, 152598.0, 2717414.0, 1182221.0, 81553.0, 15878.0, 4182.0, 1482.0, 648.0, 327.0, 199.0, 119.0, 83.0, 40.0, 29.0, 17.0, 17.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.703125, -16.161865234375, -15.62060546875, -15.079345703125, -14.5380859375, -13.996826171875, -13.45556640625, -12.914306640625, -12.373046875, -11.831787109375, -11.29052734375, -10.749267578125, -10.2080078125, -9.666748046875, -9.12548828125, -8.584228515625, -8.04296875, -7.501708984375, -6.96044921875, -6.419189453125, -5.8779296875, -5.336669921875, -4.79541015625, -4.254150390625, -3.712890625, -3.171630859375, -2.63037109375, -2.089111328125, -1.5478515625, -1.006591796875, -0.46533203125, 0.075927734375, 0.6171875, 1.158447265625, 1.69970703125, 2.240966796875, 2.7822265625, 3.323486328125, 3.86474609375, 4.406005859375, 4.947265625, 5.488525390625, 6.02978515625, 6.571044921875, 7.1123046875, 7.653564453125, 8.19482421875, 8.736083984375, 9.27734375, 9.818603515625, 10.35986328125, 10.901123046875, 11.4423828125, 11.983642578125, 12.52490234375, 13.066162109375, 13.607421875, 14.148681640625, 14.68994140625, 15.231201171875, 15.7724609375, 16.313720703125, 16.85498046875, 17.396240234375, 17.9375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 7.0, 7.0, 10.0, 16.0, 29.0, 23.0, 38.0, 75.0, 105.0, 184.0, 281.0, 542.0, 836.0, 793.0, 483.0, 244.0, 146.0, 79.0, 59.0, 36.0, 21.0, 18.0, 10.0, 9.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.18603515625, -11.5751953125, -10.96435546875, -10.353515625, -9.74267578125, -9.1318359375, -8.52099609375, -7.91015625, -7.29931640625, -6.6884765625, -6.07763671875, -5.466796875, -4.85595703125, -4.2451171875, -3.63427734375, -3.0234375, -2.41259765625, -1.8017578125, -1.19091796875, -0.580078125, 0.03076171875, 0.6416015625, 1.25244140625, 1.86328125, 2.47412109375, 3.0849609375, 3.69580078125, 4.306640625, 4.91748046875, 5.5283203125, 6.13916015625, 6.75, 7.36083984375, 7.9716796875, 8.58251953125, 9.193359375, 9.80419921875, 10.4150390625, 11.02587890625, 11.63671875, 12.24755859375, 12.8583984375, 13.46923828125, 14.080078125, 14.69091796875, 15.3017578125, 15.91259765625, 16.5234375, 17.13427734375, 17.7451171875, 18.35595703125, 18.966796875, 19.57763671875, 20.1884765625, 20.79931640625, 21.41015625, 22.02099609375, 22.6318359375, 23.24267578125, 23.853515625, 24.46435546875, 25.0751953125, 25.68603515625, 26.296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 8.0, 12.0, 37.0, 56.0, 128.0, 254.0, 231.0, 148.0, 69.0, 27.0, 7.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-373.190185546875, -365.7127990722656, -358.23541259765625, -350.758056640625, -343.2806701660156, -335.80328369140625, -328.3258972167969, -320.8485107421875, -313.37115478515625, -305.8937683105469, -298.4163818359375, -290.93902587890625, -283.4616394042969, -275.9842529296875, -268.5068664550781, -261.02947998046875, -253.55209350585938, -246.07470703125, -238.5973358154297, -231.1199493408203, -223.642578125, -216.16519165039062, -208.68780517578125, -201.21041870117188, -193.73304748535156, -186.2556610107422, -178.77828979492188, -171.3009033203125, -163.82351684570312, -156.3461456298828, -148.86875915527344, -141.39138793945312, -133.91400146484375, -126.4366226196289, -118.95924377441406, -111.48185729980469, -104.00447845458984, -96.527099609375, -89.04971313476562, -81.57233428955078, -74.09496307373047, -66.61758422851562, -59.140201568603516, -51.662818908691406, -44.18544006347656, -36.70806121826172, -29.23067855834961, -21.7532958984375, -14.275917053222656, -6.79853630065918, 0.6788444519042969, 8.156225204467773, 15.63360595703125, 23.110984802246094, 30.588367462158203, 38.06575012207031, 45.543128967285156, 53.0205078125, 60.49789047241211, 67.97527313232422, 75.45265197753906, 82.9300308227539, 90.40740966796875, 97.88479614257812, 105.36217498779297]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 13.0, 13.0, 27.0, 20.0, 20.0, 33.0, 44.0, 37.0, 63.0, 51.0, 63.0, 76.0, 54.0, 72.0, 63.0, 57.0, 63.0, 51.0, 37.0, 36.0, 26.0, 26.0, 19.0, 11.0, 9.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.67156982421875, -138.99705505371094, -135.3225555419922, -131.64804077148438, -127.97352600097656, -124.29901885986328, -120.62451171875, -116.94999694824219, -113.2754898071289, -109.60098266601562, -105.92646789550781, -102.25196075439453, -98.57745361328125, -94.90293884277344, -91.22843170166016, -87.55392456054688, -83.87940979003906, -80.20490264892578, -76.53038787841797, -72.85588073730469, -69.18136596679688, -65.5068588256836, -61.83235168457031, -58.157840728759766, -54.48332977294922, -50.80881881713867, -47.134307861328125, -43.459800720214844, -39.7852897644043, -36.11077880859375, -32.43627166748047, -28.761760711669922, -25.087242126464844, -21.412731170654297, -17.738222122192383, -14.063712120056152, -10.389202117919922, -6.714691162109375, -3.040182113647461, 0.6343269348144531, 4.308837890625, 7.9833478927612305, 11.657857894897461, 15.332367897033691, 19.006877899169922, 22.68138885498047, 26.355897903442383, 30.030406951904297, 33.704917907714844, 37.37942886352539, 41.05393981933594, 44.72844696044922, 48.402957916259766, 52.07746887207031, 55.751976013183594, 59.42648696899414, 63.10099792480469, 66.77550506591797, 70.45001983642578, 74.12452697753906, 77.79904174804688, 81.47354888916016, 85.14805603027344, 88.82257080078125, 92.49707794189453]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 5.0, 6.0, 7.0, 11.0, 18.0, 26.0, 28.0, 51.0, 64.0, 127.0, 167.0, 294.0, 434.0, 687.0, 1148.0, 2012.0, 3364.0, 6231.0, 11707.0, 23770.0, 50251.0, 113701.0, 267578.0, 306427.0, 141068.0, 60376.0, 28243.0, 13996.0, 7146.0, 3878.0, 2265.0, 1342.0, 761.0, 493.0, 291.0, 206.0, 133.0, 85.0, 49.0, 34.0, 17.0, 18.0, 12.0, 13.0, 7.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.203369140625, -9.87548828125, -9.547607421875, -9.2197265625, -8.891845703125, -8.56396484375, -8.236083984375, -7.908203125, -7.580322265625, -7.25244140625, -6.924560546875, -6.5966796875, -6.268798828125, -5.94091796875, -5.613037109375, -5.28515625, -4.957275390625, -4.62939453125, -4.301513671875, -3.9736328125, -3.645751953125, -3.31787109375, -2.989990234375, -2.662109375, -2.334228515625, -2.00634765625, -1.678466796875, -1.3505859375, -1.022705078125, -0.69482421875, -0.366943359375, -0.0390625, 0.288818359375, 0.61669921875, 0.944580078125, 1.2724609375, 1.600341796875, 1.92822265625, 2.256103515625, 2.583984375, 2.911865234375, 3.23974609375, 3.567626953125, 3.8955078125, 4.223388671875, 4.55126953125, 4.879150390625, 5.20703125, 5.534912109375, 5.86279296875, 6.190673828125, 6.5185546875, 6.846435546875, 7.17431640625, 7.502197265625, 7.830078125, 8.157958984375, 8.48583984375, 8.813720703125, 9.1416015625, 9.469482421875, 9.79736328125, 10.125244140625, 10.453125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 4.0, 1.0, 12.0, 6.0, 13.0, 20.0, 24.0, 20.0, 29.0, 26.0, 22.0, 29.0, 25.0, 37.0, 34.0, 38.0, 34.0, 36.0, 48.0, 40.0, 48.0, 42.0, 36.0, 38.0, 34.0, 32.0, 36.0, 35.0, 36.0, 26.0, 21.0, 21.0, 12.0, 20.0, 10.0, 12.0, 5.0, 9.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.328125, -5.14849853515625, -4.9688720703125, -4.78924560546875, -4.609619140625, -4.42999267578125, -4.2503662109375, -4.07073974609375, -3.89111328125, -3.71148681640625, -3.5318603515625, -3.35223388671875, -3.172607421875, -2.99298095703125, -2.8133544921875, -2.63372802734375, -2.4541015625, -2.27447509765625, -2.0948486328125, -1.91522216796875, -1.735595703125, -1.55596923828125, -1.3763427734375, -1.19671630859375, -1.01708984375, -0.83746337890625, -0.6578369140625, -0.47821044921875, -0.298583984375, -0.11895751953125, 0.0606689453125, 0.24029541015625, 0.419921875, 0.59954833984375, 0.7791748046875, 0.95880126953125, 1.138427734375, 1.31805419921875, 1.4976806640625, 1.67730712890625, 1.85693359375, 2.03656005859375, 2.2161865234375, 2.39581298828125, 2.575439453125, 2.75506591796875, 2.9346923828125, 3.11431884765625, 3.2939453125, 3.47357177734375, 3.6531982421875, 3.83282470703125, 4.012451171875, 4.19207763671875, 4.3717041015625, 4.55133056640625, 4.73095703125, 4.91058349609375, 5.0902099609375, 5.26983642578125, 5.449462890625, 5.62908935546875, 5.8087158203125, 5.98834228515625, 6.16796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 5.0, 10.0, 6.0, 12.0, 21.0, 21.0, 32.0, 48.0, 60.0, 62.0, 98.0, 134.0, 195.0, 268.0, 392.0, 665.0, 968.0, 1801.0, 4045.0, 12109.0, 53303.0, 374878.0, 519036.0, 58026.0, 13144.0, 4315.0, 1918.0, 1034.0, 617.0, 362.0, 266.0, 198.0, 127.0, 104.0, 69.0, 52.0, 32.0, 18.0, 19.0, 21.0, 9.0, 7.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.171875, -21.457275390625, -20.74267578125, -20.028076171875, -19.3134765625, -18.598876953125, -17.88427734375, -17.169677734375, -16.455078125, -15.740478515625, -15.02587890625, -14.311279296875, -13.5966796875, -12.882080078125, -12.16748046875, -11.452880859375, -10.73828125, -10.023681640625, -9.30908203125, -8.594482421875, -7.8798828125, -7.165283203125, -6.45068359375, -5.736083984375, -5.021484375, -4.306884765625, -3.59228515625, -2.877685546875, -2.1630859375, -1.448486328125, -0.73388671875, -0.019287109375, 0.6953125, 1.409912109375, 2.12451171875, 2.839111328125, 3.5537109375, 4.268310546875, 4.98291015625, 5.697509765625, 6.412109375, 7.126708984375, 7.84130859375, 8.555908203125, 9.2705078125, 9.985107421875, 10.69970703125, 11.414306640625, 12.12890625, 12.843505859375, 13.55810546875, 14.272705078125, 14.9873046875, 15.701904296875, 16.41650390625, 17.131103515625, 17.845703125, 18.560302734375, 19.27490234375, 19.989501953125, 20.7041015625, 21.418701171875, 22.13330078125, 22.847900390625, 23.5625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 3.0, 7.0, 3.0, 7.0, 9.0, 17.0, 21.0, 15.0, 20.0, 36.0, 35.0, 38.0, 38.0, 48.0, 48.0, 48.0, 59.0, 68.0, 57.0, 46.0, 70.0, 52.0, 42.0, 38.0, 33.0, 32.0, 19.0, 21.0, 11.0, 18.0, 12.0, 7.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.265625, -26.317626953125, -25.36962890625, -24.421630859375, -23.4736328125, -22.525634765625, -21.57763671875, -20.629638671875, -19.681640625, -18.733642578125, -17.78564453125, -16.837646484375, -15.8896484375, -14.941650390625, -13.99365234375, -13.045654296875, -12.09765625, -11.149658203125, -10.20166015625, -9.253662109375, -8.3056640625, -7.357666015625, -6.40966796875, -5.461669921875, -4.513671875, -3.565673828125, -2.61767578125, -1.669677734375, -0.7216796875, 0.226318359375, 1.17431640625, 2.122314453125, 3.0703125, 4.018310546875, 4.96630859375, 5.914306640625, 6.8623046875, 7.810302734375, 8.75830078125, 9.706298828125, 10.654296875, 11.602294921875, 12.55029296875, 13.498291015625, 14.4462890625, 15.394287109375, 16.34228515625, 17.290283203125, 18.23828125, 19.186279296875, 20.13427734375, 21.082275390625, 22.0302734375, 22.978271484375, 23.92626953125, 24.874267578125, 25.822265625, 26.770263671875, 27.71826171875, 28.666259765625, 29.6142578125, 30.562255859375, 31.51025390625, 32.458251953125, 33.40625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 10.0, 12.0, 12.0, 24.0, 37.0, 50.0, 110.0, 134.0, 275.0, 584.0, 1612.0, 5649.0, 28765.0, 251305.0, 690412.0, 56076.0, 9418.0, 2450.0, 820.0, 367.0, 158.0, 88.0, 73.0, 40.0, 18.0, 14.0, 6.0, 10.0, 10.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0911865234375, -8.799560546875, -8.5079345703125, -8.21630859375, -7.9246826171875, -7.633056640625, -7.3414306640625, -7.0498046875, -6.7581787109375, -6.466552734375, -6.1749267578125, -5.88330078125, -5.5916748046875, -5.300048828125, -5.0084228515625, -4.716796875, -4.4251708984375, -4.133544921875, -3.8419189453125, -3.55029296875, -3.2586669921875, -2.967041015625, -2.6754150390625, -2.3837890625, -2.0921630859375, -1.800537109375, -1.5089111328125, -1.21728515625, -0.9256591796875, -0.634033203125, -0.3424072265625, -0.05078125, 0.2408447265625, 0.532470703125, 0.8240966796875, 1.11572265625, 1.4073486328125, 1.698974609375, 1.9906005859375, 2.2822265625, 2.5738525390625, 2.865478515625, 3.1571044921875, 3.44873046875, 3.7403564453125, 4.031982421875, 4.3236083984375, 4.615234375, 4.9068603515625, 5.198486328125, 5.4901123046875, 5.78173828125, 6.0733642578125, 6.364990234375, 6.6566162109375, 6.9482421875, 7.2398681640625, 7.531494140625, 7.8231201171875, 8.11474609375, 8.4063720703125, 8.697998046875, 8.9896240234375, 9.28125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 8.0, 10.0, 9.0, 12.0, 12.0, 12.0, 14.0, 26.0, 21.0, 29.0, 54.0, 102.0, 145.0, 153.0, 119.0, 72.0, 43.0, 40.0, 32.0, 13.0, 14.0, 10.0, 14.0, 10.0, 3.0, 6.0, 5.0, 2.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.0024776458740234375, -0.0024145543575286865, -0.0023514628410339355, -0.0022883713245391846, -0.0022252798080444336, -0.0021621882915496826, -0.0020990967750549316, -0.0020360052585601807, -0.0019729137420654297, -0.0019098222255706787, -0.0018467307090759277, -0.0017836391925811768, -0.0017205476760864258, -0.0016574561595916748, -0.0015943646430969238, -0.0015312731266021729, -0.0014681816101074219, -0.001405090093612671, -0.00134199857711792, -0.001278907060623169, -0.001215815544128418, -0.001152724027633667, -0.001089632511138916, -0.001026540994644165, -0.0009634494781494141, -0.0009003579616546631, -0.0008372664451599121, -0.0007741749286651611, -0.0007110834121704102, -0.0006479918956756592, -0.0005849003791809082, -0.0005218088626861572, -0.00045871734619140625, -0.0003956258296966553, -0.0003325343132019043, -0.0002694427967071533, -0.00020635128021240234, -0.00014325976371765137, -8.016824722290039e-05, -1.7076730728149414e-05, 4.601478576660156e-05, 0.00010910630226135254, 0.00017219781875610352, 0.0002352893352508545, 0.00029838085174560547, 0.00036147236824035645, 0.0004245638847351074, 0.0004876554012298584, 0.0005507469177246094, 0.0006138384342193604, 0.0006769299507141113, 0.0007400214672088623, 0.0008031129837036133, 0.0008662045001983643, 0.0009292960166931152, 0.0009923875331878662, 0.0010554790496826172, 0.0011185705661773682, 0.0011816620826721191, 0.0012447535991668701, 0.001307845115661621, 0.001370936632156372, 0.001434028148651123, 0.001497119665145874, 0.001560211181640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 9.0, 20.0, 28.0, 42.0, 59.0, 106.0, 175.0, 316.0, 635.0, 1458.0, 3988.0, 15050.0, 121257.0, 781700.0, 103741.0, 13623.0, 3625.0, 1392.0, 624.0, 294.0, 161.0, 93.0, 59.0, 24.0, 16.0, 8.0, 10.0, 15.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.3203125, -8.055908203125, -7.79150390625, -7.527099609375, -7.2626953125, -6.998291015625, -6.73388671875, -6.469482421875, -6.205078125, -5.940673828125, -5.67626953125, -5.411865234375, -5.1474609375, -4.883056640625, -4.61865234375, -4.354248046875, -4.08984375, -3.825439453125, -3.56103515625, -3.296630859375, -3.0322265625, -2.767822265625, -2.50341796875, -2.239013671875, -1.974609375, -1.710205078125, -1.44580078125, -1.181396484375, -0.9169921875, -0.652587890625, -0.38818359375, -0.123779296875, 0.140625, 0.405029296875, 0.66943359375, 0.933837890625, 1.1982421875, 1.462646484375, 1.72705078125, 1.991455078125, 2.255859375, 2.520263671875, 2.78466796875, 3.049072265625, 3.3134765625, 3.577880859375, 3.84228515625, 4.106689453125, 4.37109375, 4.635498046875, 4.89990234375, 5.164306640625, 5.4287109375, 5.693115234375, 5.95751953125, 6.221923828125, 6.486328125, 6.750732421875, 7.01513671875, 7.279541015625, 7.5439453125, 7.808349609375, 8.07275390625, 8.337158203125, 8.6015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 10.0, 16.0, 13.0, 15.0, 15.0, 33.0, 39.0, 53.0, 64.0, 73.0, 93.0, 92.0, 105.0, 71.0, 68.0, 61.0, 49.0, 27.0, 20.0, 20.0, 12.0, 15.0, 7.0, 6.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0859375, -4.8626708984375, -4.639404296875, -4.4161376953125, -4.19287109375, -3.9696044921875, -3.746337890625, -3.5230712890625, -3.2998046875, -3.0765380859375, -2.853271484375, -2.6300048828125, -2.40673828125, -2.1834716796875, -1.960205078125, -1.7369384765625, -1.513671875, -1.2904052734375, -1.067138671875, -0.8438720703125, -0.62060546875, -0.3973388671875, -0.174072265625, 0.0491943359375, 0.2724609375, 0.4957275390625, 0.718994140625, 0.9422607421875, 1.16552734375, 1.3887939453125, 1.612060546875, 1.8353271484375, 2.05859375, 2.2818603515625, 2.505126953125, 2.7283935546875, 2.95166015625, 3.1749267578125, 3.398193359375, 3.6214599609375, 3.8447265625, 4.0679931640625, 4.291259765625, 4.5145263671875, 4.73779296875, 4.9610595703125, 5.184326171875, 5.4075927734375, 5.630859375, 5.8541259765625, 6.077392578125, 6.3006591796875, 6.52392578125, 6.7471923828125, 6.970458984375, 7.1937255859375, 7.4169921875, 7.6402587890625, 7.863525390625, 8.0867919921875, 8.31005859375, 8.5333251953125, 8.756591796875, 8.9798583984375, 9.203125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 2.0, 3.0, 6.0, 8.0, 24.0, 36.0, 70.0, 117.0, 194.0, 236.0, 130.0, 70.0, 42.0, 31.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.21054077148438, -160.87326049804688, -155.53598022460938, -150.19869995117188, -144.86141967773438, -139.52415466308594, -134.18687438964844, -128.84959411621094, -123.51231384277344, -118.17503356933594, -112.83775329589844, -107.50048065185547, -102.16320037841797, -96.82592010498047, -91.4886474609375, -86.1513671875, -80.8140869140625, -75.476806640625, -70.1395263671875, -64.80225372314453, -59.46497344970703, -54.12769317626953, -48.7904167175293, -43.45314025878906, -38.11585998535156, -32.77857971191406, -27.441303253173828, -22.10402488708496, -16.766746520996094, -11.429468154907227, -6.092189788818359, -0.754913330078125, 4.582366943359375, 9.919645309448242, 15.25692367553711, 20.594202041625977, 25.931480407714844, 31.26875877380371, 36.60603713989258, 41.94331359863281, 47.28059387207031, 52.61787414550781, 57.95515060424805, 63.29242706298828, 68.62970733642578, 73.96698760986328, 79.30426025390625, 84.64154052734375, 89.97882080078125, 95.31610107421875, 100.65338134765625, 105.99065399169922, 111.32793426513672, 116.66521453857422, 122.00248718261719, 127.33976745605469, 132.6770477294922, 138.0143280029297, 143.3516082763672, 148.6888885498047, 154.02615356445312, 159.36343383789062, 164.70071411132812, 170.03799438476562, 175.37527465820312]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 6.0, 12.0, 10.0, 16.0, 12.0, 20.0, 24.0, 32.0, 30.0, 32.0, 27.0, 24.0, 44.0, 45.0, 60.0, 55.0, 70.0, 71.0, 61.0, 45.0, 29.0, 36.0, 30.0, 25.0, 26.0, 26.0, 21.0, 20.0, 10.0, 11.0, 12.0, 10.0, 4.0, 5.0, 7.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-132.44412231445312, -128.76947021484375, -125.09483337402344, -121.4201889038086, -117.74554443359375, -114.0708999633789, -110.39625549316406, -106.72160339355469, -103.04696655273438, -99.37232208251953, -95.69767761230469, -92.02303314208984, -88.348388671875, -84.67374420166016, -80.99909973144531, -77.32444763183594, -73.6498031616211, -69.97515869140625, -66.3005142211914, -62.62586975097656, -58.95122528076172, -55.276580810546875, -51.601932525634766, -47.92728805541992, -44.25264358520508, -40.577999114990234, -36.90335464477539, -33.22870635986328, -29.55406379699707, -25.879419326782227, -22.20477294921875, -18.530128479003906, -14.855491638183594, -11.18084716796875, -7.50620174407959, -3.8315563201904297, -0.15691184997558594, 3.517732620239258, 7.192378997802734, 10.867023468017578, 14.541667938232422, 18.216312408447266, 21.89095687866211, 25.565603256225586, 29.24024772644043, 32.914894104003906, 36.58953857421875, 40.264183044433594, 43.93882751464844, 47.61347198486328, 51.288116455078125, 54.96276092529297, 58.63740539550781, 62.312049865722656, 65.9866943359375, 69.66134643554688, 73.33598327636719, 77.01062774658203, 80.68527221679688, 84.35991668701172, 88.03456115722656, 91.7092056274414, 95.38385009765625, 99.05850219726562, 102.73314666748047]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 12.0, 6.0, 16.0, 7.0, 22.0, 41.0, 51.0, 73.0, 98.0, 153.0, 211.0, 329.0, 511.0, 819.0, 1485.0, 2724.0, 5878.0, 14584.0, 46924.0, 254339.0, 1988119.0, 1619689.0, 194723.0, 38901.0, 12808.0, 5551.0, 2588.0, 1448.0, 779.0, 490.0, 285.0, 200.0, 150.0, 84.0, 52.0, 44.0, 23.0, 23.0, 13.0, 6.0, 5.0, 6.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.7578125, -7.4801025390625, -7.202392578125, -6.9246826171875, -6.64697265625, -6.3692626953125, -6.091552734375, -5.8138427734375, -5.5361328125, -5.2584228515625, -4.980712890625, -4.7030029296875, -4.42529296875, -4.1475830078125, -3.869873046875, -3.5921630859375, -3.314453125, -3.0367431640625, -2.759033203125, -2.4813232421875, -2.20361328125, -1.9259033203125, -1.648193359375, -1.3704833984375, -1.0927734375, -0.8150634765625, -0.537353515625, -0.2596435546875, 0.01806640625, 0.2957763671875, 0.573486328125, 0.8511962890625, 1.12890625, 1.4066162109375, 1.684326171875, 1.9620361328125, 2.23974609375, 2.5174560546875, 2.795166015625, 3.0728759765625, 3.3505859375, 3.6282958984375, 3.906005859375, 4.1837158203125, 4.46142578125, 4.7391357421875, 5.016845703125, 5.2945556640625, 5.572265625, 5.8499755859375, 6.127685546875, 6.4053955078125, 6.68310546875, 6.9608154296875, 7.238525390625, 7.5162353515625, 7.7939453125, 8.0716552734375, 8.349365234375, 8.6270751953125, 8.90478515625, 9.1824951171875, 9.460205078125, 9.7379150390625, 10.015625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 5.0, 8.0, 8.0, 13.0, 15.0, 12.0, 26.0, 30.0, 19.0, 27.0, 29.0, 35.0, 33.0, 39.0, 27.0, 43.0, 45.0, 52.0, 49.0, 35.0, 37.0, 48.0, 37.0, 30.0, 39.0, 28.0, 27.0, 35.0, 16.0, 22.0, 21.0, 21.0, 14.0, 13.0, 11.0, 12.0, 6.0, 4.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.48828125, -5.30853271484375, -5.1287841796875, -4.94903564453125, -4.769287109375, -4.58953857421875, -4.4097900390625, -4.23004150390625, -4.05029296875, -3.87054443359375, -3.6907958984375, -3.51104736328125, -3.331298828125, -3.15155029296875, -2.9718017578125, -2.79205322265625, -2.6123046875, -2.43255615234375, -2.2528076171875, -2.07305908203125, -1.893310546875, -1.71356201171875, -1.5338134765625, -1.35406494140625, -1.17431640625, -0.99456787109375, -0.8148193359375, -0.63507080078125, -0.455322265625, -0.27557373046875, -0.0958251953125, 0.08392333984375, 0.263671875, 0.44342041015625, 0.6231689453125, 0.80291748046875, 0.982666015625, 1.16241455078125, 1.3421630859375, 1.52191162109375, 1.70166015625, 1.88140869140625, 2.0611572265625, 2.24090576171875, 2.420654296875, 2.60040283203125, 2.7801513671875, 2.95989990234375, 3.1396484375, 3.31939697265625, 3.4991455078125, 3.67889404296875, 3.858642578125, 4.03839111328125, 4.2181396484375, 4.39788818359375, 4.57763671875, 4.75738525390625, 4.9371337890625, 5.11688232421875, 5.296630859375, 5.47637939453125, 5.6561279296875, 5.83587646484375, 6.015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 11.0, 18.0, 15.0, 19.0, 36.0, 66.0, 110.0, 180.0, 406.0, 834.0, 1968.0, 6134.0, 26511.0, 247783.0, 3602984.0, 266852.0, 29156.0, 7018.0, 2199.0, 899.0, 458.0, 235.0, 143.0, 87.0, 46.0, 39.0, 15.0, 13.0, 15.0, 6.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.453125, -13.863525390625, -13.27392578125, -12.684326171875, -12.0947265625, -11.505126953125, -10.91552734375, -10.325927734375, -9.736328125, -9.146728515625, -8.55712890625, -7.967529296875, -7.3779296875, -6.788330078125, -6.19873046875, -5.609130859375, -5.01953125, -4.429931640625, -3.84033203125, -3.250732421875, -2.6611328125, -2.071533203125, -1.48193359375, -0.892333984375, -0.302734375, 0.286865234375, 0.87646484375, 1.466064453125, 2.0556640625, 2.645263671875, 3.23486328125, 3.824462890625, 4.4140625, 5.003662109375, 5.59326171875, 6.182861328125, 6.7724609375, 7.362060546875, 7.95166015625, 8.541259765625, 9.130859375, 9.720458984375, 10.31005859375, 10.899658203125, 11.4892578125, 12.078857421875, 12.66845703125, 13.258056640625, 13.84765625, 14.437255859375, 15.02685546875, 15.616455078125, 16.2060546875, 16.795654296875, 17.38525390625, 17.974853515625, 18.564453125, 19.154052734375, 19.74365234375, 20.333251953125, 20.9228515625, 21.512451171875, 22.10205078125, 22.691650390625, 23.28125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 6.0, 5.0, 8.0, 15.0, 12.0, 15.0, 25.0, 37.0, 48.0, 83.0, 134.0, 221.0, 362.0, 587.0, 817.0, 653.0, 372.0, 236.0, 136.0, 77.0, 58.0, 32.0, 25.0, 24.0, 14.0, 12.0, 18.0, 11.0, 5.0, 3.0, 4.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.5234375, -14.049072265625, -13.57470703125, -13.100341796875, -12.6259765625, -12.151611328125, -11.67724609375, -11.202880859375, -10.728515625, -10.254150390625, -9.77978515625, -9.305419921875, -8.8310546875, -8.356689453125, -7.88232421875, -7.407958984375, -6.93359375, -6.459228515625, -5.98486328125, -5.510498046875, -5.0361328125, -4.561767578125, -4.08740234375, -3.613037109375, -3.138671875, -2.664306640625, -2.18994140625, -1.715576171875, -1.2412109375, -0.766845703125, -0.29248046875, 0.181884765625, 0.65625, 1.130615234375, 1.60498046875, 2.079345703125, 2.5537109375, 3.028076171875, 3.50244140625, 3.976806640625, 4.451171875, 4.925537109375, 5.39990234375, 5.874267578125, 6.3486328125, 6.822998046875, 7.29736328125, 7.771728515625, 8.24609375, 8.720458984375, 9.19482421875, 9.669189453125, 10.1435546875, 10.617919921875, 11.09228515625, 11.566650390625, 12.041015625, 12.515380859375, 12.98974609375, 13.464111328125, 13.9384765625, 14.412841796875, 14.88720703125, 15.361572265625, 15.8359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 24.0, 97.0, 310.0, 360.0, 128.0, 37.0, 10.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-277.3424072265625, -267.80377197265625, -258.2651672363281, -248.72654724121094, -239.18792724609375, -229.6492919921875, -220.1106719970703, -210.57205200195312, -201.03343200683594, -191.49481201171875, -181.95619201660156, -172.41757202148438, -162.87893676757812, -153.34033203125, -143.80169677734375, -134.26307678222656, -124.72445678710938, -115.18583679199219, -105.647216796875, -96.10858917236328, -86.5699691772461, -77.0313491821289, -67.49272155761719, -57.9541015625, -48.41548156738281, -38.876861572265625, -29.338237762451172, -19.79961585998535, -10.260993957519531, -0.7223739624023438, 8.81624984741211, 18.354873657226562, 27.89349365234375, 37.43211364746094, 46.97073745727539, 56.509361267089844, 66.04798126220703, 75.58660125732422, 85.12522888183594, 94.66384887695312, 104.20246887207031, 113.7410888671875, 123.27970886230469, 132.81832885742188, 142.35696411132812, 151.89556884765625, 161.4342041015625, 170.9728240966797, 180.51144409179688, 190.05006408691406, 199.58868408203125, 209.12730407714844, 218.66592407226562, 228.20455932617188, 237.74317932128906, 247.28179931640625, 256.8204345703125, 266.35906982421875, 275.8976745605469, 285.4363098144531, 294.97491455078125, 304.5135498046875, 314.0521545410156, 323.5907897949219, 333.12939453125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 10.0, 7.0, 10.0, 16.0, 27.0, 30.0, 30.0, 38.0, 33.0, 48.0, 50.0, 64.0, 59.0, 68.0, 63.0, 54.0, 58.0, 52.0, 45.0, 37.0, 35.0, 33.0, 31.0, 20.0, 17.0, 14.0, 14.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.96266174316406, -67.32160186767578, -64.6805419921875, -62.03947448730469, -59.398414611816406, -56.757354736328125, -54.11629104614258, -51.47522735595703, -48.83416748046875, -46.19310760498047, -43.55204391479492, -40.910980224609375, -38.269920349121094, -35.62886047363281, -32.987796783447266, -30.34673500061035, -27.705673217773438, -25.064611434936523, -22.42354965209961, -19.782487869262695, -17.14142608642578, -14.500364303588867, -11.859302520751953, -9.218240737915039, -6.577178955078125, -3.936117172241211, -1.2950553894042969, 1.3460063934326172, 3.9870681762695312, 6.628129959106445, 9.26919174194336, 11.910253524780273, 14.551315307617188, 17.1923770904541, 19.833438873291016, 22.47450065612793, 25.115562438964844, 27.756624221801758, 30.397686004638672, 33.03874969482422, 35.6798095703125, 38.32086944580078, 40.96193313598633, 43.602996826171875, 46.244056701660156, 48.88511657714844, 51.526180267333984, 54.16724395751953, 56.80830383300781, 59.449363708496094, 62.09042739868164, 64.73149108886719, 67.37255096435547, 70.01361083984375, 72.65467834472656, 75.29573822021484, 77.93679809570312, 80.5778579711914, 83.21891784667969, 85.8599853515625, 88.50104522705078, 91.14210510253906, 93.78317260742188, 96.42423248291016, 99.06529235839844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 10.0, 20.0, 25.0, 48.0, 91.0, 137.0, 210.0, 441.0, 791.0, 1668.0, 3636.0, 8548.0, 21227.0, 58683.0, 168720.0, 355434.0, 268536.0, 100783.0, 35576.0, 13388.0, 5491.0, 2507.0, 1234.0, 577.0, 332.0, 187.0, 95.0, 68.0, 42.0, 26.0, 7.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6875, -7.376953125, -7.06640625, -6.755859375, -6.4453125, -6.134765625, -5.82421875, -5.513671875, -5.203125, -4.892578125, -4.58203125, -4.271484375, -3.9609375, -3.650390625, -3.33984375, -3.029296875, -2.71875, -2.408203125, -2.09765625, -1.787109375, -1.4765625, -1.166015625, -0.85546875, -0.544921875, -0.234375, 0.076171875, 0.38671875, 0.697265625, 1.0078125, 1.318359375, 1.62890625, 1.939453125, 2.25, 2.560546875, 2.87109375, 3.181640625, 3.4921875, 3.802734375, 4.11328125, 4.423828125, 4.734375, 5.044921875, 5.35546875, 5.666015625, 5.9765625, 6.287109375, 6.59765625, 6.908203125, 7.21875, 7.529296875, 7.83984375, 8.150390625, 8.4609375, 8.771484375, 9.08203125, 9.392578125, 9.703125, 10.013671875, 10.32421875, 10.634765625, 10.9453125, 11.255859375, 11.56640625, 11.876953125, 12.1875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 8.0, 13.0, 8.0, 11.0, 11.0, 12.0, 17.0, 21.0, 23.0, 28.0, 26.0, 41.0, 41.0, 36.0, 46.0, 48.0, 39.0, 57.0, 52.0, 56.0, 41.0, 34.0, 48.0, 34.0, 35.0, 25.0, 28.0, 20.0, 25.0, 19.0, 16.0, 11.0, 20.0, 19.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-7.0078125, -6.80377197265625, -6.5997314453125, -6.39569091796875, -6.191650390625, -5.98760986328125, -5.7835693359375, -5.57952880859375, -5.37548828125, -5.17144775390625, -4.9674072265625, -4.76336669921875, -4.559326171875, -4.35528564453125, -4.1512451171875, -3.94720458984375, -3.7431640625, -3.53912353515625, -3.3350830078125, -3.13104248046875, -2.927001953125, -2.72296142578125, -2.5189208984375, -2.31488037109375, -2.11083984375, -1.90679931640625, -1.7027587890625, -1.49871826171875, -1.294677734375, -1.09063720703125, -0.8865966796875, -0.68255615234375, -0.478515625, -0.27447509765625, -0.0704345703125, 0.13360595703125, 0.337646484375, 0.54168701171875, 0.7457275390625, 0.94976806640625, 1.15380859375, 1.35784912109375, 1.5618896484375, 1.76593017578125, 1.969970703125, 2.17401123046875, 2.3780517578125, 2.58209228515625, 2.7861328125, 2.99017333984375, 3.1942138671875, 3.39825439453125, 3.602294921875, 3.80633544921875, 4.0103759765625, 4.21441650390625, 4.41845703125, 4.62249755859375, 4.8265380859375, 5.03057861328125, 5.234619140625, 5.43865966796875, 5.6427001953125, 5.84674072265625, 6.05078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 1.0, 5.0, 8.0, 10.0, 9.0, 12.0, 20.0, 26.0, 37.0, 69.0, 103.0, 129.0, 269.0, 493.0, 1016.0, 2213.0, 4913.0, 14266.0, 48832.0, 206852.0, 584069.0, 134286.0, 33084.0, 10297.0, 3991.0, 1703.0, 792.0, 415.0, 237.0, 127.0, 73.0, 54.0, 34.0, 22.0, 12.0, 20.0, 15.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0], "bins": [-15.7734375, -15.3272705078125, -14.881103515625, -14.4349365234375, -13.98876953125, -13.5426025390625, -13.096435546875, -12.6502685546875, -12.2041015625, -11.7579345703125, -11.311767578125, -10.8656005859375, -10.41943359375, -9.9732666015625, -9.527099609375, -9.0809326171875, -8.634765625, -8.1885986328125, -7.742431640625, -7.2962646484375, -6.85009765625, -6.4039306640625, -5.957763671875, -5.5115966796875, -5.0654296875, -4.6192626953125, -4.173095703125, -3.7269287109375, -3.28076171875, -2.8345947265625, -2.388427734375, -1.9422607421875, -1.49609375, -1.0499267578125, -0.603759765625, -0.1575927734375, 0.28857421875, 0.7347412109375, 1.180908203125, 1.6270751953125, 2.0732421875, 2.5194091796875, 2.965576171875, 3.4117431640625, 3.85791015625, 4.3040771484375, 4.750244140625, 5.1964111328125, 5.642578125, 6.0887451171875, 6.534912109375, 6.9810791015625, 7.42724609375, 7.8734130859375, 8.319580078125, 8.7657470703125, 9.2119140625, 9.6580810546875, 10.104248046875, 10.5504150390625, 10.99658203125, 11.4427490234375, 11.888916015625, 12.3350830078125, 12.78125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 10.0, 7.0, 10.0, 6.0, 11.0, 17.0, 22.0, 19.0, 22.0, 22.0, 31.0, 31.0, 42.0, 45.0, 32.0, 55.0, 55.0, 52.0, 45.0, 50.0, 43.0, 60.0, 52.0, 41.0, 41.0, 39.0, 19.0, 26.0, 20.0, 11.0, 11.0, 11.0, 12.0, 6.0, 6.0, 7.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.859375, -22.052001953125, -21.24462890625, -20.437255859375, -19.6298828125, -18.822509765625, -18.01513671875, -17.207763671875, -16.400390625, -15.593017578125, -14.78564453125, -13.978271484375, -13.1708984375, -12.363525390625, -11.55615234375, -10.748779296875, -9.94140625, -9.134033203125, -8.32666015625, -7.519287109375, -6.7119140625, -5.904541015625, -5.09716796875, -4.289794921875, -3.482421875, -2.675048828125, -1.86767578125, -1.060302734375, -0.2529296875, 0.554443359375, 1.36181640625, 2.169189453125, 2.9765625, 3.783935546875, 4.59130859375, 5.398681640625, 6.2060546875, 7.013427734375, 7.82080078125, 8.628173828125, 9.435546875, 10.242919921875, 11.05029296875, 11.857666015625, 12.6650390625, 13.472412109375, 14.27978515625, 15.087158203125, 15.89453125, 16.701904296875, 17.50927734375, 18.316650390625, 19.1240234375, 19.931396484375, 20.73876953125, 21.546142578125, 22.353515625, 23.160888671875, 23.96826171875, 24.775634765625, 25.5830078125, 26.390380859375, 27.19775390625, 28.005126953125, 28.8125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 11.0, 11.0, 19.0, 35.0, 36.0, 71.0, 96.0, 152.0, 222.0, 393.0, 625.0, 1173.0, 2194.0, 4815.0, 12110.0, 42440.0, 223393.0, 628183.0, 96275.0, 21934.0, 7383.0, 3184.0, 1571.0, 839.0, 547.0, 310.0, 190.0, 107.0, 74.0, 57.0, 40.0, 19.0, 12.0, 10.0, 8.0, 5.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.2001953125, -4.056640625, -3.9130859375, -3.76953125, -3.6259765625, -3.482421875, -3.3388671875, -3.1953125, -3.0517578125, -2.908203125, -2.7646484375, -2.62109375, -2.4775390625, -2.333984375, -2.1904296875, -2.046875, -1.9033203125, -1.759765625, -1.6162109375, -1.47265625, -1.3291015625, -1.185546875, -1.0419921875, -0.8984375, -0.7548828125, -0.611328125, -0.4677734375, -0.32421875, -0.1806640625, -0.037109375, 0.1064453125, 0.25, 0.3935546875, 0.537109375, 0.6806640625, 0.82421875, 0.9677734375, 1.111328125, 1.2548828125, 1.3984375, 1.5419921875, 1.685546875, 1.8291015625, 1.97265625, 2.1162109375, 2.259765625, 2.4033203125, 2.546875, 2.6904296875, 2.833984375, 2.9775390625, 3.12109375, 3.2646484375, 3.408203125, 3.5517578125, 3.6953125, 3.8388671875, 3.982421875, 4.1259765625, 4.26953125, 4.4130859375, 4.556640625, 4.7001953125, 4.84375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 15.0, 32.0, 124.0, 352.0, 313.0, 99.0, 24.0, 9.0, 2.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003993988037109375, -0.003879457712173462, -0.003764927387237549, -0.0036503970623016357, -0.0035358667373657227, -0.0034213364124298096, -0.0033068060874938965, -0.0031922757625579834, -0.0030777454376220703, -0.0029632151126861572, -0.002848684787750244, -0.002734154462814331, -0.002619624137878418, -0.002505093812942505, -0.002390563488006592, -0.0022760331630706787, -0.0021615028381347656, -0.0020469725131988525, -0.0019324421882629395, -0.0018179118633270264, -0.0017033815383911133, -0.0015888512134552002, -0.0014743208885192871, -0.001359790563583374, -0.001245260238647461, -0.0011307299137115479, -0.0010161995887756348, -0.0009016692638397217, -0.0007871389389038086, -0.0006726086139678955, -0.0005580782890319824, -0.00044354796409606934, -0.00032901763916015625, -0.00021448731422424316, -9.995698928833008e-05, 1.4573335647583008e-05, 0.0001291036605834961, 0.00024363398551940918, 0.00035816431045532227, 0.00047269463539123535, 0.0005872249603271484, 0.0007017552852630615, 0.0008162856101989746, 0.0009308159351348877, 0.0010453462600708008, 0.0011598765850067139, 0.001274406909942627, 0.00138893723487854, 0.0015034675598144531, 0.0016179978847503662, 0.0017325282096862793, 0.0018470585346221924, 0.0019615888595581055, 0.0020761191844940186, 0.0021906495094299316, 0.0023051798343658447, 0.002419710159301758, 0.002534240484237671, 0.002648770809173584, 0.002763301134109497, 0.00287783145904541, 0.0029923617839813232, 0.0031068921089172363, 0.0032214224338531494, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 8.0, 12.0, 11.0, 18.0, 35.0, 45.0, 74.0, 113.0, 196.0, 364.0, 651.0, 1121.0, 2282.0, 4679.0, 11520.0, 34790.0, 129953.0, 583642.0, 200749.0, 50609.0, 15658.0, 5967.0, 2794.0, 1434.0, 745.0, 434.0, 237.0, 163.0, 75.0, 57.0, 25.0, 20.0, 17.0, 13.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.93414306640625, -3.8057861328125, -3.67742919921875, -3.549072265625, -3.42071533203125, -3.2923583984375, -3.16400146484375, -3.03564453125, -2.90728759765625, -2.7789306640625, -2.65057373046875, -2.522216796875, -2.39385986328125, -2.2655029296875, -2.13714599609375, -2.0087890625, -1.88043212890625, -1.7520751953125, -1.62371826171875, -1.495361328125, -1.36700439453125, -1.2386474609375, -1.11029052734375, -0.98193359375, -0.85357666015625, -0.7252197265625, -0.59686279296875, -0.468505859375, -0.34014892578125, -0.2117919921875, -0.08343505859375, 0.044921875, 0.17327880859375, 0.3016357421875, 0.42999267578125, 0.558349609375, 0.68670654296875, 0.8150634765625, 0.94342041015625, 1.07177734375, 1.20013427734375, 1.3284912109375, 1.45684814453125, 1.585205078125, 1.71356201171875, 1.8419189453125, 1.97027587890625, 2.0986328125, 2.22698974609375, 2.3553466796875, 2.48370361328125, 2.612060546875, 2.74041748046875, 2.8687744140625, 2.99713134765625, 3.12548828125, 3.25384521484375, 3.3822021484375, 3.51055908203125, 3.638916015625, 3.76727294921875, 3.8956298828125, 4.02398681640625, 4.15234375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 5.0, 2.0, 3.0, 10.0, 6.0, 9.0, 18.0, 22.0, 33.0, 19.0, 48.0, 56.0, 60.0, 82.0, 82.0, 77.0, 82.0, 93.0, 65.0, 47.0, 42.0, 32.0, 31.0, 13.0, 10.0, 6.0, 9.0, 3.0, 4.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-5.40625, -5.253173828125, -5.10009765625, -4.947021484375, -4.7939453125, -4.640869140625, -4.48779296875, -4.334716796875, -4.181640625, -4.028564453125, -3.87548828125, -3.722412109375, -3.5693359375, -3.416259765625, -3.26318359375, -3.110107421875, -2.95703125, -2.803955078125, -2.65087890625, -2.497802734375, -2.3447265625, -2.191650390625, -2.03857421875, -1.885498046875, -1.732421875, -1.579345703125, -1.42626953125, -1.273193359375, -1.1201171875, -0.967041015625, -0.81396484375, -0.660888671875, -0.5078125, -0.354736328125, -0.20166015625, -0.048583984375, 0.1044921875, 0.257568359375, 0.41064453125, 0.563720703125, 0.716796875, 0.869873046875, 1.02294921875, 1.176025390625, 1.3291015625, 1.482177734375, 1.63525390625, 1.788330078125, 1.94140625, 2.094482421875, 2.24755859375, 2.400634765625, 2.5537109375, 2.706787109375, 2.85986328125, 3.012939453125, 3.166015625, 3.319091796875, 3.47216796875, 3.625244140625, 3.7783203125, 3.931396484375, 4.08447265625, 4.237548828125, 4.390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 18.0, 34.0, 111.0, 259.0, 337.0, 139.0, 44.0, 14.0, 18.0, 6.0, 8.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-272.1866149902344, -265.4140930175781, -258.6416015625, -251.86907958984375, -245.0965576171875, -238.32403564453125, -231.55152893066406, -224.77902221679688, -218.00650024414062, -211.23397827148438, -204.4614715576172, -197.68896484375, -190.91644287109375, -184.1439208984375, -177.3714141845703, -170.59890747070312, -163.82638549804688, -157.05386352539062, -150.28135681152344, -143.50885009765625, -136.736328125, -129.96380615234375, -123.19129943847656, -116.41878509521484, -109.64627075195312, -102.8737564086914, -96.10124206542969, -89.32872772216797, -82.55621337890625, -75.78369903564453, -69.01118469238281, -62.238670349121094, -55.466156005859375, -48.693641662597656, -41.92112731933594, -35.14861297607422, -28.3760986328125, -21.60358428955078, -14.831069946289062, -8.058555603027344, -1.286041259765625, 5.486473083496094, 12.258987426757812, 19.03150177001953, 25.80401611328125, 32.57653045654297, 39.34904479980469, 46.121559143066406, 52.894073486328125, 59.666587829589844, 66.43910217285156, 73.21161651611328, 79.984130859375, 86.75664520263672, 93.52915954589844, 100.30167388916016, 107.07418823242188, 113.8467025756836, 120.61921691894531, 127.39173126220703, 134.16424560546875, 140.936767578125, 147.7092742919922, 154.48178100585938, 161.25430297851562]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 11.0, 12.0, 8.0, 12.0, 11.0, 9.0, 13.0, 21.0, 30.0, 23.0, 18.0, 26.0, 23.0, 28.0, 42.0, 47.0, 49.0, 60.0, 68.0, 77.0, 59.0, 49.0, 25.0, 38.0, 24.0, 25.0, 18.0, 21.0, 20.0, 21.0, 19.0, 9.0, 13.0, 11.0, 10.0, 7.0, 7.0, 4.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-92.05586242675781, -89.19159698486328, -86.32733154296875, -83.46307373046875, -80.59880828857422, -77.73454284667969, -74.87028503417969, -72.00601959228516, -69.14175415039062, -66.2774887084961, -63.41322708129883, -60.54896545410156, -57.68470001220703, -54.8204345703125, -51.956172943115234, -49.09191131591797, -46.22764587402344, -43.363380432128906, -40.49911880493164, -37.634857177734375, -34.770591735839844, -31.906328201293945, -29.042064666748047, -26.17780113220215, -23.31353759765625, -20.44927406311035, -17.585010528564453, -14.720746994018555, -11.856483459472656, -8.992219924926758, -6.127956390380859, -3.263692855834961, -0.3994293212890625, 2.464834213256836, 5.329097747802734, 8.193361282348633, 11.057624816894531, 13.92188835144043, 16.786151885986328, 19.650415420532227, 22.514678955078125, 25.378942489624023, 28.243206024169922, 31.10746955871582, 33.97173309326172, 36.83599853515625, 39.700260162353516, 42.56452178955078, 45.42878723144531, 48.293052673339844, 51.15731430053711, 54.021575927734375, 56.885841369628906, 59.75010681152344, 62.6143684387207, 65.47863006591797, 68.3428955078125, 71.20716094970703, 74.07142639160156, 76.93568420410156, 79.7999496459961, 82.66421508789062, 85.52847290039062, 88.39273834228516, 91.25700378417969]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 14.0, 14.0, 22.0, 15.0, 42.0, 51.0, 81.0, 134.0, 197.0, 270.0, 436.0, 721.0, 1313.0, 2458.0, 4809.0, 11309.0, 29159.0, 92040.0, 355819.0, 1315947.0, 1665720.0, 521995.0, 128819.0, 37050.0, 13320.0, 5840.0, 2931.0, 1542.0, 845.0, 489.0, 302.0, 163.0, 136.0, 86.0, 43.0, 33.0, 36.0, 25.0, 12.0, 9.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.32421875, -5.14752197265625, -4.9708251953125, -4.79412841796875, -4.617431640625, -4.44073486328125, -4.2640380859375, -4.08734130859375, -3.91064453125, -3.73394775390625, -3.5572509765625, -3.38055419921875, -3.203857421875, -3.02716064453125, -2.8504638671875, -2.67376708984375, -2.4970703125, -2.32037353515625, -2.1436767578125, -1.96697998046875, -1.790283203125, -1.61358642578125, -1.4368896484375, -1.26019287109375, -1.08349609375, -0.90679931640625, -0.7301025390625, -0.55340576171875, -0.376708984375, -0.20001220703125, -0.0233154296875, 0.15338134765625, 0.330078125, 0.50677490234375, 0.6834716796875, 0.86016845703125, 1.036865234375, 1.21356201171875, 1.3902587890625, 1.56695556640625, 1.74365234375, 1.92034912109375, 2.0970458984375, 2.27374267578125, 2.450439453125, 2.62713623046875, 2.8038330078125, 2.98052978515625, 3.1572265625, 3.33392333984375, 3.5106201171875, 3.68731689453125, 3.864013671875, 4.04071044921875, 4.2174072265625, 4.39410400390625, 4.57080078125, 4.74749755859375, 4.9241943359375, 5.10089111328125, 5.277587890625, 5.45428466796875, 5.6309814453125, 5.80767822265625, 5.984375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 9.0, 9.0, 5.0, 9.0, 8.0, 18.0, 11.0, 12.0, 29.0, 28.0, 29.0, 27.0, 37.0, 31.0, 37.0, 32.0, 37.0, 50.0, 39.0, 47.0, 47.0, 50.0, 41.0, 29.0, 39.0, 43.0, 30.0, 24.0, 27.0, 29.0, 28.0, 12.0, 19.0, 12.0, 13.0, 12.0, 8.0, 9.0, 9.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.8394775390625, -4.651611328125, -4.4637451171875, -4.27587890625, -4.0880126953125, -3.900146484375, -3.7122802734375, -3.5244140625, -3.3365478515625, -3.148681640625, -2.9608154296875, -2.77294921875, -2.5850830078125, -2.397216796875, -2.2093505859375, -2.021484375, -1.8336181640625, -1.645751953125, -1.4578857421875, -1.27001953125, -1.0821533203125, -0.894287109375, -0.7064208984375, -0.5185546875, -0.3306884765625, -0.142822265625, 0.0450439453125, 0.23291015625, 0.4207763671875, 0.608642578125, 0.7965087890625, 0.984375, 1.1722412109375, 1.360107421875, 1.5479736328125, 1.73583984375, 1.9237060546875, 2.111572265625, 2.2994384765625, 2.4873046875, 2.6751708984375, 2.863037109375, 3.0509033203125, 3.23876953125, 3.4266357421875, 3.614501953125, 3.8023681640625, 3.990234375, 4.1781005859375, 4.365966796875, 4.5538330078125, 4.74169921875, 4.9295654296875, 5.117431640625, 5.3052978515625, 5.4931640625, 5.6810302734375, 5.868896484375, 6.0567626953125, 6.24462890625, 6.4324951171875, 6.620361328125, 6.8082275390625, 6.99609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 4.0, 9.0, 11.0, 11.0, 28.0, 29.0, 58.0, 95.0, 177.0, 422.0, 1033.0, 3667.0, 25264.0, 607089.0, 3453927.0, 90574.0, 8793.0, 1796.0, 633.0, 289.0, 138.0, 86.0, 49.0, 38.0, 21.0, 13.0, 5.0, 3.0, 8.0, 5.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.34375, -21.727294921875, -21.11083984375, -20.494384765625, -19.8779296875, -19.261474609375, -18.64501953125, -18.028564453125, -17.412109375, -16.795654296875, -16.17919921875, -15.562744140625, -14.9462890625, -14.329833984375, -13.71337890625, -13.096923828125, -12.48046875, -11.864013671875, -11.24755859375, -10.631103515625, -10.0146484375, -9.398193359375, -8.78173828125, -8.165283203125, -7.548828125, -6.932373046875, -6.31591796875, -5.699462890625, -5.0830078125, -4.466552734375, -3.85009765625, -3.233642578125, -2.6171875, -2.000732421875, -1.38427734375, -0.767822265625, -0.1513671875, 0.465087890625, 1.08154296875, 1.697998046875, 2.314453125, 2.930908203125, 3.54736328125, 4.163818359375, 4.7802734375, 5.396728515625, 6.01318359375, 6.629638671875, 7.24609375, 7.862548828125, 8.47900390625, 9.095458984375, 9.7119140625, 10.328369140625, 10.94482421875, 11.561279296875, 12.177734375, 12.794189453125, 13.41064453125, 14.027099609375, 14.6435546875, 15.260009765625, 15.87646484375, 16.492919921875, 17.109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 9.0, 10.0, 17.0, 24.0, 32.0, 79.0, 114.0, 193.0, 309.0, 540.0, 759.0, 726.0, 501.0, 314.0, 163.0, 85.0, 62.0, 38.0, 17.0, 21.0, 14.0, 8.0, 14.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.34375, -14.8775634765625, -14.411376953125, -13.9451904296875, -13.47900390625, -13.0128173828125, -12.546630859375, -12.0804443359375, -11.6142578125, -11.1480712890625, -10.681884765625, -10.2156982421875, -9.74951171875, -9.2833251953125, -8.817138671875, -8.3509521484375, -7.884765625, -7.4185791015625, -6.952392578125, -6.4862060546875, -6.02001953125, -5.5538330078125, -5.087646484375, -4.6214599609375, -4.1552734375, -3.6890869140625, -3.222900390625, -2.7567138671875, -2.29052734375, -1.8243408203125, -1.358154296875, -0.8919677734375, -0.42578125, 0.0404052734375, 0.506591796875, 0.9727783203125, 1.43896484375, 1.9051513671875, 2.371337890625, 2.8375244140625, 3.3037109375, 3.7698974609375, 4.236083984375, 4.7022705078125, 5.16845703125, 5.6346435546875, 6.100830078125, 6.5670166015625, 7.033203125, 7.4993896484375, 7.965576171875, 8.4317626953125, 8.89794921875, 9.3641357421875, 9.830322265625, 10.2965087890625, 10.7626953125, 11.2288818359375, 11.695068359375, 12.1612548828125, 12.62744140625, 13.0936279296875, 13.559814453125, 14.0260009765625, 14.4921875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 9.0, 10.0, 16.0, 41.0, 81.0, 109.0, 177.0, 176.0, 174.0, 86.0, 56.0, 25.0, 16.0, 13.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.73074340820312, -136.6337127685547, -132.53668212890625, -128.43963623046875, -124.34260559082031, -120.24557495117188, -116.1485366821289, -112.05149841308594, -107.9544677734375, -103.85743713378906, -99.7603988647461, -95.66336059570312, -91.56632995605469, -87.46929931640625, -83.37226104736328, -79.27522277832031, -75.17819213867188, -71.08116149902344, -66.98412322998047, -62.887088775634766, -58.79005432128906, -54.69301986694336, -50.595985412597656, -46.49895095825195, -42.40191650390625, -38.30488204956055, -34.207847595214844, -30.11081314086914, -26.013778686523438, -21.916744232177734, -17.81970977783203, -13.722675323486328, -9.625656127929688, -5.528621673583984, -1.4315872192382812, 2.665447235107422, 6.762481689453125, 10.859516143798828, 14.956550598144531, 19.053585052490234, 23.150619506835938, 27.24765396118164, 31.344688415527344, 35.44172286987305, 39.53875732421875, 43.63579177856445, 47.732826232910156, 51.82986068725586, 55.92689514160156, 60.023929595947266, 64.12096405029297, 68.21800231933594, 72.31503295898438, 76.41206359863281, 80.50910186767578, 84.60614013671875, 88.70317077636719, 92.80020141601562, 96.8972396850586, 100.99427795410156, 105.09130859375, 109.18833923339844, 113.2853775024414, 117.38241577148438, 121.47944641113281]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 4.0, 8.0, 1.0, 1.0, 13.0, 9.0, 14.0, 15.0, 17.0, 11.0, 21.0, 27.0, 28.0, 32.0, 31.0, 31.0, 34.0, 45.0, 34.0, 43.0, 53.0, 43.0, 51.0, 48.0, 38.0, 36.0, 35.0, 40.0, 30.0, 32.0, 27.0, 17.0, 22.0, 16.0, 17.0, 15.0, 12.0, 12.0, 9.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-51.79722213745117, -50.25037384033203, -48.703521728515625, -47.156673431396484, -45.60982131958008, -44.06297302246094, -42.51612091064453, -40.96927261352539, -39.42242431640625, -37.87557601928711, -36.3287239074707, -34.78187561035156, -33.235023498535156, -31.688175201416016, -30.141324996948242, -28.59447479248047, -27.047624588012695, -25.500774383544922, -23.95392417907715, -22.407073974609375, -20.860225677490234, -19.31337547302246, -17.766525268554688, -16.219676971435547, -14.672825813293457, -13.125975608825684, -11.579126358032227, -10.032276153564453, -8.48542594909668, -6.938576698303223, -5.391726493835449, -3.844877243041992, -2.2980270385742188, -0.751177191734314, 0.7956726551055908, 2.342522621154785, 3.8893723487854004, 5.436222076416016, 6.983072280883789, 8.529921531677246, 10.07677173614502, 11.623621940612793, 13.17047119140625, 14.717321395874023, 16.264171600341797, 17.811019897460938, 19.357872009277344, 20.904720306396484, 22.451570510864258, 23.99842071533203, 25.545270919799805, 27.092121124267578, 28.63896942138672, 30.185819625854492, 31.732669830322266, 33.279518127441406, 34.82637023925781, 36.37321853637695, 37.92007064819336, 39.4669189453125, 41.013771057128906, 42.56061935424805, 44.10746765136719, 45.654319763183594, 47.201168060302734]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 14.0, 16.0, 14.0, 35.0, 46.0, 65.0, 92.0, 154.0, 250.0, 412.0, 661.0, 1198.0, 2116.0, 3976.0, 7959.0, 16381.0, 35835.0, 82547.0, 185967.0, 302107.0, 221502.0, 102775.0, 44243.0, 20038.0, 9517.0, 4849.0, 2434.0, 1317.0, 798.0, 480.0, 266.0, 161.0, 128.0, 75.0, 45.0, 20.0, 22.0, 10.0, 8.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.80078125, -6.5787353515625, -6.356689453125, -6.1346435546875, -5.91259765625, -5.6905517578125, -5.468505859375, -5.2464599609375, -5.0244140625, -4.8023681640625, -4.580322265625, -4.3582763671875, -4.13623046875, -3.9141845703125, -3.692138671875, -3.4700927734375, -3.248046875, -3.0260009765625, -2.803955078125, -2.5819091796875, -2.35986328125, -2.1378173828125, -1.915771484375, -1.6937255859375, -1.4716796875, -1.2496337890625, -1.027587890625, -0.8055419921875, -0.58349609375, -0.3614501953125, -0.139404296875, 0.0826416015625, 0.3046875, 0.5267333984375, 0.748779296875, 0.9708251953125, 1.19287109375, 1.4149169921875, 1.636962890625, 1.8590087890625, 2.0810546875, 2.3031005859375, 2.525146484375, 2.7471923828125, 2.96923828125, 3.1912841796875, 3.413330078125, 3.6353759765625, 3.857421875, 4.0794677734375, 4.301513671875, 4.5235595703125, 4.74560546875, 4.9676513671875, 5.189697265625, 5.4117431640625, 5.6337890625, 5.8558349609375, 6.077880859375, 6.2999267578125, 6.52197265625, 6.7440185546875, 6.966064453125, 7.1881103515625, 7.41015625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 7.0, 0.0, 5.0, 9.0, 5.0, 10.0, 6.0, 17.0, 13.0, 26.0, 13.0, 15.0, 28.0, 20.0, 41.0, 34.0, 34.0, 40.0, 47.0, 60.0, 35.0, 48.0, 43.0, 49.0, 45.0, 46.0, 50.0, 29.0, 32.0, 36.0, 32.0, 17.0, 21.0, 12.0, 15.0, 17.0, 10.0, 9.0, 15.0, 6.0, 3.0, 2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-6.9765625, -6.77044677734375, -6.5643310546875, -6.35821533203125, -6.152099609375, -5.94598388671875, -5.7398681640625, -5.53375244140625, -5.32763671875, -5.12152099609375, -4.9154052734375, -4.70928955078125, -4.503173828125, -4.29705810546875, -4.0909423828125, -3.88482666015625, -3.6787109375, -3.47259521484375, -3.2664794921875, -3.06036376953125, -2.854248046875, -2.64813232421875, -2.4420166015625, -2.23590087890625, -2.02978515625, -1.82366943359375, -1.6175537109375, -1.41143798828125, -1.205322265625, -0.99920654296875, -0.7930908203125, -0.58697509765625, -0.380859375, -0.17474365234375, 0.0313720703125, 0.23748779296875, 0.443603515625, 0.64971923828125, 0.8558349609375, 1.06195068359375, 1.26806640625, 1.47418212890625, 1.6802978515625, 1.88641357421875, 2.092529296875, 2.29864501953125, 2.5047607421875, 2.71087646484375, 2.9169921875, 3.12310791015625, 3.3292236328125, 3.53533935546875, 3.741455078125, 3.94757080078125, 4.1536865234375, 4.35980224609375, 4.56591796875, 4.77203369140625, 4.9781494140625, 5.18426513671875, 5.390380859375, 5.59649658203125, 5.8026123046875, 6.00872802734375, 6.21484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 12.0, 12.0, 12.0, 31.0, 34.0, 66.0, 68.0, 132.0, 129.0, 245.0, 365.0, 626.0, 1257.0, 2892.0, 8320.0, 34859.0, 217748.0, 669574.0, 86501.0, 16611.0, 4845.0, 1886.0, 890.0, 535.0, 272.0, 170.0, 131.0, 91.0, 77.0, 36.0, 37.0, 14.0, 16.0, 11.0, 9.0, 7.0, 4.0, 2.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.4375, -12.92578125, -12.4140625, -11.90234375, -11.390625, -10.87890625, -10.3671875, -9.85546875, -9.34375, -8.83203125, -8.3203125, -7.80859375, -7.296875, -6.78515625, -6.2734375, -5.76171875, -5.25, -4.73828125, -4.2265625, -3.71484375, -3.203125, -2.69140625, -2.1796875, -1.66796875, -1.15625, -0.64453125, -0.1328125, 0.37890625, 0.890625, 1.40234375, 1.9140625, 2.42578125, 2.9375, 3.44921875, 3.9609375, 4.47265625, 4.984375, 5.49609375, 6.0078125, 6.51953125, 7.03125, 7.54296875, 8.0546875, 8.56640625, 9.078125, 9.58984375, 10.1015625, 10.61328125, 11.125, 11.63671875, 12.1484375, 12.66015625, 13.171875, 13.68359375, 14.1953125, 14.70703125, 15.21875, 15.73046875, 16.2421875, 16.75390625, 17.265625, 17.77734375, 18.2890625, 18.80078125, 19.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 4.0, 6.0, 1.0, 4.0, 4.0, 7.0, 6.0, 6.0, 12.0, 12.0, 14.0, 28.0, 31.0, 38.0, 34.0, 43.0, 59.0, 47.0, 73.0, 83.0, 61.0, 63.0, 69.0, 51.0, 53.0, 32.0, 33.0, 30.0, 25.0, 21.0, 15.0, 16.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.579833984375, -19.64404296875, -18.708251953125, -17.7724609375, -16.836669921875, -15.90087890625, -14.965087890625, -14.029296875, -13.093505859375, -12.15771484375, -11.221923828125, -10.2861328125, -9.350341796875, -8.41455078125, -7.478759765625, -6.54296875, -5.607177734375, -4.67138671875, -3.735595703125, -2.7998046875, -1.864013671875, -0.92822265625, 0.007568359375, 0.943359375, 1.879150390625, 2.81494140625, 3.750732421875, 4.6865234375, 5.622314453125, 6.55810546875, 7.493896484375, 8.4296875, 9.365478515625, 10.30126953125, 11.237060546875, 12.1728515625, 13.108642578125, 14.04443359375, 14.980224609375, 15.916015625, 16.851806640625, 17.78759765625, 18.723388671875, 19.6591796875, 20.594970703125, 21.53076171875, 22.466552734375, 23.40234375, 24.338134765625, 25.27392578125, 26.209716796875, 27.1455078125, 28.081298828125, 29.01708984375, 29.952880859375, 30.888671875, 31.824462890625, 32.76025390625, 33.696044921875, 34.6318359375, 35.567626953125, 36.50341796875, 37.439208984375, 38.375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 10.0, 17.0, 18.0, 36.0, 52.0, 55.0, 123.0, 218.0, 445.0, 1025.0, 2736.0, 8272.0, 30595.0, 160220.0, 720767.0, 94170.0, 20388.0, 5763.0, 1968.0, 825.0, 362.0, 198.0, 108.0, 60.0, 31.0, 23.0, 23.0, 13.0, 7.0, 5.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.40234375, -4.27783203125, -4.1533203125, -4.02880859375, -3.904296875, -3.77978515625, -3.6552734375, -3.53076171875, -3.40625, -3.28173828125, -3.1572265625, -3.03271484375, -2.908203125, -2.78369140625, -2.6591796875, -2.53466796875, -2.41015625, -2.28564453125, -2.1611328125, -2.03662109375, -1.912109375, -1.78759765625, -1.6630859375, -1.53857421875, -1.4140625, -1.28955078125, -1.1650390625, -1.04052734375, -0.916015625, -0.79150390625, -0.6669921875, -0.54248046875, -0.41796875, -0.29345703125, -0.1689453125, -0.04443359375, 0.080078125, 0.20458984375, 0.3291015625, 0.45361328125, 0.578125, 0.70263671875, 0.8271484375, 0.95166015625, 1.076171875, 1.20068359375, 1.3251953125, 1.44970703125, 1.57421875, 1.69873046875, 1.8232421875, 1.94775390625, 2.072265625, 2.19677734375, 2.3212890625, 2.44580078125, 2.5703125, 2.69482421875, 2.8193359375, 2.94384765625, 3.068359375, 3.19287109375, 3.3173828125, 3.44189453125, 3.56640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 7.0, 3.0, 13.0, 5.0, 16.0, 24.0, 37.0, 51.0, 67.0, 121.0, 139.0, 137.0, 97.0, 71.0, 36.0, 40.0, 28.0, 24.0, 17.0, 11.0, 11.0, 3.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008206367492675781, -0.0007902011275291443, -0.0007597655057907104, -0.0007293298840522766, -0.0006988942623138428, -0.0006684586405754089, -0.0006380230188369751, -0.0006075873970985413, -0.0005771517753601074, -0.0005467161536216736, -0.0005162805318832397, -0.0004858449101448059, -0.00045540928840637207, -0.00042497366666793823, -0.0003945380449295044, -0.00036410242319107056, -0.0003336668014526367, -0.0003032311797142029, -0.00027279555797576904, -0.0002423599362373352, -0.00021192431449890137, -0.00018148869276046753, -0.0001510530710220337, -0.00012061744928359985, -9.018182754516602e-05, -5.974620580673218e-05, -2.931058406829834e-05, 1.125037670135498e-06, 3.1560659408569336e-05, 6.199628114700317e-05, 9.243190288543701e-05, 0.00012286752462387085, 0.0001533031463623047, 0.00018373876810073853, 0.00021417438983917236, 0.0002446100115776062, 0.00027504563331604004, 0.0003054812550544739, 0.0003359168767929077, 0.00036635249853134155, 0.0003967881202697754, 0.00042722374200820923, 0.00045765936374664307, 0.0004880949854850769, 0.0005185306072235107, 0.0005489662289619446, 0.0005794018507003784, 0.0006098374724388123, 0.0006402730941772461, 0.0006707087159156799, 0.0007011443376541138, 0.0007315799593925476, 0.0007620155811309814, 0.0007924512028694153, 0.0008228868246078491, 0.000853322446346283, 0.0008837580680847168, 0.0009141936898231506, 0.0009446293115615845, 0.0009750649333000183, 0.0010055005550384521, 0.001035936176776886, 0.0010663717985153198, 0.0010968074202537537, 0.0011272430419921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 6.0, 13.0, 27.0, 27.0, 26.0, 61.0, 112.0, 140.0, 281.0, 545.0, 1076.0, 2853.0, 8762.0, 38471.0, 257245.0, 656813.0, 62328.0, 13004.0, 3849.0, 1441.0, 693.0, 303.0, 170.0, 89.0, 56.0, 46.0, 33.0, 18.0, 12.0, 17.0, 6.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.40087890625, -4.2548828125, -4.10888671875, -3.962890625, -3.81689453125, -3.6708984375, -3.52490234375, -3.37890625, -3.23291015625, -3.0869140625, -2.94091796875, -2.794921875, -2.64892578125, -2.5029296875, -2.35693359375, -2.2109375, -2.06494140625, -1.9189453125, -1.77294921875, -1.626953125, -1.48095703125, -1.3349609375, -1.18896484375, -1.04296875, -0.89697265625, -0.7509765625, -0.60498046875, -0.458984375, -0.31298828125, -0.1669921875, -0.02099609375, 0.125, 0.27099609375, 0.4169921875, 0.56298828125, 0.708984375, 0.85498046875, 1.0009765625, 1.14697265625, 1.29296875, 1.43896484375, 1.5849609375, 1.73095703125, 1.876953125, 2.02294921875, 2.1689453125, 2.31494140625, 2.4609375, 2.60693359375, 2.7529296875, 2.89892578125, 3.044921875, 3.19091796875, 3.3369140625, 3.48291015625, 3.62890625, 3.77490234375, 3.9208984375, 4.06689453125, 4.212890625, 4.35888671875, 4.5048828125, 4.65087890625, 4.796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 10.0, 4.0, 4.0, 14.0, 13.0, 11.0, 20.0, 17.0, 21.0, 31.0, 42.0, 71.0, 80.0, 121.0, 101.0, 118.0, 82.0, 70.0, 47.0, 23.0, 26.0, 9.0, 14.0, 13.0, 11.0, 5.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.327880859375, -3.19091796875, -3.053955078125, -2.9169921875, -2.780029296875, -2.64306640625, -2.506103515625, -2.369140625, -2.232177734375, -2.09521484375, -1.958251953125, -1.8212890625, -1.684326171875, -1.54736328125, -1.410400390625, -1.2734375, -1.136474609375, -0.99951171875, -0.862548828125, -0.7255859375, -0.588623046875, -0.45166015625, -0.314697265625, -0.177734375, -0.040771484375, 0.09619140625, 0.233154296875, 0.3701171875, 0.507080078125, 0.64404296875, 0.781005859375, 0.91796875, 1.054931640625, 1.19189453125, 1.328857421875, 1.4658203125, 1.602783203125, 1.73974609375, 1.876708984375, 2.013671875, 2.150634765625, 2.28759765625, 2.424560546875, 2.5615234375, 2.698486328125, 2.83544921875, 2.972412109375, 3.109375, 3.246337890625, 3.38330078125, 3.520263671875, 3.6572265625, 3.794189453125, 3.93115234375, 4.068115234375, 4.205078125, 4.342041015625, 4.47900390625, 4.615966796875, 4.7529296875, 4.889892578125, 5.02685546875, 5.163818359375, 5.30078125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 16.0, 17.0, 36.0, 67.0, 80.0, 163.0, 279.0, 138.0, 72.0, 51.0, 24.0, 14.0, 9.0, 7.0, 7.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.70768737792969, -98.24492645263672, -94.78215789794922, -91.31939697265625, -87.85663604736328, -84.39387512207031, -80.93110656738281, -77.46834564208984, -74.00558471679688, -70.5428237915039, -67.0800552368164, -63.61729431152344, -60.15453338623047, -56.691768646240234, -53.22900390625, -49.76624298095703, -46.30347442626953, -42.8407096862793, -39.37794876098633, -35.915184020996094, -32.452423095703125, -28.98965835571289, -25.526893615722656, -22.064130783081055, -18.601367950439453, -15.138605117797852, -11.675841331481934, -8.213077545166016, -4.750314712524414, -1.2875518798828125, 2.175212860107422, 5.637975692749023, 9.100730895996094, 12.563493728637695, 16.026256561279297, 19.48902130126953, 22.951784133911133, 26.414546966552734, 29.87731170654297, 33.34007263183594, 36.80283737182617, 40.265602111816406, 43.728363037109375, 47.19112777709961, 50.653892517089844, 54.11665344238281, 57.57941818237305, 61.04218292236328, 64.50494384765625, 67.96770477294922, 71.43047332763672, 74.89323425292969, 78.35599517822266, 81.81875610351562, 85.28152465820312, 88.7442855834961, 92.20704650878906, 95.66980743408203, 99.13257598876953, 102.5953369140625, 106.05809783935547, 109.52085876464844, 112.98362731933594, 116.4463882446289, 119.9091567993164]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 10.0, 8.0, 11.0, 11.0, 14.0, 18.0, 26.0, 23.0, 37.0, 29.0, 37.0, 34.0, 53.0, 55.0, 92.0, 87.0, 82.0, 41.0, 41.0, 32.0, 33.0, 16.0, 33.0, 29.0, 20.0, 11.0, 16.0, 8.0, 14.0, 8.0, 12.0, 4.0, 6.0, 6.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.31713104248047, -71.57486724853516, -68.83260345458984, -66.09033966064453, -63.34807205200195, -60.60580825805664, -57.86354064941406, -55.12127685546875, -52.37901306152344, -49.636749267578125, -46.89448547363281, -44.152217864990234, -41.40995407104492, -38.66769027709961, -35.92542266845703, -33.18315887451172, -30.440895080566406, -27.698631286621094, -24.95636558532715, -22.214099884033203, -19.47183609008789, -16.729572296142578, -13.987306594848633, -11.245040893554688, -8.502777099609375, -5.760512351989746, -3.018247604370117, -0.2759828567504883, 2.4662818908691406, 5.2085466384887695, 7.950811386108398, 10.693077087402344, 13.435333251953125, 16.177597045898438, 18.919862747192383, 21.662128448486328, 24.40439224243164, 27.146656036376953, 29.8889217376709, 32.631187438964844, 35.373451232910156, 38.11571502685547, 40.85797882080078, 43.60024642944336, 46.34251022338867, 49.084774017333984, 51.82704162597656, 54.569305419921875, 57.31156921386719, 60.0538330078125, 62.79609680175781, 65.53836059570312, 68.28062438964844, 71.02289581298828, 73.7651596069336, 76.5074234008789, 79.24968719482422, 81.99195098876953, 84.73421478271484, 87.47647857666016, 90.21875, 92.96101379394531, 95.70327758789062, 98.44554138183594, 101.18780517578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 5.0, 8.0, 19.0, 15.0, 29.0, 16.0, 25.0, 59.0, 90.0, 122.0, 243.0, 413.0, 827.0, 1853.0, 4663.0, 13079.0, 44434.0, 203458.0, 1163725.0, 2155327.0, 484111.0, 86792.0, 21827.0, 7460.0, 3049.0, 1285.0, 582.0, 309.0, 158.0, 91.0, 57.0, 39.0, 26.0, 23.0, 8.0, 10.0, 9.0, 6.0, 7.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.68359375, -7.43768310546875, -7.1917724609375, -6.94586181640625, -6.699951171875, -6.45404052734375, -6.2081298828125, -5.96221923828125, -5.71630859375, -5.47039794921875, -5.2244873046875, -4.97857666015625, -4.732666015625, -4.48675537109375, -4.2408447265625, -3.99493408203125, -3.7490234375, -3.50311279296875, -3.2572021484375, -3.01129150390625, -2.765380859375, -2.51947021484375, -2.2735595703125, -2.02764892578125, -1.78173828125, -1.53582763671875, -1.2899169921875, -1.04400634765625, -0.798095703125, -0.55218505859375, -0.3062744140625, -0.06036376953125, 0.185546875, 0.43145751953125, 0.6773681640625, 0.92327880859375, 1.169189453125, 1.41510009765625, 1.6610107421875, 1.90692138671875, 2.15283203125, 2.39874267578125, 2.6446533203125, 2.89056396484375, 3.136474609375, 3.38238525390625, 3.6282958984375, 3.87420654296875, 4.1201171875, 4.36602783203125, 4.6119384765625, 4.85784912109375, 5.103759765625, 5.34967041015625, 5.5955810546875, 5.84149169921875, 6.08740234375, 6.33331298828125, 6.5792236328125, 6.82513427734375, 7.071044921875, 7.31695556640625, 7.5628662109375, 7.80877685546875, 8.0546875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 8.0, 7.0, 8.0, 8.0, 5.0, 5.0, 8.0, 8.0, 10.0, 12.0, 19.0, 23.0, 15.0, 34.0, 32.0, 33.0, 34.0, 34.0, 38.0, 30.0, 44.0, 51.0, 45.0, 43.0, 43.0, 32.0, 53.0, 43.0, 33.0, 41.0, 30.0, 28.0, 25.0, 17.0, 15.0, 10.0, 7.0, 16.0, 11.0, 10.0, 7.0, 8.0, 10.0, 7.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.08984375, -4.9139404296875, -4.738037109375, -4.5621337890625, -4.38623046875, -4.2103271484375, -4.034423828125, -3.8585205078125, -3.6826171875, -3.5067138671875, -3.330810546875, -3.1549072265625, -2.97900390625, -2.8031005859375, -2.627197265625, -2.4512939453125, -2.275390625, -2.0994873046875, -1.923583984375, -1.7476806640625, -1.57177734375, -1.3958740234375, -1.219970703125, -1.0440673828125, -0.8681640625, -0.6922607421875, -0.516357421875, -0.3404541015625, -0.16455078125, 0.0113525390625, 0.187255859375, 0.3631591796875, 0.5390625, 0.7149658203125, 0.890869140625, 1.0667724609375, 1.24267578125, 1.4185791015625, 1.594482421875, 1.7703857421875, 1.9462890625, 2.1221923828125, 2.298095703125, 2.4739990234375, 2.64990234375, 2.8258056640625, 3.001708984375, 3.1776123046875, 3.353515625, 3.5294189453125, 3.705322265625, 3.8812255859375, 4.05712890625, 4.2330322265625, 4.408935546875, 4.5848388671875, 4.7607421875, 4.9366455078125, 5.112548828125, 5.2884521484375, 5.46435546875, 5.6402587890625, 5.816162109375, 5.9920654296875, 6.16796875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 10.0, 13.0, 31.0, 56.0, 92.0, 233.0, 499.0, 1254.0, 6213.0, 168780.0, 3955904.0, 55378.0, 3891.0, 1044.0, 467.0, 201.0, 95.0, 52.0, 26.0, 11.0, 15.0, 2.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.28125, -32.31298828125, -31.3447265625, -30.37646484375, -29.408203125, -28.43994140625, -27.4716796875, -26.50341796875, -25.53515625, -24.56689453125, -23.5986328125, -22.63037109375, -21.662109375, -20.69384765625, -19.7255859375, -18.75732421875, -17.7890625, -16.82080078125, -15.8525390625, -14.88427734375, -13.916015625, -12.94775390625, -11.9794921875, -11.01123046875, -10.04296875, -9.07470703125, -8.1064453125, -7.13818359375, -6.169921875, -5.20166015625, -4.2333984375, -3.26513671875, -2.296875, -1.32861328125, -0.3603515625, 0.60791015625, 1.576171875, 2.54443359375, 3.5126953125, 4.48095703125, 5.44921875, 6.41748046875, 7.3857421875, 8.35400390625, 9.322265625, 10.29052734375, 11.2587890625, 12.22705078125, 13.1953125, 14.16357421875, 15.1318359375, 16.10009765625, 17.068359375, 18.03662109375, 19.0048828125, 19.97314453125, 20.94140625, 21.90966796875, 22.8779296875, 23.84619140625, 24.814453125, 25.78271484375, 26.7509765625, 27.71923828125, 28.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 7.0, 17.0, 19.0, 32.0, 66.0, 142.0, 299.0, 706.0, 1103.0, 860.0, 384.0, 199.0, 98.0, 54.0, 26.0, 30.0, 12.0, 8.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.53125, -20.8056640625, -20.080078125, -19.3544921875, -18.62890625, -17.9033203125, -17.177734375, -16.4521484375, -15.7265625, -15.0009765625, -14.275390625, -13.5498046875, -12.82421875, -12.0986328125, -11.373046875, -10.6474609375, -9.921875, -9.1962890625, -8.470703125, -7.7451171875, -7.01953125, -6.2939453125, -5.568359375, -4.8427734375, -4.1171875, -3.3916015625, -2.666015625, -1.9404296875, -1.21484375, -0.4892578125, 0.236328125, 0.9619140625, 1.6875, 2.4130859375, 3.138671875, 3.8642578125, 4.58984375, 5.3154296875, 6.041015625, 6.7666015625, 7.4921875, 8.2177734375, 8.943359375, 9.6689453125, 10.39453125, 11.1201171875, 11.845703125, 12.5712890625, 13.296875, 14.0224609375, 14.748046875, 15.4736328125, 16.19921875, 16.9248046875, 17.650390625, 18.3759765625, 19.1015625, 19.8271484375, 20.552734375, 21.2783203125, 22.00390625, 22.7294921875, 23.455078125, 24.1806640625, 24.90625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 14.0, 23.0, 52.0, 91.0, 169.0, 167.0, 182.0, 126.0, 66.0, 49.0, 16.0, 16.0, 12.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.00992202758789, -49.64582443237305, -45.28172302246094, -40.917625427246094, -36.55352783203125, -32.18942642211914, -27.825328826904297, -23.46122932434082, -19.097129821777344, -14.733030319213867, -10.368931770324707, -6.004833221435547, -1.6407337188720703, 2.7233657836914062, 7.08746337890625, 11.451562881469727, 15.815662384033203, 20.17976188659668, 24.543861389160156, 28.907958984375, 33.272056579589844, 37.63615798950195, 42.0002555847168, 46.364356994628906, 50.72845458984375, 55.092552185058594, 59.4566535949707, 63.82075119018555, 68.18485260009766, 72.5489501953125, 76.91304779052734, 81.27714538574219, 85.64125061035156, 90.0053482055664, 94.36944580078125, 98.73355102539062, 103.09764862060547, 107.46174621582031, 111.82584381103516, 116.18994140625, 120.55404663085938, 124.91814422607422, 129.28224182128906, 133.64634704589844, 138.01043701171875, 142.37454223632812, 146.7386474609375, 151.1027374267578, 155.46682739257812, 159.8309326171875, 164.1950225830078, 168.5591278076172, 172.9232177734375, 177.28732299804688, 181.65142822265625, 186.01551818847656, 190.37962341308594, 194.7437286376953, 199.10781860351562, 203.471923828125, 207.8360137939453, 212.2001190185547, 216.564208984375, 220.92831420898438, 225.29241943359375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 10.0, 6.0, 10.0, 8.0, 11.0, 12.0, 18.0, 21.0, 17.0, 28.0, 20.0, 28.0, 30.0, 28.0, 51.0, 47.0, 41.0, 39.0, 42.0, 38.0, 29.0, 37.0, 37.0, 31.0, 36.0, 42.0, 39.0, 42.0, 36.0, 23.0, 18.0, 27.0, 20.0, 12.0, 14.0, 13.0, 9.0, 7.0, 6.0, 4.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 3.0], "bins": [-69.38880920410156, -67.54672241210938, -65.70463562011719, -63.862552642822266, -62.020469665527344, -60.178382873535156, -58.33629608154297, -56.49421310424805, -54.652130126953125, -52.81004333496094, -50.967960357666016, -49.12587356567383, -47.283790588378906, -45.44170379638672, -43.59961700439453, -41.75753402709961, -39.91544723510742, -38.073360443115234, -36.23127746582031, -34.389190673828125, -32.5471076965332, -30.705020904541016, -28.86293601989746, -27.020851135253906, -25.17876625061035, -23.336681365966797, -21.494596481323242, -19.652511596679688, -17.8104248046875, -15.968340873718262, -14.12625503540039, -12.284170150756836, -10.442085266113281, -8.600000381469727, -6.757915019989014, -4.915829658508301, -3.073744773864746, -1.2316598892211914, 0.6104259490966797, 2.4525108337402344, 4.294595718383789, 6.136680603027344, 7.978765964508057, 9.82085132598877, 11.662936210632324, 13.505021095275879, 15.34710693359375, 17.189191818237305, 19.03127670288086, 20.873361587524414, 22.71544647216797, 24.557533264160156, 26.399616241455078, 28.241703033447266, 30.08378791809082, 31.925872802734375, 33.76795959472656, 35.61004638671875, 37.45212936401367, 39.29421615600586, 41.13629913330078, 42.97838592529297, 44.820472717285156, 46.66255569458008, 48.504638671875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 11.0, 25.0, 26.0, 33.0, 58.0, 66.0, 133.0, 176.0, 330.0, 554.0, 891.0, 1486.0, 2826.0, 5237.0, 10286.0, 21499.0, 46144.0, 107498.0, 247769.0, 316470.0, 159475.0, 67420.0, 30203.0, 14330.0, 7079.0, 3674.0, 2028.0, 1097.0, 625.0, 392.0, 253.0, 144.0, 106.0, 52.0, 58.0, 30.0, 14.0, 17.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5703125, -8.3123779296875, -8.054443359375, -7.7965087890625, -7.53857421875, -7.2806396484375, -7.022705078125, -6.7647705078125, -6.5068359375, -6.2489013671875, -5.990966796875, -5.7330322265625, -5.47509765625, -5.2171630859375, -4.959228515625, -4.7012939453125, -4.443359375, -4.1854248046875, -3.927490234375, -3.6695556640625, -3.41162109375, -3.1536865234375, -2.895751953125, -2.6378173828125, -2.3798828125, -2.1219482421875, -1.864013671875, -1.6060791015625, -1.34814453125, -1.0902099609375, -0.832275390625, -0.5743408203125, -0.31640625, -0.0584716796875, 0.199462890625, 0.4573974609375, 0.71533203125, 0.9732666015625, 1.231201171875, 1.4891357421875, 1.7470703125, 2.0050048828125, 2.262939453125, 2.5208740234375, 2.77880859375, 3.0367431640625, 3.294677734375, 3.5526123046875, 3.810546875, 4.0684814453125, 4.326416015625, 4.5843505859375, 4.84228515625, 5.1002197265625, 5.358154296875, 5.6160888671875, 5.8740234375, 6.1319580078125, 6.389892578125, 6.6478271484375, 6.90576171875, 7.1636962890625, 7.421630859375, 7.6795654296875, 7.9375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 9.0, 11.0, 11.0, 14.0, 19.0, 24.0, 26.0, 22.0, 30.0, 27.0, 33.0, 39.0, 39.0, 49.0, 48.0, 40.0, 41.0, 35.0, 57.0, 57.0, 43.0, 38.0, 46.0, 25.0, 32.0, 27.0, 23.0, 25.0, 23.0, 15.0, 11.0, 10.0, 8.0, 14.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.375, -5.16705322265625, -4.9591064453125, -4.75115966796875, -4.543212890625, -4.33526611328125, -4.1273193359375, -3.91937255859375, -3.71142578125, -3.50347900390625, -3.2955322265625, -3.08758544921875, -2.879638671875, -2.67169189453125, -2.4637451171875, -2.25579833984375, -2.0478515625, -1.83990478515625, -1.6319580078125, -1.42401123046875, -1.216064453125, -1.00811767578125, -0.8001708984375, -0.59222412109375, -0.38427734375, -0.17633056640625, 0.0316162109375, 0.23956298828125, 0.447509765625, 0.65545654296875, 0.8634033203125, 1.07135009765625, 1.279296875, 1.48724365234375, 1.6951904296875, 1.90313720703125, 2.111083984375, 2.31903076171875, 2.5269775390625, 2.73492431640625, 2.94287109375, 3.15081787109375, 3.3587646484375, 3.56671142578125, 3.774658203125, 3.98260498046875, 4.1905517578125, 4.39849853515625, 4.6064453125, 4.81439208984375, 5.0223388671875, 5.23028564453125, 5.438232421875, 5.64617919921875, 5.8541259765625, 6.06207275390625, 6.27001953125, 6.47796630859375, 6.6859130859375, 6.89385986328125, 7.101806640625, 7.30975341796875, 7.5177001953125, 7.72564697265625, 7.93359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 13.0, 12.0, 17.0, 19.0, 22.0, 29.0, 44.0, 55.0, 67.0, 79.0, 128.0, 188.0, 240.0, 356.0, 469.0, 833.0, 1298.0, 2555.0, 5930.0, 19158.0, 90359.0, 702475.0, 175880.0, 32004.0, 8728.0, 3332.0, 1539.0, 824.0, 532.0, 367.0, 279.0, 184.0, 125.0, 96.0, 79.0, 66.0, 35.0, 36.0, 31.0, 17.0, 9.0, 12.0, 9.0, 7.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-16.1875, -15.692138671875, -15.19677734375, -14.701416015625, -14.2060546875, -13.710693359375, -13.21533203125, -12.719970703125, -12.224609375, -11.729248046875, -11.23388671875, -10.738525390625, -10.2431640625, -9.747802734375, -9.25244140625, -8.757080078125, -8.26171875, -7.766357421875, -7.27099609375, -6.775634765625, -6.2802734375, -5.784912109375, -5.28955078125, -4.794189453125, -4.298828125, -3.803466796875, -3.30810546875, -2.812744140625, -2.3173828125, -1.822021484375, -1.32666015625, -0.831298828125, -0.3359375, 0.159423828125, 0.65478515625, 1.150146484375, 1.6455078125, 2.140869140625, 2.63623046875, 3.131591796875, 3.626953125, 4.122314453125, 4.61767578125, 5.113037109375, 5.6083984375, 6.103759765625, 6.59912109375, 7.094482421875, 7.58984375, 8.085205078125, 8.58056640625, 9.075927734375, 9.5712890625, 10.066650390625, 10.56201171875, 11.057373046875, 11.552734375, 12.048095703125, 12.54345703125, 13.038818359375, 13.5341796875, 14.029541015625, 14.52490234375, 15.020263671875, 15.515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 18.0, 20.0, 13.0, 15.0, 16.0, 33.0, 27.0, 44.0, 48.0, 43.0, 49.0, 53.0, 48.0, 48.0, 55.0, 51.0, 54.0, 38.0, 40.0, 30.0, 40.0, 32.0, 18.0, 25.0, 16.0, 17.0, 8.0, 11.0, 6.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.265625, -22.525634765625, -21.78564453125, -21.045654296875, -20.3056640625, -19.565673828125, -18.82568359375, -18.085693359375, -17.345703125, -16.605712890625, -15.86572265625, -15.125732421875, -14.3857421875, -13.645751953125, -12.90576171875, -12.165771484375, -11.42578125, -10.685791015625, -9.94580078125, -9.205810546875, -8.4658203125, -7.725830078125, -6.98583984375, -6.245849609375, -5.505859375, -4.765869140625, -4.02587890625, -3.285888671875, -2.5458984375, -1.805908203125, -1.06591796875, -0.325927734375, 0.4140625, 1.154052734375, 1.89404296875, 2.634033203125, 3.3740234375, 4.114013671875, 4.85400390625, 5.593994140625, 6.333984375, 7.073974609375, 7.81396484375, 8.553955078125, 9.2939453125, 10.033935546875, 10.77392578125, 11.513916015625, 12.25390625, 12.993896484375, 13.73388671875, 14.473876953125, 15.2138671875, 15.953857421875, 16.69384765625, 17.433837890625, 18.173828125, 18.913818359375, 19.65380859375, 20.393798828125, 21.1337890625, 21.873779296875, 22.61376953125, 23.353759765625, 24.09375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 7.0, 8.0, 6.0, 22.0, 19.0, 25.0, 40.0, 69.0, 103.0, 135.0, 202.0, 371.0, 597.0, 1159.0, 2912.0, 8607.0, 33010.0, 243241.0, 691136.0, 48553.0, 11279.0, 3629.0, 1516.0, 778.0, 406.0, 208.0, 146.0, 92.0, 70.0, 59.0, 44.0, 23.0, 19.0, 19.0, 4.0, 15.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.34375, -4.21258544921875, -4.0814208984375, -3.95025634765625, -3.819091796875, -3.68792724609375, -3.5567626953125, -3.42559814453125, -3.29443359375, -3.16326904296875, -3.0321044921875, -2.90093994140625, -2.769775390625, -2.63861083984375, -2.5074462890625, -2.37628173828125, -2.2451171875, -2.11395263671875, -1.9827880859375, -1.85162353515625, -1.720458984375, -1.58929443359375, -1.4581298828125, -1.32696533203125, -1.19580078125, -1.06463623046875, -0.9334716796875, -0.80230712890625, -0.671142578125, -0.53997802734375, -0.4088134765625, -0.27764892578125, -0.146484375, -0.01531982421875, 0.1158447265625, 0.24700927734375, 0.378173828125, 0.50933837890625, 0.6405029296875, 0.77166748046875, 0.90283203125, 1.03399658203125, 1.1651611328125, 1.29632568359375, 1.427490234375, 1.55865478515625, 1.6898193359375, 1.82098388671875, 1.9521484375, 2.08331298828125, 2.2144775390625, 2.34564208984375, 2.476806640625, 2.60797119140625, 2.7391357421875, 2.87030029296875, 3.00146484375, 3.13262939453125, 3.2637939453125, 3.39495849609375, 3.526123046875, 3.65728759765625, 3.7884521484375, 3.91961669921875, 4.05078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 7.0, 5.0, 6.0, 7.0, 7.0, 9.0, 16.0, 16.0, 24.0, 41.0, 75.0, 126.0, 198.0, 158.0, 99.0, 57.0, 35.0, 18.0, 9.0, 12.0, 9.0, 13.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 2.0, 7.0, 2.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0013914108276367188, -0.0013515353202819824, -0.001311659812927246, -0.0012717843055725098, -0.0012319087982177734, -0.0011920332908630371, -0.0011521577835083008, -0.0011122822761535645, -0.0010724067687988281, -0.0010325312614440918, -0.0009926557540893555, -0.0009527802467346191, -0.0009129047393798828, -0.0008730292320251465, -0.0008331537246704102, -0.0007932782173156738, -0.0007534027099609375, -0.0007135272026062012, -0.0006736516952514648, -0.0006337761878967285, -0.0005939006805419922, -0.0005540251731872559, -0.0005141496658325195, -0.0004742741584777832, -0.0004343986511230469, -0.00039452314376831055, -0.0003546476364135742, -0.0003147721290588379, -0.00027489662170410156, -0.00023502111434936523, -0.0001951456069946289, -0.00015527009963989258, -0.00011539459228515625, -7.551908493041992e-05, -3.5643577575683594e-05, 4.231929779052734e-06, 4.410743713378906e-05, 8.398294448852539e-05, 0.00012385845184326172, 0.00016373395919799805, 0.00020360946655273438, 0.0002434849739074707, 0.00028336048126220703, 0.00032323598861694336, 0.0003631114959716797, 0.000402987003326416, 0.00044286251068115234, 0.00048273801803588867, 0.000522613525390625, 0.0005624890327453613, 0.0006023645401000977, 0.000642240047454834, 0.0006821155548095703, 0.0007219910621643066, 0.000761866569519043, 0.0008017420768737793, 0.0008416175842285156, 0.000881493091583252, 0.0009213685989379883, 0.0009612441062927246, 0.001001119613647461, 0.0010409951210021973, 0.0010808706283569336, 0.00112074613571167, 0.0011606216430664062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 9.0, 14.0, 23.0, 34.0, 49.0, 49.0, 122.0, 160.0, 252.0, 469.0, 721.0, 1406.0, 2937.0, 7127.0, 21524.0, 89898.0, 718839.0, 155312.0, 31829.0, 9968.0, 3811.0, 1780.0, 867.0, 477.0, 314.0, 210.0, 104.0, 85.0, 58.0, 29.0, 16.0, 19.0, 5.0, 7.0, 8.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.162109375, -3.038848876953125, -2.91558837890625, -2.792327880859375, -2.6690673828125, -2.545806884765625, -2.42254638671875, -2.299285888671875, -2.176025390625, -2.052764892578125, -1.92950439453125, -1.806243896484375, -1.6829833984375, -1.559722900390625, -1.43646240234375, -1.313201904296875, -1.18994140625, -1.066680908203125, -0.94342041015625, -0.820159912109375, -0.6968994140625, -0.573638916015625, -0.45037841796875, -0.327117919921875, -0.203857421875, -0.080596923828125, 0.04266357421875, 0.165924072265625, 0.2891845703125, 0.412445068359375, 0.53570556640625, 0.658966064453125, 0.7822265625, 0.905487060546875, 1.02874755859375, 1.152008056640625, 1.2752685546875, 1.398529052734375, 1.52178955078125, 1.645050048828125, 1.768310546875, 1.891571044921875, 2.01483154296875, 2.138092041015625, 2.2613525390625, 2.384613037109375, 2.50787353515625, 2.631134033203125, 2.75439453125, 2.877655029296875, 3.00091552734375, 3.124176025390625, 3.2474365234375, 3.370697021484375, 3.49395751953125, 3.617218017578125, 3.740478515625, 3.863739013671875, 3.98699951171875, 4.110260009765625, 4.2335205078125, 4.356781005859375, 4.48004150390625, 4.603302001953125, 4.7265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 4.0, 12.0, 4.0, 14.0, 6.0, 14.0, 15.0, 18.0, 28.0, 33.0, 29.0, 48.0, 57.0, 77.0, 100.0, 102.0, 88.0, 63.0, 59.0, 41.0, 40.0, 31.0, 13.0, 18.0, 14.0, 13.0, 10.0, 9.0, 3.0, 5.0, 0.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.357421875, -3.24249267578125, -3.1275634765625, -3.01263427734375, -2.897705078125, -2.78277587890625, -2.6678466796875, -2.55291748046875, -2.43798828125, -2.32305908203125, -2.2081298828125, -2.09320068359375, -1.978271484375, -1.86334228515625, -1.7484130859375, -1.63348388671875, -1.5185546875, -1.40362548828125, -1.2886962890625, -1.17376708984375, -1.058837890625, -0.94390869140625, -0.8289794921875, -0.71405029296875, -0.59912109375, -0.48419189453125, -0.3692626953125, -0.25433349609375, -0.139404296875, -0.02447509765625, 0.0904541015625, 0.20538330078125, 0.3203125, 0.43524169921875, 0.5501708984375, 0.66510009765625, 0.780029296875, 0.89495849609375, 1.0098876953125, 1.12481689453125, 1.23974609375, 1.35467529296875, 1.4696044921875, 1.58453369140625, 1.699462890625, 1.81439208984375, 1.9293212890625, 2.04425048828125, 2.1591796875, 2.27410888671875, 2.3890380859375, 2.50396728515625, 2.618896484375, 2.73382568359375, 2.8487548828125, 2.96368408203125, 3.07861328125, 3.19354248046875, 3.3084716796875, 3.42340087890625, 3.538330078125, 3.65325927734375, 3.7681884765625, 3.88311767578125, 3.998046875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 8.0, 18.0, 34.0, 90.0, 216.0, 325.0, 136.0, 74.0, 41.0, 17.0, 10.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.99158477783203, -110.41474151611328, -105.837890625, -101.26104736328125, -96.68419647216797, -92.10735321044922, -87.53050231933594, -82.95365905761719, -78.37681579589844, -73.79997253417969, -69.2231216430664, -64.64627838134766, -60.069427490234375, -55.492584228515625, -50.91573715209961, -46.338890075683594, -41.76203918457031, -37.1851921081543, -32.60834503173828, -28.0314998626709, -23.454652786254883, -18.877805709838867, -14.300960540771484, -9.724113464355469, -5.147266387939453, -0.5704197883605957, 4.006426811218262, 8.583272933959961, 13.160120010375977, 17.736967086791992, 22.313812255859375, 26.89065933227539, 31.467514038085938, 36.04436111450195, 40.62120819091797, 45.19805145263672, 49.77490234375, 54.35174560546875, 58.928592681884766, 63.50543975830078, 68.08229064941406, 72.65913391113281, 77.2359848022461, 81.81282806396484, 86.38967895507812, 90.96652221679688, 95.54336547851562, 100.1202163696289, 104.69705963134766, 109.2739028930664, 113.85075378417969, 118.42759704589844, 123.00444793701172, 127.58129119873047, 132.15814208984375, 136.7349853515625, 141.31182861328125, 145.888671875, 150.46551513671875, 155.04237365722656, 159.6192169189453, 164.19606018066406, 168.7729034423828, 173.34976196289062, 177.92660522460938]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 4.0, 5.0, 9.0, 9.0, 11.0, 13.0, 8.0, 19.0, 26.0, 21.0, 21.0, 32.0, 40.0, 49.0, 47.0, 84.0, 174.0, 94.0, 44.0, 52.0, 23.0, 36.0, 33.0, 20.0, 19.0, 26.0, 18.0, 16.0, 11.0, 8.0, 14.0, 8.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.46981811523438, -116.02001953125, -112.57022094726562, -109.12042236328125, -105.67062377929688, -102.2208251953125, -98.77102661132812, -95.32122802734375, -91.87142944335938, -88.421630859375, -84.97183227539062, -81.52203369140625, -78.07223510742188, -74.6224365234375, -71.17263793945312, -67.72283935546875, -64.27304077148438, -60.8232421875, -57.373443603515625, -53.92364501953125, -50.473846435546875, -47.0240478515625, -43.574249267578125, -40.12445068359375, -36.674652099609375, -33.224853515625, -29.775054931640625, -26.32525634765625, -22.875457763671875, -19.4256591796875, -15.975860595703125, -12.52606201171875, -9.076271057128906, -5.626472473144531, -2.1766738891601562, 1.2731246948242188, 4.722923278808594, 8.172721862792969, 11.622520446777344, 15.072319030761719, 18.522117614746094, 21.97191619873047, 25.421714782714844, 28.87151336669922, 32.321311950683594, 35.77111053466797, 39.220909118652344, 42.67070770263672, 46.120506286621094, 49.57030487060547, 53.020103454589844, 56.46990203857422, 59.919700622558594, 63.36949920654297, 66.81929779052734, 70.26909637451172, 73.7188949584961, 77.16869354248047, 80.61849212646484, 84.06829071044922, 87.5180892944336, 90.96788787841797, 94.41768646240234, 97.86748504638672, 101.3172836303711]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 7.0, 12.0, 14.0, 23.0, 37.0, 51.0, 68.0, 107.0, 170.0, 263.0, 461.0, 721.0, 1332.0, 2413.0, 5202.0, 13192.0, 38842.0, 145421.0, 664665.0, 1884817.0, 1078980.0, 267061.0, 58702.0, 17638.0, 6932.0, 3176.0, 1674.0, 864.0, 505.0, 308.0, 198.0, 117.0, 98.0, 75.0, 31.0, 36.0, 18.0, 13.0, 7.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3203125, -7.055908203125, -6.79150390625, -6.527099609375, -6.2626953125, -5.998291015625, -5.73388671875, -5.469482421875, -5.205078125, -4.940673828125, -4.67626953125, -4.411865234375, -4.1474609375, -3.883056640625, -3.61865234375, -3.354248046875, -3.08984375, -2.825439453125, -2.56103515625, -2.296630859375, -2.0322265625, -1.767822265625, -1.50341796875, -1.239013671875, -0.974609375, -0.710205078125, -0.44580078125, -0.181396484375, 0.0830078125, 0.347412109375, 0.61181640625, 0.876220703125, 1.140625, 1.405029296875, 1.66943359375, 1.933837890625, 2.1982421875, 2.462646484375, 2.72705078125, 2.991455078125, 3.255859375, 3.520263671875, 3.78466796875, 4.049072265625, 4.3134765625, 4.577880859375, 4.84228515625, 5.106689453125, 5.37109375, 5.635498046875, 5.89990234375, 6.164306640625, 6.4287109375, 6.693115234375, 6.95751953125, 7.221923828125, 7.486328125, 7.750732421875, 8.01513671875, 8.279541015625, 8.5439453125, 8.808349609375, 9.07275390625, 9.337158203125, 9.6015625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 12.0, 17.0, 17.0, 24.0, 27.0, 27.0, 27.0, 28.0, 50.0, 42.0, 42.0, 38.0, 67.0, 63.0, 63.0, 71.0, 57.0, 45.0, 44.0, 46.0, 27.0, 39.0, 25.0, 18.0, 19.0, 11.0, 11.0, 6.0, 9.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.78399658203125, -6.5484619140625, -6.31292724609375, -6.077392578125, -5.84185791015625, -5.6063232421875, -5.37078857421875, -5.13525390625, -4.89971923828125, -4.6641845703125, -4.42864990234375, -4.193115234375, -3.95758056640625, -3.7220458984375, -3.48651123046875, -3.2509765625, -3.01544189453125, -2.7799072265625, -2.54437255859375, -2.308837890625, -2.07330322265625, -1.8377685546875, -1.60223388671875, -1.36669921875, -1.13116455078125, -0.8956298828125, -0.66009521484375, -0.424560546875, -0.18902587890625, 0.0465087890625, 0.28204345703125, 0.517578125, 0.75311279296875, 0.9886474609375, 1.22418212890625, 1.459716796875, 1.69525146484375, 1.9307861328125, 2.16632080078125, 2.40185546875, 2.63739013671875, 2.8729248046875, 3.10845947265625, 3.343994140625, 3.57952880859375, 3.8150634765625, 4.05059814453125, 4.2861328125, 4.52166748046875, 4.7572021484375, 4.99273681640625, 5.228271484375, 5.46380615234375, 5.6993408203125, 5.93487548828125, 6.17041015625, 6.40594482421875, 6.6414794921875, 6.87701416015625, 7.112548828125, 7.34808349609375, 7.5836181640625, 7.81915283203125, 8.0546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 10.0, 5.0, 12.0, 16.0, 31.0, 51.0, 70.0, 134.0, 291.0, 514.0, 1307.0, 4316.0, 55335.0, 4032539.0, 91390.0, 5384.0, 1506.0, 643.0, 322.0, 166.0, 91.0, 68.0, 29.0, 25.0, 17.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -46.1337890625, -44.798828125, -43.4638671875, -42.12890625, -40.7939453125, -39.458984375, -38.1240234375, -36.7890625, -35.4541015625, -34.119140625, -32.7841796875, -31.44921875, -30.1142578125, -28.779296875, -27.4443359375, -26.109375, -24.7744140625, -23.439453125, -22.1044921875, -20.76953125, -19.4345703125, -18.099609375, -16.7646484375, -15.4296875, -14.0947265625, -12.759765625, -11.4248046875, -10.08984375, -8.7548828125, -7.419921875, -6.0849609375, -4.75, -3.4150390625, -2.080078125, -0.7451171875, 0.58984375, 1.9248046875, 3.259765625, 4.5947265625, 5.9296875, 7.2646484375, 8.599609375, 9.9345703125, 11.26953125, 12.6044921875, 13.939453125, 15.2744140625, 16.609375, 17.9443359375, 19.279296875, 20.6142578125, 21.94921875, 23.2841796875, 24.619140625, 25.9541015625, 27.2890625, 28.6240234375, 29.958984375, 31.2939453125, 32.62890625, 33.9638671875, 35.298828125, 36.6337890625, 37.96875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 14.0, 19.0, 37.0, 41.0, 68.0, 107.0, 164.0, 280.0, 510.0, 693.0, 736.0, 539.0, 329.0, 185.0, 114.0, 69.0, 60.0, 34.0, 18.0, 10.0, 7.0, 5.0, 6.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2890625, -13.5413818359375, -12.793701171875, -12.0460205078125, -11.29833984375, -10.5506591796875, -9.802978515625, -9.0552978515625, -8.3076171875, -7.5599365234375, -6.812255859375, -6.0645751953125, -5.31689453125, -4.5692138671875, -3.821533203125, -3.0738525390625, -2.326171875, -1.5784912109375, -0.830810546875, -0.0831298828125, 0.66455078125, 1.4122314453125, 2.159912109375, 2.9075927734375, 3.6552734375, 4.4029541015625, 5.150634765625, 5.8983154296875, 6.64599609375, 7.3936767578125, 8.141357421875, 8.8890380859375, 9.63671875, 10.3843994140625, 11.132080078125, 11.8797607421875, 12.62744140625, 13.3751220703125, 14.122802734375, 14.8704833984375, 15.6181640625, 16.3658447265625, 17.113525390625, 17.8612060546875, 18.60888671875, 19.3565673828125, 20.104248046875, 20.8519287109375, 21.599609375, 22.3472900390625, 23.094970703125, 23.8426513671875, 24.59033203125, 25.3380126953125, 26.085693359375, 26.8333740234375, 27.5810546875, 28.3287353515625, 29.076416015625, 29.8240966796875, 30.57177734375, 31.3194580078125, 32.067138671875, 32.8148193359375, 33.5625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 11.0, 32.0, 48.0, 97.0, 163.0, 205.0, 167.0, 98.0, 56.0, 29.0, 24.0, 12.0, 10.0, 9.0, 4.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-207.5370330810547, -200.26132202148438, -192.985595703125, -185.7098846435547, -178.43417358398438, -171.158447265625, -163.8827362060547, -156.60702514648438, -149.331298828125, -142.0555877685547, -134.7798614501953, -127.504150390625, -120.22843170166016, -112.95271301269531, -105.677001953125, -98.40128326416016, -91.12556457519531, -83.84984588623047, -76.57412719726562, -69.29841613769531, -62.02269744873047, -54.746978759765625, -47.47126388549805, -40.19554901123047, -32.919830322265625, -25.644113540649414, -18.368396759033203, -11.092679977416992, -3.8169631958007812, 3.4587554931640625, 10.73447036743164, 18.01018524169922, 25.285888671875, 32.561607360839844, 39.83732223510742, 47.113037109375, 54.388755798339844, 61.66447448730469, 68.940185546875, 76.21590423583984, 83.49162292480469, 90.76734161376953, 98.04306030273438, 105.31877136230469, 112.59449005126953, 119.87020874023438, 127.14591979980469, 134.421630859375, 141.69735717773438, 148.9730682373047, 156.24879455566406, 163.52450561523438, 170.80023193359375, 178.07594299316406, 185.35165405273438, 192.62738037109375, 199.90309143066406, 207.17880249023438, 214.45452880859375, 221.73023986816406, 229.00595092773438, 236.28167724609375, 243.55738830566406, 250.83309936523438, 258.10882568359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 5.0, 8.0, 10.0, 16.0, 24.0, 15.0, 26.0, 35.0, 26.0, 43.0, 48.0, 42.0, 49.0, 57.0, 54.0, 74.0, 73.0, 63.0, 44.0, 45.0, 37.0, 26.0, 42.0, 30.0, 15.0, 10.0, 24.0, 15.0, 14.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.83439636230469, -111.25556182861328, -107.67672729492188, -104.097900390625, -100.5190658569336, -96.94023132324219, -93.36140441894531, -89.7825698852539, -86.2037353515625, -82.6249008178711, -79.04606628417969, -75.46723937988281, -71.8884048461914, -68.3095703125, -64.73074340820312, -61.15190887451172, -57.57307434082031, -53.994239807128906, -50.415409088134766, -46.836578369140625, -43.25774383544922, -39.67890930175781, -36.10007858276367, -32.52124786376953, -28.942413330078125, -25.36358070373535, -21.784748077392578, -18.205915451049805, -14.627082824707031, -11.048250198364258, -7.469417572021484, -3.890584945678711, -0.3117523193359375, 3.267080307006836, 6.845912933349609, 10.424745559692383, 14.003578186035156, 17.58241081237793, 21.161243438720703, 24.740076065063477, 28.31890869140625, 31.897741317749023, 35.4765739440918, 39.05540466308594, 42.634239196777344, 46.21307373046875, 49.79190444946289, 53.37073516845703, 56.94956970214844, 60.528404235839844, 64.10723876953125, 67.68606567382812, 71.26490020751953, 74.84373474121094, 78.42256164550781, 82.00139617919922, 85.58023071289062, 89.15906524658203, 92.73789978027344, 96.31672668457031, 99.89556121826172, 103.47439575195312, 107.05322265625, 110.6320571899414, 114.21089172363281]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 9.0, 20.0, 28.0, 40.0, 54.0, 98.0, 147.0, 244.0, 395.0, 749.0, 1325.0, 2420.0, 5059.0, 11947.0, 32751.0, 107814.0, 434833.0, 323947.0, 81777.0, 25787.0, 9880.0, 4349.0, 2229.0, 1083.0, 602.0, 340.0, 215.0, 157.0, 79.0, 54.0, 32.0, 21.0, 14.0, 14.0, 10.0, 3.0, 11.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.6875, -11.3426513671875, -10.997802734375, -10.6529541015625, -10.30810546875, -9.9632568359375, -9.618408203125, -9.2735595703125, -8.9287109375, -8.5838623046875, -8.239013671875, -7.8941650390625, -7.54931640625, -7.2044677734375, -6.859619140625, -6.5147705078125, -6.169921875, -5.8250732421875, -5.480224609375, -5.1353759765625, -4.79052734375, -4.4456787109375, -4.100830078125, -3.7559814453125, -3.4111328125, -3.0662841796875, -2.721435546875, -2.3765869140625, -2.03173828125, -1.6868896484375, -1.342041015625, -0.9971923828125, -0.65234375, -0.3074951171875, 0.037353515625, 0.3822021484375, 0.72705078125, 1.0718994140625, 1.416748046875, 1.7615966796875, 2.1064453125, 2.4512939453125, 2.796142578125, 3.1409912109375, 3.48583984375, 3.8306884765625, 4.175537109375, 4.5203857421875, 4.865234375, 5.2100830078125, 5.554931640625, 5.8997802734375, 6.24462890625, 6.5894775390625, 6.934326171875, 7.2791748046875, 7.6240234375, 7.9688720703125, 8.313720703125, 8.6585693359375, 9.00341796875, 9.3482666015625, 9.693115234375, 10.0379638671875, 10.3828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 11.0, 11.0, 16.0, 17.0, 23.0, 40.0, 37.0, 56.0, 74.0, 53.0, 57.0, 59.0, 81.0, 91.0, 74.0, 66.0, 53.0, 48.0, 32.0, 29.0, 31.0, 17.0, 9.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.15625, -12.8131103515625, -12.469970703125, -12.1268310546875, -11.78369140625, -11.4405517578125, -11.097412109375, -10.7542724609375, -10.4111328125, -10.0679931640625, -9.724853515625, -9.3817138671875, -9.03857421875, -8.6954345703125, -8.352294921875, -8.0091552734375, -7.666015625, -7.3228759765625, -6.979736328125, -6.6365966796875, -6.29345703125, -5.9503173828125, -5.607177734375, -5.2640380859375, -4.9208984375, -4.5777587890625, -4.234619140625, -3.8914794921875, -3.54833984375, -3.2052001953125, -2.862060546875, -2.5189208984375, -2.17578125, -1.8326416015625, -1.489501953125, -1.1463623046875, -0.80322265625, -0.4600830078125, -0.116943359375, 0.2261962890625, 0.5693359375, 0.9124755859375, 1.255615234375, 1.5987548828125, 1.94189453125, 2.2850341796875, 2.628173828125, 2.9713134765625, 3.314453125, 3.6575927734375, 4.000732421875, 4.3438720703125, 4.68701171875, 5.0301513671875, 5.373291015625, 5.7164306640625, 6.0595703125, 6.4027099609375, 6.745849609375, 7.0889892578125, 7.43212890625, 7.7752685546875, 8.118408203125, 8.4615478515625, 8.8046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 9.0, 10.0, 18.0, 17.0, 34.0, 74.0, 144.0, 270.0, 513.0, 1448.0, 7221.0, 143702.0, 871230.0, 19599.0, 2698.0, 809.0, 330.0, 165.0, 93.0, 62.0, 36.0, 19.0, 22.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.6875, -24.936767578125, -24.18603515625, -23.435302734375, -22.6845703125, -21.933837890625, -21.18310546875, -20.432373046875, -19.681640625, -18.930908203125, -18.18017578125, -17.429443359375, -16.6787109375, -15.927978515625, -15.17724609375, -14.426513671875, -13.67578125, -12.925048828125, -12.17431640625, -11.423583984375, -10.6728515625, -9.922119140625, -9.17138671875, -8.420654296875, -7.669921875, -6.919189453125, -6.16845703125, -5.417724609375, -4.6669921875, -3.916259765625, -3.16552734375, -2.414794921875, -1.6640625, -0.913330078125, -0.16259765625, 0.588134765625, 1.3388671875, 2.089599609375, 2.84033203125, 3.591064453125, 4.341796875, 5.092529296875, 5.84326171875, 6.593994140625, 7.3447265625, 8.095458984375, 8.84619140625, 9.596923828125, 10.34765625, 11.098388671875, 11.84912109375, 12.599853515625, 13.3505859375, 14.101318359375, 14.85205078125, 15.602783203125, 16.353515625, 17.104248046875, 17.85498046875, 18.605712890625, 19.3564453125, 20.107177734375, 20.85791015625, 21.608642578125, 22.359375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 4.0, 4.0, 10.0, 10.0, 7.0, 21.0, 18.0, 25.0, 31.0, 34.0, 31.0, 59.0, 55.0, 69.0, 82.0, 104.0, 94.0, 62.0, 71.0, 33.0, 36.0, 23.0, 23.0, 24.0, 16.0, 10.0, 12.0, 6.0, 6.0, 5.0, 4.0, 6.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.40625, -29.2861328125, -28.166015625, -27.0458984375, -25.92578125, -24.8056640625, -23.685546875, -22.5654296875, -21.4453125, -20.3251953125, -19.205078125, -18.0849609375, -16.96484375, -15.8447265625, -14.724609375, -13.6044921875, -12.484375, -11.3642578125, -10.244140625, -9.1240234375, -8.00390625, -6.8837890625, -5.763671875, -4.6435546875, -3.5234375, -2.4033203125, -1.283203125, -0.1630859375, 0.95703125, 2.0771484375, 3.197265625, 4.3173828125, 5.4375, 6.5576171875, 7.677734375, 8.7978515625, 9.91796875, 11.0380859375, 12.158203125, 13.2783203125, 14.3984375, 15.5185546875, 16.638671875, 17.7587890625, 18.87890625, 19.9990234375, 21.119140625, 22.2392578125, 23.359375, 24.4794921875, 25.599609375, 26.7197265625, 27.83984375, 28.9599609375, 30.080078125, 31.2001953125, 32.3203125, 33.4404296875, 34.560546875, 35.6806640625, 36.80078125, 37.9208984375, 39.041015625, 40.1611328125, 41.28125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 12.0, 16.0, 19.0, 32.0, 46.0, 51.0, 95.0, 117.0, 198.0, 337.0, 668.0, 1625.0, 4243.0, 15585.0, 93085.0, 865799.0, 50555.0, 10305.0, 3263.0, 1116.0, 552.0, 268.0, 182.0, 105.0, 64.0, 62.0, 41.0, 33.0, 21.0, 13.0, 8.0, 4.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.079925537109375, -2.01141357421875, -1.942901611328125, -1.8743896484375, -1.805877685546875, -1.73736572265625, -1.668853759765625, -1.600341796875, -1.531829833984375, -1.46331787109375, -1.394805908203125, -1.3262939453125, -1.257781982421875, -1.18927001953125, -1.120758056640625, -1.05224609375, -0.983734130859375, -0.91522216796875, -0.846710205078125, -0.7781982421875, -0.709686279296875, -0.64117431640625, -0.572662353515625, -0.504150390625, -0.435638427734375, -0.36712646484375, -0.298614501953125, -0.2301025390625, -0.161590576171875, -0.09307861328125, -0.024566650390625, 0.0439453125, 0.112457275390625, 0.18096923828125, 0.249481201171875, 0.3179931640625, 0.386505126953125, 0.45501708984375, 0.523529052734375, 0.592041015625, 0.660552978515625, 0.72906494140625, 0.797576904296875, 0.8660888671875, 0.934600830078125, 1.00311279296875, 1.071624755859375, 1.14013671875, 1.208648681640625, 1.27716064453125, 1.345672607421875, 1.4141845703125, 1.482696533203125, 1.55120849609375, 1.619720458984375, 1.688232421875, 1.756744384765625, 1.82525634765625, 1.893768310546875, 1.9622802734375, 2.030792236328125, 2.09930419921875, 2.167816162109375, 2.236328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 9.0, 12.0, 13.0, 9.0, 7.0, 14.0, 25.0, 40.0, 54.0, 60.0, 73.0, 73.0, 106.0, 93.0, 102.0, 75.0, 40.0, 28.0, 29.0, 19.0, 16.0, 17.0, 14.0, 11.0, 6.0, 4.0, 11.0, 4.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00043463706970214844, -0.00042219460010528564, -0.00040975213050842285, -0.00039730966091156006, -0.00038486719131469727, -0.00037242472171783447, -0.0003599822521209717, -0.0003475397825241089, -0.0003350973129272461, -0.0003226548433303833, -0.0003102123737335205, -0.0002977699041366577, -0.0002853274345397949, -0.00027288496494293213, -0.00026044249534606934, -0.00024800002574920654, -0.00023555755615234375, -0.00022311508655548096, -0.00021067261695861816, -0.00019823014736175537, -0.00018578767776489258, -0.00017334520816802979, -0.000160902738571167, -0.0001484602689743042, -0.0001360177993774414, -0.0001235753297805786, -0.00011113286018371582, -9.869039058685303e-05, -8.624792098999023e-05, -7.380545139312744e-05, -6.136298179626465e-05, -4.8920512199401855e-05, -3.647804260253906e-05, -2.403557300567627e-05, -1.1593103408813477e-05, 8.493661880493164e-07, 1.329183578491211e-05, 2.5734305381774902e-05, 3.8176774978637695e-05, 5.061924457550049e-05, 6.306171417236328e-05, 7.550418376922607e-05, 8.794665336608887e-05, 0.00010038912296295166, 0.00011283159255981445, 0.00012527406215667725, 0.00013771653175354004, 0.00015015900135040283, 0.00016260147094726562, 0.00017504394054412842, 0.0001874864101409912, 0.000199928879737854, 0.0002123713493347168, 0.0002248138189315796, 0.00023725628852844238, 0.0002496987581253052, 0.00026214122772216797, 0.00027458369731903076, 0.00028702616691589355, 0.00029946863651275635, 0.00031191110610961914, 0.00032435357570648193, 0.0003367960453033447, 0.0003492385149002075, 0.0003616809844970703]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 10.0, 13.0, 17.0, 34.0, 55.0, 80.0, 143.0, 199.0, 368.0, 570.0, 956.0, 1721.0, 3644.0, 8081.0, 19753.0, 63347.0, 691905.0, 196624.0, 36423.0, 13154.0, 5582.0, 2580.0, 1309.0, 761.0, 467.0, 276.0, 174.0, 105.0, 61.0, 33.0, 29.0, 12.0, 15.0, 12.0, 6.0, 5.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.308074951171875, -1.26263427734375, -1.217193603515625, -1.1717529296875, -1.126312255859375, -1.08087158203125, -1.035430908203125, -0.989990234375, -0.944549560546875, -0.89910888671875, -0.853668212890625, -0.8082275390625, -0.762786865234375, -0.71734619140625, -0.671905517578125, -0.62646484375, -0.581024169921875, -0.53558349609375, -0.490142822265625, -0.4447021484375, -0.399261474609375, -0.35382080078125, -0.308380126953125, -0.262939453125, -0.217498779296875, -0.17205810546875, -0.126617431640625, -0.0811767578125, -0.035736083984375, 0.00970458984375, 0.055145263671875, 0.1005859375, 0.146026611328125, 0.19146728515625, 0.236907958984375, 0.2823486328125, 0.327789306640625, 0.37322998046875, 0.418670654296875, 0.464111328125, 0.509552001953125, 0.55499267578125, 0.600433349609375, 0.6458740234375, 0.691314697265625, 0.73675537109375, 0.782196044921875, 0.82763671875, 0.873077392578125, 0.91851806640625, 0.963958740234375, 1.0093994140625, 1.054840087890625, 1.10028076171875, 1.145721435546875, 1.191162109375, 1.236602783203125, 1.28204345703125, 1.327484130859375, 1.3729248046875, 1.418365478515625, 1.46380615234375, 1.509246826171875, 1.5546875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 10.0, 8.0, 14.0, 14.0, 23.0, 28.0, 38.0, 33.0, 36.0, 65.0, 64.0, 101.0, 99.0, 101.0, 81.0, 57.0, 47.0, 42.0, 28.0, 19.0, 18.0, 8.0, 18.0, 13.0, 7.0, 5.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.337860107421875, -2.26165771484375, -2.185455322265625, -2.1092529296875, -2.033050537109375, -1.95684814453125, -1.880645751953125, -1.804443359375, -1.728240966796875, -1.65203857421875, -1.575836181640625, -1.4996337890625, -1.423431396484375, -1.34722900390625, -1.271026611328125, -1.19482421875, -1.118621826171875, -1.04241943359375, -0.966217041015625, -0.8900146484375, -0.813812255859375, -0.73760986328125, -0.661407470703125, -0.585205078125, -0.509002685546875, -0.43280029296875, -0.356597900390625, -0.2803955078125, -0.204193115234375, -0.12799072265625, -0.051788330078125, 0.0244140625, 0.100616455078125, 0.17681884765625, 0.253021240234375, 0.3292236328125, 0.405426025390625, 0.48162841796875, 0.557830810546875, 0.634033203125, 0.710235595703125, 0.78643798828125, 0.862640380859375, 0.9388427734375, 1.015045166015625, 1.09124755859375, 1.167449951171875, 1.24365234375, 1.319854736328125, 1.39605712890625, 1.472259521484375, 1.5484619140625, 1.624664306640625, 1.70086669921875, 1.777069091796875, 1.853271484375, 1.929473876953125, 2.00567626953125, 2.081878662109375, 2.1580810546875, 2.234283447265625, 2.31048583984375, 2.386688232421875, 2.462890625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 7.0, 27.0, 77.0, 268.0, 542.0, 55.0, 17.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-281.5025939941406, -273.7172546386719, -265.93194580078125, -258.1466064453125, -250.36126708984375, -242.57594299316406, -234.79061889648438, -227.00527954101562, -219.21994018554688, -211.4346160888672, -203.64927673339844, -195.86395263671875, -188.07861328125, -180.2932891845703, -172.50796508789062, -164.72262573242188, -156.9373016357422, -149.1519775390625, -141.36663818359375, -133.58131408691406, -125.79597473144531, -118.01065063476562, -110.2253189086914, -102.43998718261719, -94.65465545654297, -86.86932373046875, -79.08399200439453, -71.29866027832031, -63.51333236694336, -55.72800064086914, -47.94267272949219, -40.15734100341797, -32.37202453613281, -24.586692810058594, -16.801362991333008, -9.016033172607422, -1.2307014465332031, 6.554630279541016, 14.339958190917969, 22.125289916992188, 29.910621643066406, 37.695953369140625, 45.481285095214844, 53.2666130065918, 61.051944732666016, 68.8372802734375, 76.62260437011719, 84.4079360961914, 92.19326782226562, 99.97859954833984, 107.76393127441406, 115.54925537109375, 123.3345947265625, 131.1199188232422, 138.90524291992188, 146.69058227539062, 154.47592163085938, 162.26124572753906, 170.0465850830078, 177.8319091796875, 185.61724853515625, 193.40257263183594, 201.18789672851562, 208.97323608398438, 216.75856018066406]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 9.0, 19.0, 13.0, 12.0, 23.0, 27.0, 20.0, 27.0, 17.0, 44.0, 118.0, 237.0, 155.0, 50.0, 25.0, 22.0, 31.0, 18.0, 16.0, 15.0, 17.0, 15.0, 10.0, 13.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.02637481689453, -67.87860107421875, -64.73082733154297, -61.58305358886719, -58.435279846191406, -55.287506103515625, -52.13973617553711, -48.99196243286133, -45.84418869018555, -42.696414947509766, -39.548641204833984, -36.40087127685547, -33.25309753417969, -30.105321884155273, -26.957550048828125, -23.809776306152344, -20.662002563476562, -17.51422882080078, -14.366456031799316, -11.218683242797852, -8.07090950012207, -4.923135757446289, -1.7753639221191406, 1.3724098205566406, 4.520183563232422, 7.667956829071045, 10.815730094909668, 13.963502883911133, 17.111276626586914, 20.259050369262695, 23.406822204589844, 26.554595947265625, 29.702377319335938, 32.85015106201172, 35.9979248046875, 39.14569854736328, 42.29347229003906, 45.441246032714844, 48.58901596069336, 51.73678970336914, 54.88456344604492, 58.0323371887207, 61.180110931396484, 64.327880859375, 67.47565460205078, 70.62342834472656, 73.77120208740234, 76.91897583007812, 80.0667495727539, 83.21452331542969, 86.36229705810547, 89.51007080078125, 92.65784454345703, 95.80561828613281, 98.95338439941406, 102.10116577148438, 105.24893188476562, 108.3967056274414, 111.54447937011719, 114.69225311279297, 117.84002685546875, 120.98780059814453, 124.13557434082031, 127.28334045410156, 130.43112182617188]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 11.0, 2.0, 8.0, 13.0, 11.0, 19.0, 13.0, 21.0, 25.0, 25.0, 31.0, 30.0, 36.0, 52.0, 253.0, 153.0, 49.0, 32.0, 36.0, 37.0, 19.0, 27.0, 18.0, 13.0, 22.0, 13.0, 6.0, 11.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.94317626953125, -6.7027587890625, -6.46234130859375, -6.221923828125, -5.98150634765625, -5.7410888671875, -5.50067138671875, -5.26025390625, -5.01983642578125, -4.7794189453125, -4.53900146484375, -4.298583984375, -4.05816650390625, -3.8177490234375, -3.57733154296875, -3.3369140625, -3.09649658203125, -2.8560791015625, -2.61566162109375, -2.375244140625, -2.13482666015625, -1.8944091796875, -1.65399169921875, -1.41357421875, -1.17315673828125, -0.9327392578125, -0.69232177734375, -0.451904296875, -0.21148681640625, 0.0289306640625, 0.26934814453125, 0.509765625, 0.75018310546875, 0.9906005859375, 1.23101806640625, 1.471435546875, 1.71185302734375, 1.9522705078125, 2.19268798828125, 2.43310546875, 2.67352294921875, 2.9139404296875, 3.15435791015625, 3.394775390625, 3.63519287109375, 3.8756103515625, 4.11602783203125, 4.3564453125, 4.59686279296875, 4.8372802734375, 5.07769775390625, 5.318115234375, 5.55853271484375, 5.7989501953125, 6.03936767578125, 6.27978515625, 6.52020263671875, 6.7606201171875, 7.00103759765625, 7.241455078125, 7.48187255859375, 7.7222900390625, 7.96270751953125, 8.203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 4.0, 11.0, 12.0, 21.0, 31.0, 31.0, 90.0, 263.0, 1107.0, 9481.0, 8364348.0, 11551.0, 1142.0, 269.0, 93.0, 46.0, 18.0, 17.0, 14.0, 4.0, 12.0, 9.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-145.31378173828125, -141.224365234375, -137.1349639892578, -133.04556274414062, -128.95614624023438, -124.86673736572266, -120.77732849121094, -116.68791961669922, -112.5985107421875, -108.50910186767578, -104.41969299316406, -100.33028411865234, -96.24087524414062, -92.1514663696289, -88.06205749511719, -83.97264862060547, -79.88323974609375, -75.79383087158203, -71.70442199707031, -67.6150131225586, -63.525604248046875, -59.436195373535156, -55.34678649902344, -51.25737762451172, -47.16796875, -43.07855987548828, -38.98915100097656, -34.899742126464844, -30.810333251953125, -26.720924377441406, -22.631515502929688, -18.54210662841797, -14.452682495117188, -10.363273620605469, -6.27386474609375, -2.1844558715820312, 1.9049530029296875, 5.994361877441406, 10.083770751953125, 14.173179626464844, 18.262588500976562, 22.35199737548828, 26.44140625, 30.53081512451172, 34.62022399902344, 38.709632873535156, 42.799041748046875, 46.888450622558594, 50.97785949707031, 55.06726837158203, 59.15667724609375, 63.24608612060547, 67.33549499511719, 71.4249038696289, 75.51431274414062, 79.60372161865234, 83.69313049316406, 87.78253936767578, 91.8719482421875, 95.96135711669922, 100.05076599121094, 104.14017486572266, 108.22958374023438, 112.3189926147461, 116.40840148925781]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 8.0, 5.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-116.07782745361328, -112.86913299560547, -109.66043090820312, -106.45173645019531, -103.2430419921875, -100.03434753417969, -96.82564544677734, -93.61695098876953, -90.40824890136719, -87.19955444335938, -83.99085235595703, -80.78215789794922, -77.5734634399414, -74.36476135253906, -71.15606689453125, -67.94737243652344, -64.73867797851562, -61.52997970581055, -58.321285247802734, -55.112586975097656, -51.903892517089844, -48.695194244384766, -45.48649597167969, -42.277801513671875, -39.0691032409668, -35.86040496826172, -32.651710510253906, -29.443012237548828, -26.234315872192383, -23.025619506835938, -19.81692123413086, -16.608224868774414, -13.399520874023438, -10.190824508666992, -6.9821271896362305, -3.7734298706054688, -0.5647335052490234, 2.643962860107422, 5.8526611328125, 9.061357498168945, 12.27005386352539, 15.478750228881836, 18.68744659423828, 21.89614486694336, 25.104841232299805, 28.31353759765625, 31.522235870361328, 34.730934143066406, 37.93962860107422, 41.1483268737793, 44.35702133178711, 47.56571960449219, 50.7744140625, 53.98311233520508, 57.191810607910156, 60.40050506591797, 63.60920333862305, 66.81790161132812, 70.02659606933594, 73.23529052734375, 76.4439926147461, 79.6526870727539, 82.86138916015625, 86.07008361816406, 89.27877807617188]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 0.0, 3.0, 2.0, 9.0, 3.0, 8.0, 16.0, 7.0, 26.0, 42.0, 47.0, 93.0, 133.0, 191.0, 257.0, 470.0, 799.0, 1462.0, 2731.0, 5202.0, 10180.0, 20929.0, 43150.0, 88235.0, 136945.0, 105723.0, 54781.0, 26228.0, 12830.0, 6456.0, 3360.0, 1689.0, 970.0, 523.0, 294.0, 194.0, 102.0, 63.0, 42.0, 22.0, 18.0, 15.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0], "bins": [-44.0625, -42.8603515625, -41.658203125, -40.4560546875, -39.25390625, -38.0517578125, -36.849609375, -35.6474609375, -34.4453125, -33.2431640625, -32.041015625, -30.8388671875, -29.63671875, -28.4345703125, -27.232421875, -26.0302734375, -24.828125, -23.6259765625, -22.423828125, -21.2216796875, -20.01953125, -18.8173828125, -17.615234375, -16.4130859375, -15.2109375, -14.0087890625, -12.806640625, -11.6044921875, -10.40234375, -9.2001953125, -7.998046875, -6.7958984375, -5.59375, -4.3916015625, -3.189453125, -1.9873046875, -0.78515625, 0.4169921875, 1.619140625, 2.8212890625, 4.0234375, 5.2255859375, 6.427734375, 7.6298828125, 8.83203125, 10.0341796875, 11.236328125, 12.4384765625, 13.640625, 14.8427734375, 16.044921875, 17.2470703125, 18.44921875, 19.6513671875, 20.853515625, 22.0556640625, 23.2578125, 24.4599609375, 25.662109375, 26.8642578125, 28.06640625, 29.2685546875, 30.470703125, 31.6728515625, 32.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 9.0, 12.0, 10.0, 18.0, 28.0, 29.0, 44.0, 67.0, 70.0, 62.0, 92.0, 80.0, 97.0, 82.0, 71.0, 51.0, 53.0, 31.0, 27.0, 13.0, 22.0, 10.0, 5.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.921875, -12.5694580078125, -12.217041015625, -11.8646240234375, -11.51220703125, -11.1597900390625, -10.807373046875, -10.4549560546875, -10.1025390625, -9.7501220703125, -9.397705078125, -9.0452880859375, -8.69287109375, -8.3404541015625, -7.988037109375, -7.6356201171875, -7.283203125, -6.9307861328125, -6.578369140625, -6.2259521484375, -5.87353515625, -5.5211181640625, -5.168701171875, -4.8162841796875, -4.4638671875, -4.1114501953125, -3.759033203125, -3.4066162109375, -3.05419921875, -2.7017822265625, -2.349365234375, -1.9969482421875, -1.64453125, -1.2921142578125, -0.939697265625, -0.5872802734375, -0.23486328125, 0.1175537109375, 0.469970703125, 0.8223876953125, 1.1748046875, 1.5272216796875, 1.879638671875, 2.2320556640625, 2.58447265625, 2.9368896484375, 3.289306640625, 3.6417236328125, 3.994140625, 4.3465576171875, 4.698974609375, 5.0513916015625, 5.40380859375, 5.7562255859375, 6.108642578125, 6.4610595703125, 6.8134765625, 7.1658935546875, 7.518310546875, 7.8707275390625, 8.22314453125, 8.5755615234375, 8.927978515625, 9.2803955078125, 9.6328125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 1.0, 13.0, 11.0, 23.0, 21.0, 76.0, 130.0, 98.0, 50.0, 25.0, 17.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.0001220703125, -124.15399169921875, -121.307861328125, -118.46173095703125, -115.6156005859375, -112.76947021484375, -109.92333984375, -107.07720947265625, -104.2310791015625, -101.38494873046875, -98.538818359375, -95.69268798828125, -92.8465576171875, -90.00042724609375, -87.154296875, -84.30816650390625, -81.46202850341797, -78.61589813232422, -75.76976776123047, -72.92363739013672, -70.07750701904297, -67.23137664794922, -64.38523864746094, -61.53911209106445, -58.6929817199707, -55.84685134887695, -53.0007209777832, -50.15458679199219, -47.30845642089844, -44.46232604980469, -41.61619567871094, -38.77006530761719, -35.92394256591797, -33.07781219482422, -30.23168182373047, -27.385549545288086, -24.539419174194336, -21.693288803100586, -18.847156524658203, -16.001026153564453, -13.154895782470703, -10.308765411376953, -7.462634086608887, -4.61650276184082, -1.7703723907470703, 1.0757579803466797, 3.9218902587890625, 6.7680206298828125, 9.614151000976562, 12.460281372070312, 15.306412696838379, 18.152544021606445, 20.998674392700195, 23.844804763793945, 26.690937042236328, 29.537067413330078, 32.38319778442383, 35.22932815551758, 38.07545852661133, 40.921592712402344, 43.767723083496094, 46.613853454589844, 49.459983825683594, 52.306114196777344, 55.152244567871094]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 16.0, 12.0, 33.0, 71.0, 103.0, 95.0, 53.0, 27.0, 20.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.629150390625, -56.844322204589844, -55.05949401855469, -53.27466583251953, -51.489837646484375, -49.70500946044922, -47.92018127441406, -46.135353088378906, -44.35052490234375, -42.565696716308594, -40.78086853027344, -38.99604034423828, -37.211212158203125, -35.42638397216797, -33.64155578613281, -31.85672950744629, -30.071903228759766, -28.28707504272461, -26.502246856689453, -24.717418670654297, -22.93259048461914, -21.147762298583984, -19.36293601989746, -17.578107833862305, -15.793279647827148, -14.008451461791992, -12.223623275756836, -10.438796043395996, -8.65396785736084, -6.869139671325684, -5.084312438964844, -3.2994842529296875, -1.5146560668945312, 0.2701718807220459, 2.054999828338623, 3.839827537536621, 5.624655723571777, 7.409483909606934, 9.194311141967773, 10.97913932800293, 12.763967514038086, 14.548795700073242, 16.3336238861084, 18.118450164794922, 19.903278350830078, 21.688106536865234, 23.47293472290039, 25.257762908935547, 27.042591094970703, 28.82741928100586, 30.612247467041016, 32.39707565307617, 34.18190383911133, 35.966732025146484, 37.751556396484375, 39.53638458251953, 41.32121276855469, 43.106040954589844, 44.890869140625, 46.675697326660156, 48.46052551269531, 50.24535369873047, 52.030181884765625, 53.81501007080078, 55.59983825683594]}, "eval/loss": 0.8678382039070129, "eval/wer": 0.14052423755382265, "eval/runtime": 1220.9888, "eval/samples_per_second": 2.164, "eval/steps_per_second": 0.271} \ No newline at end of file +{"train/loss": 0.3805, "train/learning_rate": 2.3942992874109263e-06, "train/epoch": 18.5, "train/global_step": 16500, "_runtime": 114636, "_timestamp": 1647488913, "_step": 16510, "gradients/decoder.cls.predictions.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 9.0, 7.0, 20.0, 30344.0, 81.0, 11.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.125, -147.578125, -143.03125, -138.484375, -133.9375, -129.390625, -124.84375, -120.296875, -115.75, -111.203125, -106.65625, -102.109375, -97.5625, -93.015625, -88.46875, -83.921875, -79.375, -74.828125, -70.28125, -65.734375, -61.1875, -56.640625, -52.09375, -47.546875, -43.0, -38.453125, -33.90625, -29.359375, -24.8125, -20.265625, -15.71875, -11.171875, -6.625, -2.078125, 2.46875, 7.015625, 11.5625, 16.109375, 20.65625, 25.203125, 29.75, 34.296875, 38.84375, 43.390625, 47.9375, 52.484375, 57.03125, 61.578125, 66.125, 70.671875, 75.21875, 79.765625, 84.3125, 88.859375, 93.40625, 97.953125, 102.5, 107.046875, 111.59375, 116.140625, 120.6875, 125.234375, 129.78125, 134.328125, 138.875]}, "gradients/decoder.cls.predictions.transform.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 4.0, 9.0, 12.0, 12.0, 13.0, 11.0, 20.0, 23.0, 14.0, 29.0, 32.0, 36.0, 41.0, 35.0, 33.0, 38.0, 43.0, 49.0, 44.0, 43.0, 52.0, 61.0, 42.0, 49.0, 32.0, 35.0, 22.0, 23.0, 24.0, 28.0, 19.0, 13.0, 15.0, 10.0, 7.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-63.42264175415039, -62.10611343383789, -60.789588928222656, -59.473060607910156, -58.156532287597656, -56.84000778198242, -55.52347946166992, -54.20695495605469, -52.89042663574219, -51.57389831542969, -50.25737380981445, -48.94084548950195, -47.62432098388672, -46.30779266357422, -44.99126434326172, -43.67473602294922, -42.358211517333984, -41.041683197021484, -39.72515869140625, -38.40863037109375, -37.09210205078125, -35.775577545166016, -34.459049224853516, -33.14252471923828, -31.82599639892578, -30.509469985961914, -29.192943572998047, -27.876415252685547, -26.55988883972168, -25.243362426757812, -23.926834106445312, -22.610307693481445, -21.293785095214844, -19.977258682250977, -18.66073226928711, -17.34420394897461, -16.027677536010742, -14.711151123046875, -13.394623756408691, -12.078096389770508, -10.76156997680664, -9.445043563842773, -8.12851619720459, -6.8119893074035645, -5.495462417602539, -4.178935527801514, -2.8624086380004883, -1.5458812713623047, -0.2293548583984375, 1.087172031402588, 2.4036989212036133, 3.7202258110046387, 5.036752700805664, 6.3532795906066895, 7.669806480407715, 8.986333847045898, 10.302860260009766, 11.619386672973633, 12.935914039611816, 14.25244140625, 15.568967819213867, 16.885494232177734, 18.202022552490234, 19.5185489654541, 20.83507537841797]}, "gradients/decoder.cls.predictions.transform.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 10.0, 3.0, 15.0, 23.0, 19.0, 23.0, 35.0, 27.0, 29.0, 26.0, 41.0, 28.0, 43.0, 47.0, 51.0, 57.0, 34.0, 48.0, 46.0, 47.0, 50.0, 33.0, 34.0, 29.0, 20.0, 28.0, 31.0, 24.0, 20.0, 11.0, 10.0, 11.0, 8.0, 8.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.79653549194336, -35.52540969848633, -34.2542839050293, -32.983158111572266, -31.712034225463867, -30.440908432006836, -29.169784545898438, -27.898658752441406, -26.627532958984375, -25.356407165527344, -24.085281372070312, -22.814157485961914, -21.543031692504883, -20.27190589904785, -19.000782012939453, -17.729656219482422, -16.45853042602539, -15.18740463256836, -13.916279792785645, -12.64515495300293, -11.374029159545898, -10.102903366088867, -8.831778526306152, -7.5606536865234375, -6.289527893066406, -5.018402576446533, -3.74727725982666, -2.476151943206787, -1.205026626586914, 0.06609869003295898, 1.337224006652832, 2.608348846435547, 3.8794784545898438, 5.150603771209717, 6.42172908782959, 7.692854404449463, 8.963979721069336, 10.235105514526367, 11.506230354309082, 12.777355194091797, 14.048480987548828, 15.31960678100586, 16.59073257446289, 17.86185646057129, 19.13298225402832, 20.40410804748535, 21.67523193359375, 22.94635772705078, 24.217483520507812, 25.488609313964844, 26.759735107421875, 28.030858993530273, 29.301984786987305, 30.573110580444336, 31.844234466552734, 33.115360260009766, 34.3864860534668, 35.65761184692383, 36.92873764038086, 38.19986343383789, 39.470985412597656, 40.74211120605469, 42.01323699951172, 43.28436279296875, 44.55548858642578]}, "gradients/decoder.cls.predictions.transform.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 8.0, 18.0, 40.0, 36.0, 64.0, 110.0, 149.0, 225.0, 356.0, 517.0, 791.0, 1178.0, 1786.0, 2775.0, 4168.0, 6169.0, 9284.0, 13129.0, 19126.0, 27131.0, 37481.0, 50007.0, 64518.0, 79362.0, 92999.0, 113192.0, 112222.0, 93945.0, 79706.0, 64437.0, 49698.0, 37285.0, 26728.0, 19286.0, 13274.0, 9185.0, 6051.0, 4034.0, 2686.0, 1851.0, 1217.0, 741.0, 526.0, 325.0, 297.0, 138.0, 112.0, 61.0, 48.0, 25.0, 16.0, 20.0, 7.0, 5.0, 3.0, 1.0, 2.0], "bins": [-129.375, -125.4541015625, -121.533203125, -117.6123046875, -113.69140625, -109.7705078125, -105.849609375, -101.9287109375, -98.0078125, -94.0869140625, -90.166015625, -86.2451171875, -82.32421875, -78.4033203125, -74.482421875, -70.5615234375, -66.640625, -62.7197265625, -58.798828125, -54.8779296875, -50.95703125, -47.0361328125, -43.115234375, -39.1943359375, -35.2734375, -31.3525390625, -27.431640625, -23.5107421875, -19.58984375, -15.6689453125, -11.748046875, -7.8271484375, -3.90625, 0.0146484375, 3.935546875, 7.8564453125, 11.77734375, 15.6982421875, 19.619140625, 23.5400390625, 27.4609375, 31.3818359375, 35.302734375, 39.2236328125, 43.14453125, 47.0654296875, 50.986328125, 54.9072265625, 58.828125, 62.7490234375, 66.669921875, 70.5908203125, 74.51171875, 78.4326171875, 82.353515625, 86.2744140625, 90.1953125, 94.1162109375, 98.037109375, 101.9580078125, 105.87890625, 109.7998046875, 113.720703125, 117.6416015625, 121.5625]}, "gradients/decoder.cls.predictions.transform.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 9.0, 14.0, 9.0, 14.0, 18.0, 21.0, 38.0, 33.0, 28.0, 30.0, 43.0, 42.0, 40.0, 41.0, 53.0, 69.0, 54.0, 51.0, 50.0, 31.0, 41.0, 27.0, 43.0, 31.0, 29.0, 14.0, 21.0, 15.0, 18.0, 13.0, 14.0, 6.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.90625, -61.88623046875, -59.8662109375, -57.84619140625, -55.826171875, -53.80615234375, -51.7861328125, -49.76611328125, -47.74609375, -45.72607421875, -43.7060546875, -41.68603515625, -39.666015625, -37.64599609375, -35.6259765625, -33.60595703125, -31.5859375, -29.56591796875, -27.5458984375, -25.52587890625, -23.505859375, -21.48583984375, -19.4658203125, -17.44580078125, -15.42578125, -13.40576171875, -11.3857421875, -9.36572265625, -7.345703125, -5.32568359375, -3.3056640625, -1.28564453125, 0.734375, 2.75439453125, 4.7744140625, 6.79443359375, 8.814453125, 10.83447265625, 12.8544921875, 14.87451171875, 16.89453125, 18.91455078125, 20.9345703125, 22.95458984375, 24.974609375, 26.99462890625, 29.0146484375, 31.03466796875, 33.0546875, 35.07470703125, 37.0947265625, 39.11474609375, 41.134765625, 43.15478515625, 45.1748046875, 47.19482421875, 49.21484375, 51.23486328125, 53.2548828125, 55.27490234375, 57.294921875, 59.31494140625, 61.3349609375, 63.35498046875, 65.375]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 9.0, 14.0, 11.0, 18.0, 23.0, 25.0, 29.0, 28.0, 35.0, 26.0, 38.0, 33.0, 42.0, 54.0, 56.0, 72.0, 56.0, 54.0, 55.0, 42.0, 40.0, 45.0, 33.0, 23.0, 31.0, 17.0, 9.0, 11.0, 12.0, 9.0, 13.0, 10.0, 6.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.490638732910156, -42.03007888793945, -40.56951904296875, -39.10895919799805, -37.648399353027344, -36.18783950805664, -34.72727966308594, -33.26671600341797, -31.8061580657959, -30.345598220825195, -28.885038375854492, -27.424476623535156, -25.963916778564453, -24.50335693359375, -23.042797088623047, -21.582237243652344, -20.12167739868164, -18.661117553710938, -17.200557708740234, -15.739996910095215, -14.279437065124512, -12.818877220153809, -11.358316421508789, -9.897756576538086, -8.437196731567383, -6.97663688659668, -5.516076564788818, -4.055516242980957, -2.594956398010254, -1.1343965530395508, 0.32616424560546875, 1.7867240905761719, 3.247283935546875, 4.707843780517578, 6.1684041023254395, 7.628964424133301, 9.089524269104004, 10.550084114074707, 12.010644912719727, 13.47120475769043, 14.931764602661133, 16.392324447631836, 17.85288429260254, 19.313446044921875, 20.774005889892578, 22.23456573486328, 23.695125579833984, 25.155685424804688, 26.61624526977539, 28.076805114746094, 29.537364959716797, 30.9979248046875, 32.4584846496582, 33.919044494628906, 35.379608154296875, 36.84016418457031, 38.30072784423828, 39.761287689208984, 41.22184753417969, 42.68240737915039, 44.142967224121094, 45.6035270690918, 47.0640869140625, 48.52465057373047, 49.985206604003906]}, "gradients/decoder.bert.encoder.layer.23.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 5.0, 9.0, 11.0, 13.0, 8.0, 19.0, 22.0, 26.0, 21.0, 28.0, 28.0, 35.0, 37.0, 39.0, 45.0, 28.0, 43.0, 37.0, 39.0, 43.0, 44.0, 38.0, 46.0, 31.0, 37.0, 27.0, 24.0, 24.0, 24.0, 28.0, 19.0, 19.0, 21.0, 14.0, 10.0, 11.0, 7.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70409393310547, -34.49701690673828, -33.289939880371094, -32.082862854003906, -30.87578582763672, -29.66870880126953, -28.461631774902344, -27.254554748535156, -26.04747772216797, -24.84040069580078, -23.633323669433594, -22.426246643066406, -21.21916961669922, -20.01209259033203, -18.805015563964844, -17.597938537597656, -16.39086151123047, -15.183784484863281, -13.976707458496094, -12.769630432128906, -11.562553405761719, -10.355476379394531, -9.148399353027344, -7.941322326660156, -6.734245300292969, -5.527168273925781, -4.320091247558594, -3.1130142211914062, -1.9059371948242188, -0.6988601684570312, 0.5082168579101562, 1.7152938842773438, 2.9223709106445312, 4.129447937011719, 5.336524963378906, 6.543601989746094, 7.750679016113281, 8.957756042480469, 10.164833068847656, 11.371910095214844, 12.578987121582031, 13.786064147949219, 14.993141174316406, 16.200218200683594, 17.40729522705078, 18.61437225341797, 19.821449279785156, 21.028526306152344, 22.23560333251953, 23.44268035888672, 24.649757385253906, 25.856834411621094, 27.06391143798828, 28.27098846435547, 29.478065490722656, 30.685142517089844, 31.89221954345703, 33.09929656982422, 34.306373596191406, 35.513450622558594, 36.72052764892578, 37.92760467529297, 39.134681701660156, 40.341758728027344, 41.54883575439453]}, "gradients/decoder.bert.encoder.layer.23.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 8.0, 12.0, 22.0, 26.0, 31.0, 64.0, 92.0, 149.0, 267.0, 453.0, 685.0, 1115.0, 1799.0, 2812.0, 4686.0, 7410.0, 11981.0, 19643.0, 32215.0, 52192.0, 87367.0, 142774.0, 235755.0, 391251.0, 642794.0, 845113.0, 667734.0, 411125.0, 248148.0, 150716.0, 91502.0, 55878.0, 33992.0, 20831.0, 12831.0, 7851.0, 4932.0, 2954.0, 1842.0, 1240.0, 717.0, 477.0, 300.0, 203.0, 112.0, 84.0, 45.0, 21.0, 20.0, 8.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0625, -57.0634765625, -55.064453125, -53.0654296875, -51.06640625, -49.0673828125, -47.068359375, -45.0693359375, -43.0703125, -41.0712890625, -39.072265625, -37.0732421875, -35.07421875, -33.0751953125, -31.076171875, -29.0771484375, -27.078125, -25.0791015625, -23.080078125, -21.0810546875, -19.08203125, -17.0830078125, -15.083984375, -13.0849609375, -11.0859375, -9.0869140625, -7.087890625, -5.0888671875, -3.08984375, -1.0908203125, 0.908203125, 2.9072265625, 4.90625, 6.9052734375, 8.904296875, 10.9033203125, 12.90234375, 14.9013671875, 16.900390625, 18.8994140625, 20.8984375, 22.8974609375, 24.896484375, 26.8955078125, 28.89453125, 30.8935546875, 32.892578125, 34.8916015625, 36.890625, 38.8896484375, 40.888671875, 42.8876953125, 44.88671875, 46.8857421875, 48.884765625, 50.8837890625, 52.8828125, 54.8818359375, 56.880859375, 58.8798828125, 60.87890625, 62.8779296875, 64.876953125, 66.8759765625, 68.875]}, "gradients/decoder.bert.encoder.layer.23.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 10.0, 10.0, 13.0, 10.0, 6.0, 10.0, 20.0, 15.0, 18.0, 30.0, 37.0, 29.0, 37.0, 41.0, 36.0, 38.0, 43.0, 39.0, 30.0, 32.0, 44.0, 34.0, 41.0, 36.0, 36.0, 34.0, 34.0, 28.0, 29.0, 31.0, 18.0, 27.0, 11.0, 17.0, 9.0, 16.0, 10.0, 7.0, 11.0, 1.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1875, -30.12646484375, -29.0654296875, -28.00439453125, -26.943359375, -25.88232421875, -24.8212890625, -23.76025390625, -22.69921875, -21.63818359375, -20.5771484375, -19.51611328125, -18.455078125, -17.39404296875, -16.3330078125, -15.27197265625, -14.2109375, -13.14990234375, -12.0888671875, -11.02783203125, -9.966796875, -8.90576171875, -7.8447265625, -6.78369140625, -5.72265625, -4.66162109375, -3.6005859375, -2.53955078125, -1.478515625, -0.41748046875, 0.6435546875, 1.70458984375, 2.765625, 3.82666015625, 4.8876953125, 5.94873046875, 7.009765625, 8.07080078125, 9.1318359375, 10.19287109375, 11.25390625, 12.31494140625, 13.3759765625, 14.43701171875, 15.498046875, 16.55908203125, 17.6201171875, 18.68115234375, 19.7421875, 20.80322265625, 21.8642578125, 22.92529296875, 23.986328125, 25.04736328125, 26.1083984375, 27.16943359375, 28.23046875, 29.29150390625, 30.3525390625, 31.41357421875, 32.474609375, 33.53564453125, 34.5966796875, 35.65771484375, 36.71875]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 2.0, 3.0, 7.0, 11.0, 12.0, 26.0, 49.0, 54.0, 92.0, 140.0, 180.0, 313.0, 525.0, 795.0, 1176.0, 1946.0, 2977.0, 4800.0, 7550.0, 11961.0, 19577.0, 31342.0, 50626.0, 82832.0, 131337.0, 209190.0, 323936.0, 487916.0, 665310.0, 686852.0, 520390.0, 349876.0, 225004.0, 142641.0, 88389.0, 55849.0, 34026.0, 20930.0, 13179.0, 8315.0, 5175.0, 3280.0, 2007.0, 1388.0, 829.0, 517.0, 320.0, 236.0, 134.0, 89.0, 62.0, 42.0, 32.0, 15.0, 16.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-40.90625, -39.59033203125, -38.2744140625, -36.95849609375, -35.642578125, -34.32666015625, -33.0107421875, -31.69482421875, -30.37890625, -29.06298828125, -27.7470703125, -26.43115234375, -25.115234375, -23.79931640625, -22.4833984375, -21.16748046875, -19.8515625, -18.53564453125, -17.2197265625, -15.90380859375, -14.587890625, -13.27197265625, -11.9560546875, -10.64013671875, -9.32421875, -8.00830078125, -6.6923828125, -5.37646484375, -4.060546875, -2.74462890625, -1.4287109375, -0.11279296875, 1.203125, 2.51904296875, 3.8349609375, 5.15087890625, 6.466796875, 7.78271484375, 9.0986328125, 10.41455078125, 11.73046875, 13.04638671875, 14.3623046875, 15.67822265625, 16.994140625, 18.31005859375, 19.6259765625, 20.94189453125, 22.2578125, 23.57373046875, 24.8896484375, 26.20556640625, 27.521484375, 28.83740234375, 30.1533203125, 31.46923828125, 32.78515625, 34.10107421875, 35.4169921875, 36.73291015625, 38.048828125, 39.36474609375, 40.6806640625, 41.99658203125, 43.3125]}, "gradients/decoder.bert.encoder.layer.23.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 9.0, 10.0, 17.0, 22.0, 22.0, 36.0, 37.0, 40.0, 65.0, 65.0, 72.0, 93.0, 110.0, 143.0, 152.0, 171.0, 195.0, 206.0, 239.0, 232.0, 259.0, 276.0, 224.0, 204.0, 183.0, 162.0, 120.0, 128.0, 101.0, 73.0, 91.0, 56.0, 50.0, 33.0, 29.0, 24.0, 26.0, 26.0, 10.0, 8.0, 12.0, 13.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.25, -15.69677734375, -15.1435546875, -14.59033203125, -14.037109375, -13.48388671875, -12.9306640625, -12.37744140625, -11.82421875, -11.27099609375, -10.7177734375, -10.16455078125, -9.611328125, -9.05810546875, -8.5048828125, -7.95166015625, -7.3984375, -6.84521484375, -6.2919921875, -5.73876953125, -5.185546875, -4.63232421875, -4.0791015625, -3.52587890625, -2.97265625, -2.41943359375, -1.8662109375, -1.31298828125, -0.759765625, -0.20654296875, 0.3466796875, 0.89990234375, 1.453125, 2.00634765625, 2.5595703125, 3.11279296875, 3.666015625, 4.21923828125, 4.7724609375, 5.32568359375, 5.87890625, 6.43212890625, 6.9853515625, 7.53857421875, 8.091796875, 8.64501953125, 9.1982421875, 9.75146484375, 10.3046875, 10.85791015625, 11.4111328125, 11.96435546875, 12.517578125, 13.07080078125, 13.6240234375, 14.17724609375, 14.73046875, 15.28369140625, 15.8369140625, 16.39013671875, 16.943359375, 17.49658203125, 18.0498046875, 18.60302734375, 19.15625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 8.0, 5.0, 16.0, 20.0, 14.0, 11.0, 25.0, 30.0, 35.0, 30.0, 42.0, 39.0, 36.0, 47.0, 49.0, 46.0, 41.0, 52.0, 57.0, 47.0, 59.0, 43.0, 31.0, 29.0, 30.0, 24.0, 22.0, 16.0, 21.0, 15.0, 14.0, 15.0, 5.0, 4.0, 8.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.07200622558594, -41.729984283447266, -40.38795852661133, -39.045936584472656, -37.703914642333984, -36.36189270019531, -35.019866943359375, -33.6778450012207, -32.33582305908203, -30.993799209594727, -29.651777267456055, -28.30975341796875, -26.967731475830078, -25.625707626342773, -24.28368377685547, -22.941661834716797, -21.59963607788086, -20.257612228393555, -18.915590286254883, -17.573566436767578, -16.231544494628906, -14.889520645141602, -13.547496795654297, -12.205473899841309, -10.86345100402832, -9.521428108215332, -8.179405212402344, -6.837381362915039, -5.495358467102051, -4.1533355712890625, -2.811311721801758, -1.4692888259887695, -0.12726593017578125, 1.2147572040557861, 2.5567803382873535, 3.8988037109375, 5.240826606750488, 6.582849502563477, 7.924873352050781, 9.26689624786377, 10.608919143676758, 11.950942039489746, 13.292964935302734, 14.634988784790039, 15.977011680603027, 17.319034576416016, 18.66105842590332, 20.003082275390625, 21.345104217529297, 22.6871280670166, 24.029150009155273, 25.371173858642578, 26.71319580078125, 28.055219650268555, 29.39724349975586, 30.73926544189453, 32.08129119873047, 33.42331314086914, 34.76533889770508, 36.10736083984375, 37.44938278198242, 38.791404724121094, 40.13343048095703, 41.4754524230957, 42.817474365234375]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 7.0, 13.0, 11.0, 16.0, 17.0, 22.0, 16.0, 21.0, 22.0, 32.0, 34.0, 34.0, 39.0, 55.0, 43.0, 41.0, 41.0, 43.0, 41.0, 39.0, 36.0, 43.0, 37.0, 36.0, 31.0, 29.0, 27.0, 31.0, 24.0, 15.0, 8.0, 13.0, 10.0, 12.0, 8.0, 10.0, 6.0, 8.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.21171569824219, -36.03618240356445, -34.86064910888672, -33.685115814208984, -32.50958251953125, -31.33405113220215, -30.158517837524414, -28.982986450195312, -27.807453155517578, -26.631919860839844, -25.45638656616211, -24.280853271484375, -23.105321884155273, -21.92978858947754, -20.754255294799805, -19.578723907470703, -18.403188705444336, -17.2276554107666, -16.052122116088867, -14.87658977508545, -13.701057434082031, -12.525524139404297, -11.349990844726562, -10.174458503723145, -8.99892520904541, -7.823392391204834, -6.647859573364258, -5.472326278686523, -4.296793460845947, -3.121260643005371, -1.9457273483276367, -0.7701950073242188, 0.4053382873535156, 1.5808712244033813, 2.756404161453247, 3.9319372177124023, 5.1074700355529785, 6.283002853393555, 7.458536148071289, 8.634068489074707, 9.809601783752441, 10.985135078430176, 12.160667419433594, 13.336200714111328, 14.511734008789062, 15.68726634979248, 16.86280059814453, 18.038331985473633, 19.213865280151367, 20.3893985748291, 21.564931869506836, 22.740463256835938, 23.915996551513672, 25.091529846191406, 26.26706314086914, 27.442596435546875, 28.61812973022461, 29.793663024902344, 30.969196319580078, 32.14472961425781, 33.32026290893555, 34.49579620361328, 35.67132568359375, 36.846858978271484, 38.02239227294922]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 19.0, 21.0, 43.0, 61.0, 80.0, 147.0, 214.0, 311.0, 518.0, 757.0, 1224.0, 1809.0, 2852.0, 4059.0, 6032.0, 8954.0, 13558.0, 19716.0, 28509.0, 40976.0, 57994.0, 78775.0, 101592.0, 121690.0, 126974.0, 113257.0, 91196.0, 68419.0, 49711.0, 34709.0, 24181.0, 16235.0, 11070.0, 7562.0, 5132.0, 3501.0, 2344.0, 1520.0, 1030.0, 605.0, 438.0, 279.0, 177.0, 96.0, 84.0, 34.0, 28.0, 31.0, 7.0, 10.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.59375, -18.986572265625, -18.37939453125, -17.772216796875, -17.1650390625, -16.557861328125, -15.95068359375, -15.343505859375, -14.736328125, -14.129150390625, -13.52197265625, -12.914794921875, -12.3076171875, -11.700439453125, -11.09326171875, -10.486083984375, -9.87890625, -9.271728515625, -8.66455078125, -8.057373046875, -7.4501953125, -6.843017578125, -6.23583984375, -5.628662109375, -5.021484375, -4.414306640625, -3.80712890625, -3.199951171875, -2.5927734375, -1.985595703125, -1.37841796875, -0.771240234375, -0.1640625, 0.443115234375, 1.05029296875, 1.657470703125, 2.2646484375, 2.871826171875, 3.47900390625, 4.086181640625, 4.693359375, 5.300537109375, 5.90771484375, 6.514892578125, 7.1220703125, 7.729248046875, 8.33642578125, 8.943603515625, 9.55078125, 10.157958984375, 10.76513671875, 11.372314453125, 11.9794921875, 12.586669921875, 13.19384765625, 13.801025390625, 14.408203125, 15.015380859375, 15.62255859375, 16.229736328125, 16.8369140625, 17.444091796875, 18.05126953125, 18.658447265625, 19.265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 10.0, 5.0, 2.0, 9.0, 16.0, 13.0, 18.0, 19.0, 9.0, 27.0, 19.0, 31.0, 34.0, 34.0, 39.0, 52.0, 41.0, 42.0, 49.0, 34.0, 42.0, 41.0, 34.0, 31.0, 42.0, 28.0, 36.0, 33.0, 37.0, 28.0, 22.0, 20.0, 19.0, 19.0, 10.0, 17.0, 9.0, 9.0, 4.0, 3.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.1787109375, -31.076171875, -29.9736328125, -28.87109375, -27.7685546875, -26.666015625, -25.5634765625, -24.4609375, -23.3583984375, -22.255859375, -21.1533203125, -20.05078125, -18.9482421875, -17.845703125, -16.7431640625, -15.640625, -14.5380859375, -13.435546875, -12.3330078125, -11.23046875, -10.1279296875, -9.025390625, -7.9228515625, -6.8203125, -5.7177734375, -4.615234375, -3.5126953125, -2.41015625, -1.3076171875, -0.205078125, 0.8974609375, 2.0, 3.1025390625, 4.205078125, 5.3076171875, 6.41015625, 7.5126953125, 8.615234375, 9.7177734375, 10.8203125, 11.9228515625, 13.025390625, 14.1279296875, 15.23046875, 16.3330078125, 17.435546875, 18.5380859375, 19.640625, 20.7431640625, 21.845703125, 22.9482421875, 24.05078125, 25.1533203125, 26.255859375, 27.3583984375, 28.4609375, 29.5634765625, 30.666015625, 31.7685546875, 32.87109375, 33.9736328125, 35.076171875, 36.1787109375, 37.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 6.0, 8.0, 11.0, 20.0, 17.0, 33.0, 62.0, 90.0, 156.0, 233.0, 372.0, 505.0, 849.0, 1423.0, 2293.0, 3850.0, 6659.0, 11993.0, 24140.0, 157020.0, 770624.0, 33396.0, 15163.0, 8097.0, 4563.0, 2552.0, 1603.0, 1014.0, 644.0, 375.0, 262.0, 168.0, 123.0, 76.0, 49.0, 39.0, 23.0, 13.0, 10.0, 8.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.7236328125, -44.041015625, -42.3583984375, -40.67578125, -38.9931640625, -37.310546875, -35.6279296875, -33.9453125, -32.2626953125, -30.580078125, -28.8974609375, -27.21484375, -25.5322265625, -23.849609375, -22.1669921875, -20.484375, -18.8017578125, -17.119140625, -15.4365234375, -13.75390625, -12.0712890625, -10.388671875, -8.7060546875, -7.0234375, -5.3408203125, -3.658203125, -1.9755859375, -0.29296875, 1.3896484375, 3.072265625, 4.7548828125, 6.4375, 8.1201171875, 9.802734375, 11.4853515625, 13.16796875, 14.8505859375, 16.533203125, 18.2158203125, 19.8984375, 21.5810546875, 23.263671875, 24.9462890625, 26.62890625, 28.3115234375, 29.994140625, 31.6767578125, 33.359375, 35.0419921875, 36.724609375, 38.4072265625, 40.08984375, 41.7724609375, 43.455078125, 45.1376953125, 46.8203125, 48.5029296875, 50.185546875, 51.8681640625, 53.55078125, 55.2333984375, 56.916015625, 58.5986328125, 60.28125]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 4.0, 4.0, 6.0, 12.0, 13.0, 22.0, 25.0, 17.0, 28.0, 40.0, 41.0, 29.0, 40.0, 40.0, 60.0, 41.0, 61.0, 36.0, 42.0, 46.0, 54.0, 36.0, 43.0, 38.0, 36.0, 29.0, 21.0, 27.0, 18.0, 25.0, 12.0, 13.0, 9.0, 5.0, 4.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.21875, -31.0625, -29.90625, -28.75, -27.59375, -26.4375, -25.28125, -24.125, -22.96875, -21.8125, -20.65625, -19.5, -18.34375, -17.1875, -16.03125, -14.875, -13.71875, -12.5625, -11.40625, -10.25, -9.09375, -7.9375, -6.78125, -5.625, -4.46875, -3.3125, -2.15625, -1.0, 0.15625, 1.3125, 2.46875, 3.625, 4.78125, 5.9375, 7.09375, 8.25, 9.40625, 10.5625, 11.71875, 12.875, 14.03125, 15.1875, 16.34375, 17.5, 18.65625, 19.8125, 20.96875, 22.125, 23.28125, 24.4375, 25.59375, 26.75, 27.90625, 29.0625, 30.21875, 31.375, 32.53125, 33.6875, 34.84375, 36.0, 37.15625, 38.3125, 39.46875, 40.625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 3.0, 14.0, 8.0, 18.0, 23.0, 24.0, 34.0, 47.0, 51.0, 80.0, 121.0, 190.0, 311.0, 523.0, 921.0, 1622.0, 3272.0, 6696.0, 15026.0, 41884.0, 871756.0, 70167.0, 18833.0, 8177.0, 3855.0, 2039.0, 1061.0, 645.0, 374.0, 228.0, 166.0, 99.0, 62.0, 56.0, 38.0, 36.0, 18.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.522705078125, -12.10009765625, -11.677490234375, -11.2548828125, -10.832275390625, -10.40966796875, -9.987060546875, -9.564453125, -9.141845703125, -8.71923828125, -8.296630859375, -7.8740234375, -7.451416015625, -7.02880859375, -6.606201171875, -6.18359375, -5.760986328125, -5.33837890625, -4.915771484375, -4.4931640625, -4.070556640625, -3.64794921875, -3.225341796875, -2.802734375, -2.380126953125, -1.95751953125, -1.534912109375, -1.1123046875, -0.689697265625, -0.26708984375, 0.155517578125, 0.578125, 1.000732421875, 1.42333984375, 1.845947265625, 2.2685546875, 2.691162109375, 3.11376953125, 3.536376953125, 3.958984375, 4.381591796875, 4.80419921875, 5.226806640625, 5.6494140625, 6.072021484375, 6.49462890625, 6.917236328125, 7.33984375, 7.762451171875, 8.18505859375, 8.607666015625, 9.0302734375, 9.452880859375, 9.87548828125, 10.298095703125, 10.720703125, 11.143310546875, 11.56591796875, 11.988525390625, 12.4111328125, 12.833740234375, 13.25634765625, 13.678955078125, 14.1015625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 7.0, 4.0, 7.0, 3.0, 2.0, 6.0, 7.0, 8.0, 8.0, 5.0, 17.0, 19.0, 30.0, 41.0, 63.0, 64.0, 97.0, 91.0, 126.0, 86.0, 72.0, 53.0, 45.0, 28.0, 20.0, 21.0, 19.0, 11.0, 5.0, 9.0, 7.0, 7.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015010833740234375, -0.0014482289552688599, -0.0013953745365142822, -0.0013425201177597046, -0.001289665699005127, -0.0012368112802505493, -0.0011839568614959717, -0.001131102442741394, -0.0010782480239868164, -0.0010253936052322388, -0.0009725391864776611, -0.0009196847677230835, -0.0008668303489685059, -0.0008139759302139282, -0.0007611215114593506, -0.000708267092704773, -0.0006554126739501953, -0.0006025582551956177, -0.00054970383644104, -0.0004968494176864624, -0.00044399499893188477, -0.00039114058017730713, -0.0003382861614227295, -0.00028543174266815186, -0.00023257732391357422, -0.00017972290515899658, -0.00012686848640441895, -7.401406764984131e-05, -2.1159648895263672e-05, 3.1694769859313965e-05, 8.45491886138916e-05, 0.00013740360736846924, 0.00019025802612304688, 0.0002431124448776245, 0.00029596686363220215, 0.0003488212823867798, 0.0004016757011413574, 0.00045453011989593506, 0.0005073845386505127, 0.0005602389574050903, 0.000613093376159668, 0.0006659477949142456, 0.0007188022136688232, 0.0007716566324234009, 0.0008245110511779785, 0.0008773654699325562, 0.0009302198886871338, 0.0009830743074417114, 0.001035928726196289, 0.0010887831449508667, 0.0011416375637054443, 0.001194491982460022, 0.0012473464012145996, 0.0013002008199691772, 0.0013530552387237549, 0.0014059096574783325, 0.0014587640762329102, 0.0015116184949874878, 0.0015644729137420654, 0.001617327332496643, 0.0016701817512512207, 0.0017230361700057983, 0.001775890588760376, 0.0018287450075149536, 0.0018815994262695312]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 9.0, 14.0, 22.0, 25.0, 27.0, 37.0, 69.0, 87.0, 131.0, 145.0, 251.0, 364.0, 653.0, 937.0, 1596.0, 2798.0, 5413.0, 11576.0, 27677.0, 69170.0, 169132.0, 305637.0, 252204.0, 117053.0, 46951.0, 18698.0, 8132.0, 3970.0, 2218.0, 1268.0, 770.0, 481.0, 318.0, 206.0, 145.0, 98.0, 77.0, 67.0, 32.0, 31.0, 18.0, 14.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-8.609375, -8.3385009765625, -8.067626953125, -7.7967529296875, -7.52587890625, -7.2550048828125, -6.984130859375, -6.7132568359375, -6.4423828125, -6.1715087890625, -5.900634765625, -5.6297607421875, -5.35888671875, -5.0880126953125, -4.817138671875, -4.5462646484375, -4.275390625, -4.0045166015625, -3.733642578125, -3.4627685546875, -3.19189453125, -2.9210205078125, -2.650146484375, -2.3792724609375, -2.1083984375, -1.8375244140625, -1.566650390625, -1.2957763671875, -1.02490234375, -0.7540283203125, -0.483154296875, -0.2122802734375, 0.05859375, 0.3294677734375, 0.600341796875, 0.8712158203125, 1.14208984375, 1.4129638671875, 1.683837890625, 1.9547119140625, 2.2255859375, 2.4964599609375, 2.767333984375, 3.0382080078125, 3.30908203125, 3.5799560546875, 3.850830078125, 4.1217041015625, 4.392578125, 4.6634521484375, 4.934326171875, 5.2052001953125, 5.47607421875, 5.7469482421875, 6.017822265625, 6.2886962890625, 6.5595703125, 6.8304443359375, 7.101318359375, 7.3721923828125, 7.64306640625, 7.9139404296875, 8.184814453125, 8.4556884765625, 8.7265625]}, "gradients/decoder.bert.encoder.layer.23.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 14.0, 7.0, 17.0, 11.0, 26.0, 29.0, 39.0, 43.0, 43.0, 59.0, 67.0, 76.0, 65.0, 77.0, 71.0, 64.0, 60.0, 37.0, 44.0, 46.0, 18.0, 15.0, 13.0, 7.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.5625, -2.487884521484375, -2.41326904296875, -2.338653564453125, -2.2640380859375, -2.189422607421875, -2.11480712890625, -2.040191650390625, -1.965576171875, -1.890960693359375, -1.81634521484375, -1.741729736328125, -1.6671142578125, -1.592498779296875, -1.51788330078125, -1.443267822265625, -1.36865234375, -1.294036865234375, -1.21942138671875, -1.144805908203125, -1.0701904296875, -0.995574951171875, -0.92095947265625, -0.846343994140625, -0.771728515625, -0.697113037109375, -0.62249755859375, -0.547882080078125, -0.4732666015625, -0.398651123046875, -0.32403564453125, -0.249420166015625, -0.1748046875, -0.100189208984375, -0.02557373046875, 0.049041748046875, 0.1236572265625, 0.198272705078125, 0.27288818359375, 0.347503662109375, 0.422119140625, 0.496734619140625, 0.57135009765625, 0.645965576171875, 0.7205810546875, 0.795196533203125, 0.86981201171875, 0.944427490234375, 1.01904296875, 1.093658447265625, 1.16827392578125, 1.242889404296875, 1.3175048828125, 1.392120361328125, 1.46673583984375, 1.541351318359375, 1.615966796875, 1.690582275390625, 1.76519775390625, 1.839813232421875, 1.9144287109375, 1.989044189453125, 2.06365966796875, 2.138275146484375, 2.212890625]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 7.0, 12.0, 6.0, 17.0, 17.0, 18.0, 32.0, 31.0, 35.0, 43.0, 44.0, 51.0, 46.0, 44.0, 55.0, 62.0, 59.0, 59.0, 63.0, 63.0, 30.0, 37.0, 22.0, 32.0, 28.0, 17.0, 9.0, 16.0, 15.0, 10.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6795768737793, -42.33344268798828, -40.987308502197266, -39.64117431640625, -38.295040130615234, -36.94890594482422, -35.60277557373047, -34.25663757324219, -32.91050720214844, -31.564373016357422, -30.218238830566406, -28.87210464477539, -27.525970458984375, -26.17983627319336, -24.833703994750977, -23.48756980895996, -22.141433715820312, -20.795299530029297, -19.44916534423828, -18.103031158447266, -16.75689697265625, -15.41076374053955, -14.064630508422852, -12.718496322631836, -11.37236213684082, -10.026227951049805, -8.680093765258789, -7.33396053314209, -5.987826347351074, -4.641692161560059, -3.2955589294433594, -1.9494247436523438, -0.6032943725585938, 0.7428395748138428, 2.0889735221862793, 3.4351072311401367, 4.781241416931152, 6.127375602722168, 7.473508834838867, 8.819643020629883, 10.165777206420898, 11.511911392211914, 12.85804557800293, 14.204178810119629, 15.550312995910645, 16.896446228027344, 18.24258041381836, 19.588714599609375, 20.93484878540039, 22.280982971191406, 23.627117156982422, 24.973251342773438, 26.319385528564453, 27.66551971435547, 29.01165199279785, 30.357786178588867, 31.703920364379883, 33.050052642822266, 34.39618682861328, 35.7423210144043, 37.08845520019531, 38.43458938598633, 39.780723571777344, 41.12685775756836, 42.472991943359375]}, "gradients/decoder.bert.encoder.layer.23.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 5.0, 12.0, 8.0, 14.0, 15.0, 22.0, 14.0, 17.0, 23.0, 23.0, 26.0, 36.0, 45.0, 37.0, 50.0, 45.0, 44.0, 37.0, 40.0, 50.0, 38.0, 36.0, 37.0, 31.0, 38.0, 37.0, 35.0, 24.0, 31.0, 22.0, 13.0, 11.0, 10.0, 10.0, 10.0, 13.0, 10.0, 11.0, 2.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.06751251220703, -32.019248962402344, -30.970985412597656, -29.92272186279297, -28.87445831298828, -27.826194763183594, -26.77793312072754, -25.72966957092285, -24.681406021118164, -23.633142471313477, -22.58487892150879, -21.5366153717041, -20.488353729248047, -19.44009017944336, -18.391826629638672, -17.343563079833984, -16.295299530029297, -15.24703598022461, -14.198772430419922, -13.15050983428955, -12.102246284484863, -11.053982734680176, -10.005720138549805, -8.957456588745117, -7.90919303894043, -6.860929489135742, -5.812666416168213, -4.764403343200684, -3.716139793395996, -2.6678762435913086, -1.6196131706237793, -0.57135009765625, 0.4769134521484375, 1.525176763534546, 2.5734400749206543, 3.6217033863067627, 4.669966697692871, 5.718230247497559, 6.766493320465088, 7.814756393432617, 8.863019943237305, 9.911283493041992, 10.95954704284668, 12.00780963897705, 13.056073188781738, 14.104336738586426, 15.152599334716797, 16.200862884521484, 17.249126434326172, 18.29738998413086, 19.345653533935547, 20.393917083740234, 21.442180633544922, 22.49044418334961, 23.538705825805664, 24.58696937561035, 25.63523292541504, 26.683496475219727, 27.731760025024414, 28.7800235748291, 29.828285217285156, 30.876548767089844, 31.92481231689453, 32.97307586669922, 34.021339416503906]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 10.0, 7.0, 9.0, 26.0, 36.0, 65.0, 84.0, 150.0, 266.0, 435.0, 626.0, 1034.0, 1545.0, 2758.0, 4381.0, 7177.0, 11724.0, 19783.0, 32302.0, 52482.0, 82212.0, 119950.0, 153634.0, 160014.0, 134926.0, 97701.0, 63941.0, 39833.0, 24007.0, 14620.0, 8879.0, 5327.0, 3328.0, 2001.0, 1187.0, 825.0, 426.0, 293.0, 215.0, 116.0, 97.0, 47.0, 29.0, 17.0, 18.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.353515625, -43.80078125, -42.248046875, -40.6953125, -39.142578125, -37.58984375, -36.037109375, -34.484375, -32.931640625, -31.37890625, -29.826171875, -28.2734375, -26.720703125, -25.16796875, -23.615234375, -22.0625, -20.509765625, -18.95703125, -17.404296875, -15.8515625, -14.298828125, -12.74609375, -11.193359375, -9.640625, -8.087890625, -6.53515625, -4.982421875, -3.4296875, -1.876953125, -0.32421875, 1.228515625, 2.78125, 4.333984375, 5.88671875, 7.439453125, 8.9921875, 10.544921875, 12.09765625, 13.650390625, 15.203125, 16.755859375, 18.30859375, 19.861328125, 21.4140625, 22.966796875, 24.51953125, 26.072265625, 27.625, 29.177734375, 30.73046875, 32.283203125, 33.8359375, 35.388671875, 36.94140625, 38.494140625, 40.046875, 41.599609375, 43.15234375, 44.705078125, 46.2578125, 47.810546875, 49.36328125, 50.916015625, 52.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 5.0, 19.0, 23.0, 18.0, 24.0, 24.0, 22.0, 31.0, 48.0, 39.0, 42.0, 49.0, 32.0, 40.0, 55.0, 44.0, 33.0, 44.0, 42.0, 33.0, 40.0, 31.0, 40.0, 31.0, 27.0, 21.0, 24.0, 13.0, 14.0, 11.0, 10.0, 11.0, 12.0, 4.0, 4.0, 9.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.125, -34.06884765625, -33.0126953125, -31.95654296875, -30.900390625, -29.84423828125, -28.7880859375, -27.73193359375, -26.67578125, -25.61962890625, -24.5634765625, -23.50732421875, -22.451171875, -21.39501953125, -20.3388671875, -19.28271484375, -18.2265625, -17.17041015625, -16.1142578125, -15.05810546875, -14.001953125, -12.94580078125, -11.8896484375, -10.83349609375, -9.77734375, -8.72119140625, -7.6650390625, -6.60888671875, -5.552734375, -4.49658203125, -3.4404296875, -2.38427734375, -1.328125, -0.27197265625, 0.7841796875, 1.84033203125, 2.896484375, 3.95263671875, 5.0087890625, 6.06494140625, 7.12109375, 8.17724609375, 9.2333984375, 10.28955078125, 11.345703125, 12.40185546875, 13.4580078125, 14.51416015625, 15.5703125, 16.62646484375, 17.6826171875, 18.73876953125, 19.794921875, 20.85107421875, 21.9072265625, 22.96337890625, 24.01953125, 25.07568359375, 26.1318359375, 27.18798828125, 28.244140625, 29.30029296875, 30.3564453125, 31.41259765625, 32.46875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 11.0, 22.0, 22.0, 26.0, 55.0, 74.0, 140.0, 205.0, 331.0, 444.0, 694.0, 1046.0, 1694.0, 2612.0, 4080.0, 6458.0, 10088.0, 15876.0, 24345.0, 36531.0, 53850.0, 74753.0, 98237.0, 119230.0, 127979.0, 120742.0, 101367.0, 78924.0, 56674.0, 39229.0, 25906.0, 16806.0, 10826.0, 6882.0, 4419.0, 2897.0, 1827.0, 1155.0, 699.0, 485.0, 337.0, 202.0, 122.0, 87.0, 51.0, 34.0, 25.0, 18.0, 7.0, 6.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-38.46875, -37.25048828125, -36.0322265625, -34.81396484375, -33.595703125, -32.37744140625, -31.1591796875, -29.94091796875, -28.72265625, -27.50439453125, -26.2861328125, -25.06787109375, -23.849609375, -22.63134765625, -21.4130859375, -20.19482421875, -18.9765625, -17.75830078125, -16.5400390625, -15.32177734375, -14.103515625, -12.88525390625, -11.6669921875, -10.44873046875, -9.23046875, -8.01220703125, -6.7939453125, -5.57568359375, -4.357421875, -3.13916015625, -1.9208984375, -0.70263671875, 0.515625, 1.73388671875, 2.9521484375, 4.17041015625, 5.388671875, 6.60693359375, 7.8251953125, 9.04345703125, 10.26171875, 11.47998046875, 12.6982421875, 13.91650390625, 15.134765625, 16.35302734375, 17.5712890625, 18.78955078125, 20.0078125, 21.22607421875, 22.4443359375, 23.66259765625, 24.880859375, 26.09912109375, 27.3173828125, 28.53564453125, 29.75390625, 30.97216796875, 32.1904296875, 33.40869140625, 34.626953125, 35.84521484375, 37.0634765625, 38.28173828125, 39.5]}, "gradients/decoder.bert.encoder.layer.23.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 7.0, 4.0, 4.0, 8.0, 18.0, 17.0, 19.0, 15.0, 22.0, 30.0, 23.0, 30.0, 41.0, 34.0, 38.0, 38.0, 23.0, 49.0, 40.0, 44.0, 37.0, 49.0, 41.0, 43.0, 38.0, 40.0, 33.0, 34.0, 22.0, 27.0, 34.0, 22.0, 20.0, 6.0, 15.0, 7.0, 5.0, 6.0, 6.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.59375, -20.906982421875, -20.22021484375, -19.533447265625, -18.8466796875, -18.159912109375, -17.47314453125, -16.786376953125, -16.099609375, -15.412841796875, -14.72607421875, -14.039306640625, -13.3525390625, -12.665771484375, -11.97900390625, -11.292236328125, -10.60546875, -9.918701171875, -9.23193359375, -8.545166015625, -7.8583984375, -7.171630859375, -6.48486328125, -5.798095703125, -5.111328125, -4.424560546875, -3.73779296875, -3.051025390625, -2.3642578125, -1.677490234375, -0.99072265625, -0.303955078125, 0.3828125, 1.069580078125, 1.75634765625, 2.443115234375, 3.1298828125, 3.816650390625, 4.50341796875, 5.190185546875, 5.876953125, 6.563720703125, 7.25048828125, 7.937255859375, 8.6240234375, 9.310791015625, 9.99755859375, 10.684326171875, 11.37109375, 12.057861328125, 12.74462890625, 13.431396484375, 14.1181640625, 14.804931640625, 15.49169921875, 16.178466796875, 16.865234375, 17.552001953125, 18.23876953125, 18.925537109375, 19.6123046875, 20.299072265625, 20.98583984375, 21.672607421875, 22.359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 9.0, 10.0, 28.0, 35.0, 54.0, 58.0, 92.0, 121.0, 148.0, 250.0, 298.0, 426.0, 634.0, 845.0, 1316.0, 1972.0, 3060.0, 4913.0, 8636.0, 15645.0, 30174.0, 63290.0, 132167.0, 237114.0, 249854.0, 148872.0, 71605.0, 34504.0, 17297.0, 9475.0, 5503.0, 3328.0, 2136.0, 1469.0, 926.0, 640.0, 463.0, 309.0, 258.0, 188.0, 108.0, 86.0, 71.0, 57.0, 31.0, 21.0, 20.0, 15.0, 11.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-27.84375, -27.002197265625, -26.16064453125, -25.319091796875, -24.4775390625, -23.635986328125, -22.79443359375, -21.952880859375, -21.111328125, -20.269775390625, -19.42822265625, -18.586669921875, -17.7451171875, -16.903564453125, -16.06201171875, -15.220458984375, -14.37890625, -13.537353515625, -12.69580078125, -11.854248046875, -11.0126953125, -10.171142578125, -9.32958984375, -8.488037109375, -7.646484375, -6.804931640625, -5.96337890625, -5.121826171875, -4.2802734375, -3.438720703125, -2.59716796875, -1.755615234375, -0.9140625, -0.072509765625, 0.76904296875, 1.610595703125, 2.4521484375, 3.293701171875, 4.13525390625, 4.976806640625, 5.818359375, 6.659912109375, 7.50146484375, 8.343017578125, 9.1845703125, 10.026123046875, 10.86767578125, 11.709228515625, 12.55078125, 13.392333984375, 14.23388671875, 15.075439453125, 15.9169921875, 16.758544921875, 17.60009765625, 18.441650390625, 19.283203125, 20.124755859375, 20.96630859375, 21.807861328125, 22.6494140625, 23.490966796875, 24.33251953125, 25.174072265625, 26.015625]}, "gradients/decoder.bert.encoder.layer.23.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 8.0, 18.0, 13.0, 29.0, 30.0, 65.0, 81.0, 116.0, 144.0, 139.0, 92.0, 82.0, 57.0, 32.0, 19.0, 24.0, 14.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00426483154296875, -0.004131019115447998, -0.003997206687927246, -0.003863394260406494, -0.003729581832885742, -0.0035957694053649902, -0.0034619569778442383, -0.0033281445503234863, -0.0031943321228027344, -0.0030605196952819824, -0.0029267072677612305, -0.0027928948402404785, -0.0026590824127197266, -0.0025252699851989746, -0.0023914575576782227, -0.0022576451301574707, -0.0021238327026367188, -0.001990020275115967, -0.0018562078475952148, -0.0017223954200744629, -0.001588582992553711, -0.001454770565032959, -0.001320958137512207, -0.001187145709991455, -0.0010533332824707031, -0.0009195208549499512, -0.0007857084274291992, -0.0006518959999084473, -0.0005180835723876953, -0.00038427114486694336, -0.0002504587173461914, -0.00011664628982543945, 1.71661376953125e-05, 0.00015097856521606445, 0.0002847909927368164, 0.00041860342025756836, 0.0005524158477783203, 0.0006862282752990723, 0.0008200407028198242, 0.0009538531303405762, 0.0010876655578613281, 0.00122147798538208, 0.001355290412902832, 0.001489102840423584, 0.001622915267944336, 0.0017567276954650879, 0.0018905401229858398, 0.002024352550506592, 0.0021581649780273438, 0.0022919774055480957, 0.0024257898330688477, 0.0025596022605895996, 0.0026934146881103516, 0.0028272271156311035, 0.0029610395431518555, 0.0030948519706726074, 0.0032286643981933594, 0.0033624768257141113, 0.0034962892532348633, 0.0036301016807556152, 0.003763914108276367, 0.003897726535797119, 0.004031538963317871, 0.004165351390838623, 0.004299163818359375]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 12.0, 21.0, 21.0, 22.0, 32.0, 74.0, 95.0, 139.0, 203.0, 286.0, 487.0, 715.0, 1245.0, 1940.0, 3362.0, 6063.0, 11646.0, 22713.0, 47580.0, 98558.0, 182236.0, 247010.0, 200390.0, 113167.0, 54637.0, 26401.0, 13086.0, 6899.0, 3773.0, 2164.0, 1277.0, 775.0, 478.0, 321.0, 232.0, 142.0, 114.0, 68.0, 44.0, 45.0, 27.0, 19.0, 15.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0], "bins": [-24.65625, -23.963623046875, -23.27099609375, -22.578369140625, -21.8857421875, -21.193115234375, -20.50048828125, -19.807861328125, -19.115234375, -18.422607421875, -17.72998046875, -17.037353515625, -16.3447265625, -15.652099609375, -14.95947265625, -14.266845703125, -13.57421875, -12.881591796875, -12.18896484375, -11.496337890625, -10.8037109375, -10.111083984375, -9.41845703125, -8.725830078125, -8.033203125, -7.340576171875, -6.64794921875, -5.955322265625, -5.2626953125, -4.570068359375, -3.87744140625, -3.184814453125, -2.4921875, -1.799560546875, -1.10693359375, -0.414306640625, 0.2783203125, 0.970947265625, 1.66357421875, 2.356201171875, 3.048828125, 3.741455078125, 4.43408203125, 5.126708984375, 5.8193359375, 6.511962890625, 7.20458984375, 7.897216796875, 8.58984375, 9.282470703125, 9.97509765625, 10.667724609375, 11.3603515625, 12.052978515625, 12.74560546875, 13.438232421875, 14.130859375, 14.823486328125, 15.51611328125, 16.208740234375, 16.9013671875, 17.593994140625, 18.28662109375, 18.979248046875, 19.671875]}, "gradients/decoder.bert.encoder.layer.23.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 11.0, 14.0, 20.0, 19.0, 34.0, 33.0, 44.0, 48.0, 69.0, 52.0, 82.0, 62.0, 61.0, 64.0, 62.0, 59.0, 52.0, 32.0, 33.0, 30.0, 20.0, 17.0, 13.0, 16.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.515625, -8.289306640625, -8.06298828125, -7.836669921875, -7.6103515625, -7.384033203125, -7.15771484375, -6.931396484375, -6.705078125, -6.478759765625, -6.25244140625, -6.026123046875, -5.7998046875, -5.573486328125, -5.34716796875, -5.120849609375, -4.89453125, -4.668212890625, -4.44189453125, -4.215576171875, -3.9892578125, -3.762939453125, -3.53662109375, -3.310302734375, -3.083984375, -2.857666015625, -2.63134765625, -2.405029296875, -2.1787109375, -1.952392578125, -1.72607421875, -1.499755859375, -1.2734375, -1.047119140625, -0.82080078125, -0.594482421875, -0.3681640625, -0.141845703125, 0.08447265625, 0.310791015625, 0.537109375, 0.763427734375, 0.98974609375, 1.216064453125, 1.4423828125, 1.668701171875, 1.89501953125, 2.121337890625, 2.34765625, 2.573974609375, 2.80029296875, 3.026611328125, 3.2529296875, 3.479248046875, 3.70556640625, 3.931884765625, 4.158203125, 4.384521484375, 4.61083984375, 4.837158203125, 5.0634765625, 5.289794921875, 5.51611328125, 5.742431640625, 5.96875]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 8.0, 13.0, 15.0, 16.0, 23.0, 27.0, 32.0, 38.0, 41.0, 34.0, 45.0, 40.0, 62.0, 62.0, 43.0, 44.0, 47.0, 50.0, 56.0, 41.0, 37.0, 28.0, 31.0, 18.0, 21.0, 15.0, 18.0, 18.0, 18.0, 8.0, 7.0, 9.0, 8.0, 3.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.633331298828125, -33.47809600830078, -32.32286071777344, -31.167621612548828, -30.012386322021484, -28.85715103149414, -27.701913833618164, -26.546676635742188, -25.391441345214844, -24.2362060546875, -23.080968856811523, -21.925731658935547, -20.770496368408203, -19.61526107788086, -18.460023880004883, -17.304786682128906, -16.149551391601562, -14.994315147399902, -13.839078903198242, -12.683842658996582, -11.528606414794922, -10.373370170593262, -9.218133926391602, -8.062897682189941, -6.907661437988281, -5.752425193786621, -4.597188949584961, -3.441952705383301, -2.2867164611816406, -1.1314802169799805, 0.023756027221679688, 1.1789922714233398, 2.3342247009277344, 3.4894609451293945, 4.644697189331055, 5.799933433532715, 6.955169677734375, 8.110405921936035, 9.265642166137695, 10.420878410339355, 11.576114654541016, 12.731350898742676, 13.886587142944336, 15.041823387145996, 16.197059631347656, 17.352294921875, 18.507532119750977, 19.662769317626953, 20.818004608154297, 21.97323989868164, 23.128477096557617, 24.283714294433594, 25.438949584960938, 26.59418487548828, 27.749422073364258, 28.904659271240234, 30.059894561767578, 31.215129852294922, 32.37036895751953, 33.525604248046875, 34.68083953857422, 35.83607482910156, 36.991310119628906, 38.146549224853516, 39.30178451538086]}, "gradients/decoder.bert.encoder.layer.22.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 14.0, 12.0, 5.0, 11.0, 17.0, 21.0, 28.0, 28.0, 34.0, 25.0, 43.0, 46.0, 37.0, 38.0, 45.0, 43.0, 44.0, 34.0, 45.0, 34.0, 43.0, 39.0, 46.0, 39.0, 30.0, 28.0, 14.0, 28.0, 19.0, 15.0, 13.0, 14.0, 9.0, 14.0, 7.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.706998825073242, -30.668437957763672, -29.6298770904541, -28.59131622314453, -27.552757263183594, -26.514196395874023, -25.475635528564453, -24.437074661254883, -23.398513793945312, -22.359952926635742, -21.321392059326172, -20.282833099365234, -19.244272232055664, -18.205711364746094, -17.167150497436523, -16.128589630126953, -15.090030670166016, -14.051469802856445, -13.012909889221191, -11.974349021911621, -10.935789108276367, -9.897228240966797, -8.858667373657227, -7.8201069831848145, -6.781546592712402, -5.74298620223999, -4.704425811767578, -3.665864944458008, -2.6273045539855957, -1.5887441635131836, -0.5501832962036133, 0.48837709426879883, 1.5269393920898438, 2.565499782562256, 3.604060411453247, 4.642621040344238, 5.68118143081665, 6.7197418212890625, 7.758302688598633, 8.796863555908203, 9.835423469543457, 10.873984336853027, 11.912544250488281, 12.951105117797852, 13.989665985107422, 15.028225898742676, 16.066787719726562, 17.1053466796875, 18.14390754699707, 19.18246841430664, 20.22102928161621, 21.25959014892578, 22.29814910888672, 23.33670997619629, 24.37527084350586, 25.41383171081543, 26.452392578125, 27.49095344543457, 28.52951431274414, 29.568073272705078, 30.60663414001465, 31.64519500732422, 32.683753967285156, 33.72231674194336, 34.7608757019043]}, "gradients/decoder.bert.encoder.layer.22.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 17.0, 23.0, 39.0, 47.0, 63.0, 121.0, 213.0, 325.0, 594.0, 895.0, 1604.0, 2829.0, 5014.0, 9416.0, 18376.0, 36398.0, 73236.0, 155542.0, 342569.0, 757604.0, 1179749.0, 857405.0, 400112.0, 179642.0, 85275.0, 41617.0, 20869.0, 10897.0, 5859.0, 3313.0, 1841.0, 1096.0, 645.0, 404.0, 233.0, 135.0, 90.0, 64.0, 35.0, 32.0, 15.0, 15.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.21875, -47.66064453125, -46.1025390625, -44.54443359375, -42.986328125, -41.42822265625, -39.8701171875, -38.31201171875, -36.75390625, -35.19580078125, -33.6376953125, -32.07958984375, -30.521484375, -28.96337890625, -27.4052734375, -25.84716796875, -24.2890625, -22.73095703125, -21.1728515625, -19.61474609375, -18.056640625, -16.49853515625, -14.9404296875, -13.38232421875, -11.82421875, -10.26611328125, -8.7080078125, -7.14990234375, -5.591796875, -4.03369140625, -2.4755859375, -0.91748046875, 0.640625, 2.19873046875, 3.7568359375, 5.31494140625, 6.873046875, 8.43115234375, 9.9892578125, 11.54736328125, 13.10546875, 14.66357421875, 16.2216796875, 17.77978515625, 19.337890625, 20.89599609375, 22.4541015625, 24.01220703125, 25.5703125, 27.12841796875, 28.6865234375, 30.24462890625, 31.802734375, 33.36083984375, 34.9189453125, 36.47705078125, 38.03515625, 39.59326171875, 41.1513671875, 42.70947265625, 44.267578125, 45.82568359375, 47.3837890625, 48.94189453125, 50.5]}, "gradients/decoder.bert.encoder.layer.22.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 3.0, 8.0, 11.0, 8.0, 10.0, 7.0, 14.0, 14.0, 23.0, 20.0, 29.0, 30.0, 24.0, 31.0, 45.0, 38.0, 40.0, 43.0, 45.0, 40.0, 39.0, 35.0, 44.0, 40.0, 44.0, 46.0, 35.0, 35.0, 30.0, 21.0, 17.0, 19.0, 22.0, 13.0, 17.0, 11.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.484375, -21.7109375, -20.9375, -20.1640625, -19.390625, -18.6171875, -17.84375, -17.0703125, -16.296875, -15.5234375, -14.75, -13.9765625, -13.203125, -12.4296875, -11.65625, -10.8828125, -10.109375, -9.3359375, -8.5625, -7.7890625, -7.015625, -6.2421875, -5.46875, -4.6953125, -3.921875, -3.1484375, -2.375, -1.6015625, -0.828125, -0.0546875, 0.71875, 1.4921875, 2.265625, 3.0390625, 3.8125, 4.5859375, 5.359375, 6.1328125, 6.90625, 7.6796875, 8.453125, 9.2265625, 10.0, 10.7734375, 11.546875, 12.3203125, 13.09375, 13.8671875, 14.640625, 15.4140625, 16.1875, 16.9609375, 17.734375, 18.5078125, 19.28125, 20.0546875, 20.828125, 21.6015625, 22.375, 23.1484375, 23.921875, 24.6953125, 25.46875, 26.2421875, 27.015625]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 10.0, 20.0, 33.0, 38.0, 66.0, 95.0, 144.0, 234.0, 389.0, 560.0, 828.0, 1441.0, 2280.0, 3597.0, 5825.0, 9619.0, 15725.0, 26692.0, 45326.0, 77868.0, 135858.0, 237061.0, 407247.0, 657065.0, 834209.0, 690841.0, 435566.0, 254270.0, 146333.0, 83795.0, 48738.0, 28605.0, 16974.0, 10215.0, 6262.0, 3863.0, 2273.0, 1558.0, 956.0, 644.0, 384.0, 255.0, 144.0, 132.0, 79.0, 56.0, 33.0, 18.0, 10.0, 17.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-31.234375, -30.244873046875, -29.25537109375, -28.265869140625, -27.2763671875, -26.286865234375, -25.29736328125, -24.307861328125, -23.318359375, -22.328857421875, -21.33935546875, -20.349853515625, -19.3603515625, -18.370849609375, -17.38134765625, -16.391845703125, -15.40234375, -14.412841796875, -13.42333984375, -12.433837890625, -11.4443359375, -10.454833984375, -9.46533203125, -8.475830078125, -7.486328125, -6.496826171875, -5.50732421875, -4.517822265625, -3.5283203125, -2.538818359375, -1.54931640625, -0.559814453125, 0.4296875, 1.419189453125, 2.40869140625, 3.398193359375, 4.3876953125, 5.377197265625, 6.36669921875, 7.356201171875, 8.345703125, 9.335205078125, 10.32470703125, 11.314208984375, 12.3037109375, 13.293212890625, 14.28271484375, 15.272216796875, 16.26171875, 17.251220703125, 18.24072265625, 19.230224609375, 20.2197265625, 21.209228515625, 22.19873046875, 23.188232421875, 24.177734375, 25.167236328125, 26.15673828125, 27.146240234375, 28.1357421875, 29.125244140625, 30.11474609375, 31.104248046875, 32.09375]}, "gradients/decoder.bert.encoder.layer.22.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 9.0, 7.0, 17.0, 19.0, 20.0, 42.0, 51.0, 54.0, 62.0, 79.0, 96.0, 132.0, 154.0, 209.0, 240.0, 303.0, 299.0, 334.0, 322.0, 293.0, 245.0, 221.0, 191.0, 140.0, 112.0, 89.0, 70.0, 54.0, 53.0, 47.0, 21.0, 19.0, 19.0, 16.0, 8.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.6328125, -15.19384765625, -14.7548828125, -14.31591796875, -13.876953125, -13.43798828125, -12.9990234375, -12.56005859375, -12.12109375, -11.68212890625, -11.2431640625, -10.80419921875, -10.365234375, -9.92626953125, -9.4873046875, -9.04833984375, -8.609375, -8.17041015625, -7.7314453125, -7.29248046875, -6.853515625, -6.41455078125, -5.9755859375, -5.53662109375, -5.09765625, -4.65869140625, -4.2197265625, -3.78076171875, -3.341796875, -2.90283203125, -2.4638671875, -2.02490234375, -1.5859375, -1.14697265625, -0.7080078125, -0.26904296875, 0.169921875, 0.60888671875, 1.0478515625, 1.48681640625, 1.92578125, 2.36474609375, 2.8037109375, 3.24267578125, 3.681640625, 4.12060546875, 4.5595703125, 4.99853515625, 5.4375, 5.87646484375, 6.3154296875, 6.75439453125, 7.193359375, 7.63232421875, 8.0712890625, 8.51025390625, 8.94921875, 9.38818359375, 9.8271484375, 10.26611328125, 10.705078125, 11.14404296875, 11.5830078125, 12.02197265625, 12.4609375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 4.0, 11.0, 9.0, 22.0, 22.0, 32.0, 27.0, 37.0, 43.0, 49.0, 49.0, 55.0, 49.0, 54.0, 37.0, 61.0, 58.0, 44.0, 50.0, 42.0, 35.0, 30.0, 22.0, 22.0, 24.0, 21.0, 11.0, 12.0, 8.0, 11.0, 10.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.513519287109375, -31.45552635192871, -30.397533416748047, -29.339542388916016, -28.28154945373535, -27.223556518554688, -26.165565490722656, -25.107572555541992, -24.049579620361328, -22.991586685180664, -21.93359375, -20.87560272216797, -19.817609786987305, -18.75961685180664, -17.70162582397461, -16.643632888793945, -15.585639953613281, -14.527647018432617, -13.46965503692627, -12.411663055419922, -11.353670120239258, -10.295677185058594, -9.237685203552246, -8.179693222045898, -7.121700286865234, -6.0637078285217285, -5.005715370178223, -3.947722911834717, -2.889730453491211, -1.831737995147705, -0.7737455368041992, 0.28424692153930664, 1.3422393798828125, 2.4002318382263184, 3.458224296569824, 4.51621675491333, 5.574209213256836, 6.632201671600342, 7.690194129943848, 8.748186111450195, 9.80617904663086, 10.864171981811523, 11.922163963317871, 12.980155944824219, 14.038148880004883, 15.096141815185547, 16.154132843017578, 17.212125778198242, 18.270118713378906, 19.32811164855957, 20.386104583740234, 21.444095611572266, 22.50208854675293, 23.560081481933594, 24.618072509765625, 25.67606544494629, 26.734058380126953, 27.792051315307617, 28.85004425048828, 29.908035278320312, 30.966028213500977, 32.02402114868164, 33.08201217651367, 34.14000701904297, 35.197998046875]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 9.0, 11.0, 10.0, 9.0, 15.0, 20.0, 20.0, 21.0, 25.0, 36.0, 23.0, 34.0, 44.0, 61.0, 41.0, 64.0, 49.0, 58.0, 49.0, 41.0, 45.0, 44.0, 37.0, 36.0, 27.0, 34.0, 21.0, 19.0, 18.0, 16.0, 8.0, 12.0, 9.0, 7.0, 9.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.375486373901367, -27.36140251159668, -26.347320556640625, -25.333236694335938, -24.31915283203125, -23.305070877075195, -22.290987014770508, -21.276905059814453, -20.262821197509766, -19.248737335205078, -18.234655380249023, -17.220571517944336, -16.20648956298828, -15.192405700683594, -14.178321838378906, -13.164238929748535, -12.150156021118164, -11.136073112487793, -10.121990203857422, -9.107906341552734, -8.093823432922363, -7.079740524291992, -6.065657138824463, -5.051573753356934, -4.0374908447265625, -3.0234076976776123, -2.009324550628662, -0.9952414035797119, 0.01884174346923828, 1.0329246520996094, 2.0470080375671387, 3.061091423034668, 4.075172424316406, 5.089255332946777, 6.103338718414307, 7.117422103881836, 8.131505012512207, 9.145587921142578, 10.159671783447266, 11.173754692077637, 12.187837600708008, 13.201920509338379, 14.21600341796875, 15.230087280273438, 16.244171142578125, 17.25825309753418, 18.272336959838867, 19.286418914794922, 20.30050277709961, 21.314586639404297, 22.32866859436035, 23.34275245666504, 24.356834411621094, 25.37091827392578, 26.38500213623047, 27.399085998535156, 28.41316795349121, 29.4272518157959, 30.441333770751953, 31.45541763305664, 32.46950149536133, 33.48358154296875, 34.49766540527344, 35.511749267578125, 36.52583312988281]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 11.0, 19.0, 30.0, 46.0, 73.0, 104.0, 175.0, 248.0, 413.0, 663.0, 983.0, 1461.0, 2387.0, 3757.0, 5858.0, 8732.0, 13332.0, 19894.0, 28808.0, 41133.0, 56461.0, 74338.0, 92917.0, 108226.0, 116060.0, 109573.0, 94669.0, 76198.0, 58117.0, 42635.0, 30058.0, 20673.0, 14024.0, 9170.0, 6191.0, 3905.0, 2564.0, 1742.0, 1007.0, 674.0, 409.0, 269.0, 201.0, 118.0, 67.0, 60.0, 36.0, 27.0, 10.0, 12.0, 5.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-16.453125, -15.94775390625, -15.4423828125, -14.93701171875, -14.431640625, -13.92626953125, -13.4208984375, -12.91552734375, -12.41015625, -11.90478515625, -11.3994140625, -10.89404296875, -10.388671875, -9.88330078125, -9.3779296875, -8.87255859375, -8.3671875, -7.86181640625, -7.3564453125, -6.85107421875, -6.345703125, -5.84033203125, -5.3349609375, -4.82958984375, -4.32421875, -3.81884765625, -3.3134765625, -2.80810546875, -2.302734375, -1.79736328125, -1.2919921875, -0.78662109375, -0.28125, 0.22412109375, 0.7294921875, 1.23486328125, 1.740234375, 2.24560546875, 2.7509765625, 3.25634765625, 3.76171875, 4.26708984375, 4.7724609375, 5.27783203125, 5.783203125, 6.28857421875, 6.7939453125, 7.29931640625, 7.8046875, 8.31005859375, 8.8154296875, 9.32080078125, 9.826171875, 10.33154296875, 10.8369140625, 11.34228515625, 11.84765625, 12.35302734375, 12.8583984375, 13.36376953125, 13.869140625, 14.37451171875, 14.8798828125, 15.38525390625, 15.890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 11.0, 3.0, 8.0, 9.0, 9.0, 17.0, 17.0, 21.0, 19.0, 16.0, 25.0, 28.0, 33.0, 33.0, 47.0, 38.0, 48.0, 53.0, 48.0, 48.0, 40.0, 42.0, 47.0, 49.0, 43.0, 44.0, 29.0, 22.0, 23.0, 20.0, 23.0, 16.0, 15.0, 15.0, 8.0, 5.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.375, -21.609375, -20.84375, -20.078125, -19.3125, -18.546875, -17.78125, -17.015625, -16.25, -15.484375, -14.71875, -13.953125, -13.1875, -12.421875, -11.65625, -10.890625, -10.125, -9.359375, -8.59375, -7.828125, -7.0625, -6.296875, -5.53125, -4.765625, -4.0, -3.234375, -2.46875, -1.703125, -0.9375, -0.171875, 0.59375, 1.359375, 2.125, 2.890625, 3.65625, 4.421875, 5.1875, 5.953125, 6.71875, 7.484375, 8.25, 9.015625, 9.78125, 10.546875, 11.3125, 12.078125, 12.84375, 13.609375, 14.375, 15.140625, 15.90625, 16.671875, 17.4375, 18.203125, 18.96875, 19.734375, 20.5, 21.265625, 22.03125, 22.796875, 23.5625, 24.328125, 25.09375, 25.859375, 26.625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 6.0, 3.0, 8.0, 16.0, 20.0, 23.0, 32.0, 47.0, 65.0, 103.0, 152.0, 189.0, 308.0, 422.0, 617.0, 918.0, 1594.0, 2143.0, 3373.0, 5210.0, 8223.0, 13000.0, 22547.0, 87186.0, 804089.0, 46583.0, 19393.0, 11493.0, 7163.0, 4642.0, 2945.0, 1981.0, 1297.0, 855.0, 613.0, 399.0, 261.0, 194.0, 125.0, 103.0, 70.0, 34.0, 28.0, 30.0, 16.0, 14.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.84375, -50.2421875, -48.640625, -47.0390625, -45.4375, -43.8359375, -42.234375, -40.6328125, -39.03125, -37.4296875, -35.828125, -34.2265625, -32.625, -31.0234375, -29.421875, -27.8203125, -26.21875, -24.6171875, -23.015625, -21.4140625, -19.8125, -18.2109375, -16.609375, -15.0078125, -13.40625, -11.8046875, -10.203125, -8.6015625, -7.0, -5.3984375, -3.796875, -2.1953125, -0.59375, 1.0078125, 2.609375, 4.2109375, 5.8125, 7.4140625, 9.015625, 10.6171875, 12.21875, 13.8203125, 15.421875, 17.0234375, 18.625, 20.2265625, 21.828125, 23.4296875, 25.03125, 26.6328125, 28.234375, 29.8359375, 31.4375, 33.0390625, 34.640625, 36.2421875, 37.84375, 39.4453125, 41.046875, 42.6484375, 44.25, 45.8515625, 47.453125, 49.0546875, 50.65625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 3.0, 7.0, 6.0, 5.0, 10.0, 6.0, 11.0, 14.0, 23.0, 25.0, 31.0, 35.0, 41.0, 46.0, 43.0, 47.0, 53.0, 58.0, 55.0, 63.0, 44.0, 47.0, 48.0, 38.0, 35.0, 20.0, 26.0, 31.0, 22.0, 20.0, 19.0, 13.0, 8.0, 9.0, 9.0, 3.0, 8.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-47.65625, -46.3984375, -45.140625, -43.8828125, -42.625, -41.3671875, -40.109375, -38.8515625, -37.59375, -36.3359375, -35.078125, -33.8203125, -32.5625, -31.3046875, -30.046875, -28.7890625, -27.53125, -26.2734375, -25.015625, -23.7578125, -22.5, -21.2421875, -19.984375, -18.7265625, -17.46875, -16.2109375, -14.953125, -13.6953125, -12.4375, -11.1796875, -9.921875, -8.6640625, -7.40625, -6.1484375, -4.890625, -3.6328125, -2.375, -1.1171875, 0.140625, 1.3984375, 2.65625, 3.9140625, 5.171875, 6.4296875, 7.6875, 8.9453125, 10.203125, 11.4609375, 12.71875, 13.9765625, 15.234375, 16.4921875, 17.75, 19.0078125, 20.265625, 21.5234375, 22.78125, 24.0390625, 25.296875, 26.5546875, 27.8125, 29.0703125, 30.328125, 31.5859375, 32.84375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 5.0, 10.0, 12.0, 17.0, 18.0, 31.0, 32.0, 54.0, 69.0, 93.0, 165.0, 234.0, 369.0, 581.0, 930.0, 1781.0, 3296.0, 7160.0, 18895.0, 124629.0, 837984.0, 31502.0, 10398.0, 4657.0, 2320.0, 1254.0, 708.0, 481.0, 284.0, 182.0, 129.0, 89.0, 44.0, 43.0, 32.0, 18.0, 16.0, 4.0, 6.0, 6.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.25, -31.333984375, -30.41796875, -29.501953125, -28.5859375, -27.669921875, -26.75390625, -25.837890625, -24.921875, -24.005859375, -23.08984375, -22.173828125, -21.2578125, -20.341796875, -19.42578125, -18.509765625, -17.59375, -16.677734375, -15.76171875, -14.845703125, -13.9296875, -13.013671875, -12.09765625, -11.181640625, -10.265625, -9.349609375, -8.43359375, -7.517578125, -6.6015625, -5.685546875, -4.76953125, -3.853515625, -2.9375, -2.021484375, -1.10546875, -0.189453125, 0.7265625, 1.642578125, 2.55859375, 3.474609375, 4.390625, 5.306640625, 6.22265625, 7.138671875, 8.0546875, 8.970703125, 9.88671875, 10.802734375, 11.71875, 12.634765625, 13.55078125, 14.466796875, 15.3828125, 16.298828125, 17.21484375, 18.130859375, 19.046875, 19.962890625, 20.87890625, 21.794921875, 22.7109375, 23.626953125, 24.54296875, 25.458984375, 26.375]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 15.0, 37.0, 38.0, 33.0, 58.0, 61.0, 80.0, 104.0, 117.0, 90.0, 55.0, 53.0, 38.0, 43.0, 31.0, 27.0, 10.0, 12.0, 13.0, 8.0, 6.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006221771240234375, -0.006039679050445557, -0.005857586860656738, -0.00567549467086792, -0.0054934024810791016, -0.005311310291290283, -0.005129218101501465, -0.0049471259117126465, -0.004765033721923828, -0.00458294153213501, -0.004400849342346191, -0.004218757152557373, -0.004036664962768555, -0.0038545727729797363, -0.003672480583190918, -0.0034903883934020996, -0.0033082962036132812, -0.003126204013824463, -0.0029441118240356445, -0.002762019634246826, -0.002579927444458008, -0.0023978352546691895, -0.002215743064880371, -0.0020336508750915527, -0.0018515586853027344, -0.001669466495513916, -0.0014873743057250977, -0.0013052821159362793, -0.001123189926147461, -0.0009410977363586426, -0.0007590055465698242, -0.0005769133567810059, -0.0003948211669921875, -0.00021272897720336914, -3.063678741455078e-05, 0.00015145540237426758, 0.00033354759216308594, 0.0005156397819519043, 0.0006977319717407227, 0.000879824161529541, 0.0010619163513183594, 0.0012440085411071777, 0.001426100730895996, 0.0016081929206848145, 0.0017902851104736328, 0.001972377300262451, 0.0021544694900512695, 0.002336561679840088, 0.0025186538696289062, 0.0027007460594177246, 0.002882838249206543, 0.0030649304389953613, 0.0032470226287841797, 0.003429114818572998, 0.0036112070083618164, 0.0037932991981506348, 0.003975391387939453, 0.0041574835777282715, 0.00433957576751709, 0.004521667957305908, 0.0047037601470947266, 0.004885852336883545, 0.005067944526672363, 0.005250036716461182, 0.00543212890625]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 11.0, 20.0, 12.0, 27.0, 42.0, 65.0, 121.0, 124.0, 190.0, 287.0, 409.0, 519.0, 810.0, 1174.0, 1634.0, 2608.0, 3965.0, 6219.0, 10402.0, 18369.0, 34876.0, 70600.0, 151308.0, 278254.0, 234171.0, 112728.0, 53422.0, 27331.0, 14805.0, 8623.0, 5292.0, 3303.0, 2115.0, 1517.0, 994.0, 676.0, 488.0, 319.0, 202.0, 167.0, 111.0, 72.0, 44.0, 45.0, 23.0, 13.0, 17.0, 11.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0], "bins": [-5.0625, -4.908203125, -4.75390625, -4.599609375, -4.4453125, -4.291015625, -4.13671875, -3.982421875, -3.828125, -3.673828125, -3.51953125, -3.365234375, -3.2109375, -3.056640625, -2.90234375, -2.748046875, -2.59375, -2.439453125, -2.28515625, -2.130859375, -1.9765625, -1.822265625, -1.66796875, -1.513671875, -1.359375, -1.205078125, -1.05078125, -0.896484375, -0.7421875, -0.587890625, -0.43359375, -0.279296875, -0.125, 0.029296875, 0.18359375, 0.337890625, 0.4921875, 0.646484375, 0.80078125, 0.955078125, 1.109375, 1.263671875, 1.41796875, 1.572265625, 1.7265625, 1.880859375, 2.03515625, 2.189453125, 2.34375, 2.498046875, 2.65234375, 2.806640625, 2.9609375, 3.115234375, 3.26953125, 3.423828125, 3.578125, 3.732421875, 3.88671875, 4.041015625, 4.1953125, 4.349609375, 4.50390625, 4.658203125, 4.8125]}, "gradients/decoder.bert.encoder.layer.22.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 12.0, 12.0, 13.0, 16.0, 21.0, 16.0, 32.0, 37.0, 33.0, 54.0, 61.0, 72.0, 65.0, 55.0, 60.0, 54.0, 61.0, 44.0, 47.0, 41.0, 37.0, 15.0, 23.0, 17.0, 14.0, 16.0, 16.0, 16.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4208984375, -1.376434326171875, -1.33197021484375, -1.287506103515625, -1.2430419921875, -1.198577880859375, -1.15411376953125, -1.109649658203125, -1.065185546875, -1.020721435546875, -0.97625732421875, -0.931793212890625, -0.8873291015625, -0.842864990234375, -0.79840087890625, -0.753936767578125, -0.70947265625, -0.665008544921875, -0.62054443359375, -0.576080322265625, -0.5316162109375, -0.487152099609375, -0.44268798828125, -0.398223876953125, -0.353759765625, -0.309295654296875, -0.26483154296875, -0.220367431640625, -0.1759033203125, -0.131439208984375, -0.08697509765625, -0.042510986328125, 0.001953125, 0.046417236328125, 0.09088134765625, 0.135345458984375, 0.1798095703125, 0.224273681640625, 0.26873779296875, 0.313201904296875, 0.357666015625, 0.402130126953125, 0.44659423828125, 0.491058349609375, 0.5355224609375, 0.579986572265625, 0.62445068359375, 0.668914794921875, 0.71337890625, 0.757843017578125, 0.80230712890625, 0.846771240234375, 0.8912353515625, 0.935699462890625, 0.98016357421875, 1.024627685546875, 1.069091796875, 1.113555908203125, 1.15802001953125, 1.202484130859375, 1.2469482421875, 1.291412353515625, 1.33587646484375, 1.380340576171875, 1.4248046875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 3.0, 3.0, 4.0, 7.0, 10.0, 12.0, 12.0, 24.0, 18.0, 18.0, 30.0, 32.0, 25.0, 31.0, 41.0, 37.0, 36.0, 44.0, 42.0, 53.0, 58.0, 49.0, 46.0, 53.0, 39.0, 34.0, 35.0, 20.0, 24.0, 17.0, 18.0, 20.0, 21.0, 9.0, 17.0, 9.0, 6.0, 11.0, 7.0, 4.0, 4.0, 4.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-22.74522590637207, -22.057628631591797, -21.370033264160156, -20.682435989379883, -19.994840621948242, -19.30724334716797, -18.619647979736328, -17.932050704956055, -17.24445343017578, -16.556856155395508, -15.869260787963867, -15.181663513183594, -14.494067192077637, -13.80647087097168, -13.118874549865723, -12.431278228759766, -11.743681907653809, -11.056085586547852, -10.368489265441895, -9.680892944335938, -8.993295669555664, -8.305699348449707, -7.61810302734375, -6.930506229400635, -6.242909908294678, -5.555313587188721, -4.8677167892456055, -4.180120468139648, -3.4925239086151123, -2.804927349090576, -2.117331027984619, -1.429734230041504, -0.7421379089355469, -0.05454140901565552, 0.6330550909042358, 1.3206515312194824, 2.0082480907440186, 2.6958446502685547, 3.3834409713745117, 4.071037769317627, 4.758634090423584, 5.446230411529541, 6.133827209472656, 6.821423530578613, 7.50901985168457, 8.196617126464844, 8.884212493896484, 9.571809768676758, 10.259406089782715, 10.947002410888672, 11.634598731994629, 12.322195053100586, 13.00979232788086, 13.697388648986816, 14.384984970092773, 15.072582244873047, 15.760177612304688, 16.44777488708496, 17.1353702545166, 17.822967529296875, 18.510562896728516, 19.19816017150879, 19.885757446289062, 20.573352813720703, 21.260950088500977]}, "gradients/decoder.bert.encoder.layer.22.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 3.0, 9.0, 9.0, 15.0, 10.0, 19.0, 16.0, 15.0, 28.0, 27.0, 26.0, 25.0, 44.0, 40.0, 56.0, 55.0, 45.0, 56.0, 56.0, 47.0, 47.0, 48.0, 50.0, 33.0, 35.0, 29.0, 31.0, 22.0, 18.0, 8.0, 18.0, 14.0, 14.0, 3.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.978113174438477, -21.186697006225586, -20.395280838012695, -19.603862762451172, -18.81244659423828, -18.02103042602539, -17.2296142578125, -16.43819808959961, -15.646780014038086, -14.855363845825195, -14.063946723937988, -13.272530555725098, -12.48111343383789, -11.689697265625, -10.89828109741211, -10.106863975524902, -9.315447807312012, -8.524031639099121, -7.732614517211914, -6.941198348999023, -6.149781227111816, -5.358365058898926, -4.566948413848877, -3.775531768798828, -2.9841151237487793, -2.1926984786987305, -1.4012819528579712, -0.6098654270172119, 0.18155121803283691, 0.9729678630828857, 1.7643842697143555, 2.5558009147644043, 3.347217559814453, 4.138634204864502, 4.930050849914551, 5.721467018127441, 6.512884140014648, 7.304300308227539, 8.09571647644043, 8.887133598327637, 9.678550720214844, 10.469966888427734, 11.261384010314941, 12.052800178527832, 12.844217300415039, 13.63563346862793, 14.42704963684082, 15.218466758728027, 16.009883880615234, 16.801300048828125, 17.592716217041016, 18.38413429260254, 19.17555046081543, 19.96696662902832, 20.75838279724121, 21.549800872802734, 22.341215133666992, 23.132631301879883, 23.924047470092773, 24.715465545654297, 25.506881713867188, 26.298297882080078, 27.08971405029297, 27.88113021850586, 28.672548294067383]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 10.0, 9.0, 12.0, 29.0, 46.0, 81.0, 154.0, 200.0, 317.0, 478.0, 782.0, 1330.0, 2203.0, 3617.0, 6190.0, 10600.0, 18706.0, 32420.0, 56630.0, 94623.0, 145399.0, 182610.0, 174167.0, 127292.0, 80172.0, 46965.0, 26696.0, 15235.0, 8767.0, 5090.0, 2962.0, 1837.0, 1113.0, 706.0, 407.0, 266.0, 154.0, 102.0, 61.0, 48.0, 28.0, 13.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-25.453125, -24.677734375, -23.90234375, -23.126953125, -22.3515625, -21.576171875, -20.80078125, -20.025390625, -19.25, -18.474609375, -17.69921875, -16.923828125, -16.1484375, -15.373046875, -14.59765625, -13.822265625, -13.046875, -12.271484375, -11.49609375, -10.720703125, -9.9453125, -9.169921875, -8.39453125, -7.619140625, -6.84375, -6.068359375, -5.29296875, -4.517578125, -3.7421875, -2.966796875, -2.19140625, -1.416015625, -0.640625, 0.134765625, 0.91015625, 1.685546875, 2.4609375, 3.236328125, 4.01171875, 4.787109375, 5.5625, 6.337890625, 7.11328125, 7.888671875, 8.6640625, 9.439453125, 10.21484375, 10.990234375, 11.765625, 12.541015625, 13.31640625, 14.091796875, 14.8671875, 15.642578125, 16.41796875, 17.193359375, 17.96875, 18.744140625, 19.51953125, 20.294921875, 21.0703125, 21.845703125, 22.62109375, 23.396484375, 24.171875]}, "gradients/decoder.bert.encoder.layer.22.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 8.0, 9.0, 12.0, 14.0, 13.0, 12.0, 17.0, 24.0, 28.0, 26.0, 32.0, 38.0, 38.0, 42.0, 55.0, 43.0, 62.0, 47.0, 50.0, 49.0, 45.0, 48.0, 47.0, 41.0, 25.0, 29.0, 31.0, 29.0, 11.0, 12.0, 12.0, 11.0, 14.0, 6.0, 6.0, 1.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.62109375, -17.9140625, -17.20703125, -16.5, -15.79296875, -15.0859375, -14.37890625, -13.671875, -12.96484375, -12.2578125, -11.55078125, -10.84375, -10.13671875, -9.4296875, -8.72265625, -8.015625, -7.30859375, -6.6015625, -5.89453125, -5.1875, -4.48046875, -3.7734375, -3.06640625, -2.359375, -1.65234375, -0.9453125, -0.23828125, 0.46875, 1.17578125, 1.8828125, 2.58984375, 3.296875, 4.00390625, 4.7109375, 5.41796875, 6.125, 6.83203125, 7.5390625, 8.24609375, 8.953125, 9.66015625, 10.3671875, 11.07421875, 11.78125, 12.48828125, 13.1953125, 13.90234375, 14.609375, 15.31640625, 16.0234375, 16.73046875, 17.4375, 18.14453125, 18.8515625, 19.55859375, 20.265625, 20.97265625, 21.6796875, 22.38671875, 23.09375, 23.80078125, 24.5078125, 25.21484375, 25.921875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 5.0, 7.0, 13.0, 25.0, 21.0, 30.0, 58.0, 65.0, 124.0, 161.0, 243.0, 379.0, 579.0, 881.0, 1368.0, 2143.0, 3465.0, 5558.0, 9051.0, 14691.0, 25013.0, 41479.0, 68713.0, 107776.0, 152215.0, 172837.0, 153377.0, 110547.0, 70126.0, 42529.0, 25337.0, 15040.0, 9124.0, 5682.0, 3516.0, 2210.0, 1507.0, 874.0, 653.0, 376.0, 266.0, 172.0, 116.0, 75.0, 43.0, 37.0, 25.0, 9.0, 11.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.9677734375, -21.248046875, -20.5283203125, -19.80859375, -19.0888671875, -18.369140625, -17.6494140625, -16.9296875, -16.2099609375, -15.490234375, -14.7705078125, -14.05078125, -13.3310546875, -12.611328125, -11.8916015625, -11.171875, -10.4521484375, -9.732421875, -9.0126953125, -8.29296875, -7.5732421875, -6.853515625, -6.1337890625, -5.4140625, -4.6943359375, -3.974609375, -3.2548828125, -2.53515625, -1.8154296875, -1.095703125, -0.3759765625, 0.34375, 1.0634765625, 1.783203125, 2.5029296875, 3.22265625, 3.9423828125, 4.662109375, 5.3818359375, 6.1015625, 6.8212890625, 7.541015625, 8.2607421875, 8.98046875, 9.7001953125, 10.419921875, 11.1396484375, 11.859375, 12.5791015625, 13.298828125, 14.0185546875, 14.73828125, 15.4580078125, 16.177734375, 16.8974609375, 17.6171875, 18.3369140625, 19.056640625, 19.7763671875, 20.49609375, 21.2158203125, 21.935546875, 22.6552734375, 23.375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 11.0, 9.0, 14.0, 10.0, 18.0, 17.0, 18.0, 24.0, 31.0, 35.0, 33.0, 28.0, 27.0, 25.0, 33.0, 51.0, 38.0, 45.0, 45.0, 45.0, 39.0, 39.0, 41.0, 39.0, 33.0, 30.0, 25.0, 37.0, 26.0, 23.0, 16.0, 16.0, 9.0, 9.0, 13.0, 5.0, 7.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.3125, -12.9288330078125, -12.545166015625, -12.1614990234375, -11.77783203125, -11.3941650390625, -11.010498046875, -10.6268310546875, -10.2431640625, -9.8594970703125, -9.475830078125, -9.0921630859375, -8.70849609375, -8.3248291015625, -7.941162109375, -7.5574951171875, -7.173828125, -6.7901611328125, -6.406494140625, -6.0228271484375, -5.63916015625, -5.2554931640625, -4.871826171875, -4.4881591796875, -4.1044921875, -3.7208251953125, -3.337158203125, -2.9534912109375, -2.56982421875, -2.1861572265625, -1.802490234375, -1.4188232421875, -1.03515625, -0.6514892578125, -0.267822265625, 0.1158447265625, 0.49951171875, 0.8831787109375, 1.266845703125, 1.6505126953125, 2.0341796875, 2.4178466796875, 2.801513671875, 3.1851806640625, 3.56884765625, 3.9525146484375, 4.336181640625, 4.7198486328125, 5.103515625, 5.4871826171875, 5.870849609375, 6.2545166015625, 6.63818359375, 7.0218505859375, 7.405517578125, 7.7891845703125, 8.1728515625, 8.5565185546875, 8.940185546875, 9.3238525390625, 9.70751953125, 10.0911865234375, 10.474853515625, 10.8585205078125, 11.2421875]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 13.0, 12.0, 27.0, 59.0, 73.0, 116.0, 171.0, 312.0, 489.0, 851.0, 1506.0, 2725.0, 5612.0, 11750.0, 26949.0, 63640.0, 147311.0, 279906.0, 267112.0, 135746.0, 57281.0, 24796.0, 10887.0, 5201.0, 2632.0, 1386.0, 773.0, 438.0, 274.0, 185.0, 105.0, 77.0, 48.0, 25.0, 18.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0], "bins": [-22.0, -21.404541015625, -20.80908203125, -20.213623046875, -19.6181640625, -19.022705078125, -18.42724609375, -17.831787109375, -17.236328125, -16.640869140625, -16.04541015625, -15.449951171875, -14.8544921875, -14.259033203125, -13.66357421875, -13.068115234375, -12.47265625, -11.877197265625, -11.28173828125, -10.686279296875, -10.0908203125, -9.495361328125, -8.89990234375, -8.304443359375, -7.708984375, -7.113525390625, -6.51806640625, -5.922607421875, -5.3271484375, -4.731689453125, -4.13623046875, -3.540771484375, -2.9453125, -2.349853515625, -1.75439453125, -1.158935546875, -0.5634765625, 0.031982421875, 0.62744140625, 1.222900390625, 1.818359375, 2.413818359375, 3.00927734375, 3.604736328125, 4.2001953125, 4.795654296875, 5.39111328125, 5.986572265625, 6.58203125, 7.177490234375, 7.77294921875, 8.368408203125, 8.9638671875, 9.559326171875, 10.15478515625, 10.750244140625, 11.345703125, 11.941162109375, 12.53662109375, 13.132080078125, 13.7275390625, 14.322998046875, 14.91845703125, 15.513916015625, 16.109375]}, "gradients/decoder.bert.encoder.layer.22.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 6.0, 6.0, 9.0, 4.0, 19.0, 15.0, 15.0, 20.0, 30.0, 22.0, 31.0, 34.0, 60.0, 48.0, 54.0, 57.0, 61.0, 52.0, 73.0, 44.0, 61.0, 57.0, 41.0, 24.0, 27.0, 20.0, 21.0, 13.0, 14.0, 5.0, 8.0, 9.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001247406005859375, -0.0012114793062210083, -0.0011755526065826416, -0.001139625906944275, -0.0011036992073059082, -0.0010677725076675415, -0.0010318458080291748, -0.000995919108390808, -0.0009599924087524414, -0.0009240657091140747, -0.000888139009475708, -0.0008522123098373413, -0.0008162856101989746, -0.0007803589105606079, -0.0007444322109222412, -0.0007085055112838745, -0.0006725788116455078, -0.0006366521120071411, -0.0006007254123687744, -0.0005647987127304077, -0.000528872013092041, -0.0004929453134536743, -0.0004570186138153076, -0.0004210919141769409, -0.0003851652145385742, -0.0003492385149002075, -0.0003133118152618408, -0.0002773851156234741, -0.00024145841598510742, -0.00020553171634674072, -0.00016960501670837402, -0.00013367831707000732, -9.775161743164062e-05, -6.182491779327393e-05, -2.5898218154907227e-05, 1.0028481483459473e-05, 4.595518112182617e-05, 8.188188076019287e-05, 0.00011780858039855957, 0.00015373528003692627, 0.00018966197967529297, 0.00022558867931365967, 0.00026151537895202637, 0.00029744207859039307, 0.00033336877822875977, 0.00036929547786712646, 0.00040522217750549316, 0.00044114887714385986, 0.00047707557678222656, 0.0005130022764205933, 0.00054892897605896, 0.0005848556756973267, 0.0006207823753356934, 0.0006567090749740601, 0.0006926357746124268, 0.0007285624742507935, 0.0007644891738891602, 0.0008004158735275269, 0.0008363425731658936, 0.0008722692728042603, 0.000908195972442627, 0.0009441226720809937, 0.0009800493717193604, 0.001015976071357727, 0.0010519027709960938]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 10.0, 6.0, 20.0, 17.0, 28.0, 49.0, 58.0, 69.0, 129.0, 160.0, 243.0, 366.0, 521.0, 701.0, 1102.0, 1540.0, 2556.0, 3864.0, 6431.0, 10888.0, 18612.0, 31528.0, 53958.0, 90389.0, 137580.0, 178413.0, 174479.0, 129889.0, 82915.0, 49614.0, 28934.0, 16885.0, 9912.0, 5928.0, 3632.0, 2308.0, 1559.0, 1000.0, 680.0, 463.0, 353.0, 227.0, 150.0, 138.0, 86.0, 50.0, 48.0, 17.0, 18.0, 11.0, 13.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.7265625, -10.3905029296875, -10.054443359375, -9.7183837890625, -9.38232421875, -9.0462646484375, -8.710205078125, -8.3741455078125, -8.0380859375, -7.7020263671875, -7.365966796875, -7.0299072265625, -6.69384765625, -6.3577880859375, -6.021728515625, -5.6856689453125, -5.349609375, -5.0135498046875, -4.677490234375, -4.3414306640625, -4.00537109375, -3.6693115234375, -3.333251953125, -2.9971923828125, -2.6611328125, -2.3250732421875, -1.989013671875, -1.6529541015625, -1.31689453125, -0.9808349609375, -0.644775390625, -0.3087158203125, 0.02734375, 0.3634033203125, 0.699462890625, 1.0355224609375, 1.37158203125, 1.7076416015625, 2.043701171875, 2.3797607421875, 2.7158203125, 3.0518798828125, 3.387939453125, 3.7239990234375, 4.06005859375, 4.3961181640625, 4.732177734375, 5.0682373046875, 5.404296875, 5.7403564453125, 6.076416015625, 6.4124755859375, 6.74853515625, 7.0845947265625, 7.420654296875, 7.7567138671875, 8.0927734375, 8.4288330078125, 8.764892578125, 9.1009521484375, 9.43701171875, 9.7730712890625, 10.109130859375, 10.4451904296875, 10.78125]}, "gradients/decoder.bert.encoder.layer.22.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 6.0, 7.0, 10.0, 11.0, 23.0, 37.0, 46.0, 45.0, 57.0, 73.0, 70.0, 84.0, 76.0, 77.0, 61.0, 63.0, 50.0, 53.0, 34.0, 29.0, 17.0, 15.0, 17.0, 7.0, 5.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.281005859375, -5.11279296875, -4.944580078125, -4.7763671875, -4.608154296875, -4.43994140625, -4.271728515625, -4.103515625, -3.935302734375, -3.76708984375, -3.598876953125, -3.4306640625, -3.262451171875, -3.09423828125, -2.926025390625, -2.7578125, -2.589599609375, -2.42138671875, -2.253173828125, -2.0849609375, -1.916748046875, -1.74853515625, -1.580322265625, -1.412109375, -1.243896484375, -1.07568359375, -0.907470703125, -0.7392578125, -0.571044921875, -0.40283203125, -0.234619140625, -0.06640625, 0.101806640625, 0.27001953125, 0.438232421875, 0.6064453125, 0.774658203125, 0.94287109375, 1.111083984375, 1.279296875, 1.447509765625, 1.61572265625, 1.783935546875, 1.9521484375, 2.120361328125, 2.28857421875, 2.456787109375, 2.625, 2.793212890625, 2.96142578125, 3.129638671875, 3.2978515625, 3.466064453125, 3.63427734375, 3.802490234375, 3.970703125, 4.138916015625, 4.30712890625, 4.475341796875, 4.6435546875, 4.811767578125, 4.97998046875, 5.148193359375, 5.31640625]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 11.0, 9.0, 8.0, 9.0, 10.0, 8.0, 22.0, 16.0, 24.0, 27.0, 25.0, 26.0, 28.0, 31.0, 29.0, 41.0, 42.0, 43.0, 61.0, 34.0, 38.0, 57.0, 33.0, 41.0, 28.0, 30.0, 24.0, 38.0, 30.0, 22.0, 17.0, 18.0, 15.0, 18.0, 10.0, 10.0, 11.0, 9.0, 5.0, 6.0, 5.0, 3.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-17.20762825012207, -16.64251708984375, -16.07740592956543, -15.512295722961426, -14.947185516357422, -14.382074356079102, -13.816963195800781, -13.251852989196777, -12.686742782592773, -12.121631622314453, -11.55652141571045, -10.991410255432129, -10.426300048828125, -9.861188888549805, -9.296077728271484, -8.73096752166748, -8.16585636138916, -7.600745677947998, -7.035634994506836, -6.470523834228516, -5.905413627624512, -5.340302467346191, -4.775191783905029, -4.210081100463867, -3.644970417022705, -3.079859733581543, -2.514749050140381, -1.9496381282806396, -1.3845274448394775, -0.8194167613983154, -0.2543058395385742, 0.3108048439025879, 0.87591552734375, 1.441026210784912, 2.006136894226074, 2.5712478160858154, 3.1363584995269775, 3.7014691829681396, 4.266580104827881, 4.831690788269043, 5.396801471710205, 5.961912155151367, 6.527022838592529, 7.092133522033691, 7.657244682312012, 8.222354888916016, 8.787466049194336, 9.352577209472656, 9.91768741607666, 10.48279857635498, 11.047908782958984, 11.613019943237305, 12.178130149841309, 12.743241310119629, 13.308351516723633, 13.873462677001953, 14.438573837280273, 15.003684997558594, 15.568795204162598, 16.1339054107666, 16.699016571044922, 17.264127731323242, 17.829238891601562, 18.39434814453125, 18.95945930480957]}, "gradients/decoder.bert.encoder.layer.21.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 2.0, 13.0, 13.0, 14.0, 14.0, 24.0, 21.0, 20.0, 19.0, 42.0, 37.0, 46.0, 41.0, 53.0, 50.0, 43.0, 36.0, 50.0, 38.0, 43.0, 52.0, 32.0, 37.0, 39.0, 26.0, 28.0, 35.0, 20.0, 18.0, 15.0, 13.0, 12.0, 9.0, 1.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-22.352792739868164, -21.680479049682617, -21.008163452148438, -20.33584976196289, -19.66353416442871, -18.991220474243164, -18.318904876708984, -17.646591186523438, -16.97427749633789, -16.301963806152344, -15.629648208618164, -14.957334518432617, -14.285019874572754, -13.61270523071289, -12.940390586853027, -12.268075942993164, -11.5957612991333, -10.923446655273438, -10.251132011413574, -9.578817367553711, -8.906503677368164, -8.2341890335083, -7.5618743896484375, -6.889560222625732, -6.217245578765869, -5.544930934906006, -4.872616767883301, -4.2003021240234375, -3.5279877185821533, -2.855673313140869, -2.183358669281006, -1.5110445022583008, -0.8387298583984375, -0.16641539335250854, 0.5058990716934204, 1.1782135963439941, 1.8505280017852783, 2.5228424072265625, 3.195157051086426, 3.867471218109131, 4.539785861968994, 5.212100505828857, 5.8844146728515625, 6.556729316711426, 7.229043960571289, 7.901358127593994, 8.573673248291016, 9.245986938476562, 9.918301582336426, 10.590616226196289, 11.262930870056152, 11.935245513916016, 12.607559204101562, 13.279873847961426, 13.952188491821289, 14.624502182006836, 15.296817779541016, 15.969132423400879, 16.641447067260742, 17.31376075744629, 17.98607635498047, 18.658390045166016, 19.330703735351562, 20.003019332885742, 20.67533302307129]}, "gradients/decoder.bert.encoder.layer.21.output.dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 5.0, 11.0, 24.0, 26.0, 52.0, 70.0, 90.0, 152.0, 242.0, 293.0, 512.0, 748.0, 1169.0, 1998.0, 3155.0, 5156.0, 8613.0, 14795.0, 25667.0, 47165.0, 89235.0, 180639.0, 393046.0, 773413.0, 1025428.0, 796832.0, 419607.0, 196073.0, 94633.0, 49915.0, 26986.0, 15454.0, 9007.0, 5427.0, 3273.0, 1977.0, 1198.0, 780.0, 486.0, 308.0, 182.0, 125.0, 85.0, 71.0, 44.0, 32.0, 24.0, 9.0, 16.0, 10.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0], "bins": [-17.953125, -17.3837890625, -16.814453125, -16.2451171875, -15.67578125, -15.1064453125, -14.537109375, -13.9677734375, -13.3984375, -12.8291015625, -12.259765625, -11.6904296875, -11.12109375, -10.5517578125, -9.982421875, -9.4130859375, -8.84375, -8.2744140625, -7.705078125, -7.1357421875, -6.56640625, -5.9970703125, -5.427734375, -4.8583984375, -4.2890625, -3.7197265625, -3.150390625, -2.5810546875, -2.01171875, -1.4423828125, -0.873046875, -0.3037109375, 0.265625, 0.8349609375, 1.404296875, 1.9736328125, 2.54296875, 3.1123046875, 3.681640625, 4.2509765625, 4.8203125, 5.3896484375, 5.958984375, 6.5283203125, 7.09765625, 7.6669921875, 8.236328125, 8.8056640625, 9.375, 9.9443359375, 10.513671875, 11.0830078125, 11.65234375, 12.2216796875, 12.791015625, 13.3603515625, 13.9296875, 14.4990234375, 15.068359375, 15.6376953125, 16.20703125, 16.7763671875, 17.345703125, 17.9150390625, 18.484375]}, "gradients/decoder.bert.encoder.layer.21.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 12.0, 9.0, 16.0, 18.0, 14.0, 18.0, 25.0, 31.0, 44.0, 36.0, 50.0, 39.0, 61.0, 56.0, 55.0, 34.0, 46.0, 59.0, 40.0, 52.0, 36.0, 42.0, 31.0, 26.0, 30.0, 25.0, 12.0, 18.0, 14.0, 12.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.071044921875, -15.51708984375, -14.963134765625, -14.4091796875, -13.855224609375, -13.30126953125, -12.747314453125, -12.193359375, -11.639404296875, -11.08544921875, -10.531494140625, -9.9775390625, -9.423583984375, -8.86962890625, -8.315673828125, -7.76171875, -7.207763671875, -6.65380859375, -6.099853515625, -5.5458984375, -4.991943359375, -4.43798828125, -3.884033203125, -3.330078125, -2.776123046875, -2.22216796875, -1.668212890625, -1.1142578125, -0.560302734375, -0.00634765625, 0.547607421875, 1.1015625, 1.655517578125, 2.20947265625, 2.763427734375, 3.3173828125, 3.871337890625, 4.42529296875, 4.979248046875, 5.533203125, 6.087158203125, 6.64111328125, 7.195068359375, 7.7490234375, 8.302978515625, 8.85693359375, 9.410888671875, 9.96484375, 10.518798828125, 11.07275390625, 11.626708984375, 12.1806640625, 12.734619140625, 13.28857421875, 13.842529296875, 14.396484375, 14.950439453125, 15.50439453125, 16.058349609375, 16.6123046875, 17.166259765625, 17.72021484375, 18.274169921875, 18.828125]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 7.0, 9.0, 16.0, 22.0, 29.0, 39.0, 62.0, 90.0, 166.0, 225.0, 365.0, 519.0, 783.0, 1131.0, 1688.0, 2735.0, 3928.0, 6195.0, 9583.0, 15369.0, 24140.0, 38971.0, 63281.0, 104201.0, 172145.0, 284770.0, 460346.0, 685588.0, 769707.0, 586512.0, 374505.0, 228442.0, 138198.0, 83148.0, 51046.0, 31477.0, 19457.0, 12462.0, 7913.0, 4969.0, 3449.0, 2211.0, 1451.0, 973.0, 670.0, 454.0, 280.0, 174.0, 132.0, 88.0, 63.0, 26.0, 32.0, 22.0, 13.0, 10.0, 2.0, 4.0, 1.0, 2.0], "bins": [-14.8984375, -14.4368896484375, -13.975341796875, -13.5137939453125, -13.05224609375, -12.5906982421875, -12.129150390625, -11.6676025390625, -11.2060546875, -10.7445068359375, -10.282958984375, -9.8214111328125, -9.35986328125, -8.8983154296875, -8.436767578125, -7.9752197265625, -7.513671875, -7.0521240234375, -6.590576171875, -6.1290283203125, -5.66748046875, -5.2059326171875, -4.744384765625, -4.2828369140625, -3.8212890625, -3.3597412109375, -2.898193359375, -2.4366455078125, -1.97509765625, -1.5135498046875, -1.052001953125, -0.5904541015625, -0.12890625, 0.3326416015625, 0.794189453125, 1.2557373046875, 1.71728515625, 2.1788330078125, 2.640380859375, 3.1019287109375, 3.5634765625, 4.0250244140625, 4.486572265625, 4.9481201171875, 5.40966796875, 5.8712158203125, 6.332763671875, 6.7943115234375, 7.255859375, 7.7174072265625, 8.178955078125, 8.6405029296875, 9.10205078125, 9.5635986328125, 10.025146484375, 10.4866943359375, 10.9482421875, 11.4097900390625, 11.871337890625, 12.3328857421875, 12.79443359375, 13.2559814453125, 13.717529296875, 14.1790771484375, 14.640625]}, "gradients/decoder.bert.encoder.layer.21.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 7.0, 8.0, 15.0, 22.0, 37.0, 30.0, 51.0, 52.0, 68.0, 92.0, 88.0, 124.0, 157.0, 169.0, 206.0, 207.0, 254.0, 280.0, 265.0, 266.0, 264.0, 220.0, 218.0, 168.0, 143.0, 122.0, 135.0, 87.0, 66.0, 45.0, 38.0, 27.0, 31.0, 17.0, 17.0, 10.0, 9.0, 12.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 4.0], "bins": [-7.32421875, -7.1240234375, -6.923828125, -6.7236328125, -6.5234375, -6.3232421875, -6.123046875, -5.9228515625, -5.72265625, -5.5224609375, -5.322265625, -5.1220703125, -4.921875, -4.7216796875, -4.521484375, -4.3212890625, -4.12109375, -3.9208984375, -3.720703125, -3.5205078125, -3.3203125, -3.1201171875, -2.919921875, -2.7197265625, -2.51953125, -2.3193359375, -2.119140625, -1.9189453125, -1.71875, -1.5185546875, -1.318359375, -1.1181640625, -0.91796875, -0.7177734375, -0.517578125, -0.3173828125, -0.1171875, 0.0830078125, 0.283203125, 0.4833984375, 0.68359375, 0.8837890625, 1.083984375, 1.2841796875, 1.484375, 1.6845703125, 1.884765625, 2.0849609375, 2.28515625, 2.4853515625, 2.685546875, 2.8857421875, 3.0859375, 3.2861328125, 3.486328125, 3.6865234375, 3.88671875, 4.0869140625, 4.287109375, 4.4873046875, 4.6875, 4.8876953125, 5.087890625, 5.2880859375, 5.48828125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 7.0, 4.0, 7.0, 6.0, 18.0, 10.0, 13.0, 21.0, 16.0, 25.0, 21.0, 36.0, 37.0, 36.0, 48.0, 43.0, 62.0, 50.0, 50.0, 49.0, 47.0, 50.0, 43.0, 45.0, 38.0, 33.0, 38.0, 25.0, 24.0, 12.0, 24.0, 14.0, 12.0, 6.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0], "bins": [-18.966812133789062, -18.42782211303711, -17.888830184936523, -17.34984016418457, -16.810850143432617, -16.27185821533203, -15.732868194580078, -15.193878173828125, -14.654887199401855, -14.115896224975586, -13.576906204223633, -13.037915229797363, -12.498924255371094, -11.95993423461914, -11.420943260192871, -10.881952285766602, -10.342962265014648, -9.803971290588379, -9.264981269836426, -8.725990295410156, -8.187000274658203, -7.648009300231934, -7.109018325805664, -6.570027828216553, -6.031037330627441, -5.49204683303833, -4.953056335449219, -4.414065361022949, -3.875074863433838, -3.3360843658447266, -2.797093629837036, -2.2581028938293457, -1.7191104888916016, -1.1801198720932007, -0.6411292552947998, -0.10213863849639893, 0.43685197830200195, 0.9758424758911133, 1.5148332118988037, 2.053823947906494, 2.5928144454956055, 3.131804943084717, 3.6707956790924072, 4.209786415100098, 4.748776912689209, 5.28776741027832, 5.82675838470459, 6.365748882293701, 6.9047393798828125, 7.443729877471924, 7.982720375061035, 8.521711349487305, 9.060701370239258, 9.599692344665527, 10.138683319091797, 10.67767333984375, 11.21666431427002, 11.755655288696289, 12.294645309448242, 12.833636283874512, 13.372627258300781, 13.911617279052734, 14.450608253479004, 14.989599227905273, 15.528589248657227]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 7.0, 11.0, 13.0, 7.0, 7.0, 12.0, 15.0, 29.0, 21.0, 27.0, 25.0, 32.0, 31.0, 36.0, 40.0, 56.0, 37.0, 44.0, 39.0, 28.0, 35.0, 44.0, 36.0, 44.0, 34.0, 26.0, 27.0, 36.0, 28.0, 18.0, 28.0, 16.0, 24.0, 10.0, 13.0, 9.0, 6.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.486700057983398, -14.01639461517334, -13.546089172363281, -13.075783729553223, -12.605478286743164, -12.135173797607422, -11.664867401123047, -11.194562911987305, -10.724257469177246, -10.253952026367188, -9.783646583557129, -9.31334114074707, -8.843035697937012, -8.372730255126953, -7.902425289154053, -7.432120323181152, -6.9618144035339355, -6.491508960723877, -6.021203517913818, -5.550898551940918, -5.080593109130859, -4.610287666320801, -4.139982223510742, -3.6696770191192627, -3.199371576309204, -2.7290661334991455, -2.258760929107666, -1.7884554862976074, -1.3181501626968384, -0.8478448390960693, -0.37753939628601074, 0.09276580810546875, 0.5630712509155273, 1.0333765745162964, 1.5036818981170654, 1.973987340927124, 2.4442925453186035, 2.914597988128662, 3.3849034309387207, 3.8552086353302, 4.32551383972168, 4.795819282531738, 5.266124725341797, 5.7364301681518555, 6.206735134124756, 6.6770405769348145, 7.147346019744873, 7.617650985717773, 8.087957382202148, 8.558262825012207, 9.028568267822266, 9.498873710632324, 9.969179153442383, 10.439483642578125, 10.9097900390625, 11.380094528198242, 11.8503999710083, 12.32070541381836, 12.791010856628418, 13.261316299438477, 13.731621742248535, 14.201927185058594, 14.672231674194336, 15.142537117004395, 15.612842559814453]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 9.0, 9.0, 14.0, 17.0, 37.0, 47.0, 73.0, 90.0, 128.0, 235.0, 351.0, 488.0, 704.0, 1026.0, 1531.0, 2329.0, 3397.0, 4955.0, 7190.0, 10510.0, 15307.0, 22284.0, 32208.0, 46645.0, 68102.0, 97434.0, 130269.0, 148200.0, 132756.0, 99201.0, 69726.0, 48239.0, 32846.0, 22666.0, 15681.0, 10738.0, 7372.0, 4915.0, 3421.0, 2386.0, 1616.0, 1093.0, 763.0, 499.0, 325.0, 214.0, 170.0, 117.0, 71.0, 53.0, 41.0, 20.0, 14.0, 16.0, 7.0, 8.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-9.8046875, -9.47265625, -9.140625, -8.80859375, -8.4765625, -8.14453125, -7.8125, -7.48046875, -7.1484375, -6.81640625, -6.484375, -6.15234375, -5.8203125, -5.48828125, -5.15625, -4.82421875, -4.4921875, -4.16015625, -3.828125, -3.49609375, -3.1640625, -2.83203125, -2.5, -2.16796875, -1.8359375, -1.50390625, -1.171875, -0.83984375, -0.5078125, -0.17578125, 0.15625, 0.48828125, 0.8203125, 1.15234375, 1.484375, 1.81640625, 2.1484375, 2.48046875, 2.8125, 3.14453125, 3.4765625, 3.80859375, 4.140625, 4.47265625, 4.8046875, 5.13671875, 5.46875, 5.80078125, 6.1328125, 6.46484375, 6.796875, 7.12890625, 7.4609375, 7.79296875, 8.125, 8.45703125, 8.7890625, 9.12109375, 9.453125, 9.78515625, 10.1171875, 10.44921875, 10.78125, 11.11328125, 11.4453125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 7.0, 9.0, 11.0, 12.0, 10.0, 11.0, 19.0, 17.0, 16.0, 31.0, 34.0, 24.0, 28.0, 39.0, 38.0, 39.0, 44.0, 36.0, 38.0, 47.0, 36.0, 38.0, 44.0, 39.0, 32.0, 32.0, 33.0, 30.0, 35.0, 15.0, 22.0, 17.0, 22.0, 16.0, 8.0, 15.0, 7.0, 9.0, 7.0, 2.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3359375, -13.8780517578125, -13.420166015625, -12.9622802734375, -12.50439453125, -12.0465087890625, -11.588623046875, -11.1307373046875, -10.6728515625, -10.2149658203125, -9.757080078125, -9.2991943359375, -8.84130859375, -8.3834228515625, -7.925537109375, -7.4676513671875, -7.009765625, -6.5518798828125, -6.093994140625, -5.6361083984375, -5.17822265625, -4.7203369140625, -4.262451171875, -3.8045654296875, -3.3466796875, -2.8887939453125, -2.430908203125, -1.9730224609375, -1.51513671875, -1.0572509765625, -0.599365234375, -0.1414794921875, 0.31640625, 0.7742919921875, 1.232177734375, 1.6900634765625, 2.14794921875, 2.6058349609375, 3.063720703125, 3.5216064453125, 3.9794921875, 4.4373779296875, 4.895263671875, 5.3531494140625, 5.81103515625, 6.2689208984375, 6.726806640625, 7.1846923828125, 7.642578125, 8.1004638671875, 8.558349609375, 9.0162353515625, 9.47412109375, 9.9320068359375, 10.389892578125, 10.8477783203125, 11.3056640625, 11.7635498046875, 12.221435546875, 12.6793212890625, 13.13720703125, 13.5950927734375, 14.052978515625, 14.5108642578125, 14.96875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 14.0, 16.0, 27.0, 36.0, 46.0, 79.0, 87.0, 143.0, 185.0, 277.0, 398.0, 591.0, 894.0, 1408.0, 2235.0, 3553.0, 5878.0, 10156.0, 18988.0, 50498.0, 854299.0, 53733.0, 18714.0, 9996.0, 5898.0, 3657.0, 2219.0, 1472.0, 965.0, 656.0, 425.0, 316.0, 200.0, 156.0, 101.0, 53.0, 48.0, 54.0, 36.0, 20.0, 14.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.671875, -21.876708984375, -21.08154296875, -20.286376953125, -19.4912109375, -18.696044921875, -17.90087890625, -17.105712890625, -16.310546875, -15.515380859375, -14.72021484375, -13.925048828125, -13.1298828125, -12.334716796875, -11.53955078125, -10.744384765625, -9.94921875, -9.154052734375, -8.35888671875, -7.563720703125, -6.7685546875, -5.973388671875, -5.17822265625, -4.383056640625, -3.587890625, -2.792724609375, -1.99755859375, -1.202392578125, -0.4072265625, 0.387939453125, 1.18310546875, 1.978271484375, 2.7734375, 3.568603515625, 4.36376953125, 5.158935546875, 5.9541015625, 6.749267578125, 7.54443359375, 8.339599609375, 9.134765625, 9.929931640625, 10.72509765625, 11.520263671875, 12.3154296875, 13.110595703125, 13.90576171875, 14.700927734375, 15.49609375, 16.291259765625, 17.08642578125, 17.881591796875, 18.6767578125, 19.471923828125, 20.26708984375, 21.062255859375, 21.857421875, 22.652587890625, 23.44775390625, 24.242919921875, 25.0380859375, 25.833251953125, 26.62841796875, 27.423583984375, 28.21875]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 4.0, 4.0, 8.0, 8.0, 13.0, 13.0, 14.0, 21.0, 19.0, 27.0, 27.0, 42.0, 39.0, 38.0, 42.0, 56.0, 53.0, 53.0, 50.0, 46.0, 52.0, 57.0, 42.0, 43.0, 47.0, 34.0, 30.0, 23.0, 13.0, 12.0, 18.0, 9.0, 9.0, 7.0, 7.0, 6.0, 5.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.0, -17.43115234375, -16.8623046875, -16.29345703125, -15.724609375, -15.15576171875, -14.5869140625, -14.01806640625, -13.44921875, -12.88037109375, -12.3115234375, -11.74267578125, -11.173828125, -10.60498046875, -10.0361328125, -9.46728515625, -8.8984375, -8.32958984375, -7.7607421875, -7.19189453125, -6.623046875, -6.05419921875, -5.4853515625, -4.91650390625, -4.34765625, -3.77880859375, -3.2099609375, -2.64111328125, -2.072265625, -1.50341796875, -0.9345703125, -0.36572265625, 0.203125, 0.77197265625, 1.3408203125, 1.90966796875, 2.478515625, 3.04736328125, 3.6162109375, 4.18505859375, 4.75390625, 5.32275390625, 5.8916015625, 6.46044921875, 7.029296875, 7.59814453125, 8.1669921875, 8.73583984375, 9.3046875, 9.87353515625, 10.4423828125, 11.01123046875, 11.580078125, 12.14892578125, 12.7177734375, 13.28662109375, 13.85546875, 14.42431640625, 14.9931640625, 15.56201171875, 16.130859375, 16.69970703125, 17.2685546875, 17.83740234375, 18.40625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 11.0, 11.0, 12.0, 23.0, 24.0, 28.0, 28.0, 46.0, 63.0, 92.0, 142.0, 172.0, 305.0, 454.0, 691.0, 1103.0, 1891.0, 3433.0, 6872.0, 15940.0, 60170.0, 888292.0, 41538.0, 13352.0, 6096.0, 3053.0, 1688.0, 1044.0, 650.0, 423.0, 267.0, 166.0, 130.0, 89.0, 55.0, 52.0, 41.0, 28.0, 19.0, 13.0, 8.0, 7.0, 14.0, 6.0, 3.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.3984375, -14.9080810546875, -14.417724609375, -13.9273681640625, -13.43701171875, -12.9466552734375, -12.456298828125, -11.9659423828125, -11.4755859375, -10.9852294921875, -10.494873046875, -10.0045166015625, -9.51416015625, -9.0238037109375, -8.533447265625, -8.0430908203125, -7.552734375, -7.0623779296875, -6.572021484375, -6.0816650390625, -5.59130859375, -5.1009521484375, -4.610595703125, -4.1202392578125, -3.6298828125, -3.1395263671875, -2.649169921875, -2.1588134765625, -1.66845703125, -1.1781005859375, -0.687744140625, -0.1973876953125, 0.29296875, 0.7833251953125, 1.273681640625, 1.7640380859375, 2.25439453125, 2.7447509765625, 3.235107421875, 3.7254638671875, 4.2158203125, 4.7061767578125, 5.196533203125, 5.6868896484375, 6.17724609375, 6.6676025390625, 7.157958984375, 7.6483154296875, 8.138671875, 8.6290283203125, 9.119384765625, 9.6097412109375, 10.10009765625, 10.5904541015625, 11.080810546875, 11.5711669921875, 12.0615234375, 12.5518798828125, 13.042236328125, 13.5325927734375, 14.02294921875, 14.5133056640625, 15.003662109375, 15.4940185546875, 15.984375]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 9.0, 8.0, 16.0, 10.0, 28.0, 36.0, 47.0, 88.0, 175.0, 214.0, 107.0, 80.0, 41.0, 29.0, 29.0, 18.0, 11.0, 12.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002223968505859375, -0.0021390914916992188, -0.0020542144775390625, -0.0019693374633789062, -0.00188446044921875, -0.0017995834350585938, -0.0017147064208984375, -0.0016298294067382812, -0.001544952392578125, -0.0014600753784179688, -0.0013751983642578125, -0.0012903213500976562, -0.0012054443359375, -0.0011205673217773438, -0.0010356903076171875, -0.0009508132934570312, -0.000865936279296875, -0.0007810592651367188, -0.0006961822509765625, -0.0006113052368164062, -0.00052642822265625, -0.00044155120849609375, -0.0003566741943359375, -0.00027179718017578125, -0.000186920166015625, -0.00010204315185546875, -1.71661376953125e-05, 6.771087646484375e-05, 0.000152587890625, 0.00023746490478515625, 0.0003223419189453125, 0.00040721893310546875, 0.000492095947265625, 0.0005769729614257812, 0.0006618499755859375, 0.0007467269897460938, 0.00083160400390625, 0.0009164810180664062, 0.0010013580322265625, 0.0010862350463867188, 0.001171112060546875, 0.0012559890747070312, 0.0013408660888671875, 0.0014257431030273438, 0.0015106201171875, 0.0015954971313476562, 0.0016803741455078125, 0.0017652511596679688, 0.001850128173828125, 0.0019350051879882812, 0.0020198822021484375, 0.0021047592163085938, 0.00218963623046875, 0.0022745132446289062, 0.0023593902587890625, 0.0024442672729492188, 0.002529144287109375, 0.0026140213012695312, 0.0026988983154296875, 0.0027837753295898438, 0.00286865234375, 0.0029535293579101562, 0.0030384063720703125, 0.0031232833862304688, 0.003208160400390625]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 14.0, 17.0, 28.0, 32.0, 34.0, 54.0, 89.0, 118.0, 160.0, 265.0, 342.0, 429.0, 605.0, 900.0, 1232.0, 1807.0, 2649.0, 4121.0, 6540.0, 10740.0, 18590.0, 33307.0, 65210.0, 126984.0, 211091.0, 230390.0, 153297.0, 80485.0, 41694.0, 22050.0, 12769.0, 7662.0, 4801.0, 3057.0, 2113.0, 1393.0, 981.0, 692.0, 515.0, 349.0, 274.0, 181.0, 124.0, 91.0, 70.0, 61.0, 35.0, 28.0, 15.0, 15.0, 13.0, 6.0, 12.0, 1.0, 5.0, 3.0, 2.0], "bins": [-3.314453125, -3.211395263671875, -3.10833740234375, -3.005279541015625, -2.9022216796875, -2.799163818359375, -2.69610595703125, -2.593048095703125, -2.489990234375, -2.386932373046875, -2.28387451171875, -2.180816650390625, -2.0777587890625, -1.974700927734375, -1.87164306640625, -1.768585205078125, -1.66552734375, -1.562469482421875, -1.45941162109375, -1.356353759765625, -1.2532958984375, -1.150238037109375, -1.04718017578125, -0.944122314453125, -0.841064453125, -0.738006591796875, -0.63494873046875, -0.531890869140625, -0.4288330078125, -0.325775146484375, -0.22271728515625, -0.119659423828125, -0.0166015625, 0.086456298828125, 0.18951416015625, 0.292572021484375, 0.3956298828125, 0.498687744140625, 0.60174560546875, 0.704803466796875, 0.807861328125, 0.910919189453125, 1.01397705078125, 1.117034912109375, 1.2200927734375, 1.323150634765625, 1.42620849609375, 1.529266357421875, 1.63232421875, 1.735382080078125, 1.83843994140625, 1.941497802734375, 2.0445556640625, 2.147613525390625, 2.25067138671875, 2.353729248046875, 2.456787109375, 2.559844970703125, 2.66290283203125, 2.765960693359375, 2.8690185546875, 2.972076416015625, 3.07513427734375, 3.178192138671875, 3.28125]}, "gradients/decoder.bert.encoder.layer.21.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 5.0, 3.0, 6.0, 8.0, 4.0, 5.0, 6.0, 9.0, 19.0, 22.0, 23.0, 32.0, 43.0, 42.0, 73.0, 79.0, 91.0, 69.0, 90.0, 63.0, 53.0, 60.0, 38.0, 38.0, 28.0, 23.0, 13.0, 10.0, 8.0, 3.0, 6.0, 7.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.52734375, -1.479949951171875, -1.43255615234375, -1.385162353515625, -1.3377685546875, -1.290374755859375, -1.24298095703125, -1.195587158203125, -1.148193359375, -1.100799560546875, -1.05340576171875, -1.006011962890625, -0.9586181640625, -0.911224365234375, -0.86383056640625, -0.816436767578125, -0.76904296875, -0.721649169921875, -0.67425537109375, -0.626861572265625, -0.5794677734375, -0.532073974609375, -0.48468017578125, -0.437286376953125, -0.389892578125, -0.342498779296875, -0.29510498046875, -0.247711181640625, -0.2003173828125, -0.152923583984375, -0.10552978515625, -0.058135986328125, -0.0107421875, 0.036651611328125, 0.08404541015625, 0.131439208984375, 0.1788330078125, 0.226226806640625, 0.27362060546875, 0.321014404296875, 0.368408203125, 0.415802001953125, 0.46319580078125, 0.510589599609375, 0.5579833984375, 0.605377197265625, 0.65277099609375, 0.700164794921875, 0.74755859375, 0.794952392578125, 0.84234619140625, 0.889739990234375, 0.9371337890625, 0.984527587890625, 1.03192138671875, 1.079315185546875, 1.126708984375, 1.174102783203125, 1.22149658203125, 1.268890380859375, 1.3162841796875, 1.363677978515625, 1.41107177734375, 1.458465576171875, 1.505859375]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 7.0, 6.0, 8.0, 15.0, 17.0, 19.0, 19.0, 23.0, 27.0, 35.0, 41.0, 38.0, 42.0, 45.0, 54.0, 49.0, 50.0, 60.0, 60.0, 56.0, 42.0, 60.0, 35.0, 38.0, 31.0, 16.0, 21.0, 12.0, 11.0, 10.0, 8.0, 5.0, 14.0, 6.0, 4.0, 0.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.22270965576172, -16.706270217895508, -16.189830780029297, -15.673391342163086, -15.156951904296875, -14.640512466430664, -14.124073028564453, -13.607633590698242, -13.091194152832031, -12.57475471496582, -12.05831527709961, -11.541875839233398, -11.025436401367188, -10.508996963500977, -9.992557525634766, -9.476118087768555, -8.959678649902344, -8.443239212036133, -7.926799774169922, -7.410360336303711, -6.8939208984375, -6.377481460571289, -5.861042022705078, -5.344602584838867, -4.828163146972656, -4.311723709106445, -3.7952842712402344, -3.2788448333740234, -2.7624053955078125, -2.2459659576416016, -1.7295265197753906, -1.2130870819091797, -0.6966495513916016, -0.18021011352539062, 0.3362293243408203, 0.8526687622070312, 1.3691082000732422, 1.8855476379394531, 2.401987075805664, 2.918426513671875, 3.434865951538086, 3.951305389404297, 4.467744827270508, 4.984184265136719, 5.50062370300293, 6.017063140869141, 6.533502578735352, 7.0499420166015625, 7.566381454467773, 8.082820892333984, 8.599260330200195, 9.115699768066406, 9.632139205932617, 10.148578643798828, 10.665018081665039, 11.18145751953125, 11.697896957397461, 12.214336395263672, 12.730775833129883, 13.247215270996094, 13.763654708862305, 14.280094146728516, 14.796533584594727, 15.312973022460938, 15.829412460327148]}, "gradients/decoder.bert.encoder.layer.21.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 7.0, 10.0, 6.0, 12.0, 6.0, 8.0, 8.0, 12.0, 22.0, 29.0, 18.0, 22.0, 30.0, 30.0, 38.0, 32.0, 37.0, 43.0, 50.0, 23.0, 45.0, 40.0, 39.0, 38.0, 35.0, 35.0, 35.0, 33.0, 27.0, 23.0, 32.0, 16.0, 35.0, 23.0, 10.0, 17.0, 12.0, 9.0, 9.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.771490097045898, -12.355425834655762, -11.939361572265625, -11.523297309875488, -11.107233047485352, -10.691168785095215, -10.275104522705078, -9.859040260314941, -9.442975997924805, -9.026911735534668, -8.610847473144531, -8.194783210754395, -7.778718948364258, -7.362654685974121, -6.946590423583984, -6.530526161193848, -6.114461898803711, -5.698397636413574, -5.2823333740234375, -4.866269111633301, -4.450204849243164, -4.034140586853027, -3.6180763244628906, -3.202012062072754, -2.785947799682617, -2.3698835372924805, -1.9538192749023438, -1.537755012512207, -1.1216907501220703, -0.7056264877319336, -0.2895622253417969, 0.12650203704833984, 0.5425653457641602, 0.9586296081542969, 1.3746938705444336, 1.7907581329345703, 2.206822395324707, 2.6228866577148438, 3.0389509201049805, 3.455015182495117, 3.871079444885254, 4.287143707275391, 4.703207969665527, 5.119272232055664, 5.535336494445801, 5.9514007568359375, 6.367465019226074, 6.783529281616211, 7.199593544006348, 7.615657806396484, 8.031722068786621, 8.447786331176758, 8.863850593566895, 9.279914855957031, 9.695979118347168, 10.112043380737305, 10.528107643127441, 10.944171905517578, 11.360236167907715, 11.776300430297852, 12.192364692687988, 12.608428955078125, 13.024493217468262, 13.440557479858398, 13.856621742248535]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 0.0, 3.0, 8.0, 9.0, 12.0, 23.0, 38.0, 60.0, 80.0, 153.0, 228.0, 364.0, 660.0, 1044.0, 1751.0, 3089.0, 5168.0, 9233.0, 16151.0, 27865.0, 48017.0, 79250.0, 121427.0, 163342.0, 174091.0, 145343.0, 100483.0, 63089.0, 37077.0, 21446.0, 12103.0, 7078.0, 4114.0, 2308.0, 1295.0, 876.0, 472.0, 324.0, 175.0, 108.0, 72.0, 59.0, 26.0, 14.0, 17.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.484375, -12.98974609375, -12.4951171875, -12.00048828125, -11.505859375, -11.01123046875, -10.5166015625, -10.02197265625, -9.52734375, -9.03271484375, -8.5380859375, -8.04345703125, -7.548828125, -7.05419921875, -6.5595703125, -6.06494140625, -5.5703125, -5.07568359375, -4.5810546875, -4.08642578125, -3.591796875, -3.09716796875, -2.6025390625, -2.10791015625, -1.61328125, -1.11865234375, -0.6240234375, -0.12939453125, 0.365234375, 0.85986328125, 1.3544921875, 1.84912109375, 2.34375, 2.83837890625, 3.3330078125, 3.82763671875, 4.322265625, 4.81689453125, 5.3115234375, 5.80615234375, 6.30078125, 6.79541015625, 7.2900390625, 7.78466796875, 8.279296875, 8.77392578125, 9.2685546875, 9.76318359375, 10.2578125, 10.75244140625, 11.2470703125, 11.74169921875, 12.236328125, 12.73095703125, 13.2255859375, 13.72021484375, 14.21484375, 14.70947265625, 15.2041015625, 15.69873046875, 16.193359375, 16.68798828125, 17.1826171875, 17.67724609375, 18.171875]}, "gradients/decoder.bert.encoder.layer.21.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 6.0, 5.0, 5.0, 8.0, 11.0, 13.0, 4.0, 18.0, 14.0, 14.0, 19.0, 23.0, 22.0, 29.0, 25.0, 24.0, 36.0, 41.0, 28.0, 44.0, 40.0, 33.0, 43.0, 42.0, 42.0, 25.0, 33.0, 27.0, 46.0, 39.0, 28.0, 29.0, 21.0, 15.0, 22.0, 19.0, 21.0, 18.0, 18.0, 8.0, 10.0, 7.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-12.4765625, -12.1031494140625, -11.729736328125, -11.3563232421875, -10.98291015625, -10.6094970703125, -10.236083984375, -9.8626708984375, -9.4892578125, -9.1158447265625, -8.742431640625, -8.3690185546875, -7.99560546875, -7.6221923828125, -7.248779296875, -6.8753662109375, -6.501953125, -6.1285400390625, -5.755126953125, -5.3817138671875, -5.00830078125, -4.6348876953125, -4.261474609375, -3.8880615234375, -3.5146484375, -3.1412353515625, -2.767822265625, -2.3944091796875, -2.02099609375, -1.6475830078125, -1.274169921875, -0.9007568359375, -0.52734375, -0.1539306640625, 0.219482421875, 0.5928955078125, 0.96630859375, 1.3397216796875, 1.713134765625, 2.0865478515625, 2.4599609375, 2.8333740234375, 3.206787109375, 3.5802001953125, 3.95361328125, 4.3270263671875, 4.700439453125, 5.0738525390625, 5.447265625, 5.8206787109375, 6.194091796875, 6.5675048828125, 6.94091796875, 7.3143310546875, 7.687744140625, 8.0611572265625, 8.4345703125, 8.8079833984375, 9.181396484375, 9.5548095703125, 9.92822265625, 10.3016357421875, 10.675048828125, 11.0484619140625, 11.421875]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 12.0, 21.0, 24.0, 29.0, 54.0, 72.0, 146.0, 223.0, 344.0, 578.0, 942.0, 1480.0, 2492.0, 4107.0, 6770.0, 11415.0, 19324.0, 32226.0, 54068.0, 85931.0, 127850.0, 162405.0, 165220.0, 134550.0, 92333.0, 58305.0, 35281.0, 20948.0, 12530.0, 7534.0, 4431.0, 2666.0, 1584.0, 1043.0, 571.0, 341.0, 240.0, 164.0, 108.0, 57.0, 38.0, 38.0, 22.0, 14.0, 6.0, 7.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.921875, -14.4708251953125, -14.019775390625, -13.5687255859375, -13.11767578125, -12.6666259765625, -12.215576171875, -11.7645263671875, -11.3134765625, -10.8624267578125, -10.411376953125, -9.9603271484375, -9.50927734375, -9.0582275390625, -8.607177734375, -8.1561279296875, -7.705078125, -7.2540283203125, -6.802978515625, -6.3519287109375, -5.90087890625, -5.4498291015625, -4.998779296875, -4.5477294921875, -4.0966796875, -3.6456298828125, -3.194580078125, -2.7435302734375, -2.29248046875, -1.8414306640625, -1.390380859375, -0.9393310546875, -0.48828125, -0.0372314453125, 0.413818359375, 0.8648681640625, 1.31591796875, 1.7669677734375, 2.218017578125, 2.6690673828125, 3.1201171875, 3.5711669921875, 4.022216796875, 4.4732666015625, 4.92431640625, 5.3753662109375, 5.826416015625, 6.2774658203125, 6.728515625, 7.1795654296875, 7.630615234375, 8.0816650390625, 8.53271484375, 8.9837646484375, 9.434814453125, 9.8858642578125, 10.3369140625, 10.7879638671875, 11.239013671875, 11.6900634765625, 12.14111328125, 12.5921630859375, 13.043212890625, 13.4942626953125, 13.9453125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 6.0, 14.0, 8.0, 18.0, 15.0, 14.0, 13.0, 20.0, 25.0, 29.0, 32.0, 33.0, 37.0, 52.0, 48.0, 38.0, 37.0, 56.0, 54.0, 50.0, 58.0, 37.0, 33.0, 42.0, 28.0, 43.0, 24.0, 20.0, 25.0, 14.0, 11.0, 18.0, 6.0, 11.0, 6.0, 4.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9921875, -7.6903076171875, -7.388427734375, -7.0865478515625, -6.78466796875, -6.4827880859375, -6.180908203125, -5.8790283203125, -5.5771484375, -5.2752685546875, -4.973388671875, -4.6715087890625, -4.36962890625, -4.0677490234375, -3.765869140625, -3.4639892578125, -3.162109375, -2.8602294921875, -2.558349609375, -2.2564697265625, -1.95458984375, -1.6527099609375, -1.350830078125, -1.0489501953125, -0.7470703125, -0.4451904296875, -0.143310546875, 0.1585693359375, 0.46044921875, 0.7623291015625, 1.064208984375, 1.3660888671875, 1.66796875, 1.9698486328125, 2.271728515625, 2.5736083984375, 2.87548828125, 3.1773681640625, 3.479248046875, 3.7811279296875, 4.0830078125, 4.3848876953125, 4.686767578125, 4.9886474609375, 5.29052734375, 5.5924072265625, 5.894287109375, 6.1961669921875, 6.498046875, 6.7999267578125, 7.101806640625, 7.4036865234375, 7.70556640625, 8.0074462890625, 8.309326171875, 8.6112060546875, 8.9130859375, 9.2149658203125, 9.516845703125, 9.8187255859375, 10.12060546875, 10.4224853515625, 10.724365234375, 11.0262451171875, 11.328125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.weight": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 8.0, 12.0, 15.0, 17.0, 21.0, 31.0, 48.0, 60.0, 74.0, 103.0, 179.0, 269.0, 335.0, 479.0, 690.0, 1107.0, 1812.0, 2843.0, 4511.0, 7439.0, 12676.0, 21903.0, 37863.0, 67909.0, 117003.0, 178375.0, 202819.0, 158671.0, 97953.0, 55968.0, 31479.0, 18152.0, 10554.0, 6411.0, 3826.0, 2406.0, 1538.0, 967.0, 615.0, 440.0, 289.0, 201.0, 140.0, 104.0, 57.0, 55.0, 41.0, 26.0, 13.0, 16.0, 7.0, 6.0, 7.0, 4.0, 3.0, 3.0, 2.0], "bins": [-10.6640625, -10.3441162109375, -10.024169921875, -9.7042236328125, -9.38427734375, -9.0643310546875, -8.744384765625, -8.4244384765625, -8.1044921875, -7.7845458984375, -7.464599609375, -7.1446533203125, -6.82470703125, -6.5047607421875, -6.184814453125, -5.8648681640625, -5.544921875, -5.2249755859375, -4.905029296875, -4.5850830078125, -4.26513671875, -3.9451904296875, -3.625244140625, -3.3052978515625, -2.9853515625, -2.6654052734375, -2.345458984375, -2.0255126953125, -1.70556640625, -1.3856201171875, -1.065673828125, -0.7457275390625, -0.42578125, -0.1058349609375, 0.214111328125, 0.5340576171875, 0.85400390625, 1.1739501953125, 1.493896484375, 1.8138427734375, 2.1337890625, 2.4537353515625, 2.773681640625, 3.0936279296875, 3.41357421875, 3.7335205078125, 4.053466796875, 4.3734130859375, 4.693359375, 5.0133056640625, 5.333251953125, 5.6531982421875, 5.97314453125, 6.2930908203125, 6.613037109375, 6.9329833984375, 7.2529296875, 7.5728759765625, 7.892822265625, 8.2127685546875, 8.53271484375, 8.8526611328125, 9.172607421875, 9.4925537109375, 9.8125]}, "gradients/decoder.bert.encoder.layer.21.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 15.0, 15.0, 21.0, 23.0, 30.0, 41.0, 51.0, 62.0, 66.0, 62.0, 83.0, 76.0, 74.0, 62.0, 57.0, 53.0, 48.0, 38.0, 28.0, 22.0, 10.0, 11.0, 16.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00102996826171875, -0.000993490219116211, -0.0009570121765136719, -0.0009205341339111328, -0.0008840560913085938, -0.0008475780487060547, -0.0008111000061035156, -0.0007746219635009766, -0.0007381439208984375, -0.0007016658782958984, -0.0006651878356933594, -0.0006287097930908203, -0.0005922317504882812, -0.0005557537078857422, -0.0005192756652832031, -0.00048279762268066406, -0.000446319580078125, -0.00040984153747558594, -0.0003733634948730469, -0.0003368854522705078, -0.00030040740966796875, -0.0002639293670654297, -0.00022745132446289062, -0.00019097328186035156, -0.0001544952392578125, -0.00011801719665527344, -8.153915405273438e-05, -4.506111145019531e-05, -8.58306884765625e-06, 2.7894973754882812e-05, 6.437301635742188e-05, 0.00010085105895996094, 0.0001373291015625, 0.00017380714416503906, 0.00021028518676757812, 0.0002467632293701172, 0.00028324127197265625, 0.0003197193145751953, 0.0003561973571777344, 0.00039267539978027344, 0.0004291534423828125, 0.00046563148498535156, 0.0005021095275878906, 0.0005385875701904297, 0.0005750656127929688, 0.0006115436553955078, 0.0006480216979980469, 0.0006844997406005859, 0.000720977783203125, 0.0007574558258056641, 0.0007939338684082031, 0.0008304119110107422, 0.0008668899536132812, 0.0009033679962158203, 0.0009398460388183594, 0.0009763240814208984, 0.0010128021240234375, 0.0010492801666259766, 0.0010857582092285156, 0.0011222362518310547, 0.0011587142944335938, 0.0011951923370361328, 0.0012316703796386719, 0.001268148422241211, 0.00130462646484375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 12.0, 6.0, 16.0, 29.0, 32.0, 37.0, 64.0, 108.0, 153.0, 295.0, 520.0, 959.0, 1827.0, 3489.0, 7040.0, 14998.0, 33857.0, 79939.0, 183261.0, 296859.0, 231942.0, 108662.0, 45586.0, 20135.0, 9153.0, 4576.0, 2259.0, 1265.0, 618.0, 343.0, 172.0, 101.0, 78.0, 46.0, 25.0, 25.0, 18.0, 18.0, 5.0, 7.0, 10.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.96875, -14.4962158203125, -14.023681640625, -13.5511474609375, -13.07861328125, -12.6060791015625, -12.133544921875, -11.6610107421875, -11.1884765625, -10.7159423828125, -10.243408203125, -9.7708740234375, -9.29833984375, -8.8258056640625, -8.353271484375, -7.8807373046875, -7.408203125, -6.9356689453125, -6.463134765625, -5.9906005859375, -5.51806640625, -5.0455322265625, -4.572998046875, -4.1004638671875, -3.6279296875, -3.1553955078125, -2.682861328125, -2.2103271484375, -1.73779296875, -1.2652587890625, -0.792724609375, -0.3201904296875, 0.15234375, 0.6248779296875, 1.097412109375, 1.5699462890625, 2.04248046875, 2.5150146484375, 2.987548828125, 3.4600830078125, 3.9326171875, 4.4051513671875, 4.877685546875, 5.3502197265625, 5.82275390625, 6.2952880859375, 6.767822265625, 7.2403564453125, 7.712890625, 8.1854248046875, 8.657958984375, 9.1304931640625, 9.60302734375, 10.0755615234375, 10.548095703125, 11.0206298828125, 11.4931640625, 11.9656982421875, 12.438232421875, 12.9107666015625, 13.38330078125, 13.8558349609375, 14.328369140625, 14.8009033203125, 15.2734375]}, "gradients/decoder.bert.encoder.layer.21.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 11.0, 15.0, 14.0, 19.0, 23.0, 28.0, 41.0, 54.0, 41.0, 66.0, 73.0, 62.0, 64.0, 66.0, 64.0, 53.0, 53.0, 43.0, 47.0, 26.0, 21.0, 25.0, 13.0, 20.0, 13.0, 3.0, 7.0, 6.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.203125, -3.07818603515625, -2.9532470703125, -2.82830810546875, -2.703369140625, -2.57843017578125, -2.4534912109375, -2.32855224609375, -2.20361328125, -2.07867431640625, -1.9537353515625, -1.82879638671875, -1.703857421875, -1.57891845703125, -1.4539794921875, -1.32904052734375, -1.2041015625, -1.07916259765625, -0.9542236328125, -0.82928466796875, -0.704345703125, -0.57940673828125, -0.4544677734375, -0.32952880859375, -0.20458984375, -0.07965087890625, 0.0452880859375, 0.17022705078125, 0.295166015625, 0.42010498046875, 0.5450439453125, 0.66998291015625, 0.794921875, 0.91986083984375, 1.0447998046875, 1.16973876953125, 1.294677734375, 1.41961669921875, 1.5445556640625, 1.66949462890625, 1.79443359375, 1.91937255859375, 2.0443115234375, 2.16925048828125, 2.294189453125, 2.41912841796875, 2.5440673828125, 2.66900634765625, 2.7939453125, 2.91888427734375, 3.0438232421875, 3.16876220703125, 3.293701171875, 3.41864013671875, 3.5435791015625, 3.66851806640625, 3.79345703125, 3.91839599609375, 4.0433349609375, 4.16827392578125, 4.293212890625, 4.41815185546875, 4.5430908203125, 4.66802978515625, 4.79296875]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 9.0, 13.0, 12.0, 9.0, 24.0, 22.0, 17.0, 33.0, 20.0, 40.0, 37.0, 45.0, 50.0, 53.0, 71.0, 40.0, 60.0, 54.0, 55.0, 41.0, 48.0, 52.0, 39.0, 37.0, 28.0, 9.0, 15.0, 19.0, 9.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.446269035339355, -14.960251808166504, -14.474233627319336, -13.988216400146484, -13.502198219299316, -13.016180992126465, -12.530162811279297, -12.044145584106445, -11.558127403259277, -11.072110176086426, -10.586091995239258, -10.100074768066406, -9.614056587219238, -9.128039360046387, -8.642021179199219, -8.156003952026367, -7.669986248016357, -7.183968544006348, -6.697950839996338, -6.211933135986328, -5.725915431976318, -5.239897727966309, -4.753880500793457, -4.267862319946289, -3.7818448543548584, -3.2958271503448486, -2.809809446334839, -2.323791980743408, -1.8377741575241089, -1.3517565727233887, -0.8657388687133789, -0.37972116470336914, 0.10629653930664062, 0.5923142433166504, 1.0783319473266602, 1.5643495321273804, 2.0503673553466797, 2.5363848209381104, 3.02240252494812, 3.50842022895813, 3.9944379329681396, 4.48045539855957, 4.96647310256958, 5.45249080657959, 5.9385085105896, 6.424526214599609, 6.910543918609619, 7.396561622619629, 7.882579326629639, 8.368597030639648, 8.8546142578125, 9.340632438659668, 9.82664966583252, 10.312667846679688, 10.798685073852539, 11.284703254699707, 11.770720481872559, 12.25673770904541, 12.742755889892578, 13.22877311706543, 13.714791297912598, 14.20080852508545, 14.686826705932617, 15.172843933105469, 15.658862113952637]}, "gradients/decoder.bert.encoder.layer.20.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 7.0, 11.0, 5.0, 6.0, 18.0, 15.0, 17.0, 20.0, 18.0, 19.0, 17.0, 28.0, 32.0, 31.0, 42.0, 39.0, 33.0, 48.0, 34.0, 43.0, 44.0, 32.0, 33.0, 38.0, 30.0, 38.0, 27.0, 24.0, 26.0, 23.0, 33.0, 20.0, 14.0, 17.0, 15.0, 14.0, 6.0, 11.0, 11.0, 7.0, 2.0, 7.0, 5.0, 6.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-11.707863807678223, -11.32986831665039, -10.951872825622559, -10.57387638092041, -10.195880889892578, -9.817885398864746, -9.439889907836914, -9.061893463134766, -8.683897972106934, -8.305902481079102, -7.927906513214111, -7.549911022186279, -7.171915054321289, -6.793919563293457, -6.415924072265625, -6.037928104400635, -5.659932613372803, -5.281937122344971, -4.9039411544799805, -4.525945663452148, -4.147949695587158, -3.769954204559326, -3.391958475112915, -3.013962745666504, -2.6359670162200928, -2.2579712867736816, -1.8799755573272705, -1.501979947090149, -1.1239842176437378, -0.7459884881973267, -0.3679928779602051, 0.010002851486206055, 0.3879985809326172, 0.7659943103790283, 1.1439900398254395, 1.521985650062561, 1.8999813795089722, 2.2779769897460938, 2.655972719192505, 3.033968448638916, 3.411964178085327, 3.7899599075317383, 4.16795539855957, 4.5459513664245605, 4.923946857452393, 5.301942825317383, 5.679938316345215, 6.057933807373047, 6.435929775238037, 6.813925266265869, 7.191921234130859, 7.569916725158691, 7.947912693023682, 8.325908660888672, 8.703904151916504, 9.081899642944336, 9.459895133972168, 9.837890625, 10.215886116027832, 10.59388256072998, 10.971878051757812, 11.349873542785645, 11.727869033813477, 12.105865478515625, 12.483860969543457]}, "gradients/decoder.bert.encoder.layer.20.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 10.0, 17.0, 23.0, 22.0, 50.0, 89.0, 144.0, 227.0, 328.0, 477.0, 816.0, 1322.0, 2095.0, 3406.0, 5900.0, 10225.0, 18393.0, 33999.0, 65996.0, 135980.0, 309491.0, 673099.0, 1046046.0, 931256.0, 508270.0, 225269.0, 104213.0, 51843.0, 27700.0, 15504.0, 8667.0, 4978.0, 3110.0, 1967.0, 1190.0, 782.0, 458.0, 299.0, 219.0, 141.0, 105.0, 47.0, 43.0, 25.0, 17.0, 9.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-12.5703125, -12.162353515625, -11.75439453125, -11.346435546875, -10.9384765625, -10.530517578125, -10.12255859375, -9.714599609375, -9.306640625, -8.898681640625, -8.49072265625, -8.082763671875, -7.6748046875, -7.266845703125, -6.85888671875, -6.450927734375, -6.04296875, -5.635009765625, -5.22705078125, -4.819091796875, -4.4111328125, -4.003173828125, -3.59521484375, -3.187255859375, -2.779296875, -2.371337890625, -1.96337890625, -1.555419921875, -1.1474609375, -0.739501953125, -0.33154296875, 0.076416015625, 0.484375, 0.892333984375, 1.30029296875, 1.708251953125, 2.1162109375, 2.524169921875, 2.93212890625, 3.340087890625, 3.748046875, 4.156005859375, 4.56396484375, 4.971923828125, 5.3798828125, 5.787841796875, 6.19580078125, 6.603759765625, 7.01171875, 7.419677734375, 7.82763671875, 8.235595703125, 8.6435546875, 9.051513671875, 9.45947265625, 9.867431640625, 10.275390625, 10.683349609375, 11.09130859375, 11.499267578125, 11.9072265625, 12.315185546875, 12.72314453125, 13.131103515625, 13.5390625]}, "gradients/decoder.bert.encoder.layer.20.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 5.0, 5.0, 9.0, 8.0, 10.0, 12.0, 10.0, 16.0, 18.0, 19.0, 21.0, 21.0, 32.0, 29.0, 31.0, 37.0, 39.0, 42.0, 42.0, 39.0, 44.0, 30.0, 28.0, 41.0, 30.0, 23.0, 37.0, 40.0, 26.0, 24.0, 30.0, 23.0, 17.0, 27.0, 16.0, 22.0, 16.0, 15.0, 10.0, 10.0, 3.0, 7.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0], "bins": [-8.4921875, -8.21337890625, -7.9345703125, -7.65576171875, -7.376953125, -7.09814453125, -6.8193359375, -6.54052734375, -6.26171875, -5.98291015625, -5.7041015625, -5.42529296875, -5.146484375, -4.86767578125, -4.5888671875, -4.31005859375, -4.03125, -3.75244140625, -3.4736328125, -3.19482421875, -2.916015625, -2.63720703125, -2.3583984375, -2.07958984375, -1.80078125, -1.52197265625, -1.2431640625, -0.96435546875, -0.685546875, -0.40673828125, -0.1279296875, 0.15087890625, 0.4296875, 0.70849609375, 0.9873046875, 1.26611328125, 1.544921875, 1.82373046875, 2.1025390625, 2.38134765625, 2.66015625, 2.93896484375, 3.2177734375, 3.49658203125, 3.775390625, 4.05419921875, 4.3330078125, 4.61181640625, 4.890625, 5.16943359375, 5.4482421875, 5.72705078125, 6.005859375, 6.28466796875, 6.5634765625, 6.84228515625, 7.12109375, 7.39990234375, 7.6787109375, 7.95751953125, 8.236328125, 8.51513671875, 8.7939453125, 9.07275390625, 9.3515625]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 8.0, 16.0, 25.0, 35.0, 46.0, 60.0, 112.0, 195.0, 279.0, 425.0, 677.0, 1001.0, 1456.0, 2389.0, 3671.0, 5933.0, 9570.0, 15485.0, 26075.0, 44021.0, 76330.0, 133245.0, 237138.0, 417676.0, 690572.0, 866063.0, 687391.0, 418587.0, 236072.0, 132386.0, 76249.0, 43835.0, 26125.0, 15401.0, 9476.0, 5875.0, 3709.0, 2330.0, 1562.0, 912.0, 694.0, 364.0, 282.0, 196.0, 116.0, 80.0, 52.0, 31.0, 14.0, 18.0, 10.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.984375, -10.6463623046875, -10.308349609375, -9.9703369140625, -9.63232421875, -9.2943115234375, -8.956298828125, -8.6182861328125, -8.2802734375, -7.9422607421875, -7.604248046875, -7.2662353515625, -6.92822265625, -6.5902099609375, -6.252197265625, -5.9141845703125, -5.576171875, -5.2381591796875, -4.900146484375, -4.5621337890625, -4.22412109375, -3.8861083984375, -3.548095703125, -3.2100830078125, -2.8720703125, -2.5340576171875, -2.196044921875, -1.8580322265625, -1.52001953125, -1.1820068359375, -0.843994140625, -0.5059814453125, -0.16796875, 0.1700439453125, 0.508056640625, 0.8460693359375, 1.18408203125, 1.5220947265625, 1.860107421875, 2.1981201171875, 2.5361328125, 2.8741455078125, 3.212158203125, 3.5501708984375, 3.88818359375, 4.2261962890625, 4.564208984375, 4.9022216796875, 5.240234375, 5.5782470703125, 5.916259765625, 6.2542724609375, 6.59228515625, 6.9302978515625, 7.268310546875, 7.6063232421875, 7.9443359375, 8.2823486328125, 8.620361328125, 8.9583740234375, 9.29638671875, 9.6343994140625, 9.972412109375, 10.3104248046875, 10.6484375]}, "gradients/decoder.bert.encoder.layer.20.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 7.0, 11.0, 15.0, 18.0, 24.0, 24.0, 41.0, 42.0, 48.0, 59.0, 72.0, 89.0, 110.0, 147.0, 174.0, 233.0, 222.0, 253.0, 293.0, 284.0, 283.0, 258.0, 258.0, 210.0, 173.0, 133.0, 110.0, 93.0, 77.0, 69.0, 46.0, 47.0, 26.0, 29.0, 23.0, 14.0, 13.0, 9.0, 10.0, 6.0, 2.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.171875, -4.0390625, -3.90625, -3.7734375, -3.640625, -3.5078125, -3.375, -3.2421875, -3.109375, -2.9765625, -2.84375, -2.7109375, -2.578125, -2.4453125, -2.3125, -2.1796875, -2.046875, -1.9140625, -1.78125, -1.6484375, -1.515625, -1.3828125, -1.25, -1.1171875, -0.984375, -0.8515625, -0.71875, -0.5859375, -0.453125, -0.3203125, -0.1875, -0.0546875, 0.078125, 0.2109375, 0.34375, 0.4765625, 0.609375, 0.7421875, 0.875, 1.0078125, 1.140625, 1.2734375, 1.40625, 1.5390625, 1.671875, 1.8046875, 1.9375, 2.0703125, 2.203125, 2.3359375, 2.46875, 2.6015625, 2.734375, 2.8671875, 3.0, 3.1328125, 3.265625, 3.3984375, 3.53125, 3.6640625, 3.796875, 3.9296875, 4.0625, 4.1953125]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 3.0, 6.0, 9.0, 2.0, 13.0, 16.0, 17.0, 19.0, 26.0, 31.0, 40.0, 49.0, 47.0, 50.0, 51.0, 54.0, 48.0, 53.0, 65.0, 54.0, 61.0, 44.0, 48.0, 39.0, 28.0, 20.0, 17.0, 17.0, 15.0, 16.0, 7.0, 2.0, 7.0, 4.0, 3.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.015341758728027, -11.61558723449707, -11.21583366394043, -10.816080093383789, -10.416325569152832, -10.016571044921875, -9.616817474365234, -9.217063903808594, -8.817309379577637, -8.41755485534668, -8.017801284790039, -7.61804723739624, -7.218293190002441, -6.818539142608643, -6.418785095214844, -6.019031047821045, -5.619277000427246, -5.219522953033447, -4.819768905639648, -4.42001485824585, -4.020260810852051, -3.620506763458252, -3.220752716064453, -2.8209986686706543, -2.4212446212768555, -2.0214905738830566, -1.6217365264892578, -1.221982479095459, -0.8222284317016602, -0.42247438430786133, -0.0227203369140625, 0.37703371047973633, 0.7767887115478516, 1.1765427589416504, 1.5762968063354492, 1.976050853729248, 2.375804901123047, 2.7755589485168457, 3.1753129959106445, 3.5750670433044434, 3.974821090698242, 4.374575138092041, 4.77432918548584, 5.174083232879639, 5.5738372802734375, 5.973591327667236, 6.373345375061035, 6.773099422454834, 7.172853469848633, 7.572607517242432, 7.9723615646362305, 8.372116088867188, 8.771869659423828, 9.171623229980469, 9.571377754211426, 9.971132278442383, 10.370885848999023, 10.770639419555664, 11.170393943786621, 11.570148468017578, 11.969902038574219, 12.36965560913086, 12.769410133361816, 13.169164657592773, 13.568918228149414]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 9.0, 8.0, 10.0, 12.0, 9.0, 13.0, 16.0, 16.0, 17.0, 30.0, 32.0, 24.0, 23.0, 29.0, 33.0, 31.0, 34.0, 36.0, 45.0, 48.0, 42.0, 37.0, 50.0, 38.0, 34.0, 38.0, 28.0, 40.0, 27.0, 27.0, 20.0, 17.0, 11.0, 22.0, 18.0, 10.0, 8.0, 12.0, 9.0, 4.0, 6.0, 5.0, 7.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.879922866821289, -9.566076278686523, -9.252229690551758, -8.938384056091309, -8.624537467956543, -8.310690879821777, -7.996844291687012, -7.682998180389404, -7.369152069091797, -7.055305480957031, -6.741459369659424, -6.427612781524658, -6.113766670227051, -5.799920082092285, -5.4860734939575195, -5.172227382659912, -4.8583807945251465, -4.544534206390381, -4.230688095092773, -3.916841506958008, -3.6029953956604004, -3.2891488075256348, -2.9753024578094482, -2.6614561080932617, -2.347609758377075, -2.0337634086608887, -1.7199170589447021, -1.406070590019226, -1.0922242403030396, -0.778377890586853, -0.46453142166137695, -0.15068507194519043, 0.1631612777709961, 0.477007657289505, 0.7908540368080139, 1.1047004461288452, 1.4185467958450317, 1.7323931455612183, 2.0462396144866943, 2.360085964202881, 2.6739323139190674, 2.987778663635254, 3.3016250133514404, 3.615471363067627, 3.9293179512023926, 4.2431640625, 4.557010650634766, 4.870857238769531, 5.184703350067139, 5.498549938201904, 5.812396049499512, 6.126242637634277, 6.440088748931885, 6.75393533706665, 7.067781448364258, 7.381628036499023, 7.695474624633789, 8.009321212768555, 8.32316780090332, 8.63701343536377, 8.950860023498535, 9.2647066116333, 9.578553199768066, 9.892398834228516, 10.206245422363281]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 8.0, 4.0, 11.0, 9.0, 17.0, 24.0, 31.0, 46.0, 81.0, 78.0, 128.0, 190.0, 265.0, 388.0, 600.0, 838.0, 1206.0, 1911.0, 2842.0, 4517.0, 7360.0, 12484.0, 22139.0, 40503.0, 75503.0, 140225.0, 216981.0, 214668.0, 137527.0, 74263.0, 39523.0, 21554.0, 12415.0, 7274.0, 4400.0, 2854.0, 1793.0, 1197.0, 843.0, 596.0, 375.0, 269.0, 185.0, 150.0, 96.0, 60.0, 45.0, 27.0, 16.0, 9.0, 14.0, 8.0, 3.0, 3.0, 5.0, 0.0, 3.0], "bins": [-8.9453125, -8.68206787109375, -8.4188232421875, -8.15557861328125, -7.892333984375, -7.62908935546875, -7.3658447265625, -7.10260009765625, -6.83935546875, -6.57611083984375, -6.3128662109375, -6.04962158203125, -5.786376953125, -5.52313232421875, -5.2598876953125, -4.99664306640625, -4.7333984375, -4.47015380859375, -4.2069091796875, -3.94366455078125, -3.680419921875, -3.41717529296875, -3.1539306640625, -2.89068603515625, -2.62744140625, -2.36419677734375, -2.1009521484375, -1.83770751953125, -1.574462890625, -1.31121826171875, -1.0479736328125, -0.78472900390625, -0.521484375, -0.25823974609375, 0.0050048828125, 0.26824951171875, 0.531494140625, 0.79473876953125, 1.0579833984375, 1.32122802734375, 1.58447265625, 1.84771728515625, 2.1109619140625, 2.37420654296875, 2.637451171875, 2.90069580078125, 3.1639404296875, 3.42718505859375, 3.6904296875, 3.95367431640625, 4.2169189453125, 4.48016357421875, 4.743408203125, 5.00665283203125, 5.2698974609375, 5.53314208984375, 5.79638671875, 6.05963134765625, 6.3228759765625, 6.58612060546875, 6.849365234375, 7.11260986328125, 7.3758544921875, 7.63909912109375, 7.90234375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 6.0, 12.0, 14.0, 9.0, 20.0, 25.0, 23.0, 22.0, 38.0, 28.0, 27.0, 33.0, 34.0, 24.0, 31.0, 40.0, 47.0, 45.0, 42.0, 39.0, 38.0, 40.0, 33.0, 30.0, 30.0, 41.0, 24.0, 22.0, 20.0, 20.0, 15.0, 11.0, 15.0, 9.0, 18.0, 5.0, 12.0, 4.0, 4.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.15625, -8.84033203125, -8.5244140625, -8.20849609375, -7.892578125, -7.57666015625, -7.2607421875, -6.94482421875, -6.62890625, -6.31298828125, -5.9970703125, -5.68115234375, -5.365234375, -5.04931640625, -4.7333984375, -4.41748046875, -4.1015625, -3.78564453125, -3.4697265625, -3.15380859375, -2.837890625, -2.52197265625, -2.2060546875, -1.89013671875, -1.57421875, -1.25830078125, -0.9423828125, -0.62646484375, -0.310546875, 0.00537109375, 0.3212890625, 0.63720703125, 0.953125, 1.26904296875, 1.5849609375, 1.90087890625, 2.216796875, 2.53271484375, 2.8486328125, 3.16455078125, 3.48046875, 3.79638671875, 4.1123046875, 4.42822265625, 4.744140625, 5.06005859375, 5.3759765625, 5.69189453125, 6.0078125, 6.32373046875, 6.6396484375, 6.95556640625, 7.271484375, 7.58740234375, 7.9033203125, 8.21923828125, 8.53515625, 8.85107421875, 9.1669921875, 9.48291015625, 9.798828125, 10.11474609375, 10.4306640625, 10.74658203125, 11.0625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 7.0, 6.0, 9.0, 22.0, 10.0, 21.0, 25.0, 31.0, 41.0, 60.0, 73.0, 103.0, 162.0, 175.0, 284.0, 431.0, 548.0, 793.0, 1197.0, 2018.0, 3035.0, 4972.0, 8559.0, 15898.0, 35763.0, 789560.0, 130880.0, 23698.0, 11969.0, 6812.0, 3943.0, 2543.0, 1575.0, 992.0, 727.0, 458.0, 293.0, 221.0, 165.0, 113.0, 100.0, 69.0, 44.0, 33.0, 29.0, 21.0, 28.0, 14.0, 8.0, 6.0, 8.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.3359375, -11.9478759765625, -11.559814453125, -11.1717529296875, -10.78369140625, -10.3956298828125, -10.007568359375, -9.6195068359375, -9.2314453125, -8.8433837890625, -8.455322265625, -8.0672607421875, -7.67919921875, -7.2911376953125, -6.903076171875, -6.5150146484375, -6.126953125, -5.7388916015625, -5.350830078125, -4.9627685546875, -4.57470703125, -4.1866455078125, -3.798583984375, -3.4105224609375, -3.0224609375, -2.6343994140625, -2.246337890625, -1.8582763671875, -1.47021484375, -1.0821533203125, -0.694091796875, -0.3060302734375, 0.08203125, 0.4700927734375, 0.858154296875, 1.2462158203125, 1.63427734375, 2.0223388671875, 2.410400390625, 2.7984619140625, 3.1865234375, 3.5745849609375, 3.962646484375, 4.3507080078125, 4.73876953125, 5.1268310546875, 5.514892578125, 5.9029541015625, 6.291015625, 6.6790771484375, 7.067138671875, 7.4552001953125, 7.84326171875, 8.2313232421875, 8.619384765625, 9.0074462890625, 9.3955078125, 9.7835693359375, 10.171630859375, 10.5596923828125, 10.94775390625, 11.3358154296875, 11.723876953125, 12.1119384765625, 12.5]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 6.0, 10.0, 4.0, 11.0, 13.0, 14.0, 31.0, 21.0, 30.0, 35.0, 40.0, 34.0, 31.0, 49.0, 41.0, 42.0, 63.0, 48.0, 61.0, 44.0, 38.0, 59.0, 49.0, 31.0, 28.0, 26.0, 23.0, 21.0, 16.0, 15.0, 20.0, 8.0, 4.0, 9.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.784912109375, -8.46826171875, -8.151611328125, -7.8349609375, -7.518310546875, -7.20166015625, -6.885009765625, -6.568359375, -6.251708984375, -5.93505859375, -5.618408203125, -5.3017578125, -4.985107421875, -4.66845703125, -4.351806640625, -4.03515625, -3.718505859375, -3.40185546875, -3.085205078125, -2.7685546875, -2.451904296875, -2.13525390625, -1.818603515625, -1.501953125, -1.185302734375, -0.86865234375, -0.552001953125, -0.2353515625, 0.081298828125, 0.39794921875, 0.714599609375, 1.03125, 1.347900390625, 1.66455078125, 1.981201171875, 2.2978515625, 2.614501953125, 2.93115234375, 3.247802734375, 3.564453125, 3.881103515625, 4.19775390625, 4.514404296875, 4.8310546875, 5.147705078125, 5.46435546875, 5.781005859375, 6.09765625, 6.414306640625, 6.73095703125, 7.047607421875, 7.3642578125, 7.680908203125, 7.99755859375, 8.314208984375, 8.630859375, 8.947509765625, 9.26416015625, 9.580810546875, 9.8974609375, 10.214111328125, 10.53076171875, 10.847412109375, 11.1640625]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 5.0, 5.0, 11.0, 12.0, 14.0, 18.0, 28.0, 28.0, 38.0, 49.0, 90.0, 138.0, 174.0, 269.0, 403.0, 668.0, 1136.0, 1858.0, 3451.0, 7436.0, 19755.0, 379287.0, 596737.0, 20604.0, 7639.0, 3704.0, 1950.0, 1083.0, 695.0, 432.0, 261.0, 165.0, 122.0, 79.0, 65.0, 36.0, 27.0, 22.0, 14.0, 11.0, 8.0, 11.0, 7.0, 5.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.109375, -12.699951171875, -12.29052734375, -11.881103515625, -11.4716796875, -11.062255859375, -10.65283203125, -10.243408203125, -9.833984375, -9.424560546875, -9.01513671875, -8.605712890625, -8.1962890625, -7.786865234375, -7.37744140625, -6.968017578125, -6.55859375, -6.149169921875, -5.73974609375, -5.330322265625, -4.9208984375, -4.511474609375, -4.10205078125, -3.692626953125, -3.283203125, -2.873779296875, -2.46435546875, -2.054931640625, -1.6455078125, -1.236083984375, -0.82666015625, -0.417236328125, -0.0078125, 0.401611328125, 0.81103515625, 1.220458984375, 1.6298828125, 2.039306640625, 2.44873046875, 2.858154296875, 3.267578125, 3.677001953125, 4.08642578125, 4.495849609375, 4.9052734375, 5.314697265625, 5.72412109375, 6.133544921875, 6.54296875, 6.952392578125, 7.36181640625, 7.771240234375, 8.1806640625, 8.590087890625, 8.99951171875, 9.408935546875, 9.818359375, 10.227783203125, 10.63720703125, 11.046630859375, 11.4560546875, 11.865478515625, 12.27490234375, 12.684326171875, 13.09375]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 8.0, 14.0, 11.0, 13.0, 16.0, 23.0, 47.0, 70.0, 114.0, 193.0, 159.0, 105.0, 78.0, 40.0, 35.0, 15.0, 18.0, 6.0, 3.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012226104736328125, -0.0011842697858810425, -0.0011459290981292725, -0.0011075884103775024, -0.0010692477226257324, -0.0010309070348739624, -0.0009925663471221924, -0.0009542256593704224, -0.0009158849716186523, -0.0008775442838668823, -0.0008392035961151123, -0.0008008629083633423, -0.0007625222206115723, -0.0007241815328598022, -0.0006858408451080322, -0.0006475001573562622, -0.0006091594696044922, -0.0005708187818527222, -0.0005324780941009521, -0.0004941374063491821, -0.0004557967185974121, -0.0004174560308456421, -0.00037911534309387207, -0.00034077465534210205, -0.00030243396759033203, -0.000264093279838562, -0.000225752592086792, -0.00018741190433502197, -0.00014907121658325195, -0.00011073052883148193, -7.238984107971191e-05, -3.4049153327941895e-05, 4.291534423828125e-06, 4.2632222175598145e-05, 8.097290992736816e-05, 0.00011931359767913818, 0.0001576542854309082, 0.00019599497318267822, 0.00023433566093444824, 0.00027267634868621826, 0.0003110170364379883, 0.0003493577241897583, 0.0003876984119415283, 0.00042603909969329834, 0.00046437978744506836, 0.0005027204751968384, 0.0005410611629486084, 0.0005794018507003784, 0.0006177425384521484, 0.0006560832262039185, 0.0006944239139556885, 0.0007327646017074585, 0.0007711052894592285, 0.0008094459772109985, 0.0008477866649627686, 0.0008861273527145386, 0.0009244680404663086, 0.0009628087282180786, 0.0010011494159698486, 0.0010394901037216187, 0.0010778307914733887, 0.0011161714792251587, 0.0011545121669769287, 0.0011928528547286987, 0.0012311935424804688]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 9.0, 7.0, 8.0, 20.0, 28.0, 36.0, 55.0, 80.0, 102.0, 153.0, 218.0, 298.0, 399.0, 555.0, 821.0, 1256.0, 1787.0, 2864.0, 4583.0, 7712.0, 13492.0, 24640.0, 48511.0, 106067.0, 233196.0, 293465.0, 159003.0, 70422.0, 34087.0, 18011.0, 10142.0, 5943.0, 3566.0, 2230.0, 1440.0, 1025.0, 675.0, 482.0, 343.0, 236.0, 170.0, 130.0, 97.0, 64.0, 40.0, 36.0, 21.0, 11.0, 10.0, 5.0, 6.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.699737548828125, -2.60064697265625, -2.501556396484375, -2.4024658203125, -2.303375244140625, -2.20428466796875, -2.105194091796875, -2.006103515625, -1.907012939453125, -1.80792236328125, -1.708831787109375, -1.6097412109375, -1.510650634765625, -1.41156005859375, -1.312469482421875, -1.21337890625, -1.114288330078125, -1.01519775390625, -0.916107177734375, -0.8170166015625, -0.717926025390625, -0.61883544921875, -0.519744873046875, -0.420654296875, -0.321563720703125, -0.22247314453125, -0.123382568359375, -0.0242919921875, 0.074798583984375, 0.17388916015625, 0.272979736328125, 0.3720703125, 0.471160888671875, 0.57025146484375, 0.669342041015625, 0.7684326171875, 0.867523193359375, 0.96661376953125, 1.065704345703125, 1.164794921875, 1.263885498046875, 1.36297607421875, 1.462066650390625, 1.5611572265625, 1.660247802734375, 1.75933837890625, 1.858428955078125, 1.95751953125, 2.056610107421875, 2.15570068359375, 2.254791259765625, 2.3538818359375, 2.452972412109375, 2.55206298828125, 2.651153564453125, 2.750244140625, 2.849334716796875, 2.94842529296875, 3.047515869140625, 3.1466064453125, 3.245697021484375, 3.34478759765625, 3.443878173828125, 3.54296875]}, "gradients/decoder.bert.encoder.layer.20.crossattention.self.query.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 4.0, 4.0, 12.0, 9.0, 19.0, 13.0, 10.0, 15.0, 30.0, 38.0, 33.0, 49.0, 58.0, 63.0, 62.0, 68.0, 75.0, 82.0, 53.0, 57.0, 39.0, 29.0, 28.0, 20.0, 23.0, 14.0, 17.0, 9.0, 12.0, 8.0, 14.0, 11.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8900985717773438, -0.8549041748046875, -0.8197097778320312, -0.784515380859375, -0.7493209838867188, -0.7141265869140625, -0.6789321899414062, -0.64373779296875, -0.6085433959960938, -0.5733489990234375, -0.5381546020507812, -0.502960205078125, -0.46776580810546875, -0.4325714111328125, -0.39737701416015625, -0.3621826171875, -0.32698822021484375, -0.2917938232421875, -0.25659942626953125, -0.221405029296875, -0.18621063232421875, -0.1510162353515625, -0.11582183837890625, -0.08062744140625, -0.04543304443359375, -0.0102386474609375, 0.02495574951171875, 0.060150146484375, 0.09534454345703125, 0.1305389404296875, 0.16573333740234375, 0.200927734375, 0.23612213134765625, 0.2713165283203125, 0.30651092529296875, 0.341705322265625, 0.37689971923828125, 0.4120941162109375, 0.44728851318359375, 0.48248291015625, 0.5176773071289062, 0.5528717041015625, 0.5880661010742188, 0.623260498046875, 0.6584548950195312, 0.6936492919921875, 0.7288436889648438, 0.7640380859375, 0.7992324829101562, 0.8344268798828125, 0.8696212768554688, 0.904815673828125, 0.9400100708007812, 0.9752044677734375, 1.0103988647460938, 1.04559326171875, 1.0807876586914062, 1.1159820556640625, 1.1511764526367188, 1.186370849609375, 1.2215652465820312, 1.2567596435546875, 1.2919540405273438, 1.3271484375]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 8.0, 2.0, 8.0, 8.0, 11.0, 17.0, 15.0, 17.0, 26.0, 24.0, 36.0, 53.0, 51.0, 46.0, 47.0, 59.0, 60.0, 58.0, 78.0, 49.0, 46.0, 50.0, 39.0, 43.0, 26.0, 28.0, 20.0, 20.0, 12.0, 6.0, 6.0, 4.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.922833442687988, -12.509087562561035, -12.095340728759766, -11.681594848632812, -11.26784896850586, -10.85410213470459, -10.440356254577637, -10.026609420776367, -9.612863540649414, -9.199117660522461, -8.785370826721191, -8.371624946594238, -7.957878589630127, -7.544132232666016, -7.1303863525390625, -6.716639995574951, -6.30289363861084, -5.8891472816467285, -5.475400924682617, -5.061655044555664, -4.647908687591553, -4.234162330627441, -3.820416212081909, -3.406670093536377, -2.9929237365722656, -2.5791773796081543, -2.165431261062622, -1.7516850233078003, -1.3379387855529785, -0.9241924285888672, -0.510446310043335, -0.09670019149780273, 0.3170452117919922, 0.730791449546814, 1.1445376873016357, 1.5582839250564575, 1.9720301628112793, 2.3857765197753906, 2.799522638320923, 3.213268756866455, 3.6270151138305664, 4.040761470794678, 4.454507827758789, 4.868253707885742, 5.2820000648498535, 5.695746421813965, 6.109492301940918, 6.523238658905029, 6.936985015869141, 7.350731372833252, 7.764477729797363, 8.178223609924316, 8.591970443725586, 9.005716323852539, 9.419462203979492, 9.833208084106445, 10.246954917907715, 10.660700798034668, 11.074447631835938, 11.48819351196289, 11.901939392089844, 12.315686225891113, 12.729432106018066, 13.143178939819336, 13.556924819946289]}, "gradients/decoder.bert.encoder.layer.20.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 4.0, 9.0, 5.0, 8.0, 13.0, 14.0, 9.0, 12.0, 20.0, 20.0, 19.0, 30.0, 32.0, 26.0, 27.0, 36.0, 30.0, 45.0, 43.0, 41.0, 38.0, 48.0, 45.0, 34.0, 35.0, 33.0, 40.0, 42.0, 29.0, 18.0, 37.0, 20.0, 20.0, 17.0, 12.0, 17.0, 10.0, 11.0, 9.0, 6.0, 6.0, 6.0, 7.0, 9.0, 1.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.073317527770996, -9.760954856872559, -9.448593139648438, -9.13623046875, -8.823867797851562, -8.511505126953125, -8.199142456054688, -7.886780738830566, -7.574418067932129, -7.262055397033691, -6.949693202972412, -6.637331008911133, -6.324968338012695, -6.012605667114258, -5.7002434730529785, -5.387881278991699, -5.075518608093262, -4.763155937194824, -4.450793743133545, -4.138431549072266, -3.826068878173828, -3.5137064456939697, -3.2013440132141113, -2.888981580734253, -2.5766191482543945, -2.264256715774536, -1.9518942832946777, -1.6395318508148193, -1.327169418334961, -1.0148069858551025, -0.7024445533752441, -0.39008212089538574, -0.07771873474121094, 0.23464369773864746, 0.5470061302185059, 0.8593685626983643, 1.1717309951782227, 1.484093427658081, 1.7964558601379395, 2.108818292617798, 2.4211807250976562, 2.7335431575775146, 3.045905590057373, 3.3582680225372314, 3.67063045501709, 3.9829928874969482, 4.295355319976807, 4.607717514038086, 4.920080184936523, 5.232442855834961, 5.54480504989624, 5.8571672439575195, 6.169529914855957, 6.4818925857543945, 6.794254779815674, 7.106616973876953, 7.418979644775391, 7.731342315673828, 8.043704986572266, 8.356066703796387, 8.668429374694824, 8.980792045593262, 9.293153762817383, 9.60551643371582, 9.917879104614258]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 9.0, 16.0, 19.0, 29.0, 42.0, 63.0, 84.0, 118.0, 186.0, 274.0, 388.0, 522.0, 813.0, 1199.0, 1883.0, 2841.0, 4458.0, 7076.0, 11175.0, 17817.0, 28384.0, 43826.0, 67402.0, 97318.0, 129125.0, 148063.0, 141008.0, 113324.0, 81025.0, 54312.0, 35021.0, 22294.0, 13719.0, 8761.0, 5547.0, 3554.0, 2232.0, 1471.0, 1001.0, 690.0, 468.0, 308.0, 216.0, 143.0, 96.0, 71.0, 56.0, 25.0, 24.0, 12.0, 17.0, 14.0, 9.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.8828125, -11.5084228515625, -11.134033203125, -10.7596435546875, -10.38525390625, -10.0108642578125, -9.636474609375, -9.2620849609375, -8.8876953125, -8.5133056640625, -8.138916015625, -7.7645263671875, -7.39013671875, -7.0157470703125, -6.641357421875, -6.2669677734375, -5.892578125, -5.5181884765625, -5.143798828125, -4.7694091796875, -4.39501953125, -4.0206298828125, -3.646240234375, -3.2718505859375, -2.8974609375, -2.5230712890625, -2.148681640625, -1.7742919921875, -1.39990234375, -1.0255126953125, -0.651123046875, -0.2767333984375, 0.09765625, 0.4720458984375, 0.846435546875, 1.2208251953125, 1.59521484375, 1.9696044921875, 2.343994140625, 2.7183837890625, 3.0927734375, 3.4671630859375, 3.841552734375, 4.2159423828125, 4.59033203125, 4.9647216796875, 5.339111328125, 5.7135009765625, 6.087890625, 6.4622802734375, 6.836669921875, 7.2110595703125, 7.58544921875, 7.9598388671875, 8.334228515625, 8.7086181640625, 9.0830078125, 9.4573974609375, 9.831787109375, 10.2061767578125, 10.58056640625, 10.9549560546875, 11.329345703125, 11.7037353515625, 12.078125]}, "gradients/decoder.bert.encoder.layer.20.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 9.0, 14.0, 13.0, 17.0, 12.0, 21.0, 25.0, 16.0, 22.0, 22.0, 30.0, 30.0, 39.0, 42.0, 42.0, 36.0, 46.0, 34.0, 43.0, 43.0, 39.0, 42.0, 39.0, 35.0, 34.0, 25.0, 34.0, 31.0, 17.0, 22.0, 16.0, 14.0, 15.0, 15.0, 8.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.6627197265625, -8.372314453125, -8.0819091796875, -7.79150390625, -7.5010986328125, -7.210693359375, -6.9202880859375, -6.6298828125, -6.3394775390625, -6.049072265625, -5.7586669921875, -5.46826171875, -5.1778564453125, -4.887451171875, -4.5970458984375, -4.306640625, -4.0162353515625, -3.725830078125, -3.4354248046875, -3.14501953125, -2.8546142578125, -2.564208984375, -2.2738037109375, -1.9833984375, -1.6929931640625, -1.402587890625, -1.1121826171875, -0.82177734375, -0.5313720703125, -0.240966796875, 0.0494384765625, 0.33984375, 0.6302490234375, 0.920654296875, 1.2110595703125, 1.50146484375, 1.7918701171875, 2.082275390625, 2.3726806640625, 2.6630859375, 2.9534912109375, 3.243896484375, 3.5343017578125, 3.82470703125, 4.1151123046875, 4.405517578125, 4.6959228515625, 4.986328125, 5.2767333984375, 5.567138671875, 5.8575439453125, 6.14794921875, 6.4383544921875, 6.728759765625, 7.0191650390625, 7.3095703125, 7.5999755859375, 7.890380859375, 8.1807861328125, 8.47119140625, 8.7615966796875, 9.052001953125, 9.3424072265625, 9.6328125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 5.0, 5.0, 10.0, 8.0, 27.0, 35.0, 43.0, 56.0, 81.0, 117.0, 203.0, 287.0, 392.0, 578.0, 874.0, 1307.0, 1937.0, 2943.0, 4534.0, 6811.0, 10360.0, 15500.0, 23868.0, 36593.0, 53518.0, 76392.0, 103056.0, 125532.0, 134798.0, 123338.0, 99649.0, 73659.0, 50844.0, 34108.0, 22958.0, 15211.0, 9856.0, 6453.0, 4233.0, 2852.0, 1805.0, 1168.0, 832.0, 517.0, 394.0, 247.0, 164.0, 145.0, 65.0, 63.0, 30.0, 40.0, 20.0, 19.0, 6.0, 11.0, 3.0, 3.0, 4.0, 1.0], "bins": [-10.125, -9.8128662109375, -9.500732421875, -9.1885986328125, -8.87646484375, -8.5643310546875, -8.252197265625, -7.9400634765625, -7.6279296875, -7.3157958984375, -7.003662109375, -6.6915283203125, -6.37939453125, -6.0672607421875, -5.755126953125, -5.4429931640625, -5.130859375, -4.8187255859375, -4.506591796875, -4.1944580078125, -3.88232421875, -3.5701904296875, -3.258056640625, -2.9459228515625, -2.6337890625, -2.3216552734375, -2.009521484375, -1.6973876953125, -1.38525390625, -1.0731201171875, -0.760986328125, -0.4488525390625, -0.13671875, 0.1754150390625, 0.487548828125, 0.7996826171875, 1.11181640625, 1.4239501953125, 1.736083984375, 2.0482177734375, 2.3603515625, 2.6724853515625, 2.984619140625, 3.2967529296875, 3.60888671875, 3.9210205078125, 4.233154296875, 4.5452880859375, 4.857421875, 5.1695556640625, 5.481689453125, 5.7938232421875, 6.10595703125, 6.4180908203125, 6.730224609375, 7.0423583984375, 7.3544921875, 7.6666259765625, 7.978759765625, 8.2908935546875, 8.60302734375, 8.9151611328125, 9.227294921875, 9.5394287109375, 9.8515625]}, "gradients/decoder.bert.encoder.layer.20.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 9.0, 5.0, 6.0, 11.0, 6.0, 11.0, 11.0, 13.0, 25.0, 16.0, 28.0, 25.0, 20.0, 35.0, 32.0, 37.0, 40.0, 42.0, 33.0, 37.0, 33.0, 36.0, 46.0, 49.0, 48.0, 41.0, 34.0, 40.0, 31.0, 33.0, 31.0, 24.0, 18.0, 15.0, 16.0, 7.0, 11.0, 11.0, 10.0, 10.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.94921875, -5.7464599609375, -5.543701171875, -5.3409423828125, -5.13818359375, -4.9354248046875, -4.732666015625, -4.5299072265625, -4.3271484375, -4.1243896484375, -3.921630859375, -3.7188720703125, -3.51611328125, -3.3133544921875, -3.110595703125, -2.9078369140625, -2.705078125, -2.5023193359375, -2.299560546875, -2.0968017578125, -1.89404296875, -1.6912841796875, -1.488525390625, -1.2857666015625, -1.0830078125, -0.8802490234375, -0.677490234375, -0.4747314453125, -0.27197265625, -0.0692138671875, 0.133544921875, 0.3363037109375, 0.5390625, 0.7418212890625, 0.944580078125, 1.1473388671875, 1.35009765625, 1.5528564453125, 1.755615234375, 1.9583740234375, 2.1611328125, 2.3638916015625, 2.566650390625, 2.7694091796875, 2.97216796875, 3.1749267578125, 3.377685546875, 3.5804443359375, 3.783203125, 3.9859619140625, 4.188720703125, 4.3914794921875, 4.59423828125, 4.7969970703125, 4.999755859375, 5.2025146484375, 5.4052734375, 5.6080322265625, 5.810791015625, 6.0135498046875, 6.21630859375, 6.4190673828125, 6.621826171875, 6.8245849609375, 7.02734375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 13.0, 14.0, 17.0, 27.0, 39.0, 64.0, 83.0, 112.0, 157.0, 228.0, 337.0, 489.0, 710.0, 1139.0, 1727.0, 3163.0, 5306.0, 9638.0, 19176.0, 38903.0, 87226.0, 185641.0, 288813.0, 211396.0, 100675.0, 45126.0, 22073.0, 10981.0, 5902.0, 3413.0, 2031.0, 1277.0, 868.0, 580.0, 373.0, 269.0, 170.0, 118.0, 86.0, 58.0, 34.0, 35.0, 16.0, 9.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-12.2734375, -11.872314453125, -11.47119140625, -11.070068359375, -10.6689453125, -10.267822265625, -9.86669921875, -9.465576171875, -9.064453125, -8.663330078125, -8.26220703125, -7.861083984375, -7.4599609375, -7.058837890625, -6.65771484375, -6.256591796875, -5.85546875, -5.454345703125, -5.05322265625, -4.652099609375, -4.2509765625, -3.849853515625, -3.44873046875, -3.047607421875, -2.646484375, -2.245361328125, -1.84423828125, -1.443115234375, -1.0419921875, -0.640869140625, -0.23974609375, 0.161376953125, 0.5625, 0.963623046875, 1.36474609375, 1.765869140625, 2.1669921875, 2.568115234375, 2.96923828125, 3.370361328125, 3.771484375, 4.172607421875, 4.57373046875, 4.974853515625, 5.3759765625, 5.777099609375, 6.17822265625, 6.579345703125, 6.98046875, 7.381591796875, 7.78271484375, 8.183837890625, 8.5849609375, 8.986083984375, 9.38720703125, 9.788330078125, 10.189453125, 10.590576171875, 10.99169921875, 11.392822265625, 11.7939453125, 12.195068359375, 12.59619140625, 12.997314453125, 13.3984375]}, "gradients/decoder.bert.encoder.layer.20.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 10.0, 7.0, 13.0, 17.0, 24.0, 29.0, 43.0, 53.0, 63.0, 100.0, 99.0, 107.0, 93.0, 70.0, 61.0, 74.0, 36.0, 29.0, 24.0, 18.0, 12.0, 10.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015239715576171875, -0.0014796257019042969, -0.0014352798461914062, -0.0013909339904785156, -0.001346588134765625, -0.0013022422790527344, -0.0012578964233398438, -0.0012135505676269531, -0.0011692047119140625, -0.0011248588562011719, -0.0010805130004882812, -0.0010361671447753906, -0.0009918212890625, -0.0009474754333496094, -0.0009031295776367188, -0.0008587837219238281, -0.0008144378662109375, -0.0007700920104980469, -0.0007257461547851562, -0.0006814002990722656, -0.000637054443359375, -0.0005927085876464844, -0.0005483627319335938, -0.0005040168762207031, -0.0004596710205078125, -0.0004153251647949219, -0.00037097930908203125, -0.0003266334533691406, -0.00028228759765625, -0.00023794174194335938, -0.00019359588623046875, -0.00014925003051757812, -0.0001049041748046875, -6.0558319091796875e-05, -1.621246337890625e-05, 2.8133392333984375e-05, 7.2479248046875e-05, 0.00011682510375976562, 0.00016117095947265625, 0.00020551681518554688, 0.0002498626708984375, 0.0002942085266113281, 0.00033855438232421875, 0.0003829002380371094, 0.00042724609375, 0.0004715919494628906, 0.0005159378051757812, 0.0005602836608886719, 0.0006046295166015625, 0.0006489753723144531, 0.0006933212280273438, 0.0007376670837402344, 0.000782012939453125, 0.0008263587951660156, 0.0008707046508789062, 0.0009150505065917969, 0.0009593963623046875, 0.0010037422180175781, 0.0010480880737304688, 0.0010924339294433594, 0.00113677978515625, 0.0011811256408691406, 0.0012254714965820312, 0.0012698173522949219, 0.0013141632080078125]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 12.0, 7.0, 13.0, 35.0, 31.0, 30.0, 68.0, 93.0, 119.0, 180.0, 251.0, 363.0, 635.0, 957.0, 1511.0, 2405.0, 3854.0, 6260.0, 10292.0, 18144.0, 30881.0, 54578.0, 95152.0, 152664.0, 197745.0, 179645.0, 122113.0, 71737.0, 40917.0, 23420.0, 13541.0, 7855.0, 4853.0, 2941.0, 1884.0, 1123.0, 762.0, 479.0, 322.0, 216.0, 138.0, 103.0, 62.0, 54.0, 36.0, 26.0, 14.0, 9.0, 8.0, 6.0, 4.0, 8.0, 4.0, 3.0], "bins": [-8.515625, -8.2705078125, -8.025390625, -7.7802734375, -7.53515625, -7.2900390625, -7.044921875, -6.7998046875, -6.5546875, -6.3095703125, -6.064453125, -5.8193359375, -5.57421875, -5.3291015625, -5.083984375, -4.8388671875, -4.59375, -4.3486328125, -4.103515625, -3.8583984375, -3.61328125, -3.3681640625, -3.123046875, -2.8779296875, -2.6328125, -2.3876953125, -2.142578125, -1.8974609375, -1.65234375, -1.4072265625, -1.162109375, -0.9169921875, -0.671875, -0.4267578125, -0.181640625, 0.0634765625, 0.30859375, 0.5537109375, 0.798828125, 1.0439453125, 1.2890625, 1.5341796875, 1.779296875, 2.0244140625, 2.26953125, 2.5146484375, 2.759765625, 3.0048828125, 3.25, 3.4951171875, 3.740234375, 3.9853515625, 4.23046875, 4.4755859375, 4.720703125, 4.9658203125, 5.2109375, 5.4560546875, 5.701171875, 5.9462890625, 6.19140625, 6.4365234375, 6.681640625, 6.9267578125, 7.171875]}, "gradients/decoder.bert.encoder.layer.20.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 4.0, 9.0, 11.0, 7.0, 14.0, 14.0, 11.0, 17.0, 25.0, 36.0, 33.0, 49.0, 44.0, 51.0, 64.0, 70.0, 57.0, 55.0, 49.0, 59.0, 63.0, 43.0, 35.0, 35.0, 29.0, 24.0, 26.0, 10.0, 11.0, 12.0, 4.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.447265625, -3.35089111328125, -3.2545166015625, -3.15814208984375, -3.061767578125, -2.96539306640625, -2.8690185546875, -2.77264404296875, -2.67626953125, -2.57989501953125, -2.4835205078125, -2.38714599609375, -2.290771484375, -2.19439697265625, -2.0980224609375, -2.00164794921875, -1.9052734375, -1.80889892578125, -1.7125244140625, -1.61614990234375, -1.519775390625, -1.42340087890625, -1.3270263671875, -1.23065185546875, -1.13427734375, -1.03790283203125, -0.9415283203125, -0.84515380859375, -0.748779296875, -0.65240478515625, -0.5560302734375, -0.45965576171875, -0.36328125, -0.26690673828125, -0.1705322265625, -0.07415771484375, 0.022216796875, 0.11859130859375, 0.2149658203125, 0.31134033203125, 0.40771484375, 0.50408935546875, 0.6004638671875, 0.69683837890625, 0.793212890625, 0.88958740234375, 0.9859619140625, 1.08233642578125, 1.1787109375, 1.27508544921875, 1.3714599609375, 1.46783447265625, 1.564208984375, 1.66058349609375, 1.7569580078125, 1.85333251953125, 1.94970703125, 2.04608154296875, 2.1424560546875, 2.23883056640625, 2.335205078125, 2.43157958984375, 2.5279541015625, 2.62432861328125, 2.720703125]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 10.0, 3.0, 16.0, 8.0, 26.0, 23.0, 45.0, 33.0, 34.0, 60.0, 53.0, 59.0, 57.0, 48.0, 72.0, 59.0, 51.0, 49.0, 45.0, 42.0, 38.0, 33.0, 25.0, 12.0, 18.0, 22.0, 9.0, 8.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.666426658630371, -12.26688289642334, -11.867339134216309, -11.467795372009277, -11.068251609802246, -10.668707847595215, -10.269164085388184, -9.869620323181152, -9.470076560974121, -9.07053279876709, -8.670989036560059, -8.271445274353027, -7.871901512145996, -7.472357749938965, -7.072813987731934, -6.673270225524902, -6.273726463317871, -5.87418270111084, -5.474638938903809, -5.075095176696777, -4.675551414489746, -4.276007652282715, -3.8764638900756836, -3.4769201278686523, -3.077376365661621, -2.67783260345459, -2.2782888412475586, -1.8787450790405273, -1.479201316833496, -1.0796575546264648, -0.6801137924194336, -0.28057003021240234, 0.1189727783203125, 0.5185165405273438, 0.918060302734375, 1.3176040649414062, 1.7171478271484375, 2.1166915893554688, 2.5162353515625, 2.9157791137695312, 3.3153228759765625, 3.7148666381835938, 4.114410400390625, 4.513954162597656, 4.9134979248046875, 5.313041687011719, 5.71258544921875, 6.112129211425781, 6.5116729736328125, 6.911216735839844, 7.310760498046875, 7.710304260253906, 8.109848022460938, 8.509391784667969, 8.908935546875, 9.308479309082031, 9.708023071289062, 10.107566833496094, 10.507110595703125, 10.906654357910156, 11.306198120117188, 11.705741882324219, 12.10528564453125, 12.504829406738281, 12.904373168945312]}, "gradients/decoder.bert.encoder.layer.19.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 6.0, 3.0, 5.0, 4.0, 11.0, 13.0, 8.0, 7.0, 15.0, 18.0, 16.0, 18.0, 18.0, 26.0, 19.0, 28.0, 37.0, 28.0, 25.0, 40.0, 26.0, 39.0, 37.0, 39.0, 33.0, 34.0, 34.0, 26.0, 24.0, 28.0, 27.0, 34.0, 28.0, 23.0, 23.0, 29.0, 26.0, 25.0, 23.0, 18.0, 12.0, 8.0, 6.0, 10.0, 10.0, 6.0, 5.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-8.129793167114258, -7.8636579513549805, -7.597522735595703, -7.331387519836426, -7.065252304077148, -6.799117088317871, -6.5329813957214355, -6.266846179962158, -6.000710964202881, -5.7345757484436035, -5.468440532684326, -5.202305316925049, -4.936169624328613, -4.670034408569336, -4.403899192810059, -4.137763977050781, -3.871628761291504, -3.6054935455322266, -3.339358329772949, -3.0732228755950928, -2.8070876598358154, -2.540952444076538, -2.2748169898986816, -2.0086817741394043, -1.742546558380127, -1.4764113426208496, -1.2102760076522827, -0.9441407322883606, -0.6780054569244385, -0.41187024116516113, -0.14573490619659424, 0.12040042877197266, 0.38653564453125, 0.6526709198951721, 0.9188061952590942, 1.1849415302276611, 1.4510767459869385, 1.7172119617462158, 1.9833472967147827, 2.2494826316833496, 2.515617847442627, 2.7817530632019043, 3.0478882789611816, 3.314023733139038, 3.5801589488983154, 3.8462941646575928, 4.112429618835449, 4.378564834594727, 4.644700050354004, 4.910835266113281, 5.176970481872559, 5.443105697631836, 5.709240913391113, 5.975376129150391, 6.241511821746826, 6.5076470375061035, 6.773782253265381, 7.039917469024658, 7.3060526847839355, 7.572187900543213, 7.838323593139648, 8.104458808898926, 8.370594024658203, 8.63672924041748, 8.902864456176758]}, "gradients/decoder.bert.encoder.layer.19.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 9.0, 6.0, 13.0, 13.0, 23.0, 26.0, 41.0, 74.0, 122.0, 178.0, 307.0, 485.0, 749.0, 1236.0, 2027.0, 3524.0, 6059.0, 10646.0, 19279.0, 36401.0, 72187.0, 152884.0, 342262.0, 720005.0, 1047133.0, 888923.0, 477114.0, 211551.0, 96541.0, 47124.0, 24735.0, 13425.0, 7711.0, 4479.0, 2626.0, 1620.0, 1055.0, 578.0, 367.0, 265.0, 182.0, 92.0, 67.0, 43.0, 38.0, 25.0, 11.0, 9.0, 7.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.1015625, -8.795166015625, -8.48876953125, -8.182373046875, -7.8759765625, -7.569580078125, -7.26318359375, -6.956787109375, -6.650390625, -6.343994140625, -6.03759765625, -5.731201171875, -5.4248046875, -5.118408203125, -4.81201171875, -4.505615234375, -4.19921875, -3.892822265625, -3.58642578125, -3.280029296875, -2.9736328125, -2.667236328125, -2.36083984375, -2.054443359375, -1.748046875, -1.441650390625, -1.13525390625, -0.828857421875, -0.5224609375, -0.216064453125, 0.09033203125, 0.396728515625, 0.703125, 1.009521484375, 1.31591796875, 1.622314453125, 1.9287109375, 2.235107421875, 2.54150390625, 2.847900390625, 3.154296875, 3.460693359375, 3.76708984375, 4.073486328125, 4.3798828125, 4.686279296875, 4.99267578125, 5.299072265625, 5.60546875, 5.911865234375, 6.21826171875, 6.524658203125, 6.8310546875, 7.137451171875, 7.44384765625, 7.750244140625, 8.056640625, 8.363037109375, 8.66943359375, 8.975830078125, 9.2822265625, 9.588623046875, 9.89501953125, 10.201416015625, 10.5078125]}, "gradients/decoder.bert.encoder.layer.19.output.dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 3.0, 11.0, 5.0, 13.0, 13.0, 15.0, 19.0, 22.0, 22.0, 28.0, 25.0, 29.0, 32.0, 30.0, 29.0, 30.0, 37.0, 28.0, 28.0, 43.0, 42.0, 37.0, 45.0, 43.0, 30.0, 35.0, 31.0, 42.0, 28.0, 32.0, 25.0, 26.0, 24.0, 13.0, 16.0, 15.0, 8.0, 14.0, 7.0, 4.0, 4.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3828125, -6.15673828125, -5.9306640625, -5.70458984375, -5.478515625, -5.25244140625, -5.0263671875, -4.80029296875, -4.57421875, -4.34814453125, -4.1220703125, -3.89599609375, -3.669921875, -3.44384765625, -3.2177734375, -2.99169921875, -2.765625, -2.53955078125, -2.3134765625, -2.08740234375, -1.861328125, -1.63525390625, -1.4091796875, -1.18310546875, -0.95703125, -0.73095703125, -0.5048828125, -0.27880859375, -0.052734375, 0.17333984375, 0.3994140625, 0.62548828125, 0.8515625, 1.07763671875, 1.3037109375, 1.52978515625, 1.755859375, 1.98193359375, 2.2080078125, 2.43408203125, 2.66015625, 2.88623046875, 3.1123046875, 3.33837890625, 3.564453125, 3.79052734375, 4.0166015625, 4.24267578125, 4.46875, 4.69482421875, 4.9208984375, 5.14697265625, 5.373046875, 5.59912109375, 5.8251953125, 6.05126953125, 6.27734375, 6.50341796875, 6.7294921875, 6.95556640625, 7.181640625, 7.40771484375, 7.6337890625, 7.85986328125, 8.0859375]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 10.0, 8.0, 20.0, 40.0, 44.0, 67.0, 104.0, 140.0, 238.0, 373.0, 495.0, 763.0, 1272.0, 1978.0, 3110.0, 4896.0, 8124.0, 13244.0, 22538.0, 38766.0, 67856.0, 122578.0, 223743.0, 405989.0, 691440.0, 898670.0, 719482.0, 429253.0, 236888.0, 129832.0, 71834.0, 40494.0, 23530.0, 14124.0, 8276.0, 5223.0, 3136.0, 2028.0, 1229.0, 857.0, 574.0, 352.0, 239.0, 139.0, 89.0, 62.0, 46.0, 35.0, 25.0, 13.0, 12.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.6171875, -8.3524169921875, -8.087646484375, -7.8228759765625, -7.55810546875, -7.2933349609375, -7.028564453125, -6.7637939453125, -6.4990234375, -6.2342529296875, -5.969482421875, -5.7047119140625, -5.43994140625, -5.1751708984375, -4.910400390625, -4.6456298828125, -4.380859375, -4.1160888671875, -3.851318359375, -3.5865478515625, -3.32177734375, -3.0570068359375, -2.792236328125, -2.5274658203125, -2.2626953125, -1.9979248046875, -1.733154296875, -1.4683837890625, -1.20361328125, -0.9388427734375, -0.674072265625, -0.4093017578125, -0.14453125, 0.1202392578125, 0.385009765625, 0.6497802734375, 0.91455078125, 1.1793212890625, 1.444091796875, 1.7088623046875, 1.9736328125, 2.2384033203125, 2.503173828125, 2.7679443359375, 3.03271484375, 3.2974853515625, 3.562255859375, 3.8270263671875, 4.091796875, 4.3565673828125, 4.621337890625, 4.8861083984375, 5.15087890625, 5.4156494140625, 5.680419921875, 5.9451904296875, 6.2099609375, 6.4747314453125, 6.739501953125, 7.0042724609375, 7.26904296875, 7.5338134765625, 7.798583984375, 8.0633544921875, 8.328125]}, "gradients/decoder.bert.encoder.layer.19.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 4.0, 11.0, 17.0, 23.0, 33.0, 31.0, 40.0, 59.0, 58.0, 87.0, 124.0, 124.0, 190.0, 207.0, 250.0, 299.0, 331.0, 299.0, 244.0, 290.0, 252.0, 220.0, 182.0, 132.0, 127.0, 92.0, 69.0, 56.0, 53.0, 36.0, 31.0, 27.0, 17.0, 13.0, 5.0, 10.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.287109375, -3.17987060546875, -3.0726318359375, -2.96539306640625, -2.858154296875, -2.75091552734375, -2.6436767578125, -2.53643798828125, -2.42919921875, -2.32196044921875, -2.2147216796875, -2.10748291015625, -2.000244140625, -1.89300537109375, -1.7857666015625, -1.67852783203125, -1.5712890625, -1.46405029296875, -1.3568115234375, -1.24957275390625, -1.142333984375, -1.03509521484375, -0.9278564453125, -0.82061767578125, -0.71337890625, -0.60614013671875, -0.4989013671875, -0.39166259765625, -0.284423828125, -0.17718505859375, -0.0699462890625, 0.03729248046875, 0.14453125, 0.25177001953125, 0.3590087890625, 0.46624755859375, 0.573486328125, 0.68072509765625, 0.7879638671875, 0.89520263671875, 1.00244140625, 1.10968017578125, 1.2169189453125, 1.32415771484375, 1.431396484375, 1.53863525390625, 1.6458740234375, 1.75311279296875, 1.8603515625, 1.96759033203125, 2.0748291015625, 2.18206787109375, 2.289306640625, 2.39654541015625, 2.5037841796875, 2.61102294921875, 2.71826171875, 2.82550048828125, 2.9327392578125, 3.03997802734375, 3.147216796875, 3.25445556640625, 3.3616943359375, 3.46893310546875, 3.576171875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 5.0, 5.0, 14.0, 13.0, 10.0, 22.0, 15.0, 21.0, 31.0, 35.0, 49.0, 44.0, 53.0, 64.0, 79.0, 65.0, 70.0, 59.0, 59.0, 42.0, 42.0, 37.0, 31.0, 21.0, 26.0, 25.0, 18.0, 9.0, 9.0, 2.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.875686645507812, -10.540382385253906, -10.205078125, -9.869773864746094, -9.534468650817871, -9.199164390563965, -8.863860130310059, -8.528555870056152, -8.19325065612793, -7.857946395874023, -7.522641658782959, -7.187337398529053, -6.852032661437988, -6.516728401184082, -6.181424140930176, -5.8461198806762695, -5.510815620422363, -5.175511360168457, -4.840206623077393, -4.504902362823486, -4.169597625732422, -3.8342933654785156, -3.4989891052246094, -3.163684606552124, -2.8283801078796387, -2.4930756092071533, -2.157771110534668, -1.8224668502807617, -1.4871623516082764, -1.151857852935791, -0.8165535926818848, -0.4812490940093994, -0.14594459533691406, 0.1893598437309265, 0.5246642827987671, 0.8599686622619629, 1.1952731609344482, 1.5305776596069336, 1.8658819198608398, 2.201186418533325, 2.5364909172058105, 2.871795415878296, 3.2070999145507812, 3.5424041748046875, 3.877708673477173, 4.213013172149658, 4.5483174324035645, 4.883622169494629, 5.218926429748535, 5.554230690002441, 5.889535427093506, 6.224839687347412, 6.560144424438477, 6.895448684692383, 7.230752944946289, 7.566057205200195, 7.90136194229126, 8.236666679382324, 8.57197093963623, 8.907275199890137, 9.242579460144043, 9.577884674072266, 9.913188934326172, 10.248493194580078, 10.583797454833984]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 4.0, 6.0, 10.0, 5.0, 11.0, 13.0, 15.0, 17.0, 21.0, 16.0, 22.0, 26.0, 31.0, 29.0, 33.0, 25.0, 28.0, 27.0, 33.0, 40.0, 31.0, 27.0, 32.0, 29.0, 37.0, 35.0, 27.0, 42.0, 25.0, 28.0, 31.0, 27.0, 23.0, 21.0, 16.0, 23.0, 15.0, 12.0, 12.0, 14.0, 13.0, 7.0, 8.0, 11.0, 8.0, 11.0, 1.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-6.885350704193115, -6.668995380401611, -6.452640533447266, -6.236285209655762, -6.019929885864258, -5.803574562072754, -5.58721923828125, -5.370864391326904, -5.1545090675354, -4.9381537437438965, -4.721798896789551, -4.505443572998047, -4.289088249206543, -4.072732925415039, -3.8563778400421143, -3.6400227546691895, -3.4236674308776855, -3.2073121070861816, -2.990957021713257, -2.774601936340332, -2.558246612548828, -2.341891288757324, -2.1255362033843994, -1.909180998802185, -1.6928257942199707, -1.4764705896377563, -1.260115385055542, -1.0437601804733276, -0.8274049758911133, -0.6110497713088989, -0.39469456672668457, -0.17833936214447021, 0.03801584243774414, 0.2543710470199585, 0.47072625160217285, 0.6870814561843872, 0.9034366607666016, 1.119791865348816, 1.3361470699310303, 1.5525022745132446, 1.768857479095459, 1.9852126836776733, 2.2015678882598877, 2.4179229736328125, 2.6342782974243164, 2.8506336212158203, 3.066988706588745, 3.28334379196167, 3.499699115753174, 3.7160544395446777, 3.9324095249176025, 4.148764610290527, 4.365119934082031, 4.581475257873535, 4.797830581665039, 5.014185428619385, 5.230540752410889, 5.446896076202393, 5.663250923156738, 5.879606246948242, 6.095961570739746, 6.31231689453125, 6.528672218322754, 6.7450270652771, 6.9613823890686035]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 9.0, 5.0, 17.0, 13.0, 27.0, 54.0, 66.0, 100.0, 182.0, 220.0, 347.0, 555.0, 897.0, 1288.0, 1977.0, 3103.0, 4970.0, 7619.0, 12402.0, 19807.0, 31557.0, 50743.0, 80344.0, 121531.0, 160714.0, 167778.0, 134099.0, 92021.0, 58745.0, 35971.0, 22541.0, 14285.0, 8899.0, 5602.0, 3560.0, 2242.0, 1512.0, 933.0, 628.0, 408.0, 252.0, 189.0, 105.0, 64.0, 53.0, 40.0, 27.0, 18.0, 17.0, 9.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.14453125, -3.0435791015625, -2.942626953125, -2.8416748046875, -2.74072265625, -2.6397705078125, -2.538818359375, -2.4378662109375, -2.3369140625, -2.2359619140625, -2.135009765625, -2.0340576171875, -1.93310546875, -1.8321533203125, -1.731201171875, -1.6302490234375, -1.529296875, -1.4283447265625, -1.327392578125, -1.2264404296875, -1.12548828125, -1.0245361328125, -0.923583984375, -0.8226318359375, -0.7216796875, -0.6207275390625, -0.519775390625, -0.4188232421875, -0.31787109375, -0.2169189453125, -0.115966796875, -0.0150146484375, 0.0859375, 0.1868896484375, 0.287841796875, 0.3887939453125, 0.48974609375, 0.5906982421875, 0.691650390625, 0.7926025390625, 0.8935546875, 0.9945068359375, 1.095458984375, 1.1964111328125, 1.29736328125, 1.3983154296875, 1.499267578125, 1.6002197265625, 1.701171875, 1.8021240234375, 1.903076171875, 2.0040283203125, 2.10498046875, 2.2059326171875, 2.306884765625, 2.4078369140625, 2.5087890625, 2.6097412109375, 2.710693359375, 2.8116455078125, 2.91259765625, 3.0135498046875, 3.114501953125, 3.2154541015625, 3.31640625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 10.0, 9.0, 12.0, 9.0, 7.0, 17.0, 14.0, 13.0, 18.0, 21.0, 23.0, 28.0, 33.0, 29.0, 27.0, 30.0, 48.0, 28.0, 46.0, 35.0, 29.0, 39.0, 37.0, 32.0, 36.0, 34.0, 32.0, 22.0, 33.0, 33.0, 24.0, 27.0, 27.0, 18.0, 13.0, 15.0, 9.0, 11.0, 14.0, 7.0, 12.0, 10.0, 5.0, 9.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-7.78515625, -7.54473876953125, -7.3043212890625, -7.06390380859375, -6.823486328125, -6.58306884765625, -6.3426513671875, -6.10223388671875, -5.86181640625, -5.62139892578125, -5.3809814453125, -5.14056396484375, -4.900146484375, -4.65972900390625, -4.4193115234375, -4.17889404296875, -3.9384765625, -3.69805908203125, -3.4576416015625, -3.21722412109375, -2.976806640625, -2.73638916015625, -2.4959716796875, -2.25555419921875, -2.01513671875, -1.77471923828125, -1.5343017578125, -1.29388427734375, -1.053466796875, -0.81304931640625, -0.5726318359375, -0.33221435546875, -0.091796875, 0.14862060546875, 0.3890380859375, 0.62945556640625, 0.869873046875, 1.11029052734375, 1.3507080078125, 1.59112548828125, 1.83154296875, 2.07196044921875, 2.3123779296875, 2.55279541015625, 2.793212890625, 3.03363037109375, 3.2740478515625, 3.51446533203125, 3.7548828125, 3.99530029296875, 4.2357177734375, 4.47613525390625, 4.716552734375, 4.95697021484375, 5.1973876953125, 5.43780517578125, 5.67822265625, 5.91864013671875, 6.1590576171875, 6.39947509765625, 6.639892578125, 6.88031005859375, 7.1207275390625, 7.36114501953125, 7.6015625]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 13.0, 8.0, 15.0, 11.0, 34.0, 41.0, 64.0, 86.0, 129.0, 205.0, 262.0, 413.0, 615.0, 926.0, 1446.0, 2236.0, 3660.0, 5850.0, 10403.0, 19084.0, 45662.0, 841611.0, 65222.0, 21456.0, 11314.0, 6728.0, 3864.0, 2452.0, 1605.0, 1006.0, 644.0, 465.0, 309.0, 237.0, 149.0, 93.0, 84.0, 38.0, 34.0, 28.0, 15.0, 8.0, 10.0, 5.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.7254638671875, -6.505615234375, -6.2857666015625, -6.06591796875, -5.8460693359375, -5.626220703125, -5.4063720703125, -5.1865234375, -4.9666748046875, -4.746826171875, -4.5269775390625, -4.30712890625, -4.0872802734375, -3.867431640625, -3.6475830078125, -3.427734375, -3.2078857421875, -2.988037109375, -2.7681884765625, -2.54833984375, -2.3284912109375, -2.108642578125, -1.8887939453125, -1.6689453125, -1.4490966796875, -1.229248046875, -1.0093994140625, -0.78955078125, -0.5697021484375, -0.349853515625, -0.1300048828125, 0.08984375, 0.3096923828125, 0.529541015625, 0.7493896484375, 0.96923828125, 1.1890869140625, 1.408935546875, 1.6287841796875, 1.8486328125, 2.0684814453125, 2.288330078125, 2.5081787109375, 2.72802734375, 2.9478759765625, 3.167724609375, 3.3875732421875, 3.607421875, 3.8272705078125, 4.047119140625, 4.2669677734375, 4.48681640625, 4.7066650390625, 4.926513671875, 5.1463623046875, 5.3662109375, 5.5860595703125, 5.805908203125, 6.0257568359375, 6.24560546875, 6.4654541015625, 6.685302734375, 6.9051513671875, 7.125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 4.0, 10.0, 8.0, 10.0, 14.0, 16.0, 20.0, 30.0, 36.0, 37.0, 43.0, 43.0, 45.0, 48.0, 59.0, 51.0, 54.0, 64.0, 42.0, 45.0, 47.0, 34.0, 33.0, 35.0, 29.0, 28.0, 16.0, 23.0, 15.0, 16.0, 4.0, 6.0, 10.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.4921875, -8.26727294921875, -8.0423583984375, -7.81744384765625, -7.592529296875, -7.36761474609375, -7.1427001953125, -6.91778564453125, -6.69287109375, -6.46795654296875, -6.2430419921875, -6.01812744140625, -5.793212890625, -5.56829833984375, -5.3433837890625, -5.11846923828125, -4.8935546875, -4.66864013671875, -4.4437255859375, -4.21881103515625, -3.993896484375, -3.76898193359375, -3.5440673828125, -3.31915283203125, -3.09423828125, -2.86932373046875, -2.6444091796875, -2.41949462890625, -2.194580078125, -1.96966552734375, -1.7447509765625, -1.51983642578125, -1.294921875, -1.07000732421875, -0.8450927734375, -0.62017822265625, -0.395263671875, -0.17034912109375, 0.0545654296875, 0.27947998046875, 0.50439453125, 0.72930908203125, 0.9542236328125, 1.17913818359375, 1.404052734375, 1.62896728515625, 1.8538818359375, 2.07879638671875, 2.3037109375, 2.52862548828125, 2.7535400390625, 2.97845458984375, 3.203369140625, 3.42828369140625, 3.6531982421875, 3.87811279296875, 4.10302734375, 4.32794189453125, 4.5528564453125, 4.77777099609375, 5.002685546875, 5.22760009765625, 5.4525146484375, 5.67742919921875, 5.90234375]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 7.0, 8.0, 11.0, 18.0, 23.0, 17.0, 37.0, 48.0, 64.0, 108.0, 128.0, 204.0, 366.0, 510.0, 904.0, 1603.0, 2908.0, 5790.0, 13116.0, 39876.0, 898381.0, 54630.0, 15423.0, 6735.0, 3176.0, 1760.0, 946.0, 571.0, 370.0, 257.0, 174.0, 104.0, 65.0, 63.0, 47.0, 25.0, 19.0, 17.0, 8.0, 5.0, 5.0, 2.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.078125, -4.92230224609375, -4.7664794921875, -4.61065673828125, -4.454833984375, -4.29901123046875, -4.1431884765625, -3.98736572265625, -3.83154296875, -3.67572021484375, -3.5198974609375, -3.36407470703125, -3.208251953125, -3.05242919921875, -2.8966064453125, -2.74078369140625, -2.5849609375, -2.42913818359375, -2.2733154296875, -2.11749267578125, -1.961669921875, -1.80584716796875, -1.6500244140625, -1.49420166015625, -1.33837890625, -1.18255615234375, -1.0267333984375, -0.87091064453125, -0.715087890625, -0.55926513671875, -0.4034423828125, -0.24761962890625, -0.091796875, 0.06402587890625, 0.2198486328125, 0.37567138671875, 0.531494140625, 0.68731689453125, 0.8431396484375, 0.99896240234375, 1.15478515625, 1.31060791015625, 1.4664306640625, 1.62225341796875, 1.778076171875, 1.93389892578125, 2.0897216796875, 2.24554443359375, 2.4013671875, 2.55718994140625, 2.7130126953125, 2.86883544921875, 3.024658203125, 3.18048095703125, 3.3363037109375, 3.49212646484375, 3.64794921875, 3.80377197265625, 3.9595947265625, 4.11541748046875, 4.271240234375, 4.42706298828125, 4.5828857421875, 4.73870849609375, 4.89453125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 2.0, 4.0, 12.0, 7.0, 9.0, 12.0, 11.0, 18.0, 29.0, 22.0, 35.0, 53.0, 52.0, 76.0, 102.0, 117.0, 91.0, 78.0, 53.0, 44.0, 38.0, 26.0, 26.0, 15.0, 13.0, 7.0, 9.0, 8.0, 5.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002982616424560547, -0.0002881772816181183, -0.0002780929207801819, -0.0002680085599422455, -0.0002579241991043091, -0.0002478398382663727, -0.00023775547742843628, -0.00022767111659049988, -0.00021758675575256348, -0.00020750239491462708, -0.00019741803407669067, -0.00018733367323875427, -0.00017724931240081787, -0.00016716495156288147, -0.00015708059072494507, -0.00014699622988700867, -0.00013691186904907227, -0.00012682750821113586, -0.00011674314737319946, -0.00010665878653526306, -9.657442569732666e-05, -8.649006485939026e-05, -7.640570402145386e-05, -6.632134318351746e-05, -5.6236982345581055e-05, -4.615262150764465e-05, -3.606826066970825e-05, -2.598389983177185e-05, -1.589953899383545e-05, -5.815178155899048e-06, 4.2691826820373535e-06, 1.4353543519973755e-05, 2.4437904357910156e-05, 3.452226519584656e-05, 4.460662603378296e-05, 5.469098687171936e-05, 6.477534770965576e-05, 7.485970854759216e-05, 8.494406938552856e-05, 9.502843022346497e-05, 0.00010511279106140137, 0.00011519715189933777, 0.00012528151273727417, 0.00013536587357521057, 0.00014545023441314697, 0.00015553459525108337, 0.00016561895608901978, 0.00017570331692695618, 0.00018578767776489258, 0.00019587203860282898, 0.00020595639944076538, 0.00021604076027870178, 0.00022612512111663818, 0.00023620948195457458, 0.000246293842792511, 0.0002563782036304474, 0.0002664625644683838, 0.0002765469253063202, 0.0002866312861442566, 0.000296715646982193, 0.0003068000078201294, 0.0003168843686580658, 0.0003269687294960022, 0.0003370530903339386, 0.000347137451171875]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 12.0, 15.0, 18.0, 25.0, 36.0, 69.0, 80.0, 111.0, 150.0, 219.0, 291.0, 458.0, 672.0, 992.0, 1552.0, 2283.0, 3429.0, 5552.0, 8809.0, 14020.0, 22213.0, 36365.0, 59107.0, 96846.0, 150776.0, 195063.0, 164871.0, 108704.0, 67048.0, 40671.0, 25085.0, 15329.0, 9715.0, 6252.0, 3942.0, 2500.0, 1680.0, 1120.0, 771.0, 483.0, 357.0, 253.0, 163.0, 128.0, 81.0, 74.0, 43.0, 33.0, 33.0, 18.0, 4.0, 9.0, 6.0, 5.0, 6.0, 3.0], "bins": [-1.1845703125, -1.1493377685546875, -1.114105224609375, -1.0788726806640625, -1.04364013671875, -1.0084075927734375, -0.973175048828125, -0.9379425048828125, -0.9027099609375, -0.8674774169921875, -0.832244873046875, -0.7970123291015625, -0.76177978515625, -0.7265472412109375, -0.691314697265625, -0.6560821533203125, -0.620849609375, -0.5856170654296875, -0.550384521484375, -0.5151519775390625, -0.47991943359375, -0.4446868896484375, -0.409454345703125, -0.3742218017578125, -0.3389892578125, -0.3037567138671875, -0.268524169921875, -0.2332916259765625, -0.19805908203125, -0.1628265380859375, -0.127593994140625, -0.0923614501953125, -0.05712890625, -0.0218963623046875, 0.013336181640625, 0.0485687255859375, 0.08380126953125, 0.1190338134765625, 0.154266357421875, 0.1894989013671875, 0.2247314453125, 0.2599639892578125, 0.295196533203125, 0.3304290771484375, 0.36566162109375, 0.4008941650390625, 0.436126708984375, 0.4713592529296875, 0.506591796875, 0.5418243408203125, 0.577056884765625, 0.6122894287109375, 0.64752197265625, 0.6827545166015625, 0.717987060546875, 0.7532196044921875, 0.7884521484375, 0.8236846923828125, 0.858917236328125, 0.8941497802734375, 0.92938232421875, 0.9646148681640625, 0.999847412109375, 1.0350799560546875, 1.0703125]}, "gradients/decoder.bert.encoder.layer.19.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 8.0, 11.0, 16.0, 11.0, 8.0, 20.0, 15.0, 22.0, 36.0, 32.0, 44.0, 34.0, 49.0, 46.0, 50.0, 77.0, 45.0, 51.0, 70.0, 53.0, 50.0, 42.0, 32.0, 24.0, 25.0, 15.0, 18.0, 20.0, 9.0, 7.0, 10.0, 3.0, 10.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4853515625, -0.4700355529785156, -0.45471954345703125, -0.4394035339355469, -0.4240875244140625, -0.4087715148925781, -0.39345550537109375, -0.3781394958496094, -0.362823486328125, -0.3475074768066406, -0.33219146728515625, -0.3168754577636719, -0.3015594482421875, -0.2862434387207031, -0.27092742919921875, -0.2556114196777344, -0.24029541015625, -0.22497940063476562, -0.20966339111328125, -0.19434738159179688, -0.1790313720703125, -0.16371536254882812, -0.14839935302734375, -0.13308334350585938, -0.117767333984375, -0.10245132446289062, -0.08713531494140625, -0.07181930541992188, -0.0565032958984375, -0.041187286376953125, -0.02587127685546875, -0.010555267333984375, 0.0047607421875, 0.020076751708984375, 0.03539276123046875, 0.050708770751953125, 0.0660247802734375, 0.08134078979492188, 0.09665679931640625, 0.11197280883789062, 0.127288818359375, 0.14260482788085938, 0.15792083740234375, 0.17323684692382812, 0.1885528564453125, 0.20386886596679688, 0.21918487548828125, 0.23450088500976562, 0.24981689453125, 0.2651329040527344, 0.28044891357421875, 0.2957649230957031, 0.3110809326171875, 0.3263969421386719, 0.34171295166015625, 0.3570289611816406, 0.372344970703125, 0.3876609802246094, 0.40297698974609375, 0.4182929992675781, 0.4336090087890625, 0.4489250183105469, 0.46424102783203125, 0.4795570373535156, 0.494873046875]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 7.0, 7.0, 6.0, 14.0, 15.0, 10.0, 13.0, 28.0, 27.0, 31.0, 30.0, 61.0, 43.0, 46.0, 62.0, 65.0, 76.0, 60.0, 60.0, 63.0, 36.0, 35.0, 28.0, 30.0, 29.0, 21.0, 23.0, 17.0, 13.0, 9.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.425981521606445, -9.113774299621582, -8.801567077636719, -8.489360809326172, -8.177153587341309, -7.864946365356445, -7.55273962020874, -7.240532875061035, -6.928325653076172, -6.616118431091309, -6.3039116859436035, -5.991704940795898, -5.679497718811035, -5.367290496826172, -5.055083751678467, -4.742877006530762, -4.430669784545898, -4.118462562561035, -3.80625581741333, -3.494048833847046, -3.1818418502807617, -2.8696348667144775, -2.5574278831481934, -2.245220899581909, -1.933013916015625, -1.6208069324493408, -1.3085999488830566, -0.9963929653167725, -0.6841859817504883, -0.3719789981842041, -0.05977201461791992, 0.25243496894836426, 0.5646429061889648, 0.876849889755249, 1.1890568733215332, 1.5012638568878174, 1.8134708404541016, 2.1256778240203857, 2.43788480758667, 2.750091791152954, 3.0622987747192383, 3.3745057582855225, 3.6867127418518066, 3.998919725418091, 4.311126708984375, 4.623333930969238, 4.935540676116943, 5.247747421264648, 5.559954643249512, 5.872161865234375, 6.18436861038208, 6.496575355529785, 6.808782577514648, 7.120989799499512, 7.433196544647217, 7.745403289794922, 8.057610511779785, 8.369817733764648, 8.682024002075195, 8.994231224060059, 9.306438446044922, 9.618645668029785, 9.930852890014648, 10.243059158325195, 10.555266380310059]}, "gradients/decoder.bert.encoder.layer.19.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 7.0, 9.0, 7.0, 5.0, 14.0, 12.0, 14.0, 13.0, 21.0, 20.0, 24.0, 23.0, 29.0, 27.0, 33.0, 25.0, 22.0, 32.0, 39.0, 28.0, 31.0, 34.0, 27.0, 30.0, 37.0, 37.0, 27.0, 33.0, 38.0, 26.0, 33.0, 26.0, 32.0, 16.0, 8.0, 27.0, 26.0, 12.0, 11.0, 10.0, 9.0, 10.0, 14.0, 4.0, 8.0, 9.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0], "bins": [-7.102121829986572, -6.886204719543457, -6.6702880859375, -6.454370975494385, -6.2384538650512695, -6.0225372314453125, -5.806620121002197, -5.590703010559082, -5.374786376953125, -5.15886926651001, -4.942952632904053, -4.7270355224609375, -4.5111188888549805, -4.295201778411865, -4.07928466796875, -3.863367795944214, -3.6474509239196777, -3.4315340518951416, -3.2156171798706055, -2.9997000694274902, -2.783783197402954, -2.567866325378418, -2.3519492149353027, -2.1360323429107666, -1.9201154708862305, -1.7041985988616943, -1.4882816076278687, -1.272364616394043, -1.0564477443695068, -0.8405308723449707, -0.624613881111145, -0.40869688987731934, -0.192779541015625, 0.023137390613555908, 0.23905432224273682, 0.4549712538719177, 0.6708881855010986, 0.8868050575256348, 1.1027220487594604, 1.3186390399932861, 1.5345559120178223, 1.7504727840423584, 1.966389775276184, 2.1823067665100098, 2.398223638534546, 2.614140510559082, 2.8300576210021973, 3.0459744930267334, 3.2618913650512695, 3.4778082370758057, 3.693725109100342, 3.909642219543457, 4.125558853149414, 4.341475963592529, 4.5573930740356445, 4.773309707641602, 4.989226818084717, 5.205143928527832, 5.421060562133789, 5.636977672576904, 5.8528947830200195, 6.068811416625977, 6.284728527069092, 6.500645637512207, 6.716562271118164]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 9.0, 15.0, 26.0, 27.0, 37.0, 56.0, 77.0, 121.0, 204.0, 286.0, 434.0, 665.0, 1041.0, 1601.0, 2494.0, 4024.0, 6595.0, 10616.0, 17652.0, 29350.0, 48412.0, 76788.0, 114663.0, 152910.0, 165167.0, 142097.0, 102252.0, 66240.0, 40547.0, 24700.0, 14893.0, 9165.0, 5739.0, 3488.0, 2197.0, 1370.0, 889.0, 578.0, 376.0, 236.0, 179.0, 110.0, 83.0, 44.0, 37.0, 19.0, 13.0, 13.0, 12.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4921875, -8.22119140625, -7.9501953125, -7.67919921875, -7.408203125, -7.13720703125, -6.8662109375, -6.59521484375, -6.32421875, -6.05322265625, -5.7822265625, -5.51123046875, -5.240234375, -4.96923828125, -4.6982421875, -4.42724609375, -4.15625, -3.88525390625, -3.6142578125, -3.34326171875, -3.072265625, -2.80126953125, -2.5302734375, -2.25927734375, -1.98828125, -1.71728515625, -1.4462890625, -1.17529296875, -0.904296875, -0.63330078125, -0.3623046875, -0.09130859375, 0.1796875, 0.45068359375, 0.7216796875, 0.99267578125, 1.263671875, 1.53466796875, 1.8056640625, 2.07666015625, 2.34765625, 2.61865234375, 2.8896484375, 3.16064453125, 3.431640625, 3.70263671875, 3.9736328125, 4.24462890625, 4.515625, 4.78662109375, 5.0576171875, 5.32861328125, 5.599609375, 5.87060546875, 6.1416015625, 6.41259765625, 6.68359375, 6.95458984375, 7.2255859375, 7.49658203125, 7.767578125, 8.03857421875, 8.3095703125, 8.58056640625, 8.8515625]}, "gradients/decoder.bert.encoder.layer.19.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 3.0, 10.0, 6.0, 9.0, 14.0, 14.0, 11.0, 16.0, 17.0, 24.0, 18.0, 35.0, 25.0, 38.0, 33.0, 28.0, 36.0, 35.0, 40.0, 24.0, 45.0, 33.0, 39.0, 40.0, 36.0, 38.0, 31.0, 39.0, 34.0, 31.0, 26.0, 25.0, 24.0, 12.0, 19.0, 7.0, 15.0, 17.0, 12.0, 5.0, 12.0, 8.0, 4.0, 2.0, 4.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.5, -7.2701416015625, -7.040283203125, -6.8104248046875, -6.58056640625, -6.3507080078125, -6.120849609375, -5.8909912109375, -5.6611328125, -5.4312744140625, -5.201416015625, -4.9715576171875, -4.74169921875, -4.5118408203125, -4.281982421875, -4.0521240234375, -3.822265625, -3.5924072265625, -3.362548828125, -3.1326904296875, -2.90283203125, -2.6729736328125, -2.443115234375, -2.2132568359375, -1.9833984375, -1.7535400390625, -1.523681640625, -1.2938232421875, -1.06396484375, -0.8341064453125, -0.604248046875, -0.3743896484375, -0.14453125, 0.0853271484375, 0.315185546875, 0.5450439453125, 0.77490234375, 1.0047607421875, 1.234619140625, 1.4644775390625, 1.6943359375, 1.9241943359375, 2.154052734375, 2.3839111328125, 2.61376953125, 2.8436279296875, 3.073486328125, 3.3033447265625, 3.533203125, 3.7630615234375, 3.992919921875, 4.2227783203125, 4.45263671875, 4.6824951171875, 4.912353515625, 5.1422119140625, 5.3720703125, 5.6019287109375, 5.831787109375, 6.0616455078125, 6.29150390625, 6.5213623046875, 6.751220703125, 6.9810791015625, 7.2109375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 16.0, 29.0, 31.0, 44.0, 93.0, 131.0, 181.0, 301.0, 467.0, 733.0, 1099.0, 1767.0, 2971.0, 4505.0, 7576.0, 12355.0, 20213.0, 33135.0, 54483.0, 86751.0, 129131.0, 164995.0, 165330.0, 130653.0, 88589.0, 55592.0, 34088.0, 20416.0, 12563.0, 7534.0, 4700.0, 2861.0, 1860.0, 1201.0, 784.0, 486.0, 314.0, 199.0, 122.0, 79.0, 54.0, 36.0, 28.0, 22.0, 11.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34375, -7.09912109375, -6.8544921875, -6.60986328125, -6.365234375, -6.12060546875, -5.8759765625, -5.63134765625, -5.38671875, -5.14208984375, -4.8974609375, -4.65283203125, -4.408203125, -4.16357421875, -3.9189453125, -3.67431640625, -3.4296875, -3.18505859375, -2.9404296875, -2.69580078125, -2.451171875, -2.20654296875, -1.9619140625, -1.71728515625, -1.47265625, -1.22802734375, -0.9833984375, -0.73876953125, -0.494140625, -0.24951171875, -0.0048828125, 0.23974609375, 0.484375, 0.72900390625, 0.9736328125, 1.21826171875, 1.462890625, 1.70751953125, 1.9521484375, 2.19677734375, 2.44140625, 2.68603515625, 2.9306640625, 3.17529296875, 3.419921875, 3.66455078125, 3.9091796875, 4.15380859375, 4.3984375, 4.64306640625, 4.8876953125, 5.13232421875, 5.376953125, 5.62158203125, 5.8662109375, 6.11083984375, 6.35546875, 6.60009765625, 6.8447265625, 7.08935546875, 7.333984375, 7.57861328125, 7.8232421875, 8.06787109375, 8.3125]}, "gradients/decoder.bert.encoder.layer.19.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 11.0, 9.0, 10.0, 18.0, 16.0, 12.0, 14.0, 22.0, 15.0, 40.0, 25.0, 30.0, 39.0, 29.0, 40.0, 40.0, 31.0, 51.0, 37.0, 46.0, 34.0, 44.0, 31.0, 38.0, 34.0, 42.0, 42.0, 27.0, 20.0, 19.0, 21.0, 14.0, 22.0, 12.0, 14.0, 12.0, 4.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.5234375, -5.364501953125, -5.20556640625, -5.046630859375, -4.8876953125, -4.728759765625, -4.56982421875, -4.410888671875, -4.251953125, -4.093017578125, -3.93408203125, -3.775146484375, -3.6162109375, -3.457275390625, -3.29833984375, -3.139404296875, -2.98046875, -2.821533203125, -2.66259765625, -2.503662109375, -2.3447265625, -2.185791015625, -2.02685546875, -1.867919921875, -1.708984375, -1.550048828125, -1.39111328125, -1.232177734375, -1.0732421875, -0.914306640625, -0.75537109375, -0.596435546875, -0.4375, -0.278564453125, -0.11962890625, 0.039306640625, 0.1982421875, 0.357177734375, 0.51611328125, 0.675048828125, 0.833984375, 0.992919921875, 1.15185546875, 1.310791015625, 1.4697265625, 1.628662109375, 1.78759765625, 1.946533203125, 2.10546875, 2.264404296875, 2.42333984375, 2.582275390625, 2.7412109375, 2.900146484375, 3.05908203125, 3.218017578125, 3.376953125, 3.535888671875, 3.69482421875, 3.853759765625, 4.0126953125, 4.171630859375, 4.33056640625, 4.489501953125, 4.6484375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 9.0, 8.0, 15.0, 21.0, 31.0, 51.0, 61.0, 111.0, 196.0, 340.0, 579.0, 1015.0, 1817.0, 3556.0, 7044.0, 15436.0, 36364.0, 95533.0, 252421.0, 352696.0, 171342.0, 62852.0, 25042.0, 10882.0, 5229.0, 2600.0, 1399.0, 789.0, 411.0, 273.0, 149.0, 95.0, 62.0, 34.0, 35.0, 18.0, 16.0, 6.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.15625, -11.675537109375, -11.19482421875, -10.714111328125, -10.2333984375, -9.752685546875, -9.27197265625, -8.791259765625, -8.310546875, -7.829833984375, -7.34912109375, -6.868408203125, -6.3876953125, -5.906982421875, -5.42626953125, -4.945556640625, -4.46484375, -3.984130859375, -3.50341796875, -3.022705078125, -2.5419921875, -2.061279296875, -1.58056640625, -1.099853515625, -0.619140625, -0.138427734375, 0.34228515625, 0.822998046875, 1.3037109375, 1.784423828125, 2.26513671875, 2.745849609375, 3.2265625, 3.707275390625, 4.18798828125, 4.668701171875, 5.1494140625, 5.630126953125, 6.11083984375, 6.591552734375, 7.072265625, 7.552978515625, 8.03369140625, 8.514404296875, 8.9951171875, 9.475830078125, 9.95654296875, 10.437255859375, 10.91796875, 11.398681640625, 11.87939453125, 12.360107421875, 12.8408203125, 13.321533203125, 13.80224609375, 14.282958984375, 14.763671875, 15.244384765625, 15.72509765625, 16.205810546875, 16.6865234375, 17.167236328125, 17.64794921875, 18.128662109375, 18.609375]}, "gradients/decoder.bert.encoder.layer.19.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 8.0, 7.0, 13.0, 17.0, 22.0, 25.0, 39.0, 48.0, 40.0, 61.0, 61.0, 54.0, 74.0, 76.0, 54.0, 70.0, 56.0, 49.0, 42.0, 33.0, 24.0, 24.0, 27.0, 13.0, 13.0, 9.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009326934814453125, -0.0009019076824188232, -0.000871121883392334, -0.0008403360843658447, -0.0008095502853393555, -0.0007787644863128662, -0.000747978687286377, -0.0007171928882598877, -0.0006864070892333984, -0.0006556212902069092, -0.0006248354911804199, -0.0005940496921539307, -0.0005632638931274414, -0.0005324780941009521, -0.0005016922950744629, -0.00047090649604797363, -0.0004401206970214844, -0.0004093348979949951, -0.00037854909896850586, -0.0003477632999420166, -0.00031697750091552734, -0.0002861917018890381, -0.00025540590286254883, -0.00022462010383605957, -0.0001938343048095703, -0.00016304850578308105, -0.0001322627067565918, -0.00010147690773010254, -7.069110870361328e-05, -3.9905309677124023e-05, -9.119510650634766e-06, 2.1666288375854492e-05, 5.245208740234375e-05, 8.323788642883301e-05, 0.00011402368545532227, 0.00014480948448181152, 0.00017559528350830078, 0.00020638108253479004, 0.0002371668815612793, 0.00026795268058776855, 0.0002987384796142578, 0.00032952427864074707, 0.00036031007766723633, 0.0003910958766937256, 0.00042188167572021484, 0.0004526674747467041, 0.00048345327377319336, 0.0005142390727996826, 0.0005450248718261719, 0.0005758106708526611, 0.0006065964698791504, 0.0006373822689056396, 0.0006681680679321289, 0.0006989538669586182, 0.0007297396659851074, 0.0007605254650115967, 0.0007913112640380859, 0.0008220970630645752, 0.0008528828620910645, 0.0008836686611175537, 0.000914454460144043, 0.0009452402591705322, 0.0009760260581970215, 0.0010068118572235107, 0.00103759765625]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 6.0, 3.0, 4.0, 6.0, 8.0, 11.0, 19.0, 20.0, 39.0, 39.0, 57.0, 103.0, 152.0, 204.0, 320.0, 474.0, 722.0, 1127.0, 1929.0, 3197.0, 5557.0, 10464.0, 20900.0, 47019.0, 112148.0, 240573.0, 294303.0, 171584.0, 72722.0, 31572.0, 14733.0, 7651.0, 4219.0, 2520.0, 1466.0, 923.0, 604.0, 368.0, 233.0, 175.0, 134.0, 66.0, 45.0, 45.0, 28.0, 19.0, 17.0, 15.0, 6.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.203125, -10.8201904296875, -10.437255859375, -10.0543212890625, -9.67138671875, -9.2884521484375, -8.905517578125, -8.5225830078125, -8.1396484375, -7.7567138671875, -7.373779296875, -6.9908447265625, -6.60791015625, -6.2249755859375, -5.842041015625, -5.4591064453125, -5.076171875, -4.6932373046875, -4.310302734375, -3.9273681640625, -3.54443359375, -3.1614990234375, -2.778564453125, -2.3956298828125, -2.0126953125, -1.6297607421875, -1.246826171875, -0.8638916015625, -0.48095703125, -0.0980224609375, 0.284912109375, 0.6678466796875, 1.05078125, 1.4337158203125, 1.816650390625, 2.1995849609375, 2.58251953125, 2.9654541015625, 3.348388671875, 3.7313232421875, 4.1142578125, 4.4971923828125, 4.880126953125, 5.2630615234375, 5.64599609375, 6.0289306640625, 6.411865234375, 6.7947998046875, 7.177734375, 7.5606689453125, 7.943603515625, 8.3265380859375, 8.70947265625, 9.0924072265625, 9.475341796875, 9.8582763671875, 10.2412109375, 10.6241455078125, 11.007080078125, 11.3900146484375, 11.77294921875, 12.1558837890625, 12.538818359375, 12.9217529296875, 13.3046875]}, "gradients/decoder.bert.encoder.layer.19.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 8.0, 8.0, 10.0, 16.0, 13.0, 18.0, 23.0, 25.0, 35.0, 48.0, 50.0, 65.0, 79.0, 70.0, 72.0, 79.0, 58.0, 53.0, 57.0, 44.0, 31.0, 27.0, 21.0, 22.0, 10.0, 4.0, 7.0, 4.0, 10.0, 4.0, 4.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.86712646484375, -2.7576904296875, -2.64825439453125, -2.538818359375, -2.42938232421875, -2.3199462890625, -2.21051025390625, -2.10107421875, -1.99163818359375, -1.8822021484375, -1.77276611328125, -1.663330078125, -1.55389404296875, -1.4444580078125, -1.33502197265625, -1.2255859375, -1.11614990234375, -1.0067138671875, -0.89727783203125, -0.787841796875, -0.67840576171875, -0.5689697265625, -0.45953369140625, -0.35009765625, -0.24066162109375, -0.1312255859375, -0.02178955078125, 0.087646484375, 0.19708251953125, 0.3065185546875, 0.41595458984375, 0.525390625, 0.63482666015625, 0.7442626953125, 0.85369873046875, 0.963134765625, 1.07257080078125, 1.1820068359375, 1.29144287109375, 1.40087890625, 1.51031494140625, 1.6197509765625, 1.72918701171875, 1.838623046875, 1.94805908203125, 2.0574951171875, 2.16693115234375, 2.2763671875, 2.38580322265625, 2.4952392578125, 2.60467529296875, 2.714111328125, 2.82354736328125, 2.9329833984375, 3.04241943359375, 3.15185546875, 3.26129150390625, 3.3707275390625, 3.48016357421875, 3.589599609375, 3.69903564453125, 3.8084716796875, 3.91790771484375, 4.02734375]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 7.0, 4.0, 10.0, 16.0, 17.0, 24.0, 22.0, 35.0, 36.0, 45.0, 43.0, 57.0, 48.0, 64.0, 69.0, 74.0, 72.0, 50.0, 57.0, 46.0, 31.0, 41.0, 32.0, 22.0, 16.0, 12.0, 12.0, 9.0, 8.0, 7.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.535650253295898, -11.200141906738281, -10.86463451385498, -10.529126167297363, -10.193618774414062, -9.858110427856445, -9.522603034973145, -9.187094688415527, -8.851587295532227, -8.51607894897461, -8.180571556091309, -7.84506368637085, -7.509555816650391, -7.174047946929932, -6.838540077209473, -6.5030317306518555, -6.1675238609313965, -5.8320159912109375, -5.4965081214904785, -5.1610002517700195, -4.8254923820495605, -4.489984512329102, -4.154476165771484, -3.8189685344696045, -3.4834606647491455, -3.1479527950286865, -2.8124449253082275, -2.4769368171691895, -2.1414289474487305, -1.805921196937561, -1.4704132080078125, -1.1349053382873535, -0.7993974685668945, -0.46388956904411316, -0.1283816695213318, 0.20712625980377197, 0.542634129524231, 0.8781419992446899, 1.2136499881744385, 1.5491578578948975, 1.8846657276153564, 2.2201735973358154, 2.5556814670562744, 2.8911895751953125, 3.2266974449157715, 3.5622053146362305, 3.8977131843566895, 4.233221054077148, 4.568728923797607, 4.904236793518066, 5.239744663238525, 5.575252532958984, 5.910760402679443, 6.246268272399902, 6.5817766189575195, 6.91728401184082, 7.2527923583984375, 7.5883002281188965, 7.9238080978393555, 8.259316444396973, 8.594823837280273, 8.93033218383789, 9.265839576721191, 9.601347923278809, 9.93685531616211]}, "gradients/decoder.bert.encoder.layer.18.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 2.0, 8.0, 3.0, 3.0, 8.0, 5.0, 12.0, 2.0, 14.0, 20.0, 17.0, 28.0, 21.0, 21.0, 19.0, 31.0, 23.0, 31.0, 32.0, 30.0, 40.0, 38.0, 40.0, 45.0, 39.0, 30.0, 31.0, 28.0, 44.0, 28.0, 34.0, 29.0, 22.0, 33.0, 20.0, 26.0, 23.0, 12.0, 23.0, 20.0, 15.0, 15.0, 10.0, 3.0, 4.0, 6.0, 6.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.768545150756836, -6.531733989715576, -6.294923305511475, -6.058112144470215, -5.821300983428955, -5.5844902992248535, -5.347679138183594, -5.110868453979492, -4.874057292938232, -4.637246131896973, -4.400435447692871, -4.163624286651611, -3.9268133640289307, -3.69000244140625, -3.4531912803649902, -3.2163803577423096, -2.97956919670105, -2.742758274078369, -2.5059471130371094, -2.2691361904144287, -2.032325267791748, -1.7955142259597778, -1.5587031841278076, -1.321892261505127, -1.0850812196731567, -0.8482702374458313, -0.6114592552185059, -0.37464821338653564, -0.1378372311592102, 0.09897375106811523, 0.33578479290008545, 0.5725957155227661, 0.8094067573547363, 1.0462177991867065, 1.2830287218093872, 1.5198397636413574, 1.756650686264038, 1.9934617280960083, 2.2302727699279785, 2.467083692550659, 2.70389461517334, 2.9407055377960205, 3.1775166988372803, 3.414327621459961, 3.6511385440826416, 3.8879494667053223, 4.124760627746582, 4.361571311950684, 4.598382949829102, 4.835194110870361, 5.072004795074463, 5.308815956115723, 5.545627117156982, 5.782437801361084, 6.019248962402344, 6.256059646606445, 6.492870807647705, 6.729681968688965, 6.966492652893066, 7.203303813934326, 7.440114974975586, 7.6769256591796875, 7.913736820220947, 8.150547981262207, 8.387358665466309]}, "gradients/decoder.bert.encoder.layer.18.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 7.0, 10.0, 25.0, 28.0, 41.0, 63.0, 125.0, 167.0, 300.0, 477.0, 740.0, 1214.0, 1975.0, 3242.0, 5438.0, 9735.0, 17281.0, 32195.0, 62905.0, 129905.0, 285515.0, 625333.0, 1025214.0, 968491.0, 543012.0, 244651.0, 112989.0, 56356.0, 28958.0, 16003.0, 8908.0, 5040.0, 3095.0, 1769.0, 1110.0, 694.0, 453.0, 290.0, 190.0, 114.0, 81.0, 56.0, 35.0, 17.0, 11.0, 9.0, 6.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.287109375, -8.02734375, -7.767578125, -7.5078125, -7.248046875, -6.98828125, -6.728515625, -6.46875, -6.208984375, -5.94921875, -5.689453125, -5.4296875, -5.169921875, -4.91015625, -4.650390625, -4.390625, -4.130859375, -3.87109375, -3.611328125, -3.3515625, -3.091796875, -2.83203125, -2.572265625, -2.3125, -2.052734375, -1.79296875, -1.533203125, -1.2734375, -1.013671875, -0.75390625, -0.494140625, -0.234375, 0.025390625, 0.28515625, 0.544921875, 0.8046875, 1.064453125, 1.32421875, 1.583984375, 1.84375, 2.103515625, 2.36328125, 2.623046875, 2.8828125, 3.142578125, 3.40234375, 3.662109375, 3.921875, 4.181640625, 4.44140625, 4.701171875, 4.9609375, 5.220703125, 5.48046875, 5.740234375, 6.0, 6.259765625, 6.51953125, 6.779296875, 7.0390625, 7.298828125, 7.55859375, 7.818359375, 8.078125]}, "gradients/decoder.bert.encoder.layer.18.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 8.0, 5.0, 11.0, 12.0, 12.0, 21.0, 22.0, 21.0, 23.0, 28.0, 24.0, 26.0, 34.0, 33.0, 40.0, 42.0, 43.0, 47.0, 31.0, 38.0, 45.0, 42.0, 42.0, 37.0, 36.0, 31.0, 26.0, 29.0, 31.0, 27.0, 21.0, 19.0, 14.0, 16.0, 11.0, 8.0, 6.0, 11.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.96697998046875, -4.7894287109375, -4.61187744140625, -4.434326171875, -4.25677490234375, -4.0792236328125, -3.90167236328125, -3.72412109375, -3.54656982421875, -3.3690185546875, -3.19146728515625, -3.013916015625, -2.83636474609375, -2.6588134765625, -2.48126220703125, -2.3037109375, -2.12615966796875, -1.9486083984375, -1.77105712890625, -1.593505859375, -1.41595458984375, -1.2384033203125, -1.06085205078125, -0.88330078125, -0.70574951171875, -0.5281982421875, -0.35064697265625, -0.173095703125, 0.00445556640625, 0.1820068359375, 0.35955810546875, 0.537109375, 0.71466064453125, 0.8922119140625, 1.06976318359375, 1.247314453125, 1.42486572265625, 1.6024169921875, 1.77996826171875, 1.95751953125, 2.13507080078125, 2.3126220703125, 2.49017333984375, 2.667724609375, 2.84527587890625, 3.0228271484375, 3.20037841796875, 3.3779296875, 3.55548095703125, 3.7330322265625, 3.91058349609375, 4.088134765625, 4.26568603515625, 4.4432373046875, 4.62078857421875, 4.79833984375, 4.97589111328125, 5.1534423828125, 5.33099365234375, 5.508544921875, 5.68609619140625, 5.8636474609375, 6.04119873046875, 6.21875]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 13.0, 15.0, 22.0, 32.0, 36.0, 57.0, 101.0, 138.0, 214.0, 352.0, 559.0, 900.0, 1434.0, 2507.0, 4256.0, 7291.0, 13014.0, 23805.0, 43815.0, 83548.0, 162141.0, 312386.0, 571998.0, 874189.0, 869497.0, 570787.0, 309428.0, 160487.0, 83159.0, 43590.0, 23455.0, 12987.0, 7303.0, 4222.0, 2558.0, 1469.0, 881.0, 570.0, 386.0, 211.0, 160.0, 96.0, 56.0, 44.0, 44.0, 23.0, 14.0, 12.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.578125, -7.34844970703125, -7.1187744140625, -6.88909912109375, -6.659423828125, -6.42974853515625, -6.2000732421875, -5.97039794921875, -5.74072265625, -5.51104736328125, -5.2813720703125, -5.05169677734375, -4.822021484375, -4.59234619140625, -4.3626708984375, -4.13299560546875, -3.9033203125, -3.67364501953125, -3.4439697265625, -3.21429443359375, -2.984619140625, -2.75494384765625, -2.5252685546875, -2.29559326171875, -2.06591796875, -1.83624267578125, -1.6065673828125, -1.37689208984375, -1.147216796875, -0.91754150390625, -0.6878662109375, -0.45819091796875, -0.228515625, 0.00115966796875, 0.2308349609375, 0.46051025390625, 0.690185546875, 0.91986083984375, 1.1495361328125, 1.37921142578125, 1.60888671875, 1.83856201171875, 2.0682373046875, 2.29791259765625, 2.527587890625, 2.75726318359375, 2.9869384765625, 3.21661376953125, 3.4462890625, 3.67596435546875, 3.9056396484375, 4.13531494140625, 4.364990234375, 4.59466552734375, 4.8243408203125, 5.05401611328125, 5.28369140625, 5.51336669921875, 5.7430419921875, 5.97271728515625, 6.202392578125, 6.43206787109375, 6.6617431640625, 6.89141845703125, 7.12109375]}, "gradients/decoder.bert.encoder.layer.18.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 5.0, 10.0, 3.0, 11.0, 11.0, 17.0, 16.0, 28.0, 40.0, 39.0, 49.0, 58.0, 77.0, 99.0, 113.0, 138.0, 176.0, 178.0, 208.0, 245.0, 251.0, 256.0, 243.0, 267.0, 237.0, 221.0, 192.0, 149.0, 146.0, 114.0, 90.0, 86.0, 67.0, 50.0, 30.0, 37.0, 27.0, 24.0, 12.0, 17.0, 9.0, 10.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.298828125, -2.222198486328125, -2.14556884765625, -2.068939208984375, -1.9923095703125, -1.915679931640625, -1.83905029296875, -1.762420654296875, -1.685791015625, -1.609161376953125, -1.53253173828125, -1.455902099609375, -1.3792724609375, -1.302642822265625, -1.22601318359375, -1.149383544921875, -1.07275390625, -0.996124267578125, -0.91949462890625, -0.842864990234375, -0.7662353515625, -0.689605712890625, -0.61297607421875, -0.536346435546875, -0.459716796875, -0.383087158203125, -0.30645751953125, -0.229827880859375, -0.1531982421875, -0.076568603515625, 6.103515625e-05, 0.076690673828125, 0.1533203125, 0.229949951171875, 0.30657958984375, 0.383209228515625, 0.4598388671875, 0.536468505859375, 0.61309814453125, 0.689727783203125, 0.766357421875, 0.842987060546875, 0.91961669921875, 0.996246337890625, 1.0728759765625, 1.149505615234375, 1.22613525390625, 1.302764892578125, 1.37939453125, 1.456024169921875, 1.53265380859375, 1.609283447265625, 1.6859130859375, 1.762542724609375, 1.83917236328125, 1.915802001953125, 1.992431640625, 2.069061279296875, 2.14569091796875, 2.222320556640625, 2.2989501953125, 2.375579833984375, 2.45220947265625, 2.528839111328125, 2.60546875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 6.0, 7.0, 13.0, 17.0, 21.0, 29.0, 23.0, 36.0, 37.0, 44.0, 55.0, 55.0, 70.0, 62.0, 65.0, 54.0, 66.0, 61.0, 48.0, 32.0, 33.0, 35.0, 18.0, 25.0, 15.0, 23.0, 8.0, 12.0, 4.0, 5.0, 7.0, 5.0, 2.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.380881309509277, -8.1304931640625, -7.880105495452881, -7.629717826843262, -7.379330158233643, -7.128942489624023, -6.878554344177246, -6.628166675567627, -6.377779006958008, -6.127391338348389, -5.877003192901611, -5.626615524291992, -5.376227855682373, -5.125840187072754, -4.875452041625977, -4.625064373016357, -4.37467622756958, -4.124288558959961, -3.8739006519317627, -3.6235127449035645, -3.3731250762939453, -3.122737169265747, -2.872349262237549, -2.6219615936279297, -2.3715736865997314, -2.121185779571533, -1.870798110961914, -1.6204102039337158, -1.3700224161148071, -1.1196346282958984, -0.8692467212677002, -0.6188589334487915, -0.368471622467041, -0.11808380484580994, 0.13230401277542114, 0.3826918601989746, 0.6330796480178833, 0.883467435836792, 1.1338553428649902, 1.384243130683899, 1.6346309185028076, 1.8850187063217163, 2.135406494140625, 2.3857944011688232, 2.6361823081970215, 2.8865699768066406, 3.136957883834839, 3.387345790863037, 3.6377334594726562, 3.8881213665008545, 4.138509273529053, 4.388896942138672, 4.639284610748291, 4.88967227935791, 5.1400604248046875, 5.390448093414307, 5.640835762023926, 5.891223430633545, 6.141611576080322, 6.391999244689941, 6.6423869132995605, 6.89277458190918, 7.143162727355957, 7.393550395965576, 7.6439385414123535]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 3.0, 8.0, 3.0, 9.0, 12.0, 7.0, 12.0, 14.0, 20.0, 24.0, 31.0, 30.0, 29.0, 25.0, 21.0, 29.0, 36.0, 41.0, 35.0, 45.0, 35.0, 25.0, 33.0, 49.0, 34.0, 31.0, 36.0, 36.0, 23.0, 23.0, 33.0, 28.0, 23.0, 32.0, 22.0, 20.0, 15.0, 15.0, 7.0, 8.0, 8.0, 8.0, 2.0, 7.0, 1.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.365355014801025, -5.178637504577637, -4.99191951751709, -4.805201530456543, -4.618484020233154, -4.431766510009766, -4.245048522949219, -4.058330535888672, -3.871613025665283, -3.6848952770233154, -3.4981775283813477, -3.31145977973938, -3.124742031097412, -2.9380242824554443, -2.7513065338134766, -2.564588785171509, -2.377871036529541, -2.1911532878875732, -2.0044355392456055, -1.8177177906036377, -1.63100004196167, -1.4442822933197021, -1.2575645446777344, -1.0708467960357666, -0.8841290473937988, -0.697411298751831, -0.5106935501098633, -0.3239758014678955, -0.13725805282592773, 0.04945969581604004, 0.2361774444580078, 0.4228951930999756, 0.6096124649047852, 0.7963302135467529, 0.9830479621887207, 1.1697657108306885, 1.3564834594726562, 1.543201208114624, 1.7299189567565918, 1.9166367053985596, 2.1033544540405273, 2.290072202682495, 2.476789951324463, 2.6635076999664307, 2.8502254486083984, 3.036943197250366, 3.223660945892334, 3.4103786945343018, 3.5970964431762695, 3.7838141918182373, 3.970531940460205, 4.157249450683594, 4.343967437744141, 4.5306854248046875, 4.717402935028076, 4.904120445251465, 5.090838432312012, 5.277556419372559, 5.464273929595947, 5.650991439819336, 5.837709426879883, 6.02442741394043, 6.211144924163818, 6.397862434387207, 6.584580421447754]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 14.0, 11.0, 19.0, 27.0, 46.0, 85.0, 110.0, 144.0, 210.0, 340.0, 503.0, 711.0, 1077.0, 1590.0, 2314.0, 3439.0, 4952.0, 7198.0, 10986.0, 15869.0, 23954.0, 35254.0, 51168.0, 73986.0, 101835.0, 129538.0, 140483.0, 125238.0, 97098.0, 69661.0, 48319.0, 33202.0, 22352.0, 14985.0, 10102.0, 6992.0, 4694.0, 3210.0, 2181.0, 1457.0, 1038.0, 689.0, 493.0, 326.0, 214.0, 141.0, 109.0, 77.0, 42.0, 33.0, 13.0, 17.0, 8.0, 3.0, 0.0, 0.0, 3.0, 2.0], "bins": [-1.544921875, -1.4972686767578125, -1.449615478515625, -1.4019622802734375, -1.35430908203125, -1.3066558837890625, -1.259002685546875, -1.2113494873046875, -1.1636962890625, -1.1160430908203125, -1.068389892578125, -1.0207366943359375, -0.97308349609375, -0.9254302978515625, -0.877777099609375, -0.8301239013671875, -0.782470703125, -0.7348175048828125, -0.687164306640625, -0.6395111083984375, -0.59185791015625, -0.5442047119140625, -0.496551513671875, -0.4488983154296875, -0.4012451171875, -0.3535919189453125, -0.305938720703125, -0.2582855224609375, -0.21063232421875, -0.1629791259765625, -0.115325927734375, -0.0676727294921875, -0.02001953125, 0.0276336669921875, 0.075286865234375, 0.1229400634765625, 0.17059326171875, 0.2182464599609375, 0.265899658203125, 0.3135528564453125, 0.3612060546875, 0.4088592529296875, 0.456512451171875, 0.5041656494140625, 0.55181884765625, 0.5994720458984375, 0.647125244140625, 0.6947784423828125, 0.742431640625, 0.7900848388671875, 0.837738037109375, 0.8853912353515625, 0.93304443359375, 0.9806976318359375, 1.028350830078125, 1.0760040283203125, 1.1236572265625, 1.1713104248046875, 1.218963623046875, 1.2666168212890625, 1.31427001953125, 1.3619232177734375, 1.409576416015625, 1.4572296142578125, 1.5048828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 6.0, 3.0, 5.0, 11.0, 9.0, 11.0, 15.0, 15.0, 15.0, 24.0, 18.0, 28.0, 36.0, 18.0, 25.0, 30.0, 35.0, 42.0, 42.0, 38.0, 41.0, 29.0, 42.0, 33.0, 42.0, 32.0, 40.0, 28.0, 30.0, 41.0, 19.0, 32.0, 23.0, 27.0, 25.0, 10.0, 14.0, 12.0, 6.0, 12.0, 5.0, 8.0, 10.0, 4.0, 3.0, 1.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0], "bins": [-6.73046875, -6.53253173828125, -6.3345947265625, -6.13665771484375, -5.938720703125, -5.74078369140625, -5.5428466796875, -5.34490966796875, -5.14697265625, -4.94903564453125, -4.7510986328125, -4.55316162109375, -4.355224609375, -4.15728759765625, -3.9593505859375, -3.76141357421875, -3.5634765625, -3.36553955078125, -3.1676025390625, -2.96966552734375, -2.771728515625, -2.57379150390625, -2.3758544921875, -2.17791748046875, -1.97998046875, -1.78204345703125, -1.5841064453125, -1.38616943359375, -1.188232421875, -0.99029541015625, -0.7923583984375, -0.59442138671875, -0.396484375, -0.19854736328125, -0.0006103515625, 0.19732666015625, 0.395263671875, 0.59320068359375, 0.7911376953125, 0.98907470703125, 1.18701171875, 1.38494873046875, 1.5828857421875, 1.78082275390625, 1.978759765625, 2.17669677734375, 2.3746337890625, 2.57257080078125, 2.7705078125, 2.96844482421875, 3.1663818359375, 3.36431884765625, 3.562255859375, 3.76019287109375, 3.9581298828125, 4.15606689453125, 4.35400390625, 4.55194091796875, 4.7498779296875, 4.94781494140625, 5.145751953125, 5.34368896484375, 5.5416259765625, 5.73956298828125, 5.9375]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 4.0, 6.0, 9.0, 17.0, 25.0, 35.0, 48.0, 69.0, 82.0, 139.0, 191.0, 272.0, 399.0, 602.0, 861.0, 1250.0, 1932.0, 3096.0, 5013.0, 8317.0, 15687.0, 35201.0, 765872.0, 153176.0, 24897.0, 12279.0, 6869.0, 4250.0, 2637.0, 1640.0, 1126.0, 804.0, 503.0, 359.0, 243.0, 180.0, 127.0, 83.0, 67.0, 49.0, 34.0, 29.0, 21.0, 14.0, 15.0, 6.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.58203125, -4.43798828125, -4.2939453125, -4.14990234375, -4.005859375, -3.86181640625, -3.7177734375, -3.57373046875, -3.4296875, -3.28564453125, -3.1416015625, -2.99755859375, -2.853515625, -2.70947265625, -2.5654296875, -2.42138671875, -2.27734375, -2.13330078125, -1.9892578125, -1.84521484375, -1.701171875, -1.55712890625, -1.4130859375, -1.26904296875, -1.125, -0.98095703125, -0.8369140625, -0.69287109375, -0.548828125, -0.40478515625, -0.2607421875, -0.11669921875, 0.02734375, 0.17138671875, 0.3154296875, 0.45947265625, 0.603515625, 0.74755859375, 0.8916015625, 1.03564453125, 1.1796875, 1.32373046875, 1.4677734375, 1.61181640625, 1.755859375, 1.89990234375, 2.0439453125, 2.18798828125, 2.33203125, 2.47607421875, 2.6201171875, 2.76416015625, 2.908203125, 3.05224609375, 3.1962890625, 3.34033203125, 3.484375, 3.62841796875, 3.7724609375, 3.91650390625, 4.060546875, 4.20458984375, 4.3486328125, 4.49267578125, 4.63671875]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 19.0, 15.0, 19.0, 20.0, 25.0, 31.0, 28.0, 26.0, 38.0, 48.0, 43.0, 59.0, 47.0, 38.0, 39.0, 51.0, 50.0, 37.0, 44.0, 41.0, 30.0, 32.0, 22.0, 26.0, 20.0, 15.0, 20.0, 19.0, 15.0, 14.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.78515625, -4.6246337890625, -4.464111328125, -4.3035888671875, -4.14306640625, -3.9825439453125, -3.822021484375, -3.6614990234375, -3.5009765625, -3.3404541015625, -3.179931640625, -3.0194091796875, -2.85888671875, -2.6983642578125, -2.537841796875, -2.3773193359375, -2.216796875, -2.0562744140625, -1.895751953125, -1.7352294921875, -1.57470703125, -1.4141845703125, -1.253662109375, -1.0931396484375, -0.9326171875, -0.7720947265625, -0.611572265625, -0.4510498046875, -0.29052734375, -0.1300048828125, 0.030517578125, 0.1910400390625, 0.3515625, 0.5120849609375, 0.672607421875, 0.8331298828125, 0.99365234375, 1.1541748046875, 1.314697265625, 1.4752197265625, 1.6357421875, 1.7962646484375, 1.956787109375, 2.1173095703125, 2.27783203125, 2.4383544921875, 2.598876953125, 2.7593994140625, 2.919921875, 3.0804443359375, 3.240966796875, 3.4014892578125, 3.56201171875, 3.7225341796875, 3.883056640625, 4.0435791015625, 4.2041015625, 4.3646240234375, 4.525146484375, 4.6856689453125, 4.84619140625, 5.0067138671875, 5.167236328125, 5.3277587890625, 5.48828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 6.0, 4.0, 11.0, 15.0, 8.0, 21.0, 27.0, 62.0, 76.0, 114.0, 174.0, 310.0, 588.0, 1168.0, 2704.0, 7048.0, 25005.0, 931472.0, 60389.0, 11932.0, 3936.0, 1636.0, 785.0, 406.0, 253.0, 160.0, 74.0, 62.0, 41.0, 22.0, 14.0, 11.0, 5.0, 6.0, 4.0, 3.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.08984375, -3.9609375, -3.83203125, -3.703125, -3.57421875, -3.4453125, -3.31640625, -3.1875, -3.05859375, -2.9296875, -2.80078125, -2.671875, -2.54296875, -2.4140625, -2.28515625, -2.15625, -2.02734375, -1.8984375, -1.76953125, -1.640625, -1.51171875, -1.3828125, -1.25390625, -1.125, -0.99609375, -0.8671875, -0.73828125, -0.609375, -0.48046875, -0.3515625, -0.22265625, -0.09375, 0.03515625, 0.1640625, 0.29296875, 0.421875, 0.55078125, 0.6796875, 0.80859375, 0.9375, 1.06640625, 1.1953125, 1.32421875, 1.453125, 1.58203125, 1.7109375, 1.83984375, 1.96875, 2.09765625, 2.2265625, 2.35546875, 2.484375, 2.61328125, 2.7421875, 2.87109375, 3.0, 3.12890625, 3.2578125, 3.38671875, 3.515625, 3.64453125, 3.7734375, 3.90234375, 4.03125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 10.0, 10.0, 8.0, 9.0, 20.0, 32.0, 40.0, 74.0, 112.0, 172.0, 173.0, 138.0, 77.0, 35.0, 29.0, 22.0, 9.0, 9.0, 11.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023674964904785156, -0.00022937916219234467, -0.00022200867533683777, -0.00021463818848133087, -0.00020726770162582397, -0.00019989721477031708, -0.00019252672791481018, -0.00018515624105930328, -0.0001777857542037964, -0.0001704152673482895, -0.0001630447804927826, -0.0001556742936372757, -0.0001483038067817688, -0.0001409333199262619, -0.000133562833070755, -0.0001261923462152481, -0.00011882185935974121, -0.00011145137250423431, -0.00010408088564872742, -9.671039879322052e-05, -8.933991193771362e-05, -8.196942508220673e-05, -7.459893822669983e-05, -6.722845137119293e-05, -5.9857964515686035e-05, -5.248747766017914e-05, -4.511699080467224e-05, -3.7746503949165344e-05, -3.0376017093658447e-05, -2.300553023815155e-05, -1.5635043382644653e-05, -8.264556527137756e-06, -8.940696716308594e-07, 6.476417183876038e-06, 1.3846904039382935e-05, 2.121739089488983e-05, 2.858787775039673e-05, 3.5958364605903625e-05, 4.332885146141052e-05, 5.069933831691742e-05, 5.8069825172424316e-05, 6.544031202793121e-05, 7.281079888343811e-05, 8.018128573894501e-05, 8.75517725944519e-05, 9.49222594499588e-05, 0.0001022927463054657, 0.0001096632331609726, 0.00011703372001647949, 0.0001244042068719864, 0.00013177469372749329, 0.00013914518058300018, 0.00014651566743850708, 0.00015388615429401398, 0.00016125664114952087, 0.00016862712800502777, 0.00017599761486053467, 0.00018336810171604156, 0.00019073858857154846, 0.00019810907542705536, 0.00020547956228256226, 0.00021285004913806915, 0.00022022053599357605, 0.00022759102284908295, 0.00023496150970458984]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 7.0, 12.0, 14.0, 17.0, 24.0, 30.0, 54.0, 65.0, 108.0, 133.0, 219.0, 339.0, 540.0, 829.0, 1331.0, 2208.0, 3806.0, 7065.0, 12750.0, 25351.0, 51186.0, 107401.0, 227993.0, 293119.0, 161636.0, 75274.0, 36513.0, 18158.0, 9543.0, 5120.0, 2913.0, 1724.0, 1097.0, 650.0, 427.0, 291.0, 177.0, 139.0, 80.0, 62.0, 44.0, 31.0, 17.0, 17.0, 8.0, 8.0, 7.0, 4.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9013671875, -0.87158203125, -0.841796875, -0.81201171875, -0.7822265625, -0.75244140625, -0.72265625, -0.69287109375, -0.6630859375, -0.63330078125, -0.603515625, -0.57373046875, -0.5439453125, -0.51416015625, -0.484375, -0.45458984375, -0.4248046875, -0.39501953125, -0.365234375, -0.33544921875, -0.3056640625, -0.27587890625, -0.24609375, -0.21630859375, -0.1865234375, -0.15673828125, -0.126953125, -0.09716796875, -0.0673828125, -0.03759765625, -0.0078125, 0.02197265625, 0.0517578125, 0.08154296875, 0.111328125, 0.14111328125, 0.1708984375, 0.20068359375, 0.23046875, 0.26025390625, 0.2900390625, 0.31982421875, 0.349609375, 0.37939453125, 0.4091796875, 0.43896484375, 0.46875, 0.49853515625, 0.5283203125, 0.55810546875, 0.587890625, 0.61767578125, 0.6474609375, 0.67724609375, 0.70703125, 0.73681640625, 0.7666015625, 0.79638671875, 0.826171875, 0.85595703125, 0.8857421875, 0.91552734375, 0.9453125, 0.97509765625, 1.0048828125]}, "gradients/decoder.bert.encoder.layer.18.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 6.0, 3.0, 2.0, 9.0, 5.0, 12.0, 15.0, 20.0, 24.0, 14.0, 28.0, 48.0, 87.0, 122.0, 117.0, 114.0, 93.0, 69.0, 38.0, 36.0, 27.0, 24.0, 19.0, 19.0, 8.0, 4.0, 10.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.4370536804199219, -0.42342376708984375, -0.4097938537597656, -0.3961639404296875, -0.3825340270996094, -0.36890411376953125, -0.3552742004394531, -0.341644287109375, -0.3280143737792969, -0.31438446044921875, -0.3007545471191406, -0.2871246337890625, -0.2734947204589844, -0.25986480712890625, -0.24623489379882812, -0.23260498046875, -0.21897506713867188, -0.20534515380859375, -0.19171524047851562, -0.1780853271484375, -0.16445541381835938, -0.15082550048828125, -0.13719558715820312, -0.123565673828125, -0.10993576049804688, -0.09630584716796875, -0.08267593383789062, -0.0690460205078125, -0.055416107177734375, -0.04178619384765625, -0.028156280517578125, -0.0145263671875, -0.000896453857421875, 0.01273345947265625, 0.026363372802734375, 0.0399932861328125, 0.053623199462890625, 0.06725311279296875, 0.08088302612304688, 0.094512939453125, 0.10814285278320312, 0.12177276611328125, 0.13540267944335938, 0.1490325927734375, 0.16266250610351562, 0.17629241943359375, 0.18992233276367188, 0.20355224609375, 0.21718215942382812, 0.23081207275390625, 0.24444198608398438, 0.2580718994140625, 0.2717018127441406, 0.28533172607421875, 0.2989616394042969, 0.312591552734375, 0.3262214660644531, 0.33985137939453125, 0.3534812927246094, 0.3671112060546875, 0.3807411193847656, 0.39437103271484375, 0.4080009460449219, 0.421630859375]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 12.0, 7.0, 16.0, 23.0, 23.0, 23.0, 37.0, 44.0, 40.0, 51.0, 69.0, 70.0, 65.0, 52.0, 73.0, 71.0, 48.0, 39.0, 50.0, 33.0, 24.0, 23.0, 25.0, 14.0, 18.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.509370803833008, -8.254297256469727, -7.9992241859436035, -7.7441511154174805, -7.489077568054199, -7.234004020690918, -6.978930950164795, -6.723857879638672, -6.468784332275391, -6.213710784912109, -5.958637714385986, -5.703564643859863, -5.448491096496582, -5.193417549133301, -4.938344478607178, -4.683271408081055, -4.428197860717773, -4.173124313354492, -3.918051242828369, -3.662977933883667, -3.407904624938965, -3.1528313159942627, -2.8977580070495605, -2.6426846981048584, -2.3876113891601562, -2.132538080215454, -1.877464771270752, -1.6223914623260498, -1.3673181533813477, -1.1122448444366455, -0.8571715354919434, -0.6020982265472412, -0.34702539443969727, -0.09195208549499512, 0.16312122344970703, 0.4181945323944092, 0.6732678413391113, 0.9283411502838135, 1.1834144592285156, 1.4384877681732178, 1.69356107711792, 1.948634386062622, 2.203707695007324, 2.4587810039520264, 2.7138543128967285, 2.9689276218414307, 3.224000930786133, 3.479074239730835, 3.734147548675537, 3.9892208576202393, 4.244294166564941, 4.499367713928223, 4.754440784454346, 5.009513854980469, 5.26458740234375, 5.519660949707031, 5.774734020233154, 6.029807090759277, 6.284880638122559, 6.53995418548584, 6.795027256011963, 7.050100326538086, 7.305173873901367, 7.560247421264648, 7.8153204917907715]}, "gradients/decoder.bert.encoder.layer.18.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 7.0, 4.0, 4.0, 4.0, 6.0, 11.0, 7.0, 12.0, 12.0, 19.0, 20.0, 19.0, 31.0, 36.0, 30.0, 22.0, 31.0, 24.0, 35.0, 45.0, 33.0, 41.0, 27.0, 34.0, 36.0, 44.0, 37.0, 33.0, 35.0, 28.0, 22.0, 32.0, 24.0, 30.0, 22.0, 33.0, 23.0, 13.0, 14.0, 13.0, 13.0, 7.0, 7.0, 8.0, 4.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4951276779174805, -5.30919075012207, -5.12325382232666, -4.937317371368408, -4.751380443572998, -4.565443515777588, -4.379507064819336, -4.193570137023926, -4.007633209228516, -3.8216962814331055, -3.6357595920562744, -3.4498229026794434, -3.263885974884033, -3.077949047088623, -2.892012357711792, -2.706075668334961, -2.520138740539551, -2.3342018127441406, -2.1482651233673096, -1.962328314781189, -1.7763915061950684, -1.5904546976089478, -1.4045178890228271, -1.2185810804367065, -1.032644271850586, -0.8467074632644653, -0.6607706546783447, -0.4748338460922241, -0.2888970375061035, -0.10296022891998291, 0.0829765796661377, 0.2689133882522583, 0.4548501968383789, 0.6407870054244995, 0.8267238140106201, 1.0126606225967407, 1.1985974311828613, 1.384534239768982, 1.5704710483551025, 1.7564078569412231, 1.9423446655273438, 2.128281593322754, 2.314218282699585, 2.500154972076416, 2.686091899871826, 2.8720288276672363, 3.0579655170440674, 3.2439022064208984, 3.4298391342163086, 3.6157760620117188, 3.80171275138855, 3.987649440765381, 4.173586368560791, 4.359523296356201, 4.545459747314453, 4.731396675109863, 4.917333602905273, 5.103270530700684, 5.289207458496094, 5.475143909454346, 5.661080837249756, 5.847017765045166, 6.032954216003418, 6.218891143798828, 6.404828071594238]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 13.0, 24.0, 44.0, 60.0, 85.0, 119.0, 188.0, 322.0, 469.0, 700.0, 1119.0, 1629.0, 2519.0, 3892.0, 6008.0, 9174.0, 14387.0, 21525.0, 33738.0, 50584.0, 73863.0, 102846.0, 128921.0, 140405.0, 129692.0, 103801.0, 75046.0, 50935.0, 33432.0, 22168.0, 14127.0, 9381.0, 6009.0, 3926.0, 2508.0, 1682.0, 1074.0, 714.0, 478.0, 329.0, 206.0, 133.0, 90.0, 56.0, 42.0, 39.0, 20.0, 8.0, 8.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.59765625, -5.42547607421875, -5.2532958984375, -5.08111572265625, -4.908935546875, -4.73675537109375, -4.5645751953125, -4.39239501953125, -4.22021484375, -4.04803466796875, -3.8758544921875, -3.70367431640625, -3.531494140625, -3.35931396484375, -3.1871337890625, -3.01495361328125, -2.8427734375, -2.67059326171875, -2.4984130859375, -2.32623291015625, -2.154052734375, -1.98187255859375, -1.8096923828125, -1.63751220703125, -1.46533203125, -1.29315185546875, -1.1209716796875, -0.94879150390625, -0.776611328125, -0.60443115234375, -0.4322509765625, -0.26007080078125, -0.087890625, 0.08428955078125, 0.2564697265625, 0.42864990234375, 0.600830078125, 0.77301025390625, 0.9451904296875, 1.11737060546875, 1.28955078125, 1.46173095703125, 1.6339111328125, 1.80609130859375, 1.978271484375, 2.15045166015625, 2.3226318359375, 2.49481201171875, 2.6669921875, 2.83917236328125, 3.0113525390625, 3.18353271484375, 3.355712890625, 3.52789306640625, 3.7000732421875, 3.87225341796875, 4.04443359375, 4.21661376953125, 4.3887939453125, 4.56097412109375, 4.733154296875, 4.90533447265625, 5.0775146484375, 5.24969482421875, 5.421875]}, "gradients/decoder.bert.encoder.layer.18.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 4.0, 5.0, 3.0, 7.0, 10.0, 13.0, 15.0, 11.0, 23.0, 29.0, 30.0, 29.0, 31.0, 31.0, 42.0, 46.0, 30.0, 37.0, 34.0, 38.0, 37.0, 36.0, 44.0, 37.0, 32.0, 34.0, 40.0, 34.0, 25.0, 30.0, 23.0, 26.0, 20.0, 22.0, 13.0, 17.0, 14.0, 7.0, 8.0, 9.0, 10.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.54296875, -5.3514404296875, -5.159912109375, -4.9683837890625, -4.77685546875, -4.5853271484375, -4.393798828125, -4.2022705078125, -4.0107421875, -3.8192138671875, -3.627685546875, -3.4361572265625, -3.24462890625, -3.0531005859375, -2.861572265625, -2.6700439453125, -2.478515625, -2.2869873046875, -2.095458984375, -1.9039306640625, -1.71240234375, -1.5208740234375, -1.329345703125, -1.1378173828125, -0.9462890625, -0.7547607421875, -0.563232421875, -0.3717041015625, -0.18017578125, 0.0113525390625, 0.202880859375, 0.3944091796875, 0.5859375, 0.7774658203125, 0.968994140625, 1.1605224609375, 1.35205078125, 1.5435791015625, 1.735107421875, 1.9266357421875, 2.1181640625, 2.3096923828125, 2.501220703125, 2.6927490234375, 2.88427734375, 3.0758056640625, 3.267333984375, 3.4588623046875, 3.650390625, 3.8419189453125, 4.033447265625, 4.2249755859375, 4.41650390625, 4.6080322265625, 4.799560546875, 4.9910888671875, 5.1826171875, 5.3741455078125, 5.565673828125, 5.7572021484375, 5.94873046875, 6.1402587890625, 6.331787109375, 6.5233154296875, 6.71484375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 9.0, 7.0, 17.0, 25.0, 26.0, 34.0, 68.0, 105.0, 172.0, 255.0, 427.0, 624.0, 1132.0, 1788.0, 2973.0, 4975.0, 8443.0, 13931.0, 23366.0, 38992.0, 64316.0, 100796.0, 143055.0, 168044.0, 157433.0, 118563.0, 78172.0, 48370.0, 29356.0, 17351.0, 10194.0, 6058.0, 3618.0, 2238.0, 1321.0, 879.0, 521.0, 329.0, 225.0, 116.0, 84.0, 45.0, 49.0, 21.0, 11.0, 5.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.3681640625, -5.193359375, -5.0185546875, -4.84375, -4.6689453125, -4.494140625, -4.3193359375, -4.14453125, -3.9697265625, -3.794921875, -3.6201171875, -3.4453125, -3.2705078125, -3.095703125, -2.9208984375, -2.74609375, -2.5712890625, -2.396484375, -2.2216796875, -2.046875, -1.8720703125, -1.697265625, -1.5224609375, -1.34765625, -1.1728515625, -0.998046875, -0.8232421875, -0.6484375, -0.4736328125, -0.298828125, -0.1240234375, 0.05078125, 0.2255859375, 0.400390625, 0.5751953125, 0.75, 0.9248046875, 1.099609375, 1.2744140625, 1.44921875, 1.6240234375, 1.798828125, 1.9736328125, 2.1484375, 2.3232421875, 2.498046875, 2.6728515625, 2.84765625, 3.0224609375, 3.197265625, 3.3720703125, 3.546875, 3.7216796875, 3.896484375, 4.0712890625, 4.24609375, 4.4208984375, 4.595703125, 4.7705078125, 4.9453125, 5.1201171875, 5.294921875, 5.4697265625, 5.64453125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 6.0, 8.0, 4.0, 9.0, 16.0, 19.0, 19.0, 14.0, 16.0, 28.0, 37.0, 28.0, 37.0, 37.0, 44.0, 43.0, 45.0, 39.0, 36.0, 45.0, 34.0, 40.0, 44.0, 41.0, 37.0, 39.0, 34.0, 32.0, 22.0, 25.0, 28.0, 15.0, 14.0, 14.0, 11.0, 10.0, 10.0, 8.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.5794677734375, -4.440185546875, -4.3009033203125, -4.16162109375, -4.0223388671875, -3.883056640625, -3.7437744140625, -3.6044921875, -3.4652099609375, -3.325927734375, -3.1866455078125, -3.04736328125, -2.9080810546875, -2.768798828125, -2.6295166015625, -2.490234375, -2.3509521484375, -2.211669921875, -2.0723876953125, -1.93310546875, -1.7938232421875, -1.654541015625, -1.5152587890625, -1.3759765625, -1.2366943359375, -1.097412109375, -0.9581298828125, -0.81884765625, -0.6795654296875, -0.540283203125, -0.4010009765625, -0.26171875, -0.1224365234375, 0.016845703125, 0.1561279296875, 0.29541015625, 0.4346923828125, 0.573974609375, 0.7132568359375, 0.8525390625, 0.9918212890625, 1.131103515625, 1.2703857421875, 1.40966796875, 1.5489501953125, 1.688232421875, 1.8275146484375, 1.966796875, 2.1060791015625, 2.245361328125, 2.3846435546875, 2.52392578125, 2.6632080078125, 2.802490234375, 2.9417724609375, 3.0810546875, 3.2203369140625, 3.359619140625, 3.4989013671875, 3.63818359375, 3.7774658203125, 3.916748046875, 4.0560302734375, 4.1953125]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 9.0, 15.0, 15.0, 23.0, 41.0, 55.0, 96.0, 155.0, 226.0, 309.0, 524.0, 925.0, 1578.0, 2840.0, 5515.0, 11137.0, 24638.0, 55484.0, 129480.0, 256659.0, 279352.0, 155041.0, 67460.0, 29344.0, 13382.0, 6448.0, 3367.0, 1790.0, 1029.0, 596.0, 360.0, 234.0, 136.0, 99.0, 63.0, 47.0, 27.0, 18.0, 6.0, 7.0, 10.0, 2.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66796875, -5.45892333984375, -5.2498779296875, -5.04083251953125, -4.831787109375, -4.62274169921875, -4.4136962890625, -4.20465087890625, -3.99560546875, -3.78656005859375, -3.5775146484375, -3.36846923828125, -3.159423828125, -2.95037841796875, -2.7413330078125, -2.53228759765625, -2.3232421875, -2.11419677734375, -1.9051513671875, -1.69610595703125, -1.487060546875, -1.27801513671875, -1.0689697265625, -0.85992431640625, -0.65087890625, -0.44183349609375, -0.2327880859375, -0.02374267578125, 0.185302734375, 0.39434814453125, 0.6033935546875, 0.81243896484375, 1.021484375, 1.23052978515625, 1.4395751953125, 1.64862060546875, 1.857666015625, 2.06671142578125, 2.2757568359375, 2.48480224609375, 2.69384765625, 2.90289306640625, 3.1119384765625, 3.32098388671875, 3.530029296875, 3.73907470703125, 3.9481201171875, 4.15716552734375, 4.3662109375, 4.57525634765625, 4.7843017578125, 4.99334716796875, 5.202392578125, 5.41143798828125, 5.6204833984375, 5.82952880859375, 6.03857421875, 6.24761962890625, 6.4566650390625, 6.66571044921875, 6.874755859375, 7.08380126953125, 7.2928466796875, 7.50189208984375, 7.7109375]}, "gradients/decoder.bert.encoder.layer.18.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 5.0, 8.0, 3.0, 21.0, 14.0, 10.0, 27.0, 33.0, 33.0, 31.0, 44.0, 56.0, 64.0, 60.0, 68.0, 70.0, 66.0, 55.0, 62.0, 44.0, 44.0, 35.0, 33.0, 22.0, 17.0, 19.0, 10.0, 10.0, 8.0, 5.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041675567626953125, -0.0004015490412712097, -0.0003863424062728882, -0.00037113577127456665, -0.0003559291362762451, -0.0003407225012779236, -0.00032551586627960205, -0.0003103092312812805, -0.000295102596282959, -0.00027989596128463745, -0.0002646893262863159, -0.0002494826912879944, -0.00023427605628967285, -0.00021906942129135132, -0.00020386278629302979, -0.00018865615129470825, -0.00017344951629638672, -0.00015824288129806519, -0.00014303624629974365, -0.00012782961130142212, -0.00011262297630310059, -9.741634130477905e-05, -8.220970630645752e-05, -6.700307130813599e-05, -5.179643630981445e-05, -3.658980131149292e-05, -2.1383166313171387e-05, -6.1765313148498535e-06, 9.03010368347168e-06, 2.4236738681793213e-05, 3.9443373680114746e-05, 5.465000867843628e-05, 6.985664367675781e-05, 8.506327867507935e-05, 0.00010026991367340088, 0.00011547654867172241, 0.00013068318367004395, 0.00014588981866836548, 0.000161096453666687, 0.00017630308866500854, 0.00019150972366333008, 0.0002067163586616516, 0.00022192299365997314, 0.00023712962865829468, 0.0002523362636566162, 0.00026754289865493774, 0.0002827495336532593, 0.0002979561686515808, 0.00031316280364990234, 0.0003283694386482239, 0.0003435760736465454, 0.00035878270864486694, 0.0003739893436431885, 0.00038919597864151, 0.00040440261363983154, 0.0004196092486381531, 0.0004348158836364746, 0.00045002251863479614, 0.0004652291536331177, 0.0004804357886314392, 0.0004956424236297607, 0.0005108490586280823, 0.0005260556936264038, 0.0005412623286247253, 0.0005564689636230469]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 1.0, 5.0, 8.0, 5.0, 8.0, 20.0, 22.0, 28.0, 41.0, 79.0, 103.0, 149.0, 213.0, 312.0, 502.0, 708.0, 1220.0, 1899.0, 3073.0, 5131.0, 8952.0, 16131.0, 29022.0, 54822.0, 104114.0, 179691.0, 226630.0, 182494.0, 107502.0, 56600.0, 29833.0, 16107.0, 9292.0, 5182.0, 3165.0, 1922.0, 1251.0, 803.0, 500.0, 317.0, 188.0, 158.0, 132.0, 81.0, 39.0, 44.0, 13.0, 14.0, 10.0, 8.0, 7.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.421875, -5.2601318359375, -5.098388671875, -4.9366455078125, -4.77490234375, -4.6131591796875, -4.451416015625, -4.2896728515625, -4.1279296875, -3.9661865234375, -3.804443359375, -3.6427001953125, -3.48095703125, -3.3192138671875, -3.157470703125, -2.9957275390625, -2.833984375, -2.6722412109375, -2.510498046875, -2.3487548828125, -2.18701171875, -2.0252685546875, -1.863525390625, -1.7017822265625, -1.5400390625, -1.3782958984375, -1.216552734375, -1.0548095703125, -0.89306640625, -0.7313232421875, -0.569580078125, -0.4078369140625, -0.24609375, -0.0843505859375, 0.077392578125, 0.2391357421875, 0.40087890625, 0.5626220703125, 0.724365234375, 0.8861083984375, 1.0478515625, 1.2095947265625, 1.371337890625, 1.5330810546875, 1.69482421875, 1.8565673828125, 2.018310546875, 2.1800537109375, 2.341796875, 2.5035400390625, 2.665283203125, 2.8270263671875, 2.98876953125, 3.1505126953125, 3.312255859375, 3.4739990234375, 3.6357421875, 3.7974853515625, 3.959228515625, 4.1209716796875, 4.28271484375, 4.4444580078125, 4.606201171875, 4.7679443359375, 4.9296875]}, "gradients/decoder.bert.encoder.layer.18.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 9.0, 14.0, 9.0, 15.0, 15.0, 19.0, 17.0, 28.0, 34.0, 33.0, 34.0, 64.0, 73.0, 79.0, 67.0, 63.0, 72.0, 77.0, 57.0, 41.0, 27.0, 21.0, 29.0, 16.0, 18.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.38543701171875, -2.3021240234375, -2.21881103515625, -2.135498046875, -2.05218505859375, -1.9688720703125, -1.88555908203125, -1.80224609375, -1.71893310546875, -1.6356201171875, -1.55230712890625, -1.468994140625, -1.38568115234375, -1.3023681640625, -1.21905517578125, -1.1357421875, -1.05242919921875, -0.9691162109375, -0.88580322265625, -0.802490234375, -0.71917724609375, -0.6358642578125, -0.55255126953125, -0.46923828125, -0.38592529296875, -0.3026123046875, -0.21929931640625, -0.135986328125, -0.05267333984375, 0.0306396484375, 0.11395263671875, 0.197265625, 0.28057861328125, 0.3638916015625, 0.44720458984375, 0.530517578125, 0.61383056640625, 0.6971435546875, 0.78045654296875, 0.86376953125, 0.94708251953125, 1.0303955078125, 1.11370849609375, 1.197021484375, 1.28033447265625, 1.3636474609375, 1.44696044921875, 1.5302734375, 1.61358642578125, 1.6968994140625, 1.78021240234375, 1.863525390625, 1.94683837890625, 2.0301513671875, 2.11346435546875, 2.19677734375, 2.28009033203125, 2.3634033203125, 2.44671630859375, 2.530029296875, 2.61334228515625, 2.6966552734375, 2.77996826171875, 2.86328125]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 13.0, 10.0, 6.0, 14.0, 10.0, 19.0, 17.0, 32.0, 35.0, 35.0, 48.0, 60.0, 46.0, 74.0, 56.0, 57.0, 66.0, 58.0, 58.0, 53.0, 37.0, 36.0, 32.0, 28.0, 15.0, 21.0, 10.0, 12.0, 12.0, 0.0, 6.0, 10.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.575044631958008, -7.339587211608887, -7.104129791259766, -6.8686723709106445, -6.633214950561523, -6.397757530212402, -6.162300109863281, -5.92684268951416, -5.691385269165039, -5.455927848815918, -5.220470428466797, -4.985013008117676, -4.749555587768555, -4.514098167419434, -4.2786407470703125, -4.043183326721191, -3.8077259063720703, -3.572268486022949, -3.336811065673828, -3.101353645324707, -2.865896224975586, -2.630438804626465, -2.3949813842773438, -2.1595239639282227, -1.9240665435791016, -1.6886091232299805, -1.4531517028808594, -1.2176942825317383, -0.9822368621826172, -0.7467794418334961, -0.511322021484375, -0.2758646011352539, -0.040407657623291016, 0.19504976272583008, 0.43050718307495117, 0.6659646034240723, 0.9014220237731934, 1.1368794441223145, 1.3723368644714355, 1.6077942848205566, 1.8432517051696777, 2.078709125518799, 2.31416654586792, 2.549623966217041, 2.785081386566162, 3.020538806915283, 3.2559962272644043, 3.4914536476135254, 3.7269110679626465, 3.9623684883117676, 4.197825908660889, 4.43328332901001, 4.668740749359131, 4.904198169708252, 5.139655590057373, 5.375113010406494, 5.610570430755615, 5.846027851104736, 6.081485271453857, 6.3169426918029785, 6.5524001121521, 6.787857532501221, 7.023314952850342, 7.258772373199463, 7.494229793548584]}, "gradients/decoder.bert.encoder.layer.17.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 0.0, 2.0, 2.0, 7.0, 11.0, 8.0, 11.0, 7.0, 15.0, 14.0, 17.0, 17.0, 18.0, 18.0, 30.0, 24.0, 31.0, 29.0, 33.0, 35.0, 38.0, 45.0, 52.0, 45.0, 38.0, 38.0, 33.0, 33.0, 46.0, 29.0, 40.0, 21.0, 42.0, 24.0, 24.0, 21.0, 16.0, 18.0, 9.0, 10.0, 14.0, 7.0, 9.0, 10.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.377585411071777, -6.171494960784912, -5.965404033660889, -5.759313583374023, -5.55322265625, -5.347132205963135, -5.141041278839111, -4.934950828552246, -4.728859901428223, -4.522769451141357, -4.316678524017334, -4.110588073730469, -3.9044971466064453, -3.69840669631958, -3.4923157691955566, -3.2862253189086914, -3.080134630203247, -2.8740439414978027, -2.6679532527923584, -2.461862564086914, -2.2557718753814697, -2.0496811866760254, -1.8435906171798706, -1.6374999284744263, -1.431409239768982, -1.2253185510635376, -1.0192278623580933, -0.8131372332572937, -0.6070465445518494, -0.4009559154510498, -0.19486522674560547, 0.011225461959838867, 0.2173161506652832, 0.42340683937072754, 0.6294975280761719, 0.8355881571769714, 1.0416789054870605, 1.2477694749832153, 1.4538601636886597, 1.659950852394104, 1.8660415410995483, 2.072132110595703, 2.2782227993011475, 2.484313488006592, 2.690404176712036, 2.8964948654174805, 3.102585554122925, 3.308676242828369, 3.5147669315338135, 3.720857620239258, 3.926948308944702, 4.1330389976501465, 4.339129447937012, 4.545220375061035, 4.7513108253479, 4.957401752471924, 5.163492202758789, 5.369582653045654, 5.575673580169678, 5.781764030456543, 5.987854957580566, 6.193945407867432, 6.400036334991455, 6.60612678527832, 6.812217712402344]}, "gradients/decoder.bert.encoder.layer.17.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 5.0, 6.0, 10.0, 12.0, 23.0, 31.0, 45.0, 64.0, 99.0, 172.0, 263.0, 432.0, 763.0, 1329.0, 2203.0, 4114.0, 7551.0, 14057.0, 26835.0, 54393.0, 113600.0, 250912.0, 555324.0, 981052.0, 1027157.0, 617578.0, 282626.0, 127582.0, 60110.0, 30364.0, 15479.0, 8584.0, 4680.0, 2646.0, 1643.0, 1032.0, 568.0, 341.0, 219.0, 124.0, 95.0, 54.0, 34.0, 23.0, 15.0, 14.0, 10.0, 11.0, 6.0, 2.0, 3.0], "bins": [-7.55859375, -7.354736328125, -7.15087890625, -6.947021484375, -6.7431640625, -6.539306640625, -6.33544921875, -6.131591796875, -5.927734375, -5.723876953125, -5.52001953125, -5.316162109375, -5.1123046875, -4.908447265625, -4.70458984375, -4.500732421875, -4.296875, -4.093017578125, -3.88916015625, -3.685302734375, -3.4814453125, -3.277587890625, -3.07373046875, -2.869873046875, -2.666015625, -2.462158203125, -2.25830078125, -2.054443359375, -1.8505859375, -1.646728515625, -1.44287109375, -1.239013671875, -1.03515625, -0.831298828125, -0.62744140625, -0.423583984375, -0.2197265625, -0.015869140625, 0.18798828125, 0.391845703125, 0.595703125, 0.799560546875, 1.00341796875, 1.207275390625, 1.4111328125, 1.614990234375, 1.81884765625, 2.022705078125, 2.2265625, 2.430419921875, 2.63427734375, 2.838134765625, 3.0419921875, 3.245849609375, 3.44970703125, 3.653564453125, 3.857421875, 4.061279296875, 4.26513671875, 4.468994140625, 4.6728515625, 4.876708984375, 5.08056640625, 5.284423828125, 5.48828125]}, "gradients/decoder.bert.encoder.layer.17.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 3.0, 1.0, 3.0, 8.0, 5.0, 10.0, 10.0, 14.0, 15.0, 7.0, 18.0, 16.0, 14.0, 36.0, 31.0, 29.0, 24.0, 28.0, 46.0, 31.0, 38.0, 39.0, 48.0, 57.0, 44.0, 42.0, 32.0, 45.0, 33.0, 28.0, 30.0, 32.0, 31.0, 23.0, 27.0, 19.0, 13.0, 10.0, 11.0, 10.0, 8.0, 12.0, 6.0, 7.0, 6.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.9171142578125, -3.779541015625, -3.6419677734375, -3.50439453125, -3.3668212890625, -3.229248046875, -3.0916748046875, -2.9541015625, -2.8165283203125, -2.678955078125, -2.5413818359375, -2.40380859375, -2.2662353515625, -2.128662109375, -1.9910888671875, -1.853515625, -1.7159423828125, -1.578369140625, -1.4407958984375, -1.30322265625, -1.1656494140625, -1.028076171875, -0.8905029296875, -0.7529296875, -0.6153564453125, -0.477783203125, -0.3402099609375, -0.20263671875, -0.0650634765625, 0.072509765625, 0.2100830078125, 0.34765625, 0.4852294921875, 0.622802734375, 0.7603759765625, 0.89794921875, 1.0355224609375, 1.173095703125, 1.3106689453125, 1.4482421875, 1.5858154296875, 1.723388671875, 1.8609619140625, 1.99853515625, 2.1361083984375, 2.273681640625, 2.4112548828125, 2.548828125, 2.6864013671875, 2.823974609375, 2.9615478515625, 3.09912109375, 3.2366943359375, 3.374267578125, 3.5118408203125, 3.6494140625, 3.7869873046875, 3.924560546875, 4.0621337890625, 4.19970703125, 4.3372802734375, 4.474853515625, 4.6124267578125, 4.75]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 11.0, 12.0, 16.0, 22.0, 47.0, 65.0, 112.0, 177.0, 283.0, 481.0, 867.0, 1513.0, 2632.0, 4895.0, 9265.0, 17573.0, 35404.0, 72164.0, 152932.0, 327481.0, 666678.0, 1048434.0, 908159.0, 495086.0, 233712.0, 109110.0, 52485.0, 26009.0, 13277.0, 6901.0, 3691.0, 2037.0, 1156.0, 628.0, 394.0, 223.0, 133.0, 69.0, 57.0, 39.0, 19.0, 12.0, 9.0, 3.0, 6.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.91217041015625, -5.6993408203125, -5.48651123046875, -5.273681640625, -5.06085205078125, -4.8480224609375, -4.63519287109375, -4.42236328125, -4.20953369140625, -3.9967041015625, -3.78387451171875, -3.571044921875, -3.35821533203125, -3.1453857421875, -2.93255615234375, -2.7197265625, -2.50689697265625, -2.2940673828125, -2.08123779296875, -1.868408203125, -1.65557861328125, -1.4427490234375, -1.22991943359375, -1.01708984375, -0.80426025390625, -0.5914306640625, -0.37860107421875, -0.165771484375, 0.04705810546875, 0.2598876953125, 0.47271728515625, 0.685546875, 0.89837646484375, 1.1112060546875, 1.32403564453125, 1.536865234375, 1.74969482421875, 1.9625244140625, 2.17535400390625, 2.38818359375, 2.60101318359375, 2.8138427734375, 3.02667236328125, 3.239501953125, 3.45233154296875, 3.6651611328125, 3.87799072265625, 4.0908203125, 4.30364990234375, 4.5164794921875, 4.72930908203125, 4.942138671875, 5.15496826171875, 5.3677978515625, 5.58062744140625, 5.79345703125, 6.00628662109375, 6.2191162109375, 6.43194580078125, 6.644775390625, 6.85760498046875, 7.0704345703125, 7.28326416015625, 7.49609375]}, "gradients/decoder.bert.encoder.layer.17.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 8.0, 8.0, 14.0, 24.0, 19.0, 39.0, 33.0, 63.0, 63.0, 96.0, 114.0, 150.0, 167.0, 250.0, 257.0, 262.0, 290.0, 284.0, 308.0, 285.0, 257.0, 231.0, 162.0, 148.0, 135.0, 92.0, 68.0, 45.0, 46.0, 39.0, 31.0, 29.0, 15.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.300048828125, -2.22705078125, -2.154052734375, -2.0810546875, -2.008056640625, -1.93505859375, -1.862060546875, -1.7890625, -1.716064453125, -1.64306640625, -1.570068359375, -1.4970703125, -1.424072265625, -1.35107421875, -1.278076171875, -1.205078125, -1.132080078125, -1.05908203125, -0.986083984375, -0.9130859375, -0.840087890625, -0.76708984375, -0.694091796875, -0.62109375, -0.548095703125, -0.47509765625, -0.402099609375, -0.3291015625, -0.256103515625, -0.18310546875, -0.110107421875, -0.037109375, 0.035888671875, 0.10888671875, 0.181884765625, 0.2548828125, 0.327880859375, 0.40087890625, 0.473876953125, 0.546875, 0.619873046875, 0.69287109375, 0.765869140625, 0.8388671875, 0.911865234375, 0.98486328125, 1.057861328125, 1.130859375, 1.203857421875, 1.27685546875, 1.349853515625, 1.4228515625, 1.495849609375, 1.56884765625, 1.641845703125, 1.71484375, 1.787841796875, 1.86083984375, 1.933837890625, 2.0068359375, 2.079833984375, 2.15283203125, 2.225830078125, 2.298828125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 3.0, 7.0, 7.0, 11.0, 16.0, 15.0, 21.0, 25.0, 25.0, 31.0, 42.0, 45.0, 45.0, 40.0, 50.0, 55.0, 54.0, 53.0, 49.0, 51.0, 45.0, 38.0, 38.0, 28.0, 22.0, 28.0, 20.0, 32.0, 17.0, 22.0, 15.0, 5.0, 8.0, 6.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.2724809646606445, -5.1135125160217285, -4.9545440673828125, -4.7955756187438965, -4.6366071701049805, -4.477639198303223, -4.318670749664307, -4.159702301025391, -4.000733852386475, -3.8417654037475586, -3.6827969551086426, -3.5238287448883057, -3.3648602962493896, -3.2058918476104736, -3.0469236373901367, -2.8879551887512207, -2.7289867401123047, -2.5700182914733887, -2.4110498428344727, -2.2520816326141357, -2.0931131839752197, -1.9341447353363037, -1.7751764059066772, -1.6162080764770508, -1.4572396278381348, -1.2982711791992188, -1.1393028497695923, -0.980334460735321, -0.8213660717010498, -0.6623976826667786, -0.5034292936325073, -0.34446096420288086, -0.18549299240112305, -0.026524603366851807, 0.13244378566741943, 0.2914121747016907, 0.4503805637359619, 0.6093489527702332, 0.7683173418045044, 0.9272856712341309, 1.0862541198730469, 1.245222568511963, 1.4041908979415894, 1.5631592273712158, 1.7221276760101318, 1.8810961246490479, 2.0400643348693848, 2.199032783508301, 2.358001232147217, 2.516969680786133, 2.675938129425049, 2.8349063396453857, 2.9938747882843018, 3.1528432369232178, 3.3118114471435547, 3.4707798957824707, 3.6297483444213867, 3.7887167930603027, 3.9476852416992188, 4.106653690338135, 4.265622138977051, 4.424590110778809, 4.583558559417725, 4.742527008056641, 4.901495456695557]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 10.0, 4.0, 7.0, 4.0, 10.0, 12.0, 15.0, 19.0, 21.0, 17.0, 17.0, 30.0, 26.0, 25.0, 29.0, 40.0, 28.0, 40.0, 38.0, 33.0, 45.0, 44.0, 45.0, 29.0, 39.0, 44.0, 45.0, 26.0, 33.0, 28.0, 34.0, 20.0, 15.0, 24.0, 21.0, 12.0, 18.0, 6.0, 7.0, 11.0, 6.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-5.015134334564209, -4.854822158813477, -4.694509506225586, -4.5341973304748535, -4.373885154724121, -4.2135725021362305, -4.053260326385498, -3.8929481506347656, -3.732635736465454, -3.5723233222961426, -3.41201114654541, -3.2516987323760986, -3.091386318206787, -2.9310741424560547, -2.770761728286743, -2.6104493141174316, -2.450137138366699, -2.2898247241973877, -2.1295125484466553, -1.9692001342773438, -1.8088878393173218, -1.6485755443572998, -1.4882631301879883, -1.3279508352279663, -1.1676385402679443, -1.0073262453079224, -0.8470138907432556, -0.6867015361785889, -0.5263892412185669, -0.3660769462585449, -0.20576459169387817, -0.045452237129211426, 0.11486005783081055, 0.2751723825931549, 0.43548470735549927, 0.595797061920166, 0.756109356880188, 0.91642165184021, 1.0767340660095215, 1.2370463609695435, 1.3973586559295654, 1.5576709508895874, 1.7179832458496094, 1.878295660018921, 2.0386080741882324, 2.198920249938965, 2.3592326641082764, 2.519545078277588, 2.6798572540283203, 2.840169668197632, 3.0004818439483643, 3.160794258117676, 3.321106433868408, 3.4814188480377197, 3.6417312622070312, 3.8020434379577637, 3.962355852127075, 4.122668266296387, 4.282980442047119, 4.443292617797852, 4.603605270385742, 4.763917446136475, 4.924229621887207, 5.084542274475098, 5.24485445022583]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 12.0, 9.0, 12.0, 22.0, 39.0, 56.0, 76.0, 160.0, 234.0, 363.0, 563.0, 901.0, 1465.0, 2254.0, 3546.0, 5593.0, 9090.0, 14477.0, 22441.0, 36056.0, 59457.0, 97459.0, 154282.0, 196903.0, 165245.0, 106454.0, 64866.0, 39751.0, 24641.0, 15497.0, 9782.0, 6179.0, 3947.0, 2447.0, 1546.0, 1009.0, 650.0, 368.0, 264.0, 144.0, 122.0, 57.0, 42.0, 26.0, 21.0, 11.0, 8.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.505859375, -1.45965576171875, -1.4134521484375, -1.36724853515625, -1.321044921875, -1.27484130859375, -1.2286376953125, -1.18243408203125, -1.13623046875, -1.09002685546875, -1.0438232421875, -0.99761962890625, -0.951416015625, -0.90521240234375, -0.8590087890625, -0.81280517578125, -0.7666015625, -0.72039794921875, -0.6741943359375, -0.62799072265625, -0.581787109375, -0.53558349609375, -0.4893798828125, -0.44317626953125, -0.39697265625, -0.35076904296875, -0.3045654296875, -0.25836181640625, -0.212158203125, -0.16595458984375, -0.1197509765625, -0.07354736328125, -0.02734375, 0.01885986328125, 0.0650634765625, 0.11126708984375, 0.157470703125, 0.20367431640625, 0.2498779296875, 0.29608154296875, 0.34228515625, 0.38848876953125, 0.4346923828125, 0.48089599609375, 0.527099609375, 0.57330322265625, 0.6195068359375, 0.66571044921875, 0.7119140625, 0.75811767578125, 0.8043212890625, 0.85052490234375, 0.896728515625, 0.94293212890625, 0.9891357421875, 1.03533935546875, 1.08154296875, 1.12774658203125, 1.1739501953125, 1.22015380859375, 1.266357421875, 1.31256103515625, 1.3587646484375, 1.40496826171875, 1.451171875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 4.0, 4.0, 9.0, 12.0, 14.0, 16.0, 17.0, 14.0, 18.0, 19.0, 27.0, 25.0, 27.0, 36.0, 22.0, 35.0, 43.0, 30.0, 45.0, 38.0, 44.0, 40.0, 39.0, 45.0, 47.0, 50.0, 26.0, 26.0, 27.0, 27.0, 30.0, 18.0, 23.0, 18.0, 12.0, 12.0, 13.0, 8.0, 6.0, 8.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3515625, -5.181884765625, -5.01220703125, -4.842529296875, -4.6728515625, -4.503173828125, -4.33349609375, -4.163818359375, -3.994140625, -3.824462890625, -3.65478515625, -3.485107421875, -3.3154296875, -3.145751953125, -2.97607421875, -2.806396484375, -2.63671875, -2.467041015625, -2.29736328125, -2.127685546875, -1.9580078125, -1.788330078125, -1.61865234375, -1.448974609375, -1.279296875, -1.109619140625, -0.93994140625, -0.770263671875, -0.6005859375, -0.430908203125, -0.26123046875, -0.091552734375, 0.078125, 0.247802734375, 0.41748046875, 0.587158203125, 0.7568359375, 0.926513671875, 1.09619140625, 1.265869140625, 1.435546875, 1.605224609375, 1.77490234375, 1.944580078125, 2.1142578125, 2.283935546875, 2.45361328125, 2.623291015625, 2.79296875, 2.962646484375, 3.13232421875, 3.302001953125, 3.4716796875, 3.641357421875, 3.81103515625, 3.980712890625, 4.150390625, 4.320068359375, 4.48974609375, 4.659423828125, 4.8291015625, 4.998779296875, 5.16845703125, 5.338134765625, 5.5078125]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 11.0, 13.0, 16.0, 26.0, 25.0, 23.0, 42.0, 54.0, 81.0, 127.0, 171.0, 247.0, 360.0, 479.0, 764.0, 1213.0, 1824.0, 2903.0, 4897.0, 8443.0, 16139.0, 40664.0, 779329.0, 136840.0, 24523.0, 11796.0, 6588.0, 3925.0, 2310.0, 1531.0, 979.0, 626.0, 455.0, 307.0, 219.0, 165.0, 115.0, 80.0, 56.0, 42.0, 38.0, 21.0, 23.0, 18.0, 14.0, 12.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.779296875, -2.69696044921875, -2.6146240234375, -2.53228759765625, -2.449951171875, -2.36761474609375, -2.2852783203125, -2.20294189453125, -2.12060546875, -2.03826904296875, -1.9559326171875, -1.87359619140625, -1.791259765625, -1.70892333984375, -1.6265869140625, -1.54425048828125, -1.4619140625, -1.37957763671875, -1.2972412109375, -1.21490478515625, -1.132568359375, -1.05023193359375, -0.9678955078125, -0.88555908203125, -0.80322265625, -0.72088623046875, -0.6385498046875, -0.55621337890625, -0.473876953125, -0.39154052734375, -0.3092041015625, -0.22686767578125, -0.14453125, -0.06219482421875, 0.0201416015625, 0.10247802734375, 0.184814453125, 0.26715087890625, 0.3494873046875, 0.43182373046875, 0.51416015625, 0.59649658203125, 0.6788330078125, 0.76116943359375, 0.843505859375, 0.92584228515625, 1.0081787109375, 1.09051513671875, 1.1728515625, 1.25518798828125, 1.3375244140625, 1.41986083984375, 1.502197265625, 1.58453369140625, 1.6668701171875, 1.74920654296875, 1.83154296875, 1.91387939453125, 1.9962158203125, 2.07855224609375, 2.160888671875, 2.24322509765625, 2.3255615234375, 2.40789794921875, 2.490234375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 4.0, 9.0, 10.0, 16.0, 12.0, 22.0, 21.0, 30.0, 25.0, 20.0, 34.0, 24.0, 40.0, 36.0, 39.0, 37.0, 38.0, 47.0, 62.0, 51.0, 42.0, 49.0, 45.0, 32.0, 36.0, 26.0, 29.0, 33.0, 24.0, 19.0, 21.0, 11.0, 7.0, 10.0, 6.0, 4.0, 6.0, 4.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.2845458984375, -4.155029296875, -4.0255126953125, -3.89599609375, -3.7664794921875, -3.636962890625, -3.5074462890625, -3.3779296875, -3.2484130859375, -3.118896484375, -2.9893798828125, -2.85986328125, -2.7303466796875, -2.600830078125, -2.4713134765625, -2.341796875, -2.2122802734375, -2.082763671875, -1.9532470703125, -1.82373046875, -1.6942138671875, -1.564697265625, -1.4351806640625, -1.3056640625, -1.1761474609375, -1.046630859375, -0.9171142578125, -0.78759765625, -0.6580810546875, -0.528564453125, -0.3990478515625, -0.26953125, -0.1400146484375, -0.010498046875, 0.1190185546875, 0.24853515625, 0.3780517578125, 0.507568359375, 0.6370849609375, 0.7666015625, 0.8961181640625, 1.025634765625, 1.1551513671875, 1.28466796875, 1.4141845703125, 1.543701171875, 1.6732177734375, 1.802734375, 1.9322509765625, 2.061767578125, 2.1912841796875, 2.32080078125, 2.4503173828125, 2.579833984375, 2.7093505859375, 2.8388671875, 2.9683837890625, 3.097900390625, 3.2274169921875, 3.35693359375, 3.4864501953125, 3.615966796875, 3.7454833984375, 3.875]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 11.0, 4.0, 11.0, 12.0, 21.0, 29.0, 30.0, 54.0, 89.0, 122.0, 213.0, 274.0, 459.0, 741.0, 1093.0, 1814.0, 2993.0, 5206.0, 9811.0, 20261.0, 60863.0, 871769.0, 37539.0, 15947.0, 8226.0, 4347.0, 2562.0, 1485.0, 838.0, 589.0, 400.0, 234.0, 168.0, 113.0, 60.0, 48.0, 40.0, 29.0, 12.0, 20.0, 5.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.048828125, -1.0182952880859375, -0.987762451171875, -0.9572296142578125, -0.92669677734375, -0.8961639404296875, -0.865631103515625, -0.8350982666015625, -0.8045654296875, -0.7740325927734375, -0.743499755859375, -0.7129669189453125, -0.68243408203125, -0.6519012451171875, -0.621368408203125, -0.5908355712890625, -0.560302734375, -0.5297698974609375, -0.499237060546875, -0.4687042236328125, -0.43817138671875, -0.4076385498046875, -0.377105712890625, -0.3465728759765625, -0.3160400390625, -0.2855072021484375, -0.254974365234375, -0.2244415283203125, -0.19390869140625, -0.1633758544921875, -0.132843017578125, -0.1023101806640625, -0.07177734375, -0.0412445068359375, -0.010711669921875, 0.0198211669921875, 0.05035400390625, 0.0808868408203125, 0.111419677734375, 0.1419525146484375, 0.1724853515625, 0.2030181884765625, 0.233551025390625, 0.2640838623046875, 0.29461669921875, 0.3251495361328125, 0.355682373046875, 0.3862152099609375, 0.416748046875, 0.4472808837890625, 0.477813720703125, 0.5083465576171875, 0.53887939453125, 0.5694122314453125, 0.599945068359375, 0.6304779052734375, 0.6610107421875, 0.6915435791015625, 0.722076416015625, 0.7526092529296875, 0.78314208984375, 0.8136749267578125, 0.844207763671875, 0.8747406005859375, 0.9052734375]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 4.0, 20.0, 20.0, 23.0, 25.0, 47.0, 31.0, 42.0, 57.0, 66.0, 74.0, 97.0, 98.0, 79.0, 67.0, 44.0, 49.0, 32.0, 23.0, 26.0, 13.0, 10.0, 12.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.230043411254883e-05, -7.032230496406555e-05, -6.834417581558228e-05, -6.6366046667099e-05, -6.438791751861572e-05, -6.240978837013245e-05, -6.043165922164917e-05, -5.8453530073165894e-05, -5.647540092468262e-05, -5.449727177619934e-05, -5.2519142627716064e-05, -5.054101347923279e-05, -4.856288433074951e-05, -4.6584755182266235e-05, -4.460662603378296e-05, -4.262849688529968e-05, -4.0650367736816406e-05, -3.867223858833313e-05, -3.6694109439849854e-05, -3.471598029136658e-05, -3.27378511428833e-05, -3.0759721994400024e-05, -2.8781592845916748e-05, -2.680346369743347e-05, -2.4825334548950195e-05, -2.284720540046692e-05, -2.0869076251983643e-05, -1.8890947103500366e-05, -1.691281795501709e-05, -1.4934688806533813e-05, -1.2956559658050537e-05, -1.097843050956726e-05, -9.000301361083984e-06, -7.022172212600708e-06, -5.044043064117432e-06, -3.0659139156341553e-06, -1.087784767150879e-06, 8.903443813323975e-07, 2.868473529815674e-06, 4.84660267829895e-06, 6.8247318267822266e-06, 8.802860975265503e-06, 1.078099012374878e-05, 1.2759119272232056e-05, 1.4737248420715332e-05, 1.671537756919861e-05, 1.8693506717681885e-05, 2.067163586616516e-05, 2.2649765014648438e-05, 2.4627894163131714e-05, 2.660602331161499e-05, 2.8584152460098267e-05, 3.056228160858154e-05, 3.254041075706482e-05, 3.4518539905548096e-05, 3.649666905403137e-05, 3.847479820251465e-05, 4.0452927350997925e-05, 4.24310564994812e-05, 4.440918564796448e-05, 4.6387314796447754e-05, 4.836544394493103e-05, 5.034357309341431e-05, 5.232170224189758e-05, 5.429983139038086e-05]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 9.0, 16.0, 15.0, 17.0, 38.0, 43.0, 49.0, 97.0, 185.0, 328.0, 550.0, 960.0, 1830.0, 3415.0, 6944.0, 13551.0, 28670.0, 60807.0, 129134.0, 250156.0, 268851.0, 148465.0, 69563.0, 32799.0, 15724.0, 7827.0, 3877.0, 2055.0, 1086.0, 607.0, 342.0, 194.0, 130.0, 78.0, 50.0, 28.0, 24.0, 9.0, 10.0, 9.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4967193603515625, -0.480743408203125, -0.4647674560546875, -0.44879150390625, -0.4328155517578125, -0.416839599609375, -0.4008636474609375, -0.3848876953125, -0.3689117431640625, -0.352935791015625, -0.3369598388671875, -0.32098388671875, -0.3050079345703125, -0.289031982421875, -0.2730560302734375, -0.257080078125, -0.2411041259765625, -0.225128173828125, -0.2091522216796875, -0.19317626953125, -0.1772003173828125, -0.161224365234375, -0.1452484130859375, -0.1292724609375, -0.1132965087890625, -0.097320556640625, -0.0813446044921875, -0.06536865234375, -0.0493927001953125, -0.033416748046875, -0.0174407958984375, -0.00146484375, 0.0145111083984375, 0.030487060546875, 0.0464630126953125, 0.06243896484375, 0.0784149169921875, 0.094390869140625, 0.1103668212890625, 0.1263427734375, 0.1423187255859375, 0.158294677734375, 0.1742706298828125, 0.19024658203125, 0.2062225341796875, 0.222198486328125, 0.2381744384765625, 0.254150390625, 0.2701263427734375, 0.286102294921875, 0.3020782470703125, 0.31805419921875, 0.3340301513671875, 0.350006103515625, 0.3659820556640625, 0.3819580078125, 0.3979339599609375, 0.413909912109375, 0.4298858642578125, 0.44586181640625, 0.4618377685546875, 0.477813720703125, 0.4937896728515625, 0.509765625]}, "gradients/decoder.bert.encoder.layer.17.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 12.0, 8.0, 17.0, 17.0, 39.0, 34.0, 38.0, 48.0, 70.0, 68.0, 89.0, 75.0, 75.0, 87.0, 73.0, 60.0, 43.0, 22.0, 28.0, 23.0, 13.0, 6.0, 10.0, 11.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-0.2098388671875, -0.2042560577392578, -0.19867324829101562, -0.19309043884277344, -0.18750762939453125, -0.18192481994628906, -0.17634201049804688, -0.1707592010498047, -0.1651763916015625, -0.1595935821533203, -0.15401077270507812, -0.14842796325683594, -0.14284515380859375, -0.13726234436035156, -0.13167953491210938, -0.1260967254638672, -0.120513916015625, -0.11493110656738281, -0.10934829711914062, -0.10376548767089844, -0.09818267822265625, -0.09259986877441406, -0.08701705932617188, -0.08143424987792969, -0.0758514404296875, -0.07026863098144531, -0.06468582153320312, -0.05910301208496094, -0.05352020263671875, -0.04793739318847656, -0.042354583740234375, -0.03677177429199219, -0.03118896484375, -0.025606155395507812, -0.020023345947265625, -0.014440536499023438, -0.00885772705078125, -0.0032749176025390625, 0.002307891845703125, 0.007890701293945312, 0.0134735107421875, 0.019056320190429688, 0.024639129638671875, 0.030221939086914062, 0.03580474853515625, 0.04138755798339844, 0.046970367431640625, 0.05255317687988281, 0.058135986328125, 0.06371879577636719, 0.06930160522460938, 0.07488441467285156, 0.08046722412109375, 0.08605003356933594, 0.09163284301757812, 0.09721565246582031, 0.1027984619140625, 0.10838127136230469, 0.11396408081054688, 0.11954689025878906, 0.12512969970703125, 0.13071250915527344, 0.13629531860351562, 0.1418781280517578, 0.1474609375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 2.0, 8.0, 10.0, 15.0, 19.0, 18.0, 26.0, 22.0, 32.0, 40.0, 54.0, 42.0, 47.0, 48.0, 61.0, 56.0, 56.0, 56.0, 49.0, 46.0, 35.0, 36.0, 24.0, 25.0, 26.0, 24.0, 30.0, 16.0, 17.0, 10.0, 5.0, 13.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.523178577423096, -5.359871864318848, -5.1965651512146, -5.03325891494751, -4.869952201843262, -4.706645488739014, -4.543338775634766, -4.380032539367676, -4.216725826263428, -4.05341911315918, -3.8901126384735107, -3.7268059253692627, -3.5634994506835938, -3.4001927375793457, -3.2368860244750977, -3.0735795497894287, -2.9102728366851807, -2.7469661235809326, -2.5836596488952637, -2.4203529357910156, -2.2570464611053467, -2.0937397480010986, -1.9304331541061401, -1.7671265602111816, -1.6038199663162231, -1.4405133724212646, -1.2772067785263062, -1.1139001846313477, -0.9505935311317444, -0.7872869372367859, -0.6239802837371826, -0.4606736898422241, -0.2973670959472656, -0.13406048715114594, 0.029246121644973755, 0.19255274534225464, 0.35585933923721313, 0.5191659331321716, 0.6824725866317749, 0.8457791805267334, 1.009085774421692, 1.1723923683166504, 1.3356989622116089, 1.4990055561065674, 1.6623122692108154, 1.8256187438964844, 1.9889254570007324, 2.1522321701049805, 2.3155386447906494, 2.4788453578948975, 2.6421518325805664, 2.8054585456848145, 2.9687650203704834, 3.1320717334747314, 3.2953782081604004, 3.4586849212646484, 3.6219916343688965, 3.7852983474731445, 3.9486048221588135, 4.111911296844482, 4.2752180099487305, 4.4385247230529785, 4.601831436157227, 4.765137672424316, 4.9284443855285645]}, "gradients/decoder.bert.encoder.layer.17.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 9.0, 4.0, 5.0, 6.0, 10.0, 11.0, 14.0, 24.0, 19.0, 17.0, 18.0, 28.0, 27.0, 25.0, 33.0, 39.0, 32.0, 34.0, 37.0, 40.0, 40.0, 46.0, 47.0, 30.0, 38.0, 46.0, 38.0, 33.0, 36.0, 25.0, 29.0, 20.0, 16.0, 24.0, 17.0, 14.0, 17.0, 6.0, 7.0, 9.0, 8.0, 3.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.982836723327637, -4.823299407958984, -4.66376256942749, -4.504225254058838, -4.344688415527344, -4.185151100158691, -4.025613784790039, -3.866076946258545, -3.7065396308898926, -3.5470025539398193, -3.387465476989746, -3.2279281616210938, -3.0683910846710205, -2.9088540077209473, -2.749316930770874, -2.589779853820801, -2.4302427768707275, -2.2707056999206543, -2.111168622970581, -1.9516314268112183, -1.7920942306518555, -1.6325571537017822, -1.473020076751709, -1.3134828805923462, -1.153945803642273, -0.9944086670875549, -0.8348715305328369, -0.6753344535827637, -0.5157973170280457, -0.35626018047332764, -0.1967231035232544, -0.0371859073638916, 0.12235116958618164, 0.28188830614089966, 0.4414254128932953, 0.6009625196456909, 0.7604996562004089, 0.920036792755127, 1.0795738697052002, 1.239111065864563, 1.3986481428146362, 1.5581852197647095, 1.7177224159240723, 1.8772594928741455, 2.0367965698242188, 2.196333885192871, 2.3558707237243652, 2.5154080390930176, 2.674945116043091, 2.834482192993164, 2.9940192699432373, 3.1535563468933105, 3.313093662261963, 3.472630739212036, 3.6321678161621094, 3.7917051315307617, 3.951241970062256, 4.110779285430908, 4.270316123962402, 4.429853439331055, 4.589390277862549, 4.748927593231201, 4.908464431762695, 5.068001747131348, 5.2275390625]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 19.0, 30.0, 37.0, 69.0, 91.0, 147.0, 166.0, 293.0, 436.0, 675.0, 1011.0, 1577.0, 2447.0, 3633.0, 5691.0, 8898.0, 13709.0, 20948.0, 31653.0, 47290.0, 67888.0, 91961.0, 116406.0, 129122.0, 126939.0, 109260.0, 85095.0, 60657.0, 42179.0, 27765.0, 18248.0, 12246.0, 7693.0, 4997.0, 3171.0, 2053.0, 1373.0, 908.0, 606.0, 396.0, 271.0, 170.0, 119.0, 81.0, 46.0, 26.0, 20.0, 15.0, 7.0, 6.0, 4.0, 2.0, 0.0, 3.0, 2.0], "bins": [-3.712890625, -3.599853515625, -3.48681640625, -3.373779296875, -3.2607421875, -3.147705078125, -3.03466796875, -2.921630859375, -2.80859375, -2.695556640625, -2.58251953125, -2.469482421875, -2.3564453125, -2.243408203125, -2.13037109375, -2.017333984375, -1.904296875, -1.791259765625, -1.67822265625, -1.565185546875, -1.4521484375, -1.339111328125, -1.22607421875, -1.113037109375, -1.0, -0.886962890625, -0.77392578125, -0.660888671875, -0.5478515625, -0.434814453125, -0.32177734375, -0.208740234375, -0.095703125, 0.017333984375, 0.13037109375, 0.243408203125, 0.3564453125, 0.469482421875, 0.58251953125, 0.695556640625, 0.80859375, 0.921630859375, 1.03466796875, 1.147705078125, 1.2607421875, 1.373779296875, 1.48681640625, 1.599853515625, 1.712890625, 1.825927734375, 1.93896484375, 2.052001953125, 2.1650390625, 2.278076171875, 2.39111328125, 2.504150390625, 2.6171875, 2.730224609375, 2.84326171875, 2.956298828125, 3.0693359375, 3.182373046875, 3.29541015625, 3.408447265625, 3.521484375]}, "gradients/decoder.bert.encoder.layer.17.attention.output.dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 8.0, 10.0, 16.0, 10.0, 10.0, 22.0, 23.0, 24.0, 21.0, 32.0, 21.0, 31.0, 34.0, 31.0, 44.0, 46.0, 47.0, 32.0, 39.0, 56.0, 42.0, 36.0, 49.0, 39.0, 39.0, 31.0, 26.0, 20.0, 32.0, 21.0, 19.0, 13.0, 18.0, 5.0, 8.0, 7.0, 5.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.44921875, -5.2750244140625, -5.100830078125, -4.9266357421875, -4.75244140625, -4.5782470703125, -4.404052734375, -4.2298583984375, -4.0556640625, -3.8814697265625, -3.707275390625, -3.5330810546875, -3.35888671875, -3.1846923828125, -3.010498046875, -2.8363037109375, -2.662109375, -2.4879150390625, -2.313720703125, -2.1395263671875, -1.96533203125, -1.7911376953125, -1.616943359375, -1.4427490234375, -1.2685546875, -1.0943603515625, -0.920166015625, -0.7459716796875, -0.57177734375, -0.3975830078125, -0.223388671875, -0.0491943359375, 0.125, 0.2991943359375, 0.473388671875, 0.6475830078125, 0.82177734375, 0.9959716796875, 1.170166015625, 1.3443603515625, 1.5185546875, 1.6927490234375, 1.866943359375, 2.0411376953125, 2.21533203125, 2.3895263671875, 2.563720703125, 2.7379150390625, 2.912109375, 3.0863037109375, 3.260498046875, 3.4346923828125, 3.60888671875, 3.7830810546875, 3.957275390625, 4.1314697265625, 4.3056640625, 4.4798583984375, 4.654052734375, 4.8282470703125, 5.00244140625, 5.1766357421875, 5.350830078125, 5.5250244140625, 5.69921875]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 17.0, 24.0, 44.0, 64.0, 106.0, 154.0, 255.0, 405.0, 710.0, 1125.0, 1706.0, 2876.0, 4973.0, 8157.0, 14130.0, 24347.0, 41861.0, 68958.0, 107689.0, 147099.0, 167981.0, 153484.0, 115497.0, 75710.0, 45733.0, 26998.0, 15808.0, 9112.0, 5386.0, 3146.0, 1929.0, 1125.0, 742.0, 459.0, 282.0, 142.0, 108.0, 77.0, 47.0, 29.0, 18.0, 11.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.970703125, -3.840911865234375, -3.71112060546875, -3.581329345703125, -3.4515380859375, -3.321746826171875, -3.19195556640625, -3.062164306640625, -2.932373046875, -2.802581787109375, -2.67279052734375, -2.542999267578125, -2.4132080078125, -2.283416748046875, -2.15362548828125, -2.023834228515625, -1.89404296875, -1.764251708984375, -1.63446044921875, -1.504669189453125, -1.3748779296875, -1.245086669921875, -1.11529541015625, -0.985504150390625, -0.855712890625, -0.725921630859375, -0.59613037109375, -0.466339111328125, -0.3365478515625, -0.206756591796875, -0.07696533203125, 0.052825927734375, 0.1826171875, 0.312408447265625, 0.44219970703125, 0.571990966796875, 0.7017822265625, 0.831573486328125, 0.96136474609375, 1.091156005859375, 1.220947265625, 1.350738525390625, 1.48052978515625, 1.610321044921875, 1.7401123046875, 1.869903564453125, 1.99969482421875, 2.129486083984375, 2.25927734375, 2.389068603515625, 2.51885986328125, 2.648651123046875, 2.7784423828125, 2.908233642578125, 3.03802490234375, 3.167816162109375, 3.297607421875, 3.427398681640625, 3.55718994140625, 3.686981201171875, 3.8167724609375, 3.946563720703125, 4.07635498046875, 4.206146240234375, 4.3359375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 12.0, 9.0, 15.0, 20.0, 9.0, 20.0, 22.0, 23.0, 35.0, 34.0, 41.0, 35.0, 41.0, 42.0, 47.0, 30.0, 45.0, 31.0, 46.0, 40.0, 29.0, 43.0, 33.0, 44.0, 33.0, 29.0, 41.0, 18.0, 23.0, 19.0, 13.0, 14.0, 7.0, 7.0, 5.0, 7.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0], "bins": [-4.21875, -4.10357666015625, -3.9884033203125, -3.87322998046875, -3.758056640625, -3.64288330078125, -3.5277099609375, -3.41253662109375, -3.29736328125, -3.18218994140625, -3.0670166015625, -2.95184326171875, -2.836669921875, -2.72149658203125, -2.6063232421875, -2.49114990234375, -2.3759765625, -2.26080322265625, -2.1456298828125, -2.03045654296875, -1.915283203125, -1.80010986328125, -1.6849365234375, -1.56976318359375, -1.45458984375, -1.33941650390625, -1.2242431640625, -1.10906982421875, -0.993896484375, -0.87872314453125, -0.7635498046875, -0.64837646484375, -0.533203125, -0.41802978515625, -0.3028564453125, -0.18768310546875, -0.072509765625, 0.04266357421875, 0.1578369140625, 0.27301025390625, 0.38818359375, 0.50335693359375, 0.6185302734375, 0.73370361328125, 0.848876953125, 0.96405029296875, 1.0792236328125, 1.19439697265625, 1.3095703125, 1.42474365234375, 1.5399169921875, 1.65509033203125, 1.770263671875, 1.88543701171875, 2.0006103515625, 2.11578369140625, 2.23095703125, 2.34613037109375, 2.4613037109375, 2.57647705078125, 2.691650390625, 2.80682373046875, 2.9219970703125, 3.03717041015625, 3.15234375]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 21.0, 11.0, 21.0, 36.0, 62.0, 90.0, 139.0, 200.0, 334.0, 559.0, 918.0, 1443.0, 2535.0, 4650.0, 8566.0, 16714.0, 33900.0, 71808.0, 147502.0, 241923.0, 237495.0, 142613.0, 69330.0, 32823.0, 16024.0, 8211.0, 4371.0, 2496.0, 1434.0, 897.0, 488.0, 295.0, 203.0, 147.0, 91.0, 64.0, 39.0, 32.0, 17.0, 16.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.04779052734375, -3.9080810546875, -3.76837158203125, -3.628662109375, -3.48895263671875, -3.3492431640625, -3.20953369140625, -3.06982421875, -2.93011474609375, -2.7904052734375, -2.65069580078125, -2.510986328125, -2.37127685546875, -2.2315673828125, -2.09185791015625, -1.9521484375, -1.81243896484375, -1.6727294921875, -1.53302001953125, -1.393310546875, -1.25360107421875, -1.1138916015625, -0.97418212890625, -0.83447265625, -0.69476318359375, -0.5550537109375, -0.41534423828125, -0.275634765625, -0.13592529296875, 0.0037841796875, 0.14349365234375, 0.283203125, 0.42291259765625, 0.5626220703125, 0.70233154296875, 0.842041015625, 0.98175048828125, 1.1214599609375, 1.26116943359375, 1.40087890625, 1.54058837890625, 1.6802978515625, 1.82000732421875, 1.959716796875, 2.09942626953125, 2.2391357421875, 2.37884521484375, 2.5185546875, 2.65826416015625, 2.7979736328125, 2.93768310546875, 3.077392578125, 3.21710205078125, 3.3568115234375, 3.49652099609375, 3.63623046875, 3.77593994140625, 3.9156494140625, 4.05535888671875, 4.195068359375, 4.33477783203125, 4.4744873046875, 4.61419677734375, 4.75390625]}, "gradients/decoder.bert.encoder.layer.17.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 3.0, 6.0, 7.0, 8.0, 5.0, 7.0, 13.0, 14.0, 17.0, 26.0, 25.0, 33.0, 46.0, 32.0, 37.0, 32.0, 56.0, 58.0, 48.0, 56.0, 41.0, 50.0, 53.0, 45.0, 38.0, 36.0, 42.0, 25.0, 18.0, 23.0, 14.0, 13.0, 11.0, 14.0, 10.0, 11.0, 6.0, 8.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0], "bins": [-0.0003337860107421875, -0.00032532960176467896, -0.0003168731927871704, -0.00030841678380966187, -0.0002999603748321533, -0.0002915039658546448, -0.00028304755687713623, -0.0002745911478996277, -0.00026613473892211914, -0.0002576783299446106, -0.00024922192096710205, -0.0002407655119895935, -0.00023230910301208496, -0.00022385269403457642, -0.00021539628505706787, -0.00020693987607955933, -0.00019848346710205078, -0.00019002705812454224, -0.0001815706491470337, -0.00017311424016952515, -0.0001646578311920166, -0.00015620142221450806, -0.0001477450132369995, -0.00013928860425949097, -0.00013083219528198242, -0.00012237578630447388, -0.00011391937732696533, -0.00010546296834945679, -9.700655937194824e-05, -8.85501503944397e-05, -8.009374141693115e-05, -7.163733243942261e-05, -6.318092346191406e-05, -5.472451448440552e-05, -4.626810550689697e-05, -3.781169652938843e-05, -2.9355287551879883e-05, -2.0898878574371338e-05, -1.2442469596862793e-05, -3.986060619354248e-06, 4.470348358154297e-06, 1.2926757335662842e-05, 2.1383166313171387e-05, 2.983957529067993e-05, 3.8295984268188477e-05, 4.675239324569702e-05, 5.5208802223205566e-05, 6.366521120071411e-05, 7.212162017822266e-05, 8.05780291557312e-05, 8.903443813323975e-05, 9.749084711074829e-05, 0.00010594725608825684, 0.00011440366506576538, 0.00012286007404327393, 0.00013131648302078247, 0.00013977289199829102, 0.00014822930097579956, 0.0001566857099533081, 0.00016514211893081665, 0.0001735985279083252, 0.00018205493688583374, 0.00019051134586334229, 0.00019896775484085083, 0.00020742416381835938]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 5.0, 4.0, 3.0, 14.0, 11.0, 24.0, 35.0, 38.0, 63.0, 101.0, 146.0, 200.0, 314.0, 418.0, 699.0, 1087.0, 1675.0, 2839.0, 5052.0, 9280.0, 19445.0, 43308.0, 101597.0, 211365.0, 282234.0, 197792.0, 92375.0, 39637.0, 18064.0, 8744.0, 4749.0, 2643.0, 1627.0, 1010.0, 679.0, 429.0, 289.0, 179.0, 122.0, 94.0, 50.0, 34.0, 30.0, 19.0, 12.0, 8.0, 6.0, 5.0, 3.0, 0.0, 4.0, 2.0], "bins": [-5.796875, -5.6378173828125, -5.478759765625, -5.3197021484375, -5.16064453125, -5.0015869140625, -4.842529296875, -4.6834716796875, -4.5244140625, -4.3653564453125, -4.206298828125, -4.0472412109375, -3.88818359375, -3.7291259765625, -3.570068359375, -3.4110107421875, -3.251953125, -3.0928955078125, -2.933837890625, -2.7747802734375, -2.61572265625, -2.4566650390625, -2.297607421875, -2.1385498046875, -1.9794921875, -1.8204345703125, -1.661376953125, -1.5023193359375, -1.34326171875, -1.1842041015625, -1.025146484375, -0.8660888671875, -0.70703125, -0.5479736328125, -0.388916015625, -0.2298583984375, -0.07080078125, 0.0882568359375, 0.247314453125, 0.4063720703125, 0.5654296875, 0.7244873046875, 0.883544921875, 1.0426025390625, 1.20166015625, 1.3607177734375, 1.519775390625, 1.6788330078125, 1.837890625, 1.9969482421875, 2.156005859375, 2.3150634765625, 2.47412109375, 2.6331787109375, 2.792236328125, 2.9512939453125, 3.1103515625, 3.2694091796875, 3.428466796875, 3.5875244140625, 3.74658203125, 3.9056396484375, 4.064697265625, 4.2237548828125, 4.3828125]}, "gradients/decoder.bert.encoder.layer.17.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 10.0, 11.0, 6.0, 9.0, 11.0, 11.0, 15.0, 29.0, 36.0, 45.0, 35.0, 42.0, 48.0, 60.0, 62.0, 79.0, 63.0, 54.0, 62.0, 60.0, 42.0, 41.0, 28.0, 16.0, 24.0, 20.0, 20.0, 7.0, 15.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.38671875, -1.346282958984375, -1.30584716796875, -1.265411376953125, -1.2249755859375, -1.184539794921875, -1.14410400390625, -1.103668212890625, -1.063232421875, -1.022796630859375, -0.98236083984375, -0.941925048828125, -0.9014892578125, -0.861053466796875, -0.82061767578125, -0.780181884765625, -0.73974609375, -0.699310302734375, -0.65887451171875, -0.618438720703125, -0.5780029296875, -0.537567138671875, -0.49713134765625, -0.456695556640625, -0.416259765625, -0.375823974609375, -0.33538818359375, -0.294952392578125, -0.2545166015625, -0.214080810546875, -0.17364501953125, -0.133209228515625, -0.0927734375, -0.052337646484375, -0.01190185546875, 0.028533935546875, 0.0689697265625, 0.109405517578125, 0.14984130859375, 0.190277099609375, 0.230712890625, 0.271148681640625, 0.31158447265625, 0.352020263671875, 0.3924560546875, 0.432891845703125, 0.47332763671875, 0.513763427734375, 0.55419921875, 0.594635009765625, 0.63507080078125, 0.675506591796875, 0.7159423828125, 0.756378173828125, 0.79681396484375, 0.837249755859375, 0.877685546875, 0.918121337890625, 0.95855712890625, 0.998992919921875, 1.0394287109375, 1.079864501953125, 1.12030029296875, 1.160736083984375, 1.201171875]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 1.0, 5.0, 5.0, 11.0, 9.0, 7.0, 11.0, 15.0, 17.0, 24.0, 22.0, 34.0, 42.0, 47.0, 45.0, 37.0, 62.0, 72.0, 60.0, 46.0, 55.0, 43.0, 42.0, 42.0, 36.0, 30.0, 20.0, 40.0, 22.0, 10.0, 10.0, 15.0, 16.0, 9.0, 8.0, 3.0, 8.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.03448486328125, -4.875150203704834, -4.715815544128418, -4.55648136138916, -4.397146701812744, -4.237812042236328, -4.078477382659912, -3.919142723083496, -3.759808301925659, -3.600473642349243, -3.4411392211914062, -3.2818045616149902, -3.122469902038574, -2.9631354808807373, -2.8038008213043213, -2.6444664001464844, -2.4851317405700684, -2.3257970809936523, -2.1664626598358154, -2.0071280002593994, -1.847793459892273, -1.6884589195251465, -1.5291242599487305, -1.369789719581604, -1.2104551792144775, -1.051120638847351, -0.8917860388755798, -0.7324514389038086, -0.5731168985366821, -0.41378235816955566, -0.2544477581977844, -0.09511315822601318, 0.06422138214111328, 0.22355595231056213, 0.382890522480011, 0.5422251224517822, 0.7015596628189087, 0.8608942031860352, 1.0202288627624512, 1.1795634031295776, 1.338897943496704, 1.4982324838638306, 1.657567024230957, 1.816901683807373, 1.9762362241744995, 2.135570764541626, 2.294905424118042, 2.454239845275879, 2.613574504852295, 2.772909164428711, 2.932243585586548, 3.091578245162964, 3.250912666320801, 3.410247325897217, 3.569581985473633, 3.728916645050049, 3.8882510662078857, 4.047585487365723, 4.206920146942139, 4.366254806518555, 4.525589466094971, 4.684924125671387, 4.8442583084106445, 5.0035929679870605, 5.162927627563477]}, "gradients/decoder.bert.encoder.layer.16.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 6.0, 3.0, 6.0, 9.0, 13.0, 14.0, 16.0, 20.0, 20.0, 35.0, 33.0, 32.0, 39.0, 44.0, 31.0, 40.0, 39.0, 33.0, 47.0, 44.0, 37.0, 50.0, 49.0, 41.0, 32.0, 42.0, 40.0, 39.0, 29.0, 22.0, 17.0, 15.0, 20.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.929340362548828, -5.738770961761475, -5.548201084136963, -5.357631683349609, -5.167062282562256, -4.976492881774902, -4.785923004150391, -4.595353603363037, -4.404784202575684, -4.21421480178833, -4.023644924163818, -3.833075523376465, -3.6425061225891113, -3.4519364833831787, -3.261366844177246, -3.0707974433898926, -2.880227565765381, -2.6896579265594482, -2.4990885257720947, -2.308518886566162, -2.1179494857788086, -1.927379846572876, -1.7368102073669434, -1.5462406873703003, -1.3556711673736572, -1.1651016473770142, -0.9745320677757263, -0.7839624881744385, -0.5933929681777954, -0.40282344818115234, -0.21225380897521973, -0.02168428897857666, 0.1688847541809082, 0.35945430397987366, 0.5500238537788391, 0.740593433380127, 0.93116295337677, 1.121732473373413, 1.3123021125793457, 1.5028716325759888, 1.6934411525726318, 1.884010672569275, 2.074580192565918, 2.2651498317718506, 2.455719470977783, 2.6462888717651367, 2.8368585109710693, 3.027428150177002, 3.2179975509643555, 3.408567190170288, 3.5991365909576416, 3.789706230163574, 3.9802756309509277, 4.170845031738281, 4.361414909362793, 4.5519843101501465, 4.7425537109375, 4.9331231117248535, 5.123692989349365, 5.314262390136719, 5.504831790924072, 5.695401191711426, 5.8859710693359375, 6.076540470123291, 6.267110347747803]}, "gradients/decoder.bert.encoder.layer.16.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 10.0, 21.0, 24.0, 41.0, 41.0, 82.0, 116.0, 201.0, 284.0, 478.0, 789.0, 1168.0, 2006.0, 3234.0, 5904.0, 10743.0, 19451.0, 37751.0, 75361.0, 158241.0, 348517.0, 719261.0, 1051797.0, 876378.0, 463245.0, 211989.0, 100278.0, 49468.0, 25574.0, 13357.0, 7524.0, 4327.0, 2524.0, 1455.0, 944.0, 588.0, 357.0, 249.0, 151.0, 109.0, 68.0, 51.0, 32.0, 17.0, 22.0, 17.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-5.30859375, -5.14617919921875, -4.9837646484375, -4.82135009765625, -4.658935546875, -4.49652099609375, -4.3341064453125, -4.17169189453125, -4.00927734375, -3.84686279296875, -3.6844482421875, -3.52203369140625, -3.359619140625, -3.19720458984375, -3.0347900390625, -2.87237548828125, -2.7099609375, -2.54754638671875, -2.3851318359375, -2.22271728515625, -2.060302734375, -1.89788818359375, -1.7354736328125, -1.57305908203125, -1.41064453125, -1.24822998046875, -1.0858154296875, -0.92340087890625, -0.760986328125, -0.59857177734375, -0.4361572265625, -0.27374267578125, -0.111328125, 0.05108642578125, 0.2135009765625, 0.37591552734375, 0.538330078125, 0.70074462890625, 0.8631591796875, 1.02557373046875, 1.18798828125, 1.35040283203125, 1.5128173828125, 1.67523193359375, 1.837646484375, 2.00006103515625, 2.1624755859375, 2.32489013671875, 2.4873046875, 2.64971923828125, 2.8121337890625, 2.97454833984375, 3.136962890625, 3.29937744140625, 3.4617919921875, 3.62420654296875, 3.78662109375, 3.94903564453125, 4.1114501953125, 4.27386474609375, 4.436279296875, 4.59869384765625, 4.7611083984375, 4.92352294921875, 5.0859375]}, "gradients/decoder.bert.encoder.layer.16.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 14.0, 17.0, 17.0, 18.0, 24.0, 18.0, 27.0, 39.0, 30.0, 28.0, 39.0, 25.0, 42.0, 41.0, 45.0, 40.0, 53.0, 47.0, 47.0, 43.0, 35.0, 38.0, 34.0, 30.0, 26.0, 36.0, 28.0, 27.0, 17.0, 8.0, 10.0, 9.0, 3.0, 6.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.275390625, -3.153289794921875, -3.03118896484375, -2.909088134765625, -2.7869873046875, -2.664886474609375, -2.54278564453125, -2.420684814453125, -2.298583984375, -2.176483154296875, -2.05438232421875, -1.932281494140625, -1.8101806640625, -1.688079833984375, -1.56597900390625, -1.443878173828125, -1.32177734375, -1.199676513671875, -1.07757568359375, -0.955474853515625, -0.8333740234375, -0.711273193359375, -0.58917236328125, -0.467071533203125, -0.344970703125, -0.222869873046875, -0.10076904296875, 0.021331787109375, 0.1434326171875, 0.265533447265625, 0.38763427734375, 0.509735107421875, 0.6318359375, 0.753936767578125, 0.87603759765625, 0.998138427734375, 1.1202392578125, 1.242340087890625, 1.36444091796875, 1.486541748046875, 1.608642578125, 1.730743408203125, 1.85284423828125, 1.974945068359375, 2.0970458984375, 2.219146728515625, 2.34124755859375, 2.463348388671875, 2.58544921875, 2.707550048828125, 2.82965087890625, 2.951751708984375, 3.0738525390625, 3.195953369140625, 3.31805419921875, 3.440155029296875, 3.562255859375, 3.684356689453125, 3.80645751953125, 3.928558349609375, 4.0506591796875, 4.172760009765625, 4.29486083984375, 4.416961669921875, 4.5390625]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 8.0, 21.0, 30.0, 32.0, 66.0, 104.0, 138.0, 220.0, 315.0, 552.0, 947.0, 1406.0, 2253.0, 3637.0, 5947.0, 9990.0, 16953.0, 29437.0, 52027.0, 95323.0, 175390.0, 326459.0, 577620.0, 852951.0, 828420.0, 543543.0, 303535.0, 162962.0, 87997.0, 48459.0, 27739.0, 15861.0, 9379.0, 5537.0, 3382.0, 2073.0, 1287.0, 822.0, 509.0, 332.0, 220.0, 130.0, 93.0, 70.0, 36.0, 28.0, 14.0, 11.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.35455322265625, -4.2091064453125, -4.06365966796875, -3.918212890625, -3.77276611328125, -3.6273193359375, -3.48187255859375, -3.33642578125, -3.19097900390625, -3.0455322265625, -2.90008544921875, -2.754638671875, -2.60919189453125, -2.4637451171875, -2.31829833984375, -2.1728515625, -2.02740478515625, -1.8819580078125, -1.73651123046875, -1.591064453125, -1.44561767578125, -1.3001708984375, -1.15472412109375, -1.00927734375, -0.86383056640625, -0.7183837890625, -0.57293701171875, -0.427490234375, -0.28204345703125, -0.1365966796875, 0.00885009765625, 0.154296875, 0.29974365234375, 0.4451904296875, 0.59063720703125, 0.736083984375, 0.88153076171875, 1.0269775390625, 1.17242431640625, 1.31787109375, 1.46331787109375, 1.6087646484375, 1.75421142578125, 1.899658203125, 2.04510498046875, 2.1905517578125, 2.33599853515625, 2.4814453125, 2.62689208984375, 2.7723388671875, 2.91778564453125, 3.063232421875, 3.20867919921875, 3.3541259765625, 3.49957275390625, 3.64501953125, 3.79046630859375, 3.9359130859375, 4.08135986328125, 4.226806640625, 4.37225341796875, 4.5177001953125, 4.66314697265625, 4.80859375]}, "gradients/decoder.bert.encoder.layer.16.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 16.0, 12.0, 18.0, 25.0, 28.0, 32.0, 42.0, 50.0, 59.0, 60.0, 95.0, 115.0, 135.0, 179.0, 170.0, 209.0, 220.0, 208.0, 284.0, 279.0, 213.0, 253.0, 189.0, 174.0, 163.0, 145.0, 137.0, 93.0, 84.0, 70.0, 55.0, 51.0, 42.0, 35.0, 26.0, 17.0, 18.0, 17.0, 12.0, 13.0, 3.0, 6.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.630859375, -1.5804443359375, -1.530029296875, -1.4796142578125, -1.42919921875, -1.3787841796875, -1.328369140625, -1.2779541015625, -1.2275390625, -1.1771240234375, -1.126708984375, -1.0762939453125, -1.02587890625, -0.9754638671875, -0.925048828125, -0.8746337890625, -0.82421875, -0.7738037109375, -0.723388671875, -0.6729736328125, -0.62255859375, -0.5721435546875, -0.521728515625, -0.4713134765625, -0.4208984375, -0.3704833984375, -0.320068359375, -0.2696533203125, -0.21923828125, -0.1688232421875, -0.118408203125, -0.0679931640625, -0.017578125, 0.0328369140625, 0.083251953125, 0.1336669921875, 0.18408203125, 0.2344970703125, 0.284912109375, 0.3353271484375, 0.3857421875, 0.4361572265625, 0.486572265625, 0.5369873046875, 0.58740234375, 0.6378173828125, 0.688232421875, 0.7386474609375, 0.7890625, 0.8394775390625, 0.889892578125, 0.9403076171875, 0.99072265625, 1.0411376953125, 1.091552734375, 1.1419677734375, 1.1923828125, 1.2427978515625, 1.293212890625, 1.3436279296875, 1.39404296875, 1.4444580078125, 1.494873046875, 1.5452880859375, 1.595703125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 2.0, 6.0, 7.0, 10.0, 9.0, 16.0, 22.0, 17.0, 16.0, 32.0, 29.0, 33.0, 44.0, 46.0, 43.0, 54.0, 54.0, 56.0, 56.0, 61.0, 41.0, 44.0, 48.0, 40.0, 31.0, 29.0, 27.0, 24.0, 17.0, 13.0, 13.0, 8.0, 11.0, 11.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3879594802856445, -4.246031284332275, -4.104103088378906, -3.962175130844116, -3.820246934890747, -3.678318738937378, -3.536390781402588, -3.3944625854492188, -3.2525343894958496, -3.1106061935424805, -2.9686779975891113, -2.8267500400543213, -2.684821844100952, -2.542893648147583, -2.400965690612793, -2.259037494659424, -2.1171092987060547, -1.9751811027526855, -1.833253026008606, -1.6913249492645264, -1.5493967533111572, -1.407468557357788, -1.2655404806137085, -1.123612403869629, -0.9816842079162598, -0.8397560715675354, -0.697827935218811, -0.5558997988700867, -0.4139716625213623, -0.27204352617263794, -0.13011538982391357, 0.011812746524810791, 0.15374135971069336, 0.2956694960594177, 0.4375976324081421, 0.5795257687568665, 0.7214539051055908, 0.8633820414543152, 1.0053101778030396, 1.1472382545471191, 1.2891664505004883, 1.4310946464538574, 1.573022723197937, 1.7149507999420166, 1.8568789958953857, 1.9988071918487549, 2.140735149383545, 2.282663345336914, 2.424591541290283, 2.5665197372436523, 2.7084479331970215, 2.8503758907318115, 2.9923040866851807, 3.13423228263855, 3.27616024017334, 3.418088436126709, 3.560016632080078, 3.7019448280334473, 3.8438730239868164, 3.9858009815216064, 4.127729415893555, 4.269657135009766, 4.411585330963135, 4.553513526916504, 4.695441722869873]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 8.0, 3.0, 4.0, 4.0, 10.0, 7.0, 19.0, 14.0, 27.0, 17.0, 29.0, 32.0, 38.0, 32.0, 38.0, 43.0, 43.0, 39.0, 47.0, 40.0, 51.0, 47.0, 51.0, 38.0, 43.0, 35.0, 37.0, 35.0, 27.0, 25.0, 25.0, 20.0, 16.0, 13.0, 14.0, 15.0, 7.0, 2.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.613129138946533, -4.4596991539001465, -4.306269645690918, -4.152839660644531, -3.9994101524353027, -3.845980167388916, -3.6925504207611084, -3.539120674133301, -3.385690927505493, -3.2322611808776855, -3.078831434249878, -2.9254016876220703, -2.7719717025756836, -2.618542194366455, -2.4651122093200684, -2.3116824626922607, -2.158252716064453, -2.0048229694366455, -1.851393222808838, -1.6979633569717407, -1.544533610343933, -1.3911038637161255, -1.2376739978790283, -1.0842442512512207, -0.9308145046234131, -0.7773847579956055, -0.6239549517631531, -0.47052517533302307, -0.31709539890289307, -0.16366565227508545, -0.010235846042633057, 0.14319396018981934, 0.29662418365478516, 0.45005396008491516, 0.6034837365150452, 0.7569135427474976, 0.9103432893753052, 1.0637730360031128, 1.21720290184021, 1.3706326484680176, 1.5240623950958252, 1.6774921417236328, 1.8309218883514404, 1.9843517541885376, 2.1377816200256348, 2.2912111282348633, 2.44464111328125, 2.5980708599090576, 2.7515006065368652, 2.904930353164673, 3.0583600997924805, 3.211789846420288, 3.3652195930480957, 3.5186495780944824, 3.67207932472229, 3.8255090713500977, 3.9789388179779053, 4.132368564605713, 4.2857985496521, 4.439228057861328, 4.592658042907715, 4.746087551116943, 4.89951753616333, 5.052947044372559, 5.206377029418945]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 14.0, 12.0, 16.0, 30.0, 41.0, 55.0, 99.0, 144.0, 218.0, 299.0, 506.0, 823.0, 1177.0, 1984.0, 3190.0, 5086.0, 8205.0, 13608.0, 22396.0, 37473.0, 64275.0, 114339.0, 198871.0, 229550.0, 146395.0, 81896.0, 46594.0, 27638.0, 16649.0, 10221.0, 6193.0, 3832.0, 2464.0, 1560.0, 976.0, 596.0, 389.0, 237.0, 161.0, 121.0, 72.0, 53.0, 36.0, 17.0, 11.0, 13.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.97412109375, -0.9429092407226562, -0.9116973876953125, -0.8804855346679688, -0.849273681640625, -0.8180618286132812, -0.7868499755859375, -0.7556381225585938, -0.72442626953125, -0.6932144165039062, -0.6620025634765625, -0.6307907104492188, -0.599578857421875, -0.5683670043945312, -0.5371551513671875, -0.5059432983398438, -0.4747314453125, -0.44351959228515625, -0.4123077392578125, -0.38109588623046875, -0.349884033203125, -0.31867218017578125, -0.2874603271484375, -0.25624847412109375, -0.22503662109375, -0.19382476806640625, -0.1626129150390625, -0.13140106201171875, -0.100189208984375, -0.06897735595703125, -0.0377655029296875, -0.00655364990234375, 0.024658203125, 0.05587005615234375, 0.0870819091796875, 0.11829376220703125, 0.149505615234375, 0.18071746826171875, 0.2119293212890625, 0.24314117431640625, 0.27435302734375, 0.30556488037109375, 0.3367767333984375, 0.36798858642578125, 0.399200439453125, 0.43041229248046875, 0.4616241455078125, 0.49283599853515625, 0.5240478515625, 0.5552597045898438, 0.5864715576171875, 0.6176834106445312, 0.648895263671875, 0.6801071166992188, 0.7113189697265625, 0.7425308227539062, 0.77374267578125, 0.8049545288085938, 0.8361663818359375, 0.8673782348632812, 0.898590087890625, 0.9298019409179688, 0.9610137939453125, 0.9922256469726562, 1.0234375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 11.0, 13.0, 14.0, 21.0, 23.0, 26.0, 32.0, 32.0, 31.0, 41.0, 43.0, 41.0, 40.0, 54.0, 45.0, 50.0, 41.0, 48.0, 35.0, 31.0, 47.0, 25.0, 32.0, 24.0, 31.0, 25.0, 27.0, 14.0, 17.0, 15.0, 8.0, 9.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.3070068359375, -4.153076171875, -3.9991455078125, -3.84521484375, -3.6912841796875, -3.537353515625, -3.3834228515625, -3.2294921875, -3.0755615234375, -2.921630859375, -2.7677001953125, -2.61376953125, -2.4598388671875, -2.305908203125, -2.1519775390625, -1.998046875, -1.8441162109375, -1.690185546875, -1.5362548828125, -1.38232421875, -1.2283935546875, -1.074462890625, -0.9205322265625, -0.7666015625, -0.6126708984375, -0.458740234375, -0.3048095703125, -0.15087890625, 0.0030517578125, 0.156982421875, 0.3109130859375, 0.46484375, 0.6187744140625, 0.772705078125, 0.9266357421875, 1.08056640625, 1.2344970703125, 1.388427734375, 1.5423583984375, 1.6962890625, 1.8502197265625, 2.004150390625, 2.1580810546875, 2.31201171875, 2.4659423828125, 2.619873046875, 2.7738037109375, 2.927734375, 3.0816650390625, 3.235595703125, 3.3895263671875, 3.54345703125, 3.6973876953125, 3.851318359375, 4.0052490234375, 4.1591796875, 4.3131103515625, 4.467041015625, 4.6209716796875, 4.77490234375, 4.9288330078125, 5.082763671875, 5.2366943359375, 5.390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 3.0, 5.0, 11.0, 12.0, 20.0, 21.0, 27.0, 41.0, 57.0, 75.0, 101.0, 142.0, 199.0, 354.0, 525.0, 841.0, 1317.0, 2486.0, 4523.0, 9072.0, 21008.0, 96462.0, 834453.0, 45634.0, 15258.0, 7095.0, 3590.0, 2003.0, 1165.0, 717.0, 422.0, 286.0, 197.0, 113.0, 89.0, 60.0, 49.0, 29.0, 27.0, 26.0, 9.0, 12.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0546875, -1.9930419921875, -1.931396484375, -1.8697509765625, -1.80810546875, -1.7464599609375, -1.684814453125, -1.6231689453125, -1.5615234375, -1.4998779296875, -1.438232421875, -1.3765869140625, -1.31494140625, -1.2532958984375, -1.191650390625, -1.1300048828125, -1.068359375, -1.0067138671875, -0.945068359375, -0.8834228515625, -0.82177734375, -0.7601318359375, -0.698486328125, -0.6368408203125, -0.5751953125, -0.5135498046875, -0.451904296875, -0.3902587890625, -0.32861328125, -0.2669677734375, -0.205322265625, -0.1436767578125, -0.08203125, -0.0203857421875, 0.041259765625, 0.1029052734375, 0.16455078125, 0.2261962890625, 0.287841796875, 0.3494873046875, 0.4111328125, 0.4727783203125, 0.534423828125, 0.5960693359375, 0.65771484375, 0.7193603515625, 0.781005859375, 0.8426513671875, 0.904296875, 0.9659423828125, 1.027587890625, 1.0892333984375, 1.15087890625, 1.2125244140625, 1.274169921875, 1.3358154296875, 1.3974609375, 1.4591064453125, 1.520751953125, 1.5823974609375, 1.64404296875, 1.7056884765625, 1.767333984375, 1.8289794921875, 1.890625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 9.0, 8.0, 9.0, 4.0, 5.0, 11.0, 15.0, 13.0, 18.0, 15.0, 21.0, 29.0, 21.0, 26.0, 28.0, 37.0, 35.0, 38.0, 30.0, 35.0, 31.0, 32.0, 36.0, 42.0, 26.0, 48.0, 29.0, 38.0, 28.0, 36.0, 26.0, 22.0, 24.0, 23.0, 21.0, 17.0, 15.0, 16.0, 16.0, 17.0, 10.0, 7.0, 2.0, 12.0, 2.0, 5.0, 6.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-2.783203125, -2.7017822265625, -2.620361328125, -2.5389404296875, -2.45751953125, -2.3760986328125, -2.294677734375, -2.2132568359375, -2.1318359375, -2.0504150390625, -1.968994140625, -1.8875732421875, -1.80615234375, -1.7247314453125, -1.643310546875, -1.5618896484375, -1.48046875, -1.3990478515625, -1.317626953125, -1.2362060546875, -1.15478515625, -1.0733642578125, -0.991943359375, -0.9105224609375, -0.8291015625, -0.7476806640625, -0.666259765625, -0.5848388671875, -0.50341796875, -0.4219970703125, -0.340576171875, -0.2591552734375, -0.177734375, -0.0963134765625, -0.014892578125, 0.0665283203125, 0.14794921875, 0.2293701171875, 0.310791015625, 0.3922119140625, 0.4736328125, 0.5550537109375, 0.636474609375, 0.7178955078125, 0.79931640625, 0.8807373046875, 0.962158203125, 1.0435791015625, 1.125, 1.2064208984375, 1.287841796875, 1.3692626953125, 1.45068359375, 1.5321044921875, 1.613525390625, 1.6949462890625, 1.7763671875, 1.8577880859375, 1.939208984375, 2.0206298828125, 2.10205078125, 2.1834716796875, 2.264892578125, 2.3463134765625, 2.427734375]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 14.0, 20.0, 18.0, 30.0, 50.0, 46.0, 91.0, 139.0, 166.0, 281.0, 399.0, 616.0, 930.0, 1532.0, 2360.0, 3991.0, 6751.0, 12522.0, 25831.0, 239775.0, 689487.0, 29896.0, 14107.0, 7703.0, 4362.0, 2725.0, 1654.0, 998.0, 671.0, 408.0, 292.0, 200.0, 138.0, 91.0, 66.0, 45.0, 43.0, 24.0, 9.0, 19.0, 10.0, 11.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.49609375, -0.480133056640625, -0.46417236328125, -0.448211669921875, -0.4322509765625, -0.416290283203125, -0.40032958984375, -0.384368896484375, -0.368408203125, -0.352447509765625, -0.33648681640625, -0.320526123046875, -0.3045654296875, -0.288604736328125, -0.27264404296875, -0.256683349609375, -0.24072265625, -0.224761962890625, -0.20880126953125, -0.192840576171875, -0.1768798828125, -0.160919189453125, -0.14495849609375, -0.128997802734375, -0.113037109375, -0.097076416015625, -0.08111572265625, -0.065155029296875, -0.0491943359375, -0.033233642578125, -0.01727294921875, -0.001312255859375, 0.0146484375, 0.030609130859375, 0.04656982421875, 0.062530517578125, 0.0784912109375, 0.094451904296875, 0.11041259765625, 0.126373291015625, 0.142333984375, 0.158294677734375, 0.17425537109375, 0.190216064453125, 0.2061767578125, 0.222137451171875, 0.23809814453125, 0.254058837890625, 0.27001953125, 0.285980224609375, 0.30194091796875, 0.317901611328125, 0.3338623046875, 0.349822998046875, 0.36578369140625, 0.381744384765625, 0.397705078125, 0.413665771484375, 0.42962646484375, 0.445587158203125, 0.4615478515625, 0.477508544921875, 0.49346923828125, 0.509429931640625, 0.525390625]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 5.0, 4.0, 16.0, 14.0, 14.0, 22.0, 20.0, 32.0, 28.0, 44.0, 40.0, 60.0, 68.0, 65.0, 62.0, 62.0, 74.0, 65.0, 56.0, 43.0, 33.0, 41.0, 25.0, 22.0, 16.0, 15.0, 9.0, 8.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.522634506225586e-05, -3.412831574678421e-05, -3.303028643131256e-05, -3.193225711584091e-05, -3.083422780036926e-05, -2.9736198484897614e-05, -2.8638169169425964e-05, -2.7540139853954315e-05, -2.6442110538482666e-05, -2.5344081223011017e-05, -2.4246051907539368e-05, -2.314802259206772e-05, -2.204999327659607e-05, -2.095196396112442e-05, -1.985393464565277e-05, -1.8755905330181122e-05, -1.7657876014709473e-05, -1.6559846699237823e-05, -1.5461817383766174e-05, -1.4363788068294525e-05, -1.3265758752822876e-05, -1.2167729437351227e-05, -1.1069700121879578e-05, -9.971670806407928e-06, -8.87364149093628e-06, -7.77561217546463e-06, -6.677582859992981e-06, -5.579553544521332e-06, -4.481524229049683e-06, -3.3834949135780334e-06, -2.2854655981063843e-06, -1.1874362826347351e-06, -8.940696716308594e-08, 1.0086223483085632e-06, 2.1066516637802124e-06, 3.2046809792518616e-06, 4.302710294723511e-06, 5.40073961019516e-06, 6.498768925666809e-06, 7.596798241138458e-06, 8.694827556610107e-06, 9.792856872081757e-06, 1.0890886187553406e-05, 1.1988915503025055e-05, 1.3086944818496704e-05, 1.4184974133968353e-05, 1.5283003449440002e-05, 1.638103276491165e-05, 1.74790620803833e-05, 1.857709139585495e-05, 1.96751207113266e-05, 2.0773150026798248e-05, 2.1871179342269897e-05, 2.2969208657741547e-05, 2.4067237973213196e-05, 2.5165267288684845e-05, 2.6263296604156494e-05, 2.7361325919628143e-05, 2.8459355235099792e-05, 2.955738455057144e-05, 3.065541386604309e-05, 3.175344318151474e-05, 3.285147249698639e-05, 3.394950181245804e-05, 3.504753112792969e-05]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 7.0, 12.0, 16.0, 17.0, 28.0, 50.0, 72.0, 115.0, 153.0, 265.0, 389.0, 574.0, 888.0, 1505.0, 2376.0, 3832.0, 6175.0, 10601.0, 18098.0, 33031.0, 64891.0, 132735.0, 243584.0, 247169.0, 136058.0, 65858.0, 34056.0, 18449.0, 10566.0, 6400.0, 3971.0, 2381.0, 1522.0, 948.0, 572.0, 396.0, 279.0, 187.0, 101.0, 74.0, 53.0, 34.0, 24.0, 13.0, 12.0, 8.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.253173828125, -0.24573135375976562, -0.23828887939453125, -0.23084640502929688, -0.2234039306640625, -0.21596145629882812, -0.20851898193359375, -0.20107650756835938, -0.193634033203125, -0.18619155883789062, -0.17874908447265625, -0.17130661010742188, -0.1638641357421875, -0.15642166137695312, -0.14897918701171875, -0.14153671264648438, -0.13409423828125, -0.12665176391601562, -0.11920928955078125, -0.11176681518554688, -0.1043243408203125, -0.09688186645507812, -0.08943939208984375, -0.08199691772460938, -0.074554443359375, -0.06711196899414062, -0.05966949462890625, -0.052227020263671875, -0.0447845458984375, -0.037342071533203125, -0.02989959716796875, -0.022457122802734375, -0.0150146484375, -0.007572174072265625, -0.00012969970703125, 0.007312774658203125, 0.0147552490234375, 0.022197723388671875, 0.02964019775390625, 0.037082672119140625, 0.044525146484375, 0.051967620849609375, 0.05941009521484375, 0.06685256958007812, 0.0742950439453125, 0.08173751831054688, 0.08917999267578125, 0.09662246704101562, 0.10406494140625, 0.11150741577148438, 0.11894989013671875, 0.12639236450195312, 0.1338348388671875, 0.14127731323242188, 0.14871978759765625, 0.15616226196289062, 0.163604736328125, 0.17104721069335938, 0.17848968505859375, 0.18593215942382812, 0.1933746337890625, 0.20081710815429688, 0.20825958251953125, 0.21570205688476562, 0.22314453125]}, "gradients/decoder.bert.encoder.layer.16.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 8.0, 2.0, 5.0, 5.0, 7.0, 4.0, 10.0, 6.0, 8.0, 14.0, 14.0, 11.0, 18.0, 17.0, 34.0, 26.0, 42.0, 54.0, 35.0, 78.0, 94.0, 54.0, 65.0, 82.0, 52.0, 64.0, 34.0, 37.0, 27.0, 18.0, 12.0, 16.0, 3.0, 10.0, 5.0, 8.0, 5.0, 3.0, 5.0, 2.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06451416015625, -0.06237983703613281, -0.060245513916015625, -0.05811119079589844, -0.05597686767578125, -0.05384254455566406, -0.051708221435546875, -0.04957389831542969, -0.0474395751953125, -0.04530525207519531, -0.043170928955078125, -0.04103660583496094, -0.03890228271484375, -0.03676795959472656, -0.034633636474609375, -0.03249931335449219, -0.030364990234375, -0.028230667114257812, -0.026096343994140625, -0.023962020874023438, -0.02182769775390625, -0.019693374633789062, -0.017559051513671875, -0.015424728393554688, -0.0132904052734375, -0.011156082153320312, -0.009021759033203125, -0.0068874359130859375, -0.00475311279296875, -0.0026187896728515625, -0.000484466552734375, 0.0016498565673828125, 0.0037841796875, 0.0059185028076171875, 0.008052825927734375, 0.010187149047851562, 0.01232147216796875, 0.014455795288085938, 0.016590118408203125, 0.018724441528320312, 0.0208587646484375, 0.022993087768554688, 0.025127410888671875, 0.027261734008789062, 0.02939605712890625, 0.03153038024902344, 0.033664703369140625, 0.03579902648925781, 0.037933349609375, 0.04006767272949219, 0.042201995849609375, 0.04433631896972656, 0.04647064208984375, 0.04860496520996094, 0.050739288330078125, 0.05287361145019531, 0.0550079345703125, 0.05714225769042969, 0.059276580810546875, 0.06141090393066406, 0.06354522705078125, 0.06567955017089844, 0.06781387329101562, 0.06994819641113281, 0.07208251953125]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 4.0, 8.0, 6.0, 15.0, 20.0, 16.0, 17.0, 24.0, 28.0, 23.0, 42.0, 51.0, 45.0, 49.0, 56.0, 50.0, 66.0, 63.0, 50.0, 50.0, 48.0, 42.0, 33.0, 31.0, 31.0, 23.0, 16.0, 18.0, 15.0, 13.0, 9.0, 9.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.650997161865234, -4.503167152404785, -4.355337142944336, -4.207507133483887, -4.0596771240234375, -3.9118471145629883, -3.764017343521118, -3.616187334060669, -3.4683573246002197, -3.3205273151397705, -3.1726973056793213, -3.024867296218872, -2.877037525177002, -2.7292075157165527, -2.5813775062561035, -2.4335474967956543, -2.285717487335205, -2.137887477874756, -1.9900574684143066, -1.842227578163147, -1.6943975687026978, -1.5465675592422485, -1.3987376689910889, -1.2509076595306396, -1.1030776500701904, -0.9552476406097412, -0.8074176907539368, -0.6595877408981323, -0.5117577314376831, -0.3639277219772339, -0.21609777212142944, -0.068267822265625, 0.07956171035766602, 0.22739169001579285, 0.3752216696739197, 0.5230516195297241, 0.6708816289901733, 0.8187116384506226, 0.966541588306427, 1.1143715381622314, 1.2622015476226807, 1.4100315570831299, 1.557861566543579, 1.7056914567947388, 1.853521466255188, 2.0013513565063477, 2.149181365966797, 2.297011375427246, 2.4448413848876953, 2.5926713943481445, 2.7405014038085938, 2.888331413269043, 3.036161422729492, 3.1839914321899414, 3.3318212032318115, 3.4796512126922607, 3.62748122215271, 3.775311231613159, 3.9231412410736084, 4.0709710121154785, 4.218801021575928, 4.366631031036377, 4.514461040496826, 4.662291049957275, 4.810121059417725]}, "gradients/decoder.bert.encoder.layer.16.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 7.0, 4.0, 3.0, 5.0, 11.0, 7.0, 17.0, 15.0, 26.0, 19.0, 25.0, 36.0, 36.0, 32.0, 43.0, 37.0, 45.0, 41.0, 47.0, 34.0, 54.0, 49.0, 50.0, 37.0, 46.0, 33.0, 34.0, 37.0, 28.0, 24.0, 25.0, 21.0, 18.0, 13.0, 13.0, 12.0, 9.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5604777336120605, -4.408585071563721, -4.256692409515381, -4.104799270629883, -3.952906608581543, -3.801013946533203, -3.6491212844848633, -3.4972286224365234, -3.3453357219696045, -3.1934430599212646, -3.0415501594543457, -2.889657497406006, -2.737764835357666, -2.585871934890747, -2.4339792728424072, -2.2820863723754883, -2.1301937103271484, -1.978300929069519, -1.8264081478118896, -1.6745154857635498, -1.5226227045059204, -1.370729923248291, -1.2188372611999512, -1.0669444799423218, -0.9150516986846924, -0.763158917427063, -0.6112661957740784, -0.45937344431877136, -0.30748069286346436, -0.15558791160583496, -0.003695189952850342, 0.14819753170013428, 0.30009031295776367, 0.4519830644130707, 0.6038758158683777, 0.7557685375213623, 0.9076613187789917, 1.059554100036621, 1.211446762084961, 1.3633395433425903, 1.5152323246002197, 1.6671251058578491, 1.8190178871154785, 1.9709105491638184, 2.122803211212158, 2.274696111679077, 2.426588773727417, 2.578481674194336, 2.730374336242676, 2.8822669982910156, 3.0341598987579346, 3.1860525608062744, 3.3379454612731934, 3.489838123321533, 3.641730785369873, 3.793623447418213, 3.945516347885132, 4.097409248352051, 4.249301910400391, 4.4011945724487305, 4.55308723449707, 4.70497989654541, 4.856873035430908, 5.008765697479248, 5.160658359527588]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 7.0, 16.0, 31.0, 37.0, 61.0, 83.0, 143.0, 220.0, 350.0, 517.0, 915.0, 1425.0, 2264.0, 3506.0, 5834.0, 9748.0, 16038.0, 26385.0, 42806.0, 67352.0, 98925.0, 132972.0, 152158.0, 144648.0, 117352.0, 83135.0, 54537.0, 34108.0, 20838.0, 12308.0, 7697.0, 4670.0, 2722.0, 1746.0, 1093.0, 697.0, 419.0, 269.0, 184.0, 117.0, 78.0, 47.0, 42.0, 27.0, 13.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.157562255859375, -3.05145263671875, -2.945343017578125, -2.8392333984375, -2.733123779296875, -2.62701416015625, -2.520904541015625, -2.414794921875, -2.308685302734375, -2.20257568359375, -2.096466064453125, -1.9903564453125, -1.884246826171875, -1.77813720703125, -1.672027587890625, -1.56591796875, -1.459808349609375, -1.35369873046875, -1.247589111328125, -1.1414794921875, -1.035369873046875, -0.92926025390625, -0.823150634765625, -0.717041015625, -0.610931396484375, -0.50482177734375, -0.398712158203125, -0.2926025390625, -0.186492919921875, -0.08038330078125, 0.025726318359375, 0.1318359375, 0.237945556640625, 0.34405517578125, 0.450164794921875, 0.5562744140625, 0.662384033203125, 0.76849365234375, 0.874603271484375, 0.980712890625, 1.086822509765625, 1.19293212890625, 1.299041748046875, 1.4051513671875, 1.511260986328125, 1.61737060546875, 1.723480224609375, 1.82958984375, 1.935699462890625, 2.04180908203125, 2.147918701171875, 2.2540283203125, 2.360137939453125, 2.46624755859375, 2.572357177734375, 2.678466796875, 2.784576416015625, 2.89068603515625, 2.996795654296875, 3.1029052734375, 3.209014892578125, 3.31512451171875, 3.421234130859375, 3.52734375]}, "gradients/decoder.bert.encoder.layer.16.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 5.0, 7.0, 11.0, 6.0, 15.0, 19.0, 21.0, 22.0, 25.0, 38.0, 32.0, 42.0, 40.0, 43.0, 48.0, 51.0, 44.0, 63.0, 59.0, 45.0, 39.0, 41.0, 36.0, 33.0, 35.0, 33.0, 35.0, 23.0, 20.0, 14.0, 12.0, 12.0, 7.0, 11.0, 2.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.05987548828125, -4.8931884765625, -4.72650146484375, -4.559814453125, -4.39312744140625, -4.2264404296875, -4.05975341796875, -3.89306640625, -3.72637939453125, -3.5596923828125, -3.39300537109375, -3.226318359375, -3.05963134765625, -2.8929443359375, -2.72625732421875, -2.5595703125, -2.39288330078125, -2.2261962890625, -2.05950927734375, -1.892822265625, -1.72613525390625, -1.5594482421875, -1.39276123046875, -1.22607421875, -1.05938720703125, -0.8927001953125, -0.72601318359375, -0.559326171875, -0.39263916015625, -0.2259521484375, -0.05926513671875, 0.107421875, 0.27410888671875, 0.4407958984375, 0.60748291015625, 0.774169921875, 0.94085693359375, 1.1075439453125, 1.27423095703125, 1.44091796875, 1.60760498046875, 1.7742919921875, 1.94097900390625, 2.107666015625, 2.27435302734375, 2.4410400390625, 2.60772705078125, 2.7744140625, 2.94110107421875, 3.1077880859375, 3.27447509765625, 3.441162109375, 3.60784912109375, 3.7745361328125, 3.94122314453125, 4.10791015625, 4.27459716796875, 4.4412841796875, 4.60797119140625, 4.774658203125, 4.94134521484375, 5.1080322265625, 5.27471923828125, 5.44140625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 15.0, 14.0, 24.0, 36.0, 49.0, 77.0, 143.0, 211.0, 362.0, 530.0, 956.0, 1526.0, 2468.0, 4352.0, 7592.0, 12887.0, 22606.0, 38692.0, 64015.0, 100705.0, 139782.0, 165317.0, 156828.0, 122383.0, 82795.0, 51511.0, 30274.0, 17703.0, 10173.0, 5957.0, 3477.0, 1948.0, 1209.0, 707.0, 423.0, 300.0, 188.0, 110.0, 80.0, 49.0, 22.0, 20.0, 10.0, 12.0, 9.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.552734375, -3.4443359375, -3.3359375, -3.2275390625, -3.119140625, -3.0107421875, -2.90234375, -2.7939453125, -2.685546875, -2.5771484375, -2.46875, -2.3603515625, -2.251953125, -2.1435546875, -2.03515625, -1.9267578125, -1.818359375, -1.7099609375, -1.6015625, -1.4931640625, -1.384765625, -1.2763671875, -1.16796875, -1.0595703125, -0.951171875, -0.8427734375, -0.734375, -0.6259765625, -0.517578125, -0.4091796875, -0.30078125, -0.1923828125, -0.083984375, 0.0244140625, 0.1328125, 0.2412109375, 0.349609375, 0.4580078125, 0.56640625, 0.6748046875, 0.783203125, 0.8916015625, 1.0, 1.1083984375, 1.216796875, 1.3251953125, 1.43359375, 1.5419921875, 1.650390625, 1.7587890625, 1.8671875, 1.9755859375, 2.083984375, 2.1923828125, 2.30078125, 2.4091796875, 2.517578125, 2.6259765625, 2.734375, 2.8427734375, 2.951171875, 3.0595703125, 3.16796875, 3.2763671875, 3.384765625]}, "gradients/decoder.bert.encoder.layer.16.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 5.0, 5.0, 2.0, 15.0, 9.0, 10.0, 20.0, 20.0, 21.0, 23.0, 24.0, 35.0, 33.0, 34.0, 46.0, 23.0, 40.0, 29.0, 46.0, 32.0, 32.0, 33.0, 38.0, 31.0, 24.0, 30.0, 28.0, 39.0, 36.0, 35.0, 16.0, 20.0, 21.0, 20.0, 18.0, 20.0, 7.0, 11.0, 11.0, 7.0, 8.0, 2.0, 6.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.33984375, -2.263916015625, -2.18798828125, -2.112060546875, -2.0361328125, -1.960205078125, -1.88427734375, -1.808349609375, -1.732421875, -1.656494140625, -1.58056640625, -1.504638671875, -1.4287109375, -1.352783203125, -1.27685546875, -1.200927734375, -1.125, -1.049072265625, -0.97314453125, -0.897216796875, -0.8212890625, -0.745361328125, -0.66943359375, -0.593505859375, -0.517578125, -0.441650390625, -0.36572265625, -0.289794921875, -0.2138671875, -0.137939453125, -0.06201171875, 0.013916015625, 0.08984375, 0.165771484375, 0.24169921875, 0.317626953125, 0.3935546875, 0.469482421875, 0.54541015625, 0.621337890625, 0.697265625, 0.773193359375, 0.84912109375, 0.925048828125, 1.0009765625, 1.076904296875, 1.15283203125, 1.228759765625, 1.3046875, 1.380615234375, 1.45654296875, 1.532470703125, 1.6083984375, 1.684326171875, 1.76025390625, 1.836181640625, 1.912109375, 1.988037109375, 2.06396484375, 2.139892578125, 2.2158203125, 2.291748046875, 2.36767578125, 2.443603515625, 2.51953125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 14.0, 21.0, 28.0, 37.0, 52.0, 90.0, 129.0, 214.0, 359.0, 549.0, 869.0, 1566.0, 2329.0, 4053.0, 6729.0, 11796.0, 21134.0, 37254.0, 66320.0, 112334.0, 167187.0, 194875.0, 163849.0, 108750.0, 63877.0, 36208.0, 20008.0, 11364.0, 6648.0, 3852.0, 2305.0, 1332.0, 887.0, 553.0, 321.0, 199.0, 154.0, 95.0, 65.0, 48.0, 23.0, 19.0, 16.0, 10.0, 7.0, 8.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 1.0], "bins": [-2.443359375, -2.36810302734375, -2.2928466796875, -2.21759033203125, -2.142333984375, -2.06707763671875, -1.9918212890625, -1.91656494140625, -1.84130859375, -1.76605224609375, -1.6907958984375, -1.61553955078125, -1.540283203125, -1.46502685546875, -1.3897705078125, -1.31451416015625, -1.2392578125, -1.16400146484375, -1.0887451171875, -1.01348876953125, -0.938232421875, -0.86297607421875, -0.7877197265625, -0.71246337890625, -0.63720703125, -0.56195068359375, -0.4866943359375, -0.41143798828125, -0.336181640625, -0.26092529296875, -0.1856689453125, -0.11041259765625, -0.03515625, 0.04010009765625, 0.1153564453125, 0.19061279296875, 0.265869140625, 0.34112548828125, 0.4163818359375, 0.49163818359375, 0.56689453125, 0.64215087890625, 0.7174072265625, 0.79266357421875, 0.867919921875, 0.94317626953125, 1.0184326171875, 1.09368896484375, 1.1689453125, 1.24420166015625, 1.3194580078125, 1.39471435546875, 1.469970703125, 1.54522705078125, 1.6204833984375, 1.69573974609375, 1.77099609375, 1.84625244140625, 1.9215087890625, 1.99676513671875, 2.072021484375, 2.14727783203125, 2.2225341796875, 2.29779052734375, 2.373046875]}, "gradients/decoder.bert.encoder.layer.16.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 0.0, 8.0, 9.0, 10.0, 9.0, 18.0, 28.0, 26.0, 42.0, 33.0, 55.0, 54.0, 52.0, 50.0, 62.0, 63.0, 54.0, 68.0, 43.0, 50.0, 48.0, 35.0, 23.0, 19.0, 30.0, 25.0, 13.0, 13.0, 10.0, 6.0, 12.0, 8.0, 8.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00021529197692871094, -0.00020779669284820557, -0.0002003014087677002, -0.00019280612468719482, -0.00018531084060668945, -0.00017781555652618408, -0.0001703202724456787, -0.00016282498836517334, -0.00015532970428466797, -0.0001478344202041626, -0.00014033913612365723, -0.00013284385204315186, -0.00012534856796264648, -0.00011785328388214111, -0.00011035799980163574, -0.00010286271572113037, -9.5367431640625e-05, -8.787214756011963e-05, -8.037686347961426e-05, -7.288157939910889e-05, -6.538629531860352e-05, -5.7891011238098145e-05, -5.0395727157592773e-05, -4.29004430770874e-05, -3.540515899658203e-05, -2.790987491607666e-05, -2.041459083557129e-05, -1.2919306755065918e-05, -5.424022674560547e-06, 2.0712614059448242e-06, 9.566545486450195e-06, 1.7061829566955566e-05, 2.4557113647460938e-05, 3.205239772796631e-05, 3.954768180847168e-05, 4.704296588897705e-05, 5.453824996948242e-05, 6.203353404998779e-05, 6.952881813049316e-05, 7.702410221099854e-05, 8.45193862915039e-05, 9.201467037200928e-05, 9.950995445251465e-05, 0.00010700523853302002, 0.00011450052261352539, 0.00012199580669403076, 0.00012949109077453613, 0.0001369863748550415, 0.00014448165893554688, 0.00015197694301605225, 0.00015947222709655762, 0.000166967511177063, 0.00017446279525756836, 0.00018195807933807373, 0.0001894533634185791, 0.00019694864749908447, 0.00020444393157958984, 0.00021193921566009521, 0.00021943449974060059, 0.00022692978382110596, 0.00023442506790161133, 0.0002419203519821167, 0.00024941563606262207, 0.00025691092014312744, 0.0002644062042236328]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.weight": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 2.0, 3.0, 3.0, 6.0, 8.0, 12.0, 17.0, 25.0, 29.0, 34.0, 74.0, 89.0, 132.0, 195.0, 261.0, 402.0, 624.0, 918.0, 1488.0, 2286.0, 3739.0, 6053.0, 9992.0, 17060.0, 29657.0, 51853.0, 87546.0, 137002.0, 180073.0, 177689.0, 134213.0, 85797.0, 49884.0, 29056.0, 16862.0, 9540.0, 5882.0, 3568.0, 2233.0, 1468.0, 930.0, 585.0, 399.0, 270.0, 178.0, 129.0, 89.0, 59.0, 46.0, 31.0, 23.0, 14.0, 13.0, 10.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.328125, -2.25531005859375, -2.1824951171875, -2.10968017578125, -2.036865234375, -1.96405029296875, -1.8912353515625, -1.81842041015625, -1.74560546875, -1.67279052734375, -1.5999755859375, -1.52716064453125, -1.454345703125, -1.38153076171875, -1.3087158203125, -1.23590087890625, -1.1630859375, -1.09027099609375, -1.0174560546875, -0.94464111328125, -0.871826171875, -0.79901123046875, -0.7261962890625, -0.65338134765625, -0.58056640625, -0.50775146484375, -0.4349365234375, -0.36212158203125, -0.289306640625, -0.21649169921875, -0.1436767578125, -0.07086181640625, 0.001953125, 0.07476806640625, 0.1475830078125, 0.22039794921875, 0.293212890625, 0.36602783203125, 0.4388427734375, 0.51165771484375, 0.58447265625, 0.65728759765625, 0.7301025390625, 0.80291748046875, 0.875732421875, 0.94854736328125, 1.0213623046875, 1.09417724609375, 1.1669921875, 1.23980712890625, 1.3126220703125, 1.38543701171875, 1.458251953125, 1.53106689453125, 1.6038818359375, 1.67669677734375, 1.74951171875, 1.82232666015625, 1.8951416015625, 1.96795654296875, 2.040771484375, 2.11358642578125, 2.1864013671875, 2.25921630859375, 2.33203125]}, "gradients/decoder.bert.encoder.layer.16.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 4.0, 6.0, 6.0, 7.0, 6.0, 11.0, 14.0, 13.0, 13.0, 29.0, 19.0, 36.0, 23.0, 41.0, 48.0, 46.0, 47.0, 51.0, 50.0, 48.0, 45.0, 44.0, 60.0, 40.0, 41.0, 36.0, 33.0, 30.0, 30.0, 13.0, 18.0, 19.0, 19.0, 8.0, 7.0, 8.0, 7.0, 6.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6279296875, -0.606201171875, -0.58447265625, -0.562744140625, -0.541015625, -0.519287109375, -0.49755859375, -0.475830078125, -0.4541015625, -0.432373046875, -0.41064453125, -0.388916015625, -0.3671875, -0.345458984375, -0.32373046875, -0.302001953125, -0.2802734375, -0.258544921875, -0.23681640625, -0.215087890625, -0.193359375, -0.171630859375, -0.14990234375, -0.128173828125, -0.1064453125, -0.084716796875, -0.06298828125, -0.041259765625, -0.01953125, 0.002197265625, 0.02392578125, 0.045654296875, 0.0673828125, 0.089111328125, 0.11083984375, 0.132568359375, 0.154296875, 0.176025390625, 0.19775390625, 0.219482421875, 0.2412109375, 0.262939453125, 0.28466796875, 0.306396484375, 0.328125, 0.349853515625, 0.37158203125, 0.393310546875, 0.4150390625, 0.436767578125, 0.45849609375, 0.480224609375, 0.501953125, 0.523681640625, 0.54541015625, 0.567138671875, 0.5888671875, 0.610595703125, 0.63232421875, 0.654052734375, 0.67578125, 0.697509765625, 0.71923828125, 0.740966796875, 0.7626953125]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 13.0, 8.0, 19.0, 5.0, 16.0, 24.0, 25.0, 23.0, 30.0, 28.0, 37.0, 34.0, 54.0, 49.0, 56.0, 60.0, 59.0, 52.0, 57.0, 50.0, 42.0, 46.0, 42.0, 28.0, 27.0, 17.0, 13.0, 12.0, 16.0, 12.0, 8.0, 8.0, 8.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.62278413772583, -4.477611541748047, -4.3324384689331055, -4.187265872955322, -4.042093276977539, -3.8969204425811768, -3.7517476081848145, -3.6065750122070312, -3.461402177810669, -3.3162293434143066, -3.1710567474365234, -3.025883913040161, -2.880711078643799, -2.7355384826660156, -2.5903656482696533, -2.445192813873291, -2.300020217895508, -2.1548473834991455, -2.0096747875213623, -1.864501953125, -1.7193292379379272, -1.5741565227508545, -1.4289836883544922, -1.2838109731674194, -1.1386382579803467, -0.9934655427932739, -0.8482927680015564, -0.7031199932098389, -0.5579472780227661, -0.41277456283569336, -0.26760178804397583, -0.1224290132522583, 0.02274322509765625, 0.1679159700870514, 0.31308871507644653, 0.4582614600658417, 0.6034342050552368, 0.7486069202423096, 0.8937796950340271, 1.0389524698257446, 1.1841251850128174, 1.3292979001998901, 1.474470615386963, 1.6196434497833252, 1.764816164970398, 1.9099888801574707, 2.055161714553833, 2.2003345489501953, 2.3455071449279785, 2.490679979324341, 2.635852575302124, 2.7810254096984863, 2.9261980056762695, 3.071370840072632, 3.216543674468994, 3.3617162704467773, 3.5068891048431396, 3.652061939239502, 3.797234535217285, 3.9424073696136475, 4.08758020401001, 4.232752799987793, 4.377925395965576, 4.523098468780518, 4.668271064758301]}, "gradients/decoder.bert.encoder.layer.15.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 6.0, 5.0, 10.0, 4.0, 10.0, 8.0, 20.0, 18.0, 18.0, 17.0, 29.0, 30.0, 30.0, 28.0, 33.0, 36.0, 31.0, 52.0, 47.0, 44.0, 36.0, 38.0, 34.0, 43.0, 45.0, 49.0, 44.0, 30.0, 31.0, 26.0, 24.0, 21.0, 12.0, 23.0, 14.0, 8.0, 11.0, 11.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.436288833618164, -4.295776844024658, -4.155264854431152, -4.0147528648376465, -3.8742411136627197, -3.733729124069214, -3.593217134475708, -3.452705144882202, -3.3121933937072754, -3.1716814041137695, -3.0311694145202637, -2.890657424926758, -2.750145673751831, -2.609633684158325, -2.4691216945648193, -2.3286097049713135, -2.1880977153778076, -2.0475857257843018, -1.9070738554000854, -1.7665618658065796, -1.6260499954223633, -1.4855380058288574, -1.3450260162353516, -1.2045140266418457, -1.0640021562576294, -0.9234902262687683, -0.7829782962799072, -0.6424663066864014, -0.5019543766975403, -0.3614424467086792, -0.22093045711517334, -0.08041852712631226, 0.06009340286254883, 0.2006053477525711, 0.3411172926425934, 0.48162925243377686, 0.6221411824226379, 0.762653112411499, 0.9031651020050049, 1.0436770915985107, 1.184188961982727, 1.324700951576233, 1.4652128219604492, 1.605724811553955, 1.746236801147461, 1.8867486715316772, 2.0272607803344727, 2.1677725315093994, 2.3082845211029053, 2.448796510696411, 2.589308500289917, 2.7298202514648438, 2.8703322410583496, 3.0108442306518555, 3.1513562202453613, 3.291868209838867, 3.432380199432373, 3.572892189025879, 3.7134041786193848, 3.8539161682128906, 3.9944279193878174, 4.134940147399902, 4.27545166015625, 4.415963649749756, 4.556475639343262]}, "gradients/decoder.bert.encoder.layer.15.output.dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 6.0, 13.0, 17.0, 16.0, 23.0, 34.0, 35.0, 59.0, 97.0, 97.0, 172.0, 276.0, 362.0, 626.0, 906.0, 1376.0, 2305.0, 3566.0, 6194.0, 10581.0, 19192.0, 36073.0, 70033.0, 142788.0, 308416.0, 649365.0, 1036560.0, 935023.0, 508756.0, 231103.0, 108813.0, 54278.0, 28962.0, 15667.0, 8942.0, 5265.0, 3067.0, 1959.0, 1171.0, 749.0, 444.0, 294.0, 200.0, 122.0, 86.0, 68.0, 27.0, 33.0, 22.0, 14.0, 16.0, 4.0, 3.0, 4.0, 4.0, 3.0], "bins": [-4.91015625, -4.7691650390625, -4.628173828125, -4.4871826171875, -4.34619140625, -4.2052001953125, -4.064208984375, -3.9232177734375, -3.7822265625, -3.6412353515625, -3.500244140625, -3.3592529296875, -3.21826171875, -3.0772705078125, -2.936279296875, -2.7952880859375, -2.654296875, -2.5133056640625, -2.372314453125, -2.2313232421875, -2.09033203125, -1.9493408203125, -1.808349609375, -1.6673583984375, -1.5263671875, -1.3853759765625, -1.244384765625, -1.1033935546875, -0.96240234375, -0.8214111328125, -0.680419921875, -0.5394287109375, -0.3984375, -0.2574462890625, -0.116455078125, 0.0245361328125, 0.16552734375, 0.3065185546875, 0.447509765625, 0.5885009765625, 0.7294921875, 0.8704833984375, 1.011474609375, 1.1524658203125, 1.29345703125, 1.4344482421875, 1.575439453125, 1.7164306640625, 1.857421875, 1.9984130859375, 2.139404296875, 2.2803955078125, 2.42138671875, 2.5623779296875, 2.703369140625, 2.8443603515625, 2.9853515625, 3.1263427734375, 3.267333984375, 3.4083251953125, 3.54931640625, 3.6903076171875, 3.831298828125, 3.9722900390625, 4.11328125]}, "gradients/decoder.bert.encoder.layer.15.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 4.0, 7.0, 10.0, 9.0, 12.0, 16.0, 18.0, 14.0, 20.0, 24.0, 37.0, 21.0, 33.0, 26.0, 41.0, 29.0, 45.0, 36.0, 48.0, 43.0, 34.0, 43.0, 50.0, 37.0, 39.0, 29.0, 36.0, 32.0, 36.0, 15.0, 21.0, 23.0, 21.0, 13.0, 20.0, 12.0, 10.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.900390625, -2.80963134765625, -2.7188720703125, -2.62811279296875, -2.537353515625, -2.44659423828125, -2.3558349609375, -2.26507568359375, -2.17431640625, -2.08355712890625, -1.9927978515625, -1.90203857421875, -1.811279296875, -1.72052001953125, -1.6297607421875, -1.53900146484375, -1.4482421875, -1.35748291015625, -1.2667236328125, -1.17596435546875, -1.085205078125, -0.99444580078125, -0.9036865234375, -0.81292724609375, -0.72216796875, -0.63140869140625, -0.5406494140625, -0.44989013671875, -0.359130859375, -0.26837158203125, -0.1776123046875, -0.08685302734375, 0.00390625, 0.09466552734375, 0.1854248046875, 0.27618408203125, 0.366943359375, 0.45770263671875, 0.5484619140625, 0.63922119140625, 0.72998046875, 0.82073974609375, 0.9114990234375, 1.00225830078125, 1.093017578125, 1.18377685546875, 1.2745361328125, 1.36529541015625, 1.4560546875, 1.54681396484375, 1.6375732421875, 1.72833251953125, 1.819091796875, 1.90985107421875, 2.0006103515625, 2.09136962890625, 2.18212890625, 2.27288818359375, 2.3636474609375, 2.45440673828125, 2.545166015625, 2.63592529296875, 2.7266845703125, 2.81744384765625, 2.908203125]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 13.0, 15.0, 18.0, 31.0, 38.0, 60.0, 107.0, 142.0, 216.0, 355.0, 527.0, 825.0, 1352.0, 2203.0, 3662.0, 6057.0, 10577.0, 18454.0, 32916.0, 60866.0, 116394.0, 230098.0, 449685.0, 798183.0, 983465.0, 698195.0, 375836.0, 190721.0, 97123.0, 50759.0, 27680.0, 15450.0, 8953.0, 5234.0, 3049.0, 1822.0, 1157.0, 771.0, 442.0, 308.0, 186.0, 110.0, 71.0, 58.0, 35.0, 20.0, 20.0, 9.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-4.890625, -4.748291015625, -4.60595703125, -4.463623046875, -4.3212890625, -4.178955078125, -4.03662109375, -3.894287109375, -3.751953125, -3.609619140625, -3.46728515625, -3.324951171875, -3.1826171875, -3.040283203125, -2.89794921875, -2.755615234375, -2.61328125, -2.470947265625, -2.32861328125, -2.186279296875, -2.0439453125, -1.901611328125, -1.75927734375, -1.616943359375, -1.474609375, -1.332275390625, -1.18994140625, -1.047607421875, -0.9052734375, -0.762939453125, -0.62060546875, -0.478271484375, -0.3359375, -0.193603515625, -0.05126953125, 0.091064453125, 0.2333984375, 0.375732421875, 0.51806640625, 0.660400390625, 0.802734375, 0.945068359375, 1.08740234375, 1.229736328125, 1.3720703125, 1.514404296875, 1.65673828125, 1.799072265625, 1.94140625, 2.083740234375, 2.22607421875, 2.368408203125, 2.5107421875, 2.653076171875, 2.79541015625, 2.937744140625, 3.080078125, 3.222412109375, 3.36474609375, 3.507080078125, 3.6494140625, 3.791748046875, 3.93408203125, 4.076416015625, 4.21875]}, "gradients/decoder.bert.encoder.layer.15.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 10.0, 15.0, 18.0, 33.0, 31.0, 38.0, 48.0, 66.0, 79.0, 85.0, 136.0, 153.0, 171.0, 189.0, 253.0, 283.0, 311.0, 311.0, 250.0, 259.0, 206.0, 207.0, 171.0, 132.0, 131.0, 102.0, 87.0, 45.0, 64.0, 47.0, 34.0, 22.0, 19.0, 20.0, 16.0, 6.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7607421875, -1.711456298828125, -1.66217041015625, -1.612884521484375, -1.5635986328125, -1.514312744140625, -1.46502685546875, -1.415740966796875, -1.366455078125, -1.317169189453125, -1.26788330078125, -1.218597412109375, -1.1693115234375, -1.120025634765625, -1.07073974609375, -1.021453857421875, -0.97216796875, -0.922882080078125, -0.87359619140625, -0.824310302734375, -0.7750244140625, -0.725738525390625, -0.67645263671875, -0.627166748046875, -0.577880859375, -0.528594970703125, -0.47930908203125, -0.430023193359375, -0.3807373046875, -0.331451416015625, -0.28216552734375, -0.232879638671875, -0.18359375, -0.134307861328125, -0.08502197265625, -0.035736083984375, 0.0135498046875, 0.062835693359375, 0.11212158203125, 0.161407470703125, 0.210693359375, 0.259979248046875, 0.30926513671875, 0.358551025390625, 0.4078369140625, 0.457122802734375, 0.50640869140625, 0.555694580078125, 0.60498046875, 0.654266357421875, 0.70355224609375, 0.752838134765625, 0.8021240234375, 0.851409912109375, 0.90069580078125, 0.949981689453125, 0.999267578125, 1.048553466796875, 1.09783935546875, 1.147125244140625, 1.1964111328125, 1.245697021484375, 1.29498291015625, 1.344268798828125, 1.3935546875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 17.0, 15.0, 17.0, 16.0, 31.0, 34.0, 46.0, 44.0, 58.0, 58.0, 73.0, 69.0, 69.0, 70.0, 65.0, 50.0, 45.0, 36.0, 41.0, 23.0, 21.0, 9.0, 12.0, 15.0, 10.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6409735679626465, -4.479150772094727, -4.317328453063965, -4.155505657196045, -3.993682861328125, -3.831860303878784, -3.6700377464294434, -3.5082149505615234, -3.3463921546936035, -3.1845695972442627, -3.0227468013763428, -2.860924243927002, -2.699101448059082, -2.537278890609741, -2.3754563331604004, -2.2136335372924805, -2.0518109798431396, -1.8899883031845093, -1.728165626525879, -1.566343069076538, -1.4045202732086182, -1.2426977157592773, -1.080875039100647, -0.9190523624420166, -0.7572296857833862, -0.5954070091247559, -0.4335843622684479, -0.2717617154121399, -0.10993903875350952, 0.05188363790512085, 0.21370625495910645, 0.3755289316177368, 0.5373516082763672, 0.6991742849349976, 0.8609969615936279, 1.0228195190429688, 1.1846423149108887, 1.3464648723602295, 1.5082875490188599, 1.6701102256774902, 1.8319329023361206, 1.993755578994751, 2.155578136444092, 2.3174009323120117, 2.4792234897613525, 2.6410462856292725, 2.8028688430786133, 2.964691638946533, 3.126514196395874, 3.288336753845215, 3.4501595497131348, 3.6119821071624756, 3.7738049030303955, 3.9356274604797363, 4.097450256347656, 4.259272575378418, 4.421095371246338, 4.582918167114258, 4.7447404861450195, 4.9065632820129395, 5.068386077880859, 5.230208873748779, 5.392031192779541, 5.553853988647461, 5.715676784515381]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 5.0, 10.0, 9.0, 12.0, 27.0, 22.0, 15.0, 15.0, 32.0, 41.0, 37.0, 38.0, 40.0, 46.0, 48.0, 49.0, 48.0, 40.0, 46.0, 46.0, 48.0, 46.0, 26.0, 28.0, 37.0, 31.0, 20.0, 22.0, 25.0, 19.0, 13.0, 14.0, 5.0, 5.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.124532222747803, -3.994530200958252, -3.864528179168701, -3.7345261573791504, -3.6045241355895996, -3.474522113800049, -3.344520330429077, -3.2145183086395264, -3.0845162868499756, -2.954514265060425, -2.824512243270874, -2.6945102214813232, -2.5645084381103516, -2.434506416320801, -2.30450439453125, -2.174502372741699, -2.0445003509521484, -1.9144983291625977, -1.7844963073730469, -1.6544944047927856, -1.5244923830032349, -1.394490361213684, -1.2644884586334229, -1.134486436843872, -1.0044844150543213, -0.8744823932647705, -0.7444804310798645, -0.6144784688949585, -0.4844764471054077, -0.35447442531585693, -0.22447246313095093, -0.09447050094604492, 0.035531044006347656, 0.16553303599357605, 0.29553502798080444, 0.42553701996803284, 0.5555390119552612, 0.685541033744812, 0.815542995929718, 0.945544958114624, 1.0755469799041748, 1.2055490016937256, 1.3355510234832764, 1.4655529260635376, 1.5955549478530884, 1.7255569696426392, 1.8555588722229004, 1.9855608940124512, 2.115562915802002, 2.2455649375915527, 2.3755669593811035, 2.5055689811706543, 2.635571002960205, 2.765573024749756, 2.8955748081207275, 3.0255768299102783, 3.155578851699829, 3.28558087348938, 3.4155828952789307, 3.5455849170684814, 3.675586700439453, 3.805588722229004, 3.9355907440185547, 4.0655927658081055, 4.195594787597656]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 4.0, 5.0, 4.0, 8.0, 11.0, 25.0, 19.0, 35.0, 51.0, 66.0, 82.0, 117.0, 183.0, 251.0, 347.0, 423.0, 688.0, 949.0, 1385.0, 1965.0, 2956.0, 4411.0, 6537.0, 10010.0, 15489.0, 25015.0, 40474.0, 66490.0, 110043.0, 171175.0, 199124.0, 148767.0, 91829.0, 55319.0, 33828.0, 20852.0, 13203.0, 8575.0, 5729.0, 3785.0, 2515.0, 1771.0, 1218.0, 806.0, 614.0, 415.0, 255.0, 211.0, 157.0, 112.0, 88.0, 52.0, 39.0, 26.0, 19.0, 11.0, 11.0, 4.0, 5.0, 4.0, 4.0, 3.0], "bins": [-0.56982421875, -0.5521926879882812, -0.5345611572265625, -0.5169296264648438, -0.499298095703125, -0.48166656494140625, -0.4640350341796875, -0.44640350341796875, -0.42877197265625, -0.41114044189453125, -0.3935089111328125, -0.37587738037109375, -0.358245849609375, -0.34061431884765625, -0.3229827880859375, -0.30535125732421875, -0.2877197265625, -0.27008819580078125, -0.2524566650390625, -0.23482513427734375, -0.217193603515625, -0.19956207275390625, -0.1819305419921875, -0.16429901123046875, -0.14666748046875, -0.12903594970703125, -0.1114044189453125, -0.09377288818359375, -0.076141357421875, -0.05850982666015625, -0.0408782958984375, -0.02324676513671875, -0.005615234375, 0.01201629638671875, 0.0296478271484375, 0.04727935791015625, 0.064910888671875, 0.08254241943359375, 0.1001739501953125, 0.11780548095703125, 0.13543701171875, 0.15306854248046875, 0.1707000732421875, 0.18833160400390625, 0.205963134765625, 0.22359466552734375, 0.2412261962890625, 0.25885772705078125, 0.2764892578125, 0.29412078857421875, 0.3117523193359375, 0.32938385009765625, 0.347015380859375, 0.36464691162109375, 0.3822784423828125, 0.39990997314453125, 0.41754150390625, 0.43517303466796875, 0.4528045654296875, 0.47043609619140625, 0.488067626953125, 0.5056991577148438, 0.5233306884765625, 0.5409622192382812, 0.55859375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 4.0, 11.0, 13.0, 11.0, 13.0, 20.0, 16.0, 20.0, 25.0, 29.0, 34.0, 33.0, 47.0, 43.0, 37.0, 34.0, 44.0, 53.0, 47.0, 42.0, 40.0, 50.0, 38.0, 30.0, 28.0, 28.0, 31.0, 33.0, 21.0, 22.0, 16.0, 16.0, 16.0, 4.0, 6.0, 10.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.390625, -4.26104736328125, -4.1314697265625, -4.00189208984375, -3.872314453125, -3.74273681640625, -3.6131591796875, -3.48358154296875, -3.35400390625, -3.22442626953125, -3.0948486328125, -2.96527099609375, -2.835693359375, -2.70611572265625, -2.5765380859375, -2.44696044921875, -2.3173828125, -2.18780517578125, -2.0582275390625, -1.92864990234375, -1.799072265625, -1.66949462890625, -1.5399169921875, -1.41033935546875, -1.28076171875, -1.15118408203125, -1.0216064453125, -0.89202880859375, -0.762451171875, -0.63287353515625, -0.5032958984375, -0.37371826171875, -0.244140625, -0.11456298828125, 0.0150146484375, 0.14459228515625, 0.274169921875, 0.40374755859375, 0.5333251953125, 0.66290283203125, 0.79248046875, 0.92205810546875, 1.0516357421875, 1.18121337890625, 1.310791015625, 1.44036865234375, 1.5699462890625, 1.69952392578125, 1.8291015625, 1.95867919921875, 2.0882568359375, 2.21783447265625, 2.347412109375, 2.47698974609375, 2.6065673828125, 2.73614501953125, 2.86572265625, 2.99530029296875, 3.1248779296875, 3.25445556640625, 3.384033203125, 3.51361083984375, 3.6431884765625, 3.77276611328125, 3.90234375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 4.0, 10.0, 12.0, 8.0, 8.0, 33.0, 38.0, 81.0, 76.0, 142.0, 171.0, 353.0, 529.0, 901.0, 1660.0, 3173.0, 6395.0, 14765.0, 47387.0, 848985.0, 87991.0, 19356.0, 7966.0, 3851.0, 1899.0, 1085.0, 639.0, 379.0, 197.0, 126.0, 108.0, 60.0, 44.0, 40.0, 20.0, 22.0, 14.0, 9.0, 8.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.609375, -1.556854248046875, -1.50433349609375, -1.451812744140625, -1.3992919921875, -1.346771240234375, -1.29425048828125, -1.241729736328125, -1.189208984375, -1.136688232421875, -1.08416748046875, -1.031646728515625, -0.9791259765625, -0.926605224609375, -0.87408447265625, -0.821563720703125, -0.76904296875, -0.716522216796875, -0.66400146484375, -0.611480712890625, -0.5589599609375, -0.506439208984375, -0.45391845703125, -0.401397705078125, -0.348876953125, -0.296356201171875, -0.24383544921875, -0.191314697265625, -0.1387939453125, -0.086273193359375, -0.03375244140625, 0.018768310546875, 0.0712890625, 0.123809814453125, 0.17633056640625, 0.228851318359375, 0.2813720703125, 0.333892822265625, 0.38641357421875, 0.438934326171875, 0.491455078125, 0.543975830078125, 0.59649658203125, 0.649017333984375, 0.7015380859375, 0.754058837890625, 0.80657958984375, 0.859100341796875, 0.91162109375, 0.964141845703125, 1.01666259765625, 1.069183349609375, 1.1217041015625, 1.174224853515625, 1.22674560546875, 1.279266357421875, 1.331787109375, 1.384307861328125, 1.43682861328125, 1.489349365234375, 1.5418701171875, 1.594390869140625, 1.64691162109375, 1.699432373046875, 1.751953125]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 13.0, 15.0, 18.0, 19.0, 23.0, 20.0, 22.0, 24.0, 39.0, 38.0, 34.0, 30.0, 52.0, 32.0, 35.0, 38.0, 33.0, 42.0, 33.0, 44.0, 39.0, 30.0, 32.0, 33.0, 28.0, 23.0, 22.0, 31.0, 18.0, 21.0, 18.0, 10.0, 9.0, 17.0, 8.0, 9.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.212890625, -2.136627197265625, -2.06036376953125, -1.984100341796875, -1.9078369140625, -1.831573486328125, -1.75531005859375, -1.679046630859375, -1.602783203125, -1.526519775390625, -1.45025634765625, -1.373992919921875, -1.2977294921875, -1.221466064453125, -1.14520263671875, -1.068939208984375, -0.99267578125, -0.916412353515625, -0.84014892578125, -0.763885498046875, -0.6876220703125, -0.611358642578125, -0.53509521484375, -0.458831787109375, -0.382568359375, -0.306304931640625, -0.23004150390625, -0.153778076171875, -0.0775146484375, -0.001251220703125, 0.07501220703125, 0.151275634765625, 0.2275390625, 0.303802490234375, 0.38006591796875, 0.456329345703125, 0.5325927734375, 0.608856201171875, 0.68511962890625, 0.761383056640625, 0.837646484375, 0.913909912109375, 0.99017333984375, 1.066436767578125, 1.1427001953125, 1.218963623046875, 1.29522705078125, 1.371490478515625, 1.44775390625, 1.524017333984375, 1.60028076171875, 1.676544189453125, 1.7528076171875, 1.829071044921875, 1.90533447265625, 1.981597900390625, 2.057861328125, 2.134124755859375, 2.21038818359375, 2.286651611328125, 2.3629150390625, 2.439178466796875, 2.51544189453125, 2.591705322265625, 2.66796875]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 5.0, 9.0, 15.0, 25.0, 17.0, 33.0, 47.0, 51.0, 88.0, 110.0, 178.0, 242.0, 336.0, 542.0, 803.0, 1272.0, 1918.0, 3123.0, 5080.0, 8787.0, 15442.0, 31680.0, 767926.0, 153628.0, 24711.0, 12955.0, 7453.0, 4264.0, 2635.0, 1752.0, 1130.0, 709.0, 501.0, 309.0, 229.0, 158.0, 124.0, 70.0, 57.0, 37.0, 30.0, 18.0, 15.0, 15.0, 7.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.28173828125, -0.27260589599609375, -0.2634735107421875, -0.25434112548828125, -0.245208740234375, -0.23607635498046875, -0.2269439697265625, -0.21781158447265625, -0.20867919921875, -0.19954681396484375, -0.1904144287109375, -0.18128204345703125, -0.172149658203125, -0.16301727294921875, -0.1538848876953125, -0.14475250244140625, -0.1356201171875, -0.12648773193359375, -0.1173553466796875, -0.10822296142578125, -0.099090576171875, -0.08995819091796875, -0.0808258056640625, -0.07169342041015625, -0.06256103515625, -0.05342864990234375, -0.0442962646484375, -0.03516387939453125, -0.026031494140625, -0.01689910888671875, -0.0077667236328125, 0.00136566162109375, 0.010498046875, 0.01963043212890625, 0.0287628173828125, 0.03789520263671875, 0.047027587890625, 0.05615997314453125, 0.0652923583984375, 0.07442474365234375, 0.08355712890625, 0.09268951416015625, 0.1018218994140625, 0.11095428466796875, 0.120086669921875, 0.12921905517578125, 0.1383514404296875, 0.14748382568359375, 0.1566162109375, 0.16574859619140625, 0.1748809814453125, 0.18401336669921875, 0.193145751953125, 0.20227813720703125, 0.2114105224609375, 0.22054290771484375, 0.22967529296875, 0.23880767822265625, 0.2479400634765625, 0.25707244873046875, 0.266204833984375, 0.27533721923828125, 0.2844696044921875, 0.29360198974609375, 0.302734375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 7.0, 12.0, 20.0, 13.0, 22.0, 14.0, 22.0, 19.0, 26.0, 40.0, 27.0, 39.0, 52.0, 42.0, 35.0, 44.0, 51.0, 54.0, 54.0, 48.0, 42.0, 39.0, 27.0, 36.0, 34.0, 24.0, 21.0, 26.0, 19.0, 12.0, 12.0, 15.0, 9.0, 4.0, 3.0, 3.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4960765838623047e-05, -1.4374032616615295e-05, -1.3787299394607544e-05, -1.3200566172599792e-05, -1.2613832950592041e-05, -1.202709972858429e-05, -1.1440366506576538e-05, -1.0853633284568787e-05, -1.0266900062561035e-05, -9.680166840553284e-06, -9.093433618545532e-06, -8.50670039653778e-06, -7.91996717453003e-06, -7.333233952522278e-06, -6.746500730514526e-06, -6.159767508506775e-06, -5.5730342864990234e-06, -4.986301064491272e-06, -4.3995678424835205e-06, -3.812834620475769e-06, -3.2261013984680176e-06, -2.639368176460266e-06, -2.0526349544525146e-06, -1.4659017324447632e-06, -8.791685104370117e-07, -2.9243528842926025e-07, 2.942979335784912e-07, 8.810311555862427e-07, 1.4677643775939941e-06, 2.0544975996017456e-06, 2.641230821609497e-06, 3.2279640436172485e-06, 3.814697265625e-06, 4.4014304876327515e-06, 4.988163709640503e-06, 5.574896931648254e-06, 6.161630153656006e-06, 6.748363375663757e-06, 7.335096597671509e-06, 7.92182981967926e-06, 8.508563041687012e-06, 9.095296263694763e-06, 9.682029485702515e-06, 1.0268762707710266e-05, 1.0855495929718018e-05, 1.1442229151725769e-05, 1.202896237373352e-05, 1.2615695595741272e-05, 1.3202428817749023e-05, 1.3789162039756775e-05, 1.4375895261764526e-05, 1.4962628483772278e-05, 1.554936170578003e-05, 1.613609492778778e-05, 1.6722828149795532e-05, 1.7309561371803284e-05, 1.7896294593811035e-05, 1.8483027815818787e-05, 1.9069761037826538e-05, 1.965649425983429e-05, 2.024322748184204e-05, 2.0829960703849792e-05, 2.1416693925857544e-05, 2.2003427147865295e-05, 2.2590160369873047e-05]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 8.0, 12.0, 16.0, 29.0, 38.0, 45.0, 65.0, 83.0, 87.0, 171.0, 257.0, 392.0, 643.0, 998.0, 1807.0, 3264.0, 6018.0, 11587.0, 23527.0, 49211.0, 106267.0, 219268.0, 287063.0, 177467.0, 82346.0, 38489.0, 18572.0, 9217.0, 4936.0, 2659.0, 1499.0, 863.0, 519.0, 340.0, 210.0, 165.0, 134.0, 62.0, 64.0, 32.0, 24.0, 19.0, 25.0, 11.0, 6.0, 11.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1639404296875, -0.15887069702148438, -0.15380096435546875, -0.14873123168945312, -0.1436614990234375, -0.13859176635742188, -0.13352203369140625, -0.12845230102539062, -0.123382568359375, -0.11831283569335938, -0.11324310302734375, -0.10817337036132812, -0.1031036376953125, -0.09803390502929688, -0.09296417236328125, -0.08789443969726562, -0.08282470703125, -0.07775497436523438, -0.07268524169921875, -0.06761550903320312, -0.0625457763671875, -0.057476043701171875, -0.05240631103515625, -0.047336578369140625, -0.042266845703125, -0.037197113037109375, -0.03212738037109375, -0.027057647705078125, -0.0219879150390625, -0.016918182373046875, -0.01184844970703125, -0.006778717041015625, -0.001708984375, 0.003360748291015625, 0.00843048095703125, 0.013500213623046875, 0.0185699462890625, 0.023639678955078125, 0.02870941162109375, 0.033779144287109375, 0.038848876953125, 0.043918609619140625, 0.04898834228515625, 0.054058074951171875, 0.0591278076171875, 0.06419754028320312, 0.06926727294921875, 0.07433700561523438, 0.07940673828125, 0.08447647094726562, 0.08954620361328125, 0.09461593627929688, 0.0996856689453125, 0.10475540161132812, 0.10982513427734375, 0.11489486694335938, 0.119964599609375, 0.12503433227539062, 0.13010406494140625, 0.13517379760742188, 0.1402435302734375, 0.14531326293945312, 0.15038299560546875, 0.15545272827148438, 0.1605224609375]}, "gradients/decoder.bert.encoder.layer.15.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 14.0, 16.0, 25.0, 21.0, 35.0, 58.0, 74.0, 93.0, 103.0, 96.0, 79.0, 81.0, 70.0, 37.0, 38.0, 34.0, 26.0, 16.0, 9.0, 7.0, 9.0, 10.0, 5.0, 2.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06365966796875, -0.061743736267089844, -0.05982780456542969, -0.05791187286376953, -0.055995941162109375, -0.05408000946044922, -0.05216407775878906, -0.050248146057128906, -0.04833221435546875, -0.046416282653808594, -0.04450035095214844, -0.04258441925048828, -0.040668487548828125, -0.03875255584716797, -0.03683662414550781, -0.034920692443847656, -0.0330047607421875, -0.031088829040527344, -0.029172897338867188, -0.02725696563720703, -0.025341033935546875, -0.02342510223388672, -0.021509170532226562, -0.019593238830566406, -0.01767730712890625, -0.015761375427246094, -0.013845443725585938, -0.011929512023925781, -0.010013580322265625, -0.008097648620605469, -0.0061817169189453125, -0.004265785217285156, -0.002349853515625, -0.00043392181396484375, 0.0014820098876953125, 0.0033979415893554688, 0.005313873291015625, 0.007229804992675781, 0.009145736694335938, 0.011061668395996094, 0.01297760009765625, 0.014893531799316406, 0.016809463500976562, 0.01872539520263672, 0.020641326904296875, 0.02255725860595703, 0.024473190307617188, 0.026389122009277344, 0.0283050537109375, 0.030220985412597656, 0.03213691711425781, 0.03405284881591797, 0.035968780517578125, 0.03788471221923828, 0.03980064392089844, 0.041716575622558594, 0.04363250732421875, 0.045548439025878906, 0.04746437072753906, 0.04938030242919922, 0.051296234130859375, 0.05321216583251953, 0.05512809753417969, 0.057044029235839844, 0.0589599609375]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 6.0, 9.0, 5.0, 7.0, 10.0, 19.0, 15.0, 17.0, 14.0, 27.0, 31.0, 44.0, 45.0, 50.0, 61.0, 68.0, 63.0, 77.0, 61.0, 67.0, 69.0, 32.0, 41.0, 33.0, 35.0, 26.0, 11.0, 12.0, 13.0, 12.0, 9.0, 1.0, 6.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.431341171264648, -4.272763252258301, -4.114185810089111, -3.9556081295013428, -3.797030448913574, -3.6384525299072266, -3.479874849319458, -3.3212971687316895, -3.162719488143921, -3.0041418075561523, -2.845564126968384, -2.6869864463806152, -2.5284085273742676, -2.369831085205078, -2.2112531661987305, -2.052675485610962, -1.8940978050231934, -1.7355201244354248, -1.5769424438476562, -1.4183646440505981, -1.2597869634628296, -1.101209282875061, -0.9426315426826477, -0.7840538024902344, -0.6254761219024658, -0.4668984115123749, -0.30832070112228394, -0.149742990732193, 0.00883471965789795, 0.1674124002456665, 0.32599014043807983, 0.48456788063049316, 0.6431460380554199, 0.8017237186431885, 0.9603014588356018, 1.1188791990280151, 1.2774568796157837, 1.4360345602035522, 1.5946123600006104, 1.753190040588379, 1.9117677211761475, 2.070345401763916, 2.2289230823516846, 2.387500762939453, 2.546078681945801, 2.7046561241149902, 2.863234043121338, 3.0218117237091064, 3.180389404296875, 3.3389670848846436, 3.497544765472412, 3.6561224460601807, 3.814700126647949, 3.973278045654297, 4.131855487823486, 4.290433406829834, 4.449010848999023, 4.607588768005371, 4.7661662101745605, 4.924744129180908, 5.083321571350098, 5.241899490356445, 5.400476932525635, 5.559054851531982, 5.71763277053833]}, "gradients/decoder.bert.encoder.layer.15.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 5.0, 10.0, 10.0, 12.0, 25.0, 23.0, 16.0, 14.0, 33.0, 44.0, 34.0, 44.0, 35.0, 47.0, 50.0, 47.0, 47.0, 38.0, 46.0, 47.0, 52.0, 41.0, 29.0, 32.0, 33.0, 30.0, 23.0, 18.0, 28.0, 18.0, 14.0, 10.0, 5.0, 5.0, 8.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.104467391967773, -3.9746875762939453, -3.844907760620117, -3.715127944946289, -3.585348129272461, -3.455568313598633, -3.3257882595062256, -3.1960084438323975, -3.0662286281585693, -2.936448812484741, -2.806668996810913, -2.676889181137085, -2.5471091270446777, -2.4173293113708496, -2.2875494956970215, -2.1577696800231934, -2.0279898643493652, -1.898210048675537, -1.768430233001709, -1.6386502981185913, -1.5088704824447632, -1.379090666770935, -1.2493107318878174, -1.1195309162139893, -0.9897511005401611, -0.859971284866333, -0.7301914095878601, -0.6004115343093872, -0.4706317186355591, -0.34085190296173096, -0.21107202768325806, -0.08129215240478516, 0.048487186431884766, 0.17826703190803528, 0.3080468773841858, 0.4378267228603363, 0.5676065683364868, 0.6973863840103149, 0.8271662592887878, 0.9569461345672607, 1.0867259502410889, 1.216505765914917, 1.3462855815887451, 1.4760655164718628, 1.605845332145691, 1.735625147819519, 1.8654050827026367, 1.9951848983764648, 2.124964714050293, 2.254744529724121, 2.384524345397949, 2.5143041610717773, 2.6440839767456055, 2.7738637924194336, 2.903643846511841, 3.033423662185669, 3.163203477859497, 3.292983293533325, 3.4227631092071533, 3.5525429248809814, 3.6823229789733887, 3.812102794647217, 3.941882610321045, 4.071662425994873, 4.201442241668701]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 15.0, 13.0, 27.0, 39.0, 48.0, 111.0, 169.0, 321.0, 594.0, 1062.0, 2006.0, 3840.0, 7515.0, 14831.0, 29882.0, 58313.0, 106094.0, 166314.0, 203366.0, 183045.0, 124605.0, 71340.0, 36758.0, 18746.0, 9374.0, 4769.0, 2430.0, 1275.0, 703.0, 424.0, 224.0, 125.0, 59.0, 45.0, 25.0, 15.0, 9.0, 9.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3359375, -4.198974609375, -4.06201171875, -3.925048828125, -3.7880859375, -3.651123046875, -3.51416015625, -3.377197265625, -3.240234375, -3.103271484375, -2.96630859375, -2.829345703125, -2.6923828125, -2.555419921875, -2.41845703125, -2.281494140625, -2.14453125, -2.007568359375, -1.87060546875, -1.733642578125, -1.5966796875, -1.459716796875, -1.32275390625, -1.185791015625, -1.048828125, -0.911865234375, -0.77490234375, -0.637939453125, -0.5009765625, -0.364013671875, -0.22705078125, -0.090087890625, 0.046875, 0.183837890625, 0.32080078125, 0.457763671875, 0.5947265625, 0.731689453125, 0.86865234375, 1.005615234375, 1.142578125, 1.279541015625, 1.41650390625, 1.553466796875, 1.6904296875, 1.827392578125, 1.96435546875, 2.101318359375, 2.23828125, 2.375244140625, 2.51220703125, 2.649169921875, 2.7861328125, 2.923095703125, 3.06005859375, 3.197021484375, 3.333984375, 3.470947265625, 3.60791015625, 3.744873046875, 3.8818359375, 4.018798828125, 4.15576171875, 4.292724609375, 4.4296875]}, "gradients/decoder.bert.encoder.layer.15.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 13.0, 13.0, 14.0, 20.0, 16.0, 16.0, 29.0, 31.0, 25.0, 29.0, 44.0, 38.0, 37.0, 37.0, 40.0, 54.0, 40.0, 48.0, 45.0, 48.0, 40.0, 45.0, 39.0, 43.0, 32.0, 26.0, 15.0, 17.0, 7.0, 18.0, 11.0, 14.0, 8.0, 5.0, 4.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.9765625, -3.84832763671875, -3.7200927734375, -3.59185791015625, -3.463623046875, -3.33538818359375, -3.2071533203125, -3.07891845703125, -2.95068359375, -2.82244873046875, -2.6942138671875, -2.56597900390625, -2.437744140625, -2.30950927734375, -2.1812744140625, -2.05303955078125, -1.9248046875, -1.79656982421875, -1.6683349609375, -1.54010009765625, -1.411865234375, -1.28363037109375, -1.1553955078125, -1.02716064453125, -0.89892578125, -0.77069091796875, -0.6424560546875, -0.51422119140625, -0.385986328125, -0.25775146484375, -0.1295166015625, -0.00128173828125, 0.126953125, 0.25518798828125, 0.3834228515625, 0.51165771484375, 0.639892578125, 0.76812744140625, 0.8963623046875, 1.02459716796875, 1.15283203125, 1.28106689453125, 1.4093017578125, 1.53753662109375, 1.665771484375, 1.79400634765625, 1.9222412109375, 2.05047607421875, 2.1787109375, 2.30694580078125, 2.4351806640625, 2.56341552734375, 2.691650390625, 2.81988525390625, 2.9481201171875, 3.07635498046875, 3.20458984375, 3.33282470703125, 3.4610595703125, 3.58929443359375, 3.717529296875, 3.84576416015625, 3.9739990234375, 4.10223388671875, 4.23046875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 14.0, 4.0, 13.0, 15.0, 25.0, 42.0, 60.0, 89.0, 139.0, 278.0, 424.0, 735.0, 1293.0, 2369.0, 4316.0, 7919.0, 14908.0, 27964.0, 50975.0, 88945.0, 141476.0, 184797.0, 184115.0, 139950.0, 88171.0, 50343.0, 27217.0, 14465.0, 7866.0, 4239.0, 2291.0, 1294.0, 754.0, 377.0, 232.0, 162.0, 100.0, 59.0, 46.0, 32.0, 17.0, 7.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-4.3125, -4.18560791015625, -4.0587158203125, -3.93182373046875, -3.804931640625, -3.67803955078125, -3.5511474609375, -3.42425537109375, -3.29736328125, -3.17047119140625, -3.0435791015625, -2.91668701171875, -2.789794921875, -2.66290283203125, -2.5360107421875, -2.40911865234375, -2.2822265625, -2.15533447265625, -2.0284423828125, -1.90155029296875, -1.774658203125, -1.64776611328125, -1.5208740234375, -1.39398193359375, -1.26708984375, -1.14019775390625, -1.0133056640625, -0.88641357421875, -0.759521484375, -0.63262939453125, -0.5057373046875, -0.37884521484375, -0.251953125, -0.12506103515625, 0.0018310546875, 0.12872314453125, 0.255615234375, 0.38250732421875, 0.5093994140625, 0.63629150390625, 0.76318359375, 0.89007568359375, 1.0169677734375, 1.14385986328125, 1.270751953125, 1.39764404296875, 1.5245361328125, 1.65142822265625, 1.7783203125, 1.90521240234375, 2.0321044921875, 2.15899658203125, 2.285888671875, 2.41278076171875, 2.5396728515625, 2.66656494140625, 2.79345703125, 2.92034912109375, 3.0472412109375, 3.17413330078125, 3.301025390625, 3.42791748046875, 3.5548095703125, 3.68170166015625, 3.80859375]}, "gradients/decoder.bert.encoder.layer.15.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 11.0, 12.0, 16.0, 13.0, 17.0, 19.0, 29.0, 24.0, 30.0, 32.0, 33.0, 41.0, 33.0, 48.0, 55.0, 56.0, 44.0, 40.0, 43.0, 42.0, 35.0, 31.0, 28.0, 35.0, 25.0, 31.0, 27.0, 22.0, 21.0, 6.0, 21.0, 7.0, 10.0, 8.0, 4.0, 8.0, 4.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.1575927734375, -2.080810546875, -2.0040283203125, -1.92724609375, -1.8504638671875, -1.773681640625, -1.6968994140625, -1.6201171875, -1.5433349609375, -1.466552734375, -1.3897705078125, -1.31298828125, -1.2362060546875, -1.159423828125, -1.0826416015625, -1.005859375, -0.9290771484375, -0.852294921875, -0.7755126953125, -0.69873046875, -0.6219482421875, -0.545166015625, -0.4683837890625, -0.3916015625, -0.3148193359375, -0.238037109375, -0.1612548828125, -0.08447265625, -0.0076904296875, 0.069091796875, 0.1458740234375, 0.22265625, 0.2994384765625, 0.376220703125, 0.4530029296875, 0.52978515625, 0.6065673828125, 0.683349609375, 0.7601318359375, 0.8369140625, 0.9136962890625, 0.990478515625, 1.0672607421875, 1.14404296875, 1.2208251953125, 1.297607421875, 1.3743896484375, 1.451171875, 1.5279541015625, 1.604736328125, 1.6815185546875, 1.75830078125, 1.8350830078125, 1.911865234375, 1.9886474609375, 2.0654296875, 2.1422119140625, 2.218994140625, 2.2957763671875, 2.37255859375, 2.4493408203125, 2.526123046875, 2.6029052734375, 2.6796875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 6.0, 10.0, 19.0, 18.0, 40.0, 44.0, 74.0, 109.0, 134.0, 202.0, 323.0, 469.0, 731.0, 1123.0, 1733.0, 2723.0, 4219.0, 6601.0, 10396.0, 16551.0, 26063.0, 40742.0, 62680.0, 90710.0, 121396.0, 143818.0, 141938.0, 119207.0, 88102.0, 59615.0, 39626.0, 24963.0, 16318.0, 10092.0, 6386.0, 4036.0, 2600.0, 1605.0, 1075.0, 688.0, 428.0, 300.0, 201.0, 137.0, 89.0, 64.0, 62.0, 28.0, 21.0, 8.0, 12.0, 4.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.421875, -1.37738037109375, -1.3328857421875, -1.28839111328125, -1.243896484375, -1.19940185546875, -1.1549072265625, -1.11041259765625, -1.06591796875, -1.02142333984375, -0.9769287109375, -0.93243408203125, -0.887939453125, -0.84344482421875, -0.7989501953125, -0.75445556640625, -0.7099609375, -0.66546630859375, -0.6209716796875, -0.57647705078125, -0.531982421875, -0.48748779296875, -0.4429931640625, -0.39849853515625, -0.35400390625, -0.30950927734375, -0.2650146484375, -0.22052001953125, -0.176025390625, -0.13153076171875, -0.0870361328125, -0.04254150390625, 0.001953125, 0.04644775390625, 0.0909423828125, 0.13543701171875, 0.179931640625, 0.22442626953125, 0.2689208984375, 0.31341552734375, 0.35791015625, 0.40240478515625, 0.4468994140625, 0.49139404296875, 0.535888671875, 0.58038330078125, 0.6248779296875, 0.66937255859375, 0.7138671875, 0.75836181640625, 0.8028564453125, 0.84735107421875, 0.891845703125, 0.93634033203125, 0.9808349609375, 1.02532958984375, 1.06982421875, 1.11431884765625, 1.1588134765625, 1.20330810546875, 1.247802734375, 1.29229736328125, 1.3367919921875, 1.38128662109375, 1.42578125]}, "gradients/decoder.bert.encoder.layer.15.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 10.0, 4.0, 8.0, 8.0, 7.0, 10.0, 14.0, 22.0, 20.0, 23.0, 33.0, 39.0, 47.0, 42.0, 57.0, 71.0, 52.0, 61.0, 60.0, 56.0, 60.0, 54.0, 36.0, 36.0, 25.0, 32.0, 22.0, 17.0, 16.0, 15.0, 9.0, 6.0, 2.0, 7.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001773834228515625, -0.00017171725630760193, -0.00016605108976364136, -0.00016038492321968079, -0.00015471875667572021, -0.00014905259013175964, -0.00014338642358779907, -0.0001377202570438385, -0.00013205409049987793, -0.00012638792395591736, -0.00012072175741195679, -0.00011505559086799622, -0.00010938942432403564, -0.00010372325778007507, -9.80570912361145e-05, -9.239092469215393e-05, -8.672475814819336e-05, -8.105859160423279e-05, -7.539242506027222e-05, -6.972625851631165e-05, -6.406009197235107e-05, -5.83939254283905e-05, -5.272775888442993e-05, -4.706159234046936e-05, -4.139542579650879e-05, -3.572925925254822e-05, -3.0063092708587646e-05, -2.4396926164627075e-05, -1.8730759620666504e-05, -1.3064593076705933e-05, -7.398426532745361e-06, -1.73225998878479e-06, 3.933906555175781e-06, 9.600073099136353e-06, 1.5266239643096924e-05, 2.0932406187057495e-05, 2.6598572731018066e-05, 3.226473927497864e-05, 3.793090581893921e-05, 4.359707236289978e-05, 4.926323890686035e-05, 5.492940545082092e-05, 6.0595571994781494e-05, 6.626173853874207e-05, 7.192790508270264e-05, 7.759407162666321e-05, 8.326023817062378e-05, 8.892640471458435e-05, 9.459257125854492e-05, 0.00010025873780250549, 0.00010592490434646606, 0.00011159107089042664, 0.00011725723743438721, 0.00012292340397834778, 0.00012858957052230835, 0.00013425573706626892, 0.0001399219036102295, 0.00014558807015419006, 0.00015125423669815063, 0.0001569204032421112, 0.00016258656978607178, 0.00016825273633003235, 0.00017391890287399292, 0.0001795850694179535, 0.00018525123596191406]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 23.0, 26.0, 28.0, 57.0, 82.0, 132.0, 204.0, 296.0, 497.0, 764.0, 1243.0, 1963.0, 3149.0, 5061.0, 8195.0, 13557.0, 22240.0, 36454.0, 57793.0, 88343.0, 123760.0, 150267.0, 152716.0, 128470.0, 92292.0, 61159.0, 38349.0, 23870.0, 14374.0, 8817.0, 5347.0, 3349.0, 2027.0, 1337.0, 787.0, 528.0, 325.0, 220.0, 141.0, 100.0, 64.0, 52.0, 23.0, 17.0, 14.0, 9.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.5341796875, -1.4877777099609375, -1.441375732421875, -1.3949737548828125, -1.34857177734375, -1.3021697998046875, -1.255767822265625, -1.2093658447265625, -1.1629638671875, -1.1165618896484375, -1.070159912109375, -1.0237579345703125, -0.97735595703125, -0.9309539794921875, -0.884552001953125, -0.8381500244140625, -0.791748046875, -0.7453460693359375, -0.698944091796875, -0.6525421142578125, -0.60614013671875, -0.5597381591796875, -0.513336181640625, -0.4669342041015625, -0.4205322265625, -0.3741302490234375, -0.327728271484375, -0.2813262939453125, -0.23492431640625, -0.1885223388671875, -0.142120361328125, -0.0957183837890625, -0.04931640625, -0.0029144287109375, 0.043487548828125, 0.0898895263671875, 0.13629150390625, 0.1826934814453125, 0.229095458984375, 0.2754974365234375, 0.3218994140625, 0.3683013916015625, 0.414703369140625, 0.4611053466796875, 0.50750732421875, 0.5539093017578125, 0.600311279296875, 0.6467132568359375, 0.693115234375, 0.7395172119140625, 0.785919189453125, 0.8323211669921875, 0.87872314453125, 0.9251251220703125, 0.971527099609375, 1.0179290771484375, 1.0643310546875, 1.1107330322265625, 1.157135009765625, 1.2035369873046875, 1.24993896484375, 1.2963409423828125, 1.342742919921875, 1.3891448974609375, 1.435546875]}, "gradients/decoder.bert.encoder.layer.15.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 8.0, 4.0, 10.0, 7.0, 8.0, 21.0, 12.0, 20.0, 28.0, 29.0, 36.0, 38.0, 49.0, 50.0, 49.0, 53.0, 58.0, 49.0, 45.0, 45.0, 51.0, 52.0, 49.0, 32.0, 35.0, 21.0, 22.0, 15.0, 24.0, 6.0, 15.0, 7.0, 13.0, 9.0, 4.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.57568359375, -0.5580520629882812, -0.5404205322265625, -0.5227890014648438, -0.505157470703125, -0.48752593994140625, -0.4698944091796875, -0.45226287841796875, -0.43463134765625, -0.41699981689453125, -0.3993682861328125, -0.38173675537109375, -0.364105224609375, -0.34647369384765625, -0.3288421630859375, -0.31121063232421875, -0.2935791015625, -0.27594757080078125, -0.2583160400390625, -0.24068450927734375, -0.223052978515625, -0.20542144775390625, -0.1877899169921875, -0.17015838623046875, -0.15252685546875, -0.13489532470703125, -0.1172637939453125, -0.09963226318359375, -0.082000732421875, -0.06436920166015625, -0.0467376708984375, -0.02910614013671875, -0.011474609375, 0.00615692138671875, 0.0237884521484375, 0.04141998291015625, 0.059051513671875, 0.07668304443359375, 0.0943145751953125, 0.11194610595703125, 0.12957763671875, 0.14720916748046875, 0.1648406982421875, 0.18247222900390625, 0.200103759765625, 0.21773529052734375, 0.2353668212890625, 0.25299835205078125, 0.2706298828125, 0.28826141357421875, 0.3058929443359375, 0.32352447509765625, 0.341156005859375, 0.35878753662109375, 0.3764190673828125, 0.39405059814453125, 0.41168212890625, 0.42931365966796875, 0.4469451904296875, 0.46457672119140625, 0.482208251953125, 0.49983978271484375, 0.5174713134765625, 0.5351028442382812, 0.552734375]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 3.0, 6.0, 6.0, 6.0, 7.0, 17.0, 22.0, 27.0, 27.0, 43.0, 47.0, 53.0, 56.0, 63.0, 54.0, 80.0, 68.0, 74.0, 62.0, 49.0, 36.0, 44.0, 35.0, 29.0, 13.0, 13.0, 22.0, 8.0, 7.0, 3.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.682610988616943, -4.518340110778809, -4.354068756103516, -4.189797878265381, -4.025526523590088, -3.861255407333374, -3.69698429107666, -3.5327134132385254, -3.3684420585632324, -3.2041709423065186, -3.0398998260498047, -2.875628709793091, -2.711357593536377, -2.547086477279663, -2.382815361022949, -2.2185444831848145, -2.0542733669281006, -1.8900022506713867, -1.7257311344146729, -1.561460018157959, -1.3971889019012451, -1.2329177856445312, -1.068646788597107, -0.9043756723403931, -0.7401045560836792, -0.5758334398269653, -0.41156235337257385, -0.24729126691818237, -0.0830201506614685, 0.08125096559524536, 0.24552202224731445, 0.4097931385040283, 0.5740642547607422, 0.738335371017456, 0.9026064872741699, 1.0668776035308838, 1.2311487197875977, 1.3954198360443115, 1.5596908330917358, 1.7239619493484497, 1.8882330656051636, 2.052504062652588, 2.2167751789093018, 2.3810462951660156, 2.5453174114227295, 2.7095885276794434, 2.8738596439361572, 3.038130760192871, 3.202401876449585, 3.366672992706299, 3.5309441089630127, 3.6952152252197266, 3.8594863414764404, 4.023757457733154, 4.188028335571289, 4.352299690246582, 4.516570568084717, 4.680841445922852, 4.8451128005981445, 5.009383678436279, 5.173655033111572, 5.337925910949707, 5.502197265625, 5.666468143463135, 5.830739498138428]}, "gradients/decoder.bert.encoder.layer.14.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 7.0, 10.0, 17.0, 16.0, 19.0, 25.0, 28.0, 31.0, 35.0, 37.0, 50.0, 46.0, 45.0, 55.0, 48.0, 38.0, 45.0, 58.0, 48.0, 45.0, 54.0, 37.0, 32.0, 31.0, 24.0, 28.0, 26.0, 17.0, 6.0, 7.0, 10.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.908332824707031, -4.764987945556641, -4.621642589569092, -4.478297233581543, -4.334952354431152, -4.191607475280762, -4.048262119293213, -3.904917001724243, -3.7615718841552734, -3.6182267665863037, -3.474881649017334, -3.3315365314483643, -3.1881914138793945, -3.044846296310425, -2.901501178741455, -2.7581560611724854, -2.6148109436035156, -2.471465826034546, -2.328120708465576, -2.1847755908966064, -2.0414304733276367, -1.898085355758667, -1.7547402381896973, -1.6113951206207275, -1.4680500030517578, -1.324704885482788, -1.1813597679138184, -1.0380146503448486, -0.8946695327758789, -0.7513244152069092, -0.6079792976379395, -0.4646341800689697, -0.3212890625, -0.17794394493103027, -0.03459882736206055, 0.10874629020690918, 0.2520914077758789, 0.39543652534484863, 0.5387816429138184, 0.6821267604827881, 0.8254718780517578, 0.9688169956207275, 1.1121621131896973, 1.255507230758667, 1.3988523483276367, 1.5421974658966064, 1.6855425834655762, 1.828887701034546, 1.9722328186035156, 2.1155779361724854, 2.258923053741455, 2.402268171310425, 2.5456132888793945, 2.6889584064483643, 2.832303524017334, 2.9756486415863037, 3.1189937591552734, 3.262338876724243, 3.405683994293213, 3.5490291118621826, 3.6923742294311523, 3.835719347000122, 3.979064464569092, 4.122409820556641, 4.265754699707031]}, "gradients/decoder.bert.encoder.layer.14.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 8.0, 13.0, 13.0, 10.0, 23.0, 32.0, 41.0, 54.0, 84.0, 109.0, 145.0, 271.0, 376.0, 600.0, 926.0, 1446.0, 2499.0, 4088.0, 6929.0, 12124.0, 22281.0, 42288.0, 85819.0, 187338.0, 433477.0, 911232.0, 1151379.0, 726460.0, 319728.0, 140733.0, 66534.0, 34056.0, 18281.0, 10062.0, 5916.0, 3422.0, 2027.0, 1276.0, 834.0, 506.0, 298.0, 179.0, 134.0, 85.0, 57.0, 37.0, 20.0, 23.0, 9.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.58984375, -4.45208740234375, -4.3143310546875, -4.17657470703125, -4.038818359375, -3.90106201171875, -3.7633056640625, -3.62554931640625, -3.48779296875, -3.35003662109375, -3.2122802734375, -3.07452392578125, -2.936767578125, -2.79901123046875, -2.6612548828125, -2.52349853515625, -2.3857421875, -2.24798583984375, -2.1102294921875, -1.97247314453125, -1.834716796875, -1.69696044921875, -1.5592041015625, -1.42144775390625, -1.28369140625, -1.14593505859375, -1.0081787109375, -0.87042236328125, -0.732666015625, -0.59490966796875, -0.4571533203125, -0.31939697265625, -0.181640625, -0.04388427734375, 0.0938720703125, 0.23162841796875, 0.369384765625, 0.50714111328125, 0.6448974609375, 0.78265380859375, 0.92041015625, 1.05816650390625, 1.1959228515625, 1.33367919921875, 1.471435546875, 1.60919189453125, 1.7469482421875, 1.88470458984375, 2.0224609375, 2.16021728515625, 2.2979736328125, 2.43572998046875, 2.573486328125, 2.71124267578125, 2.8489990234375, 2.98675537109375, 3.12451171875, 3.26226806640625, 3.4000244140625, 3.53778076171875, 3.675537109375, 3.81329345703125, 3.9510498046875, 4.08880615234375, 4.2265625]}, "gradients/decoder.bert.encoder.layer.14.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 12.0, 8.0, 8.0, 11.0, 11.0, 20.0, 22.0, 25.0, 25.0, 30.0, 32.0, 31.0, 45.0, 50.0, 48.0, 48.0, 53.0, 40.0, 53.0, 48.0, 47.0, 38.0, 36.0, 41.0, 35.0, 34.0, 29.0, 28.0, 21.0, 22.0, 16.0, 8.0, 5.0, 4.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.41796875, -3.3232421875, -3.228515625, -3.1337890625, -3.0390625, -2.9443359375, -2.849609375, -2.7548828125, -2.66015625, -2.5654296875, -2.470703125, -2.3759765625, -2.28125, -2.1865234375, -2.091796875, -1.9970703125, -1.90234375, -1.8076171875, -1.712890625, -1.6181640625, -1.5234375, -1.4287109375, -1.333984375, -1.2392578125, -1.14453125, -1.0498046875, -0.955078125, -0.8603515625, -0.765625, -0.6708984375, -0.576171875, -0.4814453125, -0.38671875, -0.2919921875, -0.197265625, -0.1025390625, -0.0078125, 0.0869140625, 0.181640625, 0.2763671875, 0.37109375, 0.4658203125, 0.560546875, 0.6552734375, 0.75, 0.8447265625, 0.939453125, 1.0341796875, 1.12890625, 1.2236328125, 1.318359375, 1.4130859375, 1.5078125, 1.6025390625, 1.697265625, 1.7919921875, 1.88671875, 1.9814453125, 2.076171875, 2.1708984375, 2.265625, 2.3603515625, 2.455078125, 2.5498046875, 2.64453125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 13.0, 24.0, 41.0, 68.0, 128.0, 177.0, 226.0, 429.0, 670.0, 1192.0, 1990.0, 3261.0, 6086.0, 11142.0, 21417.0, 42274.0, 88009.0, 193106.0, 434460.0, 916579.0, 1175838.0, 703373.0, 316401.0, 142712.0, 66227.0, 32104.0, 16350.0, 8527.0, 4900.0, 2674.0, 1596.0, 871.0, 497.0, 331.0, 204.0, 141.0, 91.0, 59.0, 28.0, 29.0, 8.0, 7.0, 9.0, 2.0, 0.0, 5.0, 0.0, 2.0, 1.0], "bins": [-5.6328125, -5.4732666015625, -5.313720703125, -5.1541748046875, -4.99462890625, -4.8350830078125, -4.675537109375, -4.5159912109375, -4.3564453125, -4.1968994140625, -4.037353515625, -3.8778076171875, -3.71826171875, -3.5587158203125, -3.399169921875, -3.2396240234375, -3.080078125, -2.9205322265625, -2.760986328125, -2.6014404296875, -2.44189453125, -2.2823486328125, -2.122802734375, -1.9632568359375, -1.8037109375, -1.6441650390625, -1.484619140625, -1.3250732421875, -1.16552734375, -1.0059814453125, -0.846435546875, -0.6868896484375, -0.52734375, -0.3677978515625, -0.208251953125, -0.0487060546875, 0.11083984375, 0.2703857421875, 0.429931640625, 0.5894775390625, 0.7490234375, 0.9085693359375, 1.068115234375, 1.2276611328125, 1.38720703125, 1.5467529296875, 1.706298828125, 1.8658447265625, 2.025390625, 2.1849365234375, 2.344482421875, 2.5040283203125, 2.66357421875, 2.8231201171875, 2.982666015625, 3.1422119140625, 3.3017578125, 3.4613037109375, 3.620849609375, 3.7803955078125, 3.93994140625, 4.0994873046875, 4.259033203125, 4.4185791015625, 4.578125]}, "gradients/decoder.bert.encoder.layer.14.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 13.0, 12.0, 25.0, 24.0, 49.0, 49.0, 61.0, 72.0, 96.0, 145.0, 142.0, 165.0, 209.0, 231.0, 254.0, 261.0, 267.0, 253.0, 295.0, 230.0, 258.0, 180.0, 146.0, 111.0, 91.0, 89.0, 58.0, 67.0, 35.0, 36.0, 19.0, 31.0, 17.0, 9.0, 10.0, 7.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.328125, -1.2847747802734375, -1.241424560546875, -1.1980743408203125, -1.15472412109375, -1.1113739013671875, -1.068023681640625, -1.0246734619140625, -0.9813232421875, -0.9379730224609375, -0.894622802734375, -0.8512725830078125, -0.80792236328125, -0.7645721435546875, -0.721221923828125, -0.6778717041015625, -0.634521484375, -0.5911712646484375, -0.547821044921875, -0.5044708251953125, -0.46112060546875, -0.4177703857421875, -0.374420166015625, -0.3310699462890625, -0.2877197265625, -0.2443695068359375, -0.201019287109375, -0.1576690673828125, -0.11431884765625, -0.0709686279296875, -0.027618408203125, 0.0157318115234375, 0.05908203125, 0.1024322509765625, 0.145782470703125, 0.1891326904296875, 0.23248291015625, 0.2758331298828125, 0.319183349609375, 0.3625335693359375, 0.4058837890625, 0.4492340087890625, 0.492584228515625, 0.5359344482421875, 0.57928466796875, 0.6226348876953125, 0.665985107421875, 0.7093353271484375, 0.752685546875, 0.7960357666015625, 0.839385986328125, 0.8827362060546875, 0.92608642578125, 0.9694366455078125, 1.012786865234375, 1.0561370849609375, 1.0994873046875, 1.1428375244140625, 1.186187744140625, 1.2295379638671875, 1.27288818359375, 1.3162384033203125, 1.359588623046875, 1.4029388427734375, 1.4462890625]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 4.0, 1.0, 6.0, 9.0, 5.0, 7.0, 12.0, 16.0, 20.0, 42.0, 42.0, 56.0, 43.0, 67.0, 65.0, 72.0, 78.0, 74.0, 63.0, 69.0, 41.0, 43.0, 39.0, 26.0, 27.0, 15.0, 12.0, 11.0, 9.0, 8.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.32554817199707, -4.1618146896362305, -3.9980812072753906, -3.83434796333313, -3.67061448097229, -3.50688099861145, -3.3431477546691895, -3.1794142723083496, -3.0156807899475098, -2.85194730758667, -2.68821382522583, -2.5244805812835693, -2.3607470989227295, -2.1970136165618896, -2.033280372619629, -1.869546890258789, -1.7058134078979492, -1.5420799255371094, -1.378346562385559, -1.2146131992340088, -1.050879716873169, -0.8871462941169739, -0.7234128713607788, -0.5596795082092285, -0.39594602584838867, -0.2322126030921936, -0.06847918033599854, 0.09525424242019653, 0.2589876651763916, 0.42272108793258667, 0.5864545106887817, 0.750187873840332, 0.9139208793640137, 1.0776543617248535, 1.2413877248764038, 1.405121088027954, 1.568854570388794, 1.7325880527496338, 1.896321415901184, 2.0600547790527344, 2.223788261413574, 2.387521743774414, 2.551255226135254, 2.7149884700775146, 2.8787219524383545, 3.0424554347991943, 3.206188678741455, 3.369922161102295, 3.5336556434631348, 3.6973891258239746, 3.8611226081848145, 4.024856090545654, 4.188589096069336, 4.352322578430176, 4.516056060791016, 4.6797895431518555, 4.843523025512695, 5.007256507873535, 5.170989990234375, 5.334723472595215, 5.498456954956055, 5.662189960479736, 5.825923442840576, 5.989656925201416, 6.153390407562256]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 3.0, 4.0, 6.0, 10.0, 10.0, 8.0, 15.0, 21.0, 12.0, 26.0, 27.0, 30.0, 25.0, 29.0, 30.0, 34.0, 40.0, 61.0, 60.0, 48.0, 51.0, 46.0, 46.0, 42.0, 50.0, 20.0, 33.0, 32.0, 34.0, 28.0, 23.0, 24.0, 18.0, 9.0, 19.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.472722291946411, -3.3598921298980713, -3.2470619678497314, -3.1342320442199707, -3.021401882171631, -2.908571720123291, -2.795741558074951, -2.6829113960266113, -2.5700814723968506, -2.4572513103485107, -2.344421148300171, -2.23159122467041, -2.1187610626220703, -2.0059309005737305, -1.8931007385253906, -1.7802706956863403, -1.6674405336380005, -1.5546103715896606, -1.4417803287506104, -1.3289501667022705, -1.2161201238632202, -1.1032899618148804, -0.9904598593711853, -0.8776297569274902, -0.7647996544837952, -0.6519695520401001, -0.539139449596405, -0.4263093173503876, -0.3134792149066925, -0.20064908266067505, -0.08781898021697998, 0.025011122226715088, 0.13784122467041016, 0.2506713271141052, 0.3635014295578003, 0.47633156180381775, 0.5891616344451904, 0.7019917964935303, 0.8148218989372253, 0.9276520013809204, 1.0404820442199707, 1.1533122062683105, 1.2661422491073608, 1.3789724111557007, 1.491802453994751, 1.6046326160430908, 1.7174627780914307, 1.830292820930481, 1.9431229829788208, 2.055953025817871, 2.168783187866211, 2.281613349914551, 2.3944435119628906, 2.5072736740112305, 2.620103597640991, 2.732933759689331, 2.845763921737671, 2.9585940837860107, 3.0714242458343506, 3.1842541694641113, 3.297084331512451, 3.409914493560791, 3.522744655609131, 3.6355748176574707, 3.7484047412872314]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 12.0, 16.0, 27.0, 32.0, 58.0, 73.0, 125.0, 185.0, 303.0, 435.0, 664.0, 1051.0, 1614.0, 2629.0, 4271.0, 7306.0, 12308.0, 20714.0, 37333.0, 69182.0, 128845.0, 217259.0, 227832.0, 142693.0, 76358.0, 40850.0, 22574.0, 13255.0, 7856.0, 4757.0, 2981.0, 1767.0, 1093.0, 714.0, 503.0, 276.0, 178.0, 137.0, 104.0, 72.0, 30.0, 31.0, 12.0, 13.0, 12.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.56591796875, -0.5497856140136719, -0.5336532592773438, -0.5175209045410156, -0.5013885498046875, -0.4852561950683594, -0.46912384033203125, -0.4529914855957031, -0.436859130859375, -0.4207267761230469, -0.40459442138671875, -0.3884620666503906, -0.3723297119140625, -0.3561973571777344, -0.34006500244140625, -0.3239326477050781, -0.30780029296875, -0.2916679382324219, -0.27553558349609375, -0.2594032287597656, -0.2432708740234375, -0.22713851928710938, -0.21100616455078125, -0.19487380981445312, -0.178741455078125, -0.16260910034179688, -0.14647674560546875, -0.13034439086914062, -0.1142120361328125, -0.09807968139648438, -0.08194732666015625, -0.06581497192382812, -0.0496826171875, -0.033550262451171875, -0.01741790771484375, -0.001285552978515625, 0.0148468017578125, 0.030979156494140625, 0.04711151123046875, 0.06324386596679688, 0.079376220703125, 0.09550857543945312, 0.11164093017578125, 0.12777328491210938, 0.1439056396484375, 0.16003799438476562, 0.17617034912109375, 0.19230270385742188, 0.20843505859375, 0.22456741333007812, 0.24069976806640625, 0.2568321228027344, 0.2729644775390625, 0.2890968322753906, 0.30522918701171875, 0.3213615417480469, 0.337493896484375, 0.3536262512207031, 0.36975860595703125, 0.3858909606933594, 0.4020233154296875, 0.4181556701660156, 0.43428802490234375, 0.4504203796386719, 0.466552734375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 2.0, 3.0, 9.0, 6.0, 2.0, 9.0, 11.0, 14.0, 18.0, 21.0, 26.0, 29.0, 27.0, 29.0, 40.0, 36.0, 55.0, 35.0, 48.0, 60.0, 46.0, 53.0, 39.0, 49.0, 44.0, 46.0, 24.0, 32.0, 27.0, 28.0, 22.0, 31.0, 23.0, 8.0, 14.0, 12.0, 11.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.2578125, -4.1351318359375, -4.012451171875, -3.8897705078125, -3.76708984375, -3.6444091796875, -3.521728515625, -3.3990478515625, -3.2763671875, -3.1536865234375, -3.031005859375, -2.9083251953125, -2.78564453125, -2.6629638671875, -2.540283203125, -2.4176025390625, -2.294921875, -2.1722412109375, -2.049560546875, -1.9268798828125, -1.80419921875, -1.6815185546875, -1.558837890625, -1.4361572265625, -1.3134765625, -1.1907958984375, -1.068115234375, -0.9454345703125, -0.82275390625, -0.7000732421875, -0.577392578125, -0.4547119140625, -0.33203125, -0.2093505859375, -0.086669921875, 0.0360107421875, 0.15869140625, 0.2813720703125, 0.404052734375, 0.5267333984375, 0.6494140625, 0.7720947265625, 0.894775390625, 1.0174560546875, 1.14013671875, 1.2628173828125, 1.385498046875, 1.5081787109375, 1.630859375, 1.7535400390625, 1.876220703125, 1.9989013671875, 2.12158203125, 2.2442626953125, 2.366943359375, 2.4896240234375, 2.6123046875, 2.7349853515625, 2.857666015625, 2.9803466796875, 3.10302734375, 3.2257080078125, 3.348388671875, 3.4710693359375, 3.59375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 13.0, 10.0, 16.0, 20.0, 28.0, 31.0, 57.0, 68.0, 95.0, 133.0, 200.0, 290.0, 458.0, 743.0, 1165.0, 2081.0, 3832.0, 7469.0, 16828.0, 51456.0, 813687.0, 106768.0, 22475.0, 9614.0, 4722.0, 2413.0, 1375.0, 821.0, 558.0, 361.0, 226.0, 154.0, 112.0, 69.0, 53.0, 36.0, 27.0, 18.0, 16.0, 16.0, 10.0, 5.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.166015625, -1.12799072265625, -1.0899658203125, -1.05194091796875, -1.013916015625, -0.97589111328125, -0.9378662109375, -0.89984130859375, -0.86181640625, -0.82379150390625, -0.7857666015625, -0.74774169921875, -0.709716796875, -0.67169189453125, -0.6336669921875, -0.59564208984375, -0.5576171875, -0.51959228515625, -0.4815673828125, -0.44354248046875, -0.405517578125, -0.36749267578125, -0.3294677734375, -0.29144287109375, -0.25341796875, -0.21539306640625, -0.1773681640625, -0.13934326171875, -0.101318359375, -0.06329345703125, -0.0252685546875, 0.01275634765625, 0.05078125, 0.08880615234375, 0.1268310546875, 0.16485595703125, 0.202880859375, 0.24090576171875, 0.2789306640625, 0.31695556640625, 0.35498046875, 0.39300537109375, 0.4310302734375, 0.46905517578125, 0.507080078125, 0.54510498046875, 0.5831298828125, 0.62115478515625, 0.6591796875, 0.69720458984375, 0.7352294921875, 0.77325439453125, 0.811279296875, 0.84930419921875, 0.8873291015625, 0.92535400390625, 0.96337890625, 1.00140380859375, 1.0394287109375, 1.07745361328125, 1.115478515625, 1.15350341796875, 1.1915283203125, 1.22955322265625, 1.267578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 14.0, 14.0, 9.0, 9.0, 20.0, 22.0, 23.0, 29.0, 25.0, 26.0, 30.0, 39.0, 39.0, 52.0, 40.0, 39.0, 37.0, 44.0, 36.0, 34.0, 42.0, 45.0, 41.0, 28.0, 38.0, 31.0, 26.0, 22.0, 22.0, 17.0, 13.0, 11.0, 12.0, 8.0, 13.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1328125, -2.062286376953125, -1.99176025390625, -1.921234130859375, -1.8507080078125, -1.780181884765625, -1.70965576171875, -1.639129638671875, -1.568603515625, -1.498077392578125, -1.42755126953125, -1.357025146484375, -1.2864990234375, -1.215972900390625, -1.14544677734375, -1.074920654296875, -1.00439453125, -0.933868408203125, -0.86334228515625, -0.792816162109375, -0.7222900390625, -0.651763916015625, -0.58123779296875, -0.510711669921875, -0.440185546875, -0.369659423828125, -0.29913330078125, -0.228607177734375, -0.1580810546875, -0.087554931640625, -0.01702880859375, 0.053497314453125, 0.1240234375, 0.194549560546875, 0.26507568359375, 0.335601806640625, 0.4061279296875, 0.476654052734375, 0.54718017578125, 0.617706298828125, 0.688232421875, 0.758758544921875, 0.82928466796875, 0.899810791015625, 0.9703369140625, 1.040863037109375, 1.11138916015625, 1.181915283203125, 1.25244140625, 1.322967529296875, 1.39349365234375, 1.464019775390625, 1.5345458984375, 1.605072021484375, 1.67559814453125, 1.746124267578125, 1.816650390625, 1.887176513671875, 1.95770263671875, 2.028228759765625, 2.0987548828125, 2.169281005859375, 2.23980712890625, 2.310333251953125, 2.380859375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 11.0, 17.0, 14.0, 31.0, 48.0, 73.0, 105.0, 190.0, 312.0, 492.0, 925.0, 1602.0, 3037.0, 5779.0, 11562.0, 26057.0, 426919.0, 520002.0, 26730.0, 11889.0, 5861.0, 3064.0, 1602.0, 922.0, 525.0, 312.0, 186.0, 119.0, 47.0, 48.0, 32.0, 9.0, 9.0, 8.0, 5.0, 3.0, 6.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.292633056640625, -0.28179931640625, -0.270965576171875, -0.2601318359375, -0.249298095703125, -0.23846435546875, -0.227630615234375, -0.216796875, -0.205963134765625, -0.19512939453125, -0.184295654296875, -0.1734619140625, -0.162628173828125, -0.15179443359375, -0.140960693359375, -0.130126953125, -0.119293212890625, -0.10845947265625, -0.097625732421875, -0.0867919921875, -0.075958251953125, -0.06512451171875, -0.054290771484375, -0.04345703125, -0.032623291015625, -0.02178955078125, -0.010955810546875, -0.0001220703125, 0.010711669921875, 0.02154541015625, 0.032379150390625, 0.043212890625, 0.054046630859375, 0.06488037109375, 0.075714111328125, 0.0865478515625, 0.097381591796875, 0.10821533203125, 0.119049072265625, 0.1298828125, 0.140716552734375, 0.15155029296875, 0.162384033203125, 0.1732177734375, 0.184051513671875, 0.19488525390625, 0.205718994140625, 0.216552734375, 0.227386474609375, 0.23822021484375, 0.249053955078125, 0.2598876953125, 0.270721435546875, 0.28155517578125, 0.292388916015625, 0.30322265625, 0.314056396484375, 0.32489013671875, 0.335723876953125, 0.3465576171875, 0.357391357421875, 0.36822509765625, 0.379058837890625, 0.389892578125]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 7.0, 7.0, 16.0, 18.0, 21.0, 23.0, 25.0, 32.0, 32.0, 40.0, 43.0, 39.0, 48.0, 42.0, 48.0, 41.0, 54.0, 50.0, 47.0, 48.0, 43.0, 32.0, 41.0, 20.0, 28.0, 26.0, 25.0, 15.0, 17.0, 14.0, 12.0, 3.0, 9.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.8034130334854126e-05, -1.7352402210235596e-05, -1.6670674085617065e-05, -1.5988945960998535e-05, -1.5307217836380005e-05, -1.4625489711761475e-05, -1.3943761587142944e-05, -1.3262033462524414e-05, -1.2580305337905884e-05, -1.1898577213287354e-05, -1.1216849088668823e-05, -1.0535120964050293e-05, -9.853392839431763e-06, -9.171664714813232e-06, -8.489936590194702e-06, -7.808208465576172e-06, -7.126480340957642e-06, -6.444752216339111e-06, -5.763024091720581e-06, -5.081295967102051e-06, -4.3995678424835205e-06, -3.7178397178649902e-06, -3.03611159324646e-06, -2.3543834686279297e-06, -1.6726553440093994e-06, -9.909272193908691e-07, -3.0919909477233887e-07, 3.725290298461914e-07, 1.0542571544647217e-06, 1.735985279083252e-06, 2.4177134037017822e-06, 3.0994415283203125e-06, 3.7811696529388428e-06, 4.462897777557373e-06, 5.144625902175903e-06, 5.826354026794434e-06, 6.508082151412964e-06, 7.189810276031494e-06, 7.871538400650024e-06, 8.553266525268555e-06, 9.234994649887085e-06, 9.916722774505615e-06, 1.0598450899124146e-05, 1.1280179023742676e-05, 1.1961907148361206e-05, 1.2643635272979736e-05, 1.3325363397598267e-05, 1.4007091522216797e-05, 1.4688819646835327e-05, 1.5370547771453857e-05, 1.6052275896072388e-05, 1.6734004020690918e-05, 1.7415732145309448e-05, 1.809746026992798e-05, 1.877918839454651e-05, 1.946091651916504e-05, 2.014264464378357e-05, 2.08243727684021e-05, 2.150610089302063e-05, 2.218782901763916e-05, 2.286955714225769e-05, 2.355128526687622e-05, 2.423301339149475e-05, 2.491474151611328e-05]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 14.0, 13.0, 16.0, 16.0, 30.0, 46.0, 63.0, 86.0, 126.0, 187.0, 284.0, 459.0, 686.0, 1148.0, 1816.0, 3154.0, 5509.0, 9919.0, 18442.0, 35376.0, 69101.0, 136310.0, 234514.0, 238400.0, 141564.0, 71480.0, 36382.0, 19151.0, 10332.0, 5655.0, 3147.0, 1873.0, 1176.0, 693.0, 487.0, 287.0, 218.0, 120.0, 81.0, 51.0, 54.0, 19.0, 21.0, 17.0, 6.0, 9.0, 7.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.1175537109375, -0.11376476287841797, -0.10997581481933594, -0.1061868667602539, -0.10239791870117188, -0.09860897064208984, -0.09482002258300781, -0.09103107452392578, -0.08724212646484375, -0.08345317840576172, -0.07966423034667969, -0.07587528228759766, -0.07208633422851562, -0.0682973861694336, -0.06450843811035156, -0.06071949005126953, -0.0569305419921875, -0.05314159393310547, -0.04935264587402344, -0.045563697814941406, -0.041774749755859375, -0.037985801696777344, -0.03419685363769531, -0.03040790557861328, -0.02661895751953125, -0.02283000946044922, -0.019041061401367188, -0.015252113342285156, -0.011463165283203125, -0.007674217224121094, -0.0038852691650390625, -9.632110595703125e-05, 0.003692626953125, 0.007481575012207031, 0.011270523071289062, 0.015059471130371094, 0.018848419189453125, 0.022637367248535156, 0.026426315307617188, 0.03021526336669922, 0.03400421142578125, 0.03779315948486328, 0.04158210754394531, 0.045371055603027344, 0.049160003662109375, 0.052948951721191406, 0.05673789978027344, 0.06052684783935547, 0.0643157958984375, 0.06810474395751953, 0.07189369201660156, 0.0756826400756836, 0.07947158813476562, 0.08326053619384766, 0.08704948425292969, 0.09083843231201172, 0.09462738037109375, 0.09841632843017578, 0.10220527648925781, 0.10599422454833984, 0.10978317260742188, 0.1135721206665039, 0.11736106872558594, 0.12115001678466797, 0.12493896484375]}, "gradients/decoder.bert.encoder.layer.14.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 6.0, 5.0, 14.0, 5.0, 17.0, 14.0, 20.0, 22.0, 22.0, 31.0, 35.0, 42.0, 47.0, 61.0, 67.0, 77.0, 97.0, 75.0, 73.0, 68.0, 44.0, 29.0, 20.0, 23.0, 22.0, 18.0, 8.0, 7.0, 5.0, 8.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.050018310546875, -0.04846668243408203, -0.04691505432128906, -0.045363426208496094, -0.043811798095703125, -0.042260169982910156, -0.04070854187011719, -0.03915691375732422, -0.03760528564453125, -0.03605365753173828, -0.03450202941894531, -0.032950401306152344, -0.031398773193359375, -0.029847145080566406, -0.028295516967773438, -0.02674388885498047, -0.0251922607421875, -0.02364063262939453, -0.022089004516601562, -0.020537376403808594, -0.018985748291015625, -0.017434120178222656, -0.015882492065429688, -0.014330863952636719, -0.01277923583984375, -0.011227607727050781, -0.009675979614257812, -0.008124351501464844, -0.006572723388671875, -0.005021095275878906, -0.0034694671630859375, -0.0019178390502929688, -0.0003662109375, 0.0011854171752929688, 0.0027370452880859375, 0.004288673400878906, 0.005840301513671875, 0.007391929626464844, 0.008943557739257812, 0.010495185852050781, 0.01204681396484375, 0.013598442077636719, 0.015150070190429688, 0.016701698303222656, 0.018253326416015625, 0.019804954528808594, 0.021356582641601562, 0.02290821075439453, 0.0244598388671875, 0.02601146697998047, 0.027563095092773438, 0.029114723205566406, 0.030666351318359375, 0.032217979431152344, 0.03376960754394531, 0.03532123565673828, 0.03687286376953125, 0.03842449188232422, 0.03997611999511719, 0.041527748107910156, 0.043079376220703125, 0.044631004333496094, 0.04618263244628906, 0.04773426055908203, 0.049285888671875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 5.0, 8.0, 12.0, 13.0, 17.0, 29.0, 44.0, 44.0, 55.0, 50.0, 69.0, 78.0, 73.0, 72.0, 73.0, 62.0, 55.0, 43.0, 39.0, 36.0, 22.0, 25.0, 9.0, 13.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.401505470275879, -4.237415313720703, -4.073324680328369, -3.9092342853546143, -3.7451438903808594, -3.5810537338256836, -3.4169633388519287, -3.252872943878174, -3.088782548904419, -2.924692153930664, -2.760601758956909, -2.5965113639831543, -2.4324212074279785, -2.2683305740356445, -2.1042404174804688, -1.9401500225067139, -1.776059627532959, -1.611969232559204, -1.4478788375854492, -1.2837885618209839, -1.119698166847229, -0.9556077718734741, -0.791517436504364, -0.6274271011352539, -0.463336706161499, -0.29924634099006653, -0.13515597581863403, 0.028934389352798462, 0.19302475452423096, 0.35711514949798584, 0.521205484867096, 0.685295820236206, 0.8493862152099609, 1.0134766101837158, 1.1775670051574707, 1.341657280921936, 1.505747675895691, 1.6698380708694458, 1.8339283466339111, 1.998018741607666, 2.162109136581421, 2.326199531555176, 2.4902899265289307, 2.6543803215026855, 2.8184704780578613, 2.9825611114501953, 3.146651268005371, 3.310741662979126, 3.474832057952881, 3.6389224529266357, 3.8030128479003906, 3.9671032428741455, 4.1311936378479, 4.295283794403076, 4.45937442779541, 4.623464584350586, 4.787554740905762, 4.9516448974609375, 5.1157355308532715, 5.279825687408447, 5.443916320800781, 5.608006477355957, 5.772097110748291, 5.936187267303467, 6.100277900695801]}, "gradients/decoder.bert.encoder.layer.14.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 13.0, 7.0, 16.0, 19.0, 11.0, 23.0, 32.0, 25.0, 25.0, 26.0, 32.0, 33.0, 40.0, 57.0, 59.0, 57.0, 41.0, 52.0, 46.0, 38.0, 54.0, 24.0, 30.0, 31.0, 36.0, 26.0, 27.0, 24.0, 18.0, 11.0, 15.0, 12.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4923160076141357, -3.380154609680176, -3.2679929733276367, -3.1558315753936768, -3.0436699390411377, -2.9315085411071777, -2.8193469047546387, -2.7071855068206787, -2.5950241088867188, -2.482862710952759, -2.3707010746002197, -2.2585396766662598, -2.1463780403137207, -2.0342166423797607, -1.9220551252365112, -1.8098936080932617, -1.6977319717407227, -1.5855704545974731, -1.4734089374542236, -1.3612475395202637, -1.2490859031677246, -1.1369245052337646, -1.0247629880905151, -0.9126014709472656, -0.8004399538040161, -0.6882784366607666, -0.5761169195175171, -0.46395546197891235, -0.35179394483566284, -0.23963242769241333, -0.1274709701538086, -0.015309453010559082, 0.09685230255126953, 0.20901380479335785, 0.32117530703544617, 0.4333367943763733, 0.5454983115196228, 0.6576598286628723, 0.769821286201477, 0.8819828033447266, 0.9941443204879761, 1.1063058376312256, 1.218467354774475, 1.3306288719177246, 1.4427902698516846, 1.5549519062042236, 1.6671133041381836, 1.779274821281433, 1.8914363384246826, 2.0035977363586426, 2.1157593727111816, 2.2279207706451416, 2.3400824069976807, 2.4522438049316406, 2.5644054412841797, 2.6765668392181396, 2.7887282371520996, 2.9008896350860596, 3.0130512714385986, 3.1252126693725586, 3.2373743057250977, 3.3495357036590576, 3.4616971015930176, 3.5738587379455566, 3.6860203742980957]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 5.0, 14.0, 16.0, 17.0, 28.0, 45.0, 89.0, 120.0, 159.0, 242.0, 347.0, 547.0, 885.0, 1260.0, 2108.0, 3247.0, 5512.0, 8909.0, 15112.0, 24881.0, 41613.0, 67119.0, 103554.0, 141480.0, 162716.0, 150723.0, 116190.0, 78014.0, 48608.0, 29213.0, 17672.0, 10769.0, 6561.0, 3945.0, 2371.0, 1540.0, 1009.0, 650.0, 431.0, 292.0, 175.0, 113.0, 64.0, 52.0, 38.0, 33.0, 22.0, 21.0, 10.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.798828125, -2.707550048828125, -2.61627197265625, -2.524993896484375, -2.4337158203125, -2.342437744140625, -2.25115966796875, -2.159881591796875, -2.068603515625, -1.977325439453125, -1.88604736328125, -1.794769287109375, -1.7034912109375, -1.612213134765625, -1.52093505859375, -1.429656982421875, -1.33837890625, -1.247100830078125, -1.15582275390625, -1.064544677734375, -0.9732666015625, -0.881988525390625, -0.79071044921875, -0.699432373046875, -0.608154296875, -0.516876220703125, -0.42559814453125, -0.334320068359375, -0.2430419921875, -0.151763916015625, -0.06048583984375, 0.030792236328125, 0.1220703125, 0.213348388671875, 0.30462646484375, 0.395904541015625, 0.4871826171875, 0.578460693359375, 0.66973876953125, 0.761016845703125, 0.852294921875, 0.943572998046875, 1.03485107421875, 1.126129150390625, 1.2174072265625, 1.308685302734375, 1.39996337890625, 1.491241455078125, 1.58251953125, 1.673797607421875, 1.76507568359375, 1.856353759765625, 1.9476318359375, 2.038909912109375, 2.13018798828125, 2.221466064453125, 2.312744140625, 2.404022216796875, 2.49530029296875, 2.586578369140625, 2.6778564453125, 2.769134521484375, 2.86041259765625, 2.951690673828125, 3.04296875]}, "gradients/decoder.bert.encoder.layer.14.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 4.0, 6.0, 6.0, 9.0, 13.0, 17.0, 18.0, 22.0, 27.0, 15.0, 42.0, 35.0, 40.0, 36.0, 38.0, 50.0, 62.0, 42.0, 47.0, 60.0, 50.0, 43.0, 43.0, 37.0, 30.0, 23.0, 33.0, 30.0, 24.0, 18.0, 14.0, 19.0, 18.0, 7.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.955078125, -3.828460693359375, -3.70184326171875, -3.575225830078125, -3.4486083984375, -3.321990966796875, -3.19537353515625, -3.068756103515625, -2.942138671875, -2.815521240234375, -2.68890380859375, -2.562286376953125, -2.4356689453125, -2.309051513671875, -2.18243408203125, -2.055816650390625, -1.92919921875, -1.802581787109375, -1.67596435546875, -1.549346923828125, -1.4227294921875, -1.296112060546875, -1.16949462890625, -1.042877197265625, -0.916259765625, -0.789642333984375, -0.66302490234375, -0.536407470703125, -0.4097900390625, -0.283172607421875, -0.15655517578125, -0.029937744140625, 0.0966796875, 0.223297119140625, 0.34991455078125, 0.476531982421875, 0.6031494140625, 0.729766845703125, 0.85638427734375, 0.983001708984375, 1.109619140625, 1.236236572265625, 1.36285400390625, 1.489471435546875, 1.6160888671875, 1.742706298828125, 1.86932373046875, 1.995941162109375, 2.12255859375, 2.249176025390625, 2.37579345703125, 2.502410888671875, 2.6290283203125, 2.755645751953125, 2.88226318359375, 3.008880615234375, 3.135498046875, 3.262115478515625, 3.38873291015625, 3.515350341796875, 3.6419677734375, 3.768585205078125, 3.89520263671875, 4.021820068359375, 4.1484375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 21.0, 28.0, 42.0, 51.0, 69.0, 98.0, 179.0, 267.0, 398.0, 592.0, 916.0, 1443.0, 2235.0, 3758.0, 5789.0, 9495.0, 15357.0, 25125.0, 41112.0, 65601.0, 99222.0, 135652.0, 157189.0, 149176.0, 117721.0, 81083.0, 52115.0, 32258.0, 19627.0, 11909.0, 7209.0, 4708.0, 2897.0, 1863.0, 1153.0, 732.0, 492.0, 344.0, 211.0, 123.0, 99.0, 64.0, 42.0, 30.0, 12.0, 13.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.814453125, -2.725799560546875, -2.63714599609375, -2.548492431640625, -2.4598388671875, -2.371185302734375, -2.28253173828125, -2.193878173828125, -2.105224609375, -2.016571044921875, -1.92791748046875, -1.839263916015625, -1.7506103515625, -1.661956787109375, -1.57330322265625, -1.484649658203125, -1.39599609375, -1.307342529296875, -1.21868896484375, -1.130035400390625, -1.0413818359375, -0.952728271484375, -0.86407470703125, -0.775421142578125, -0.686767578125, -0.598114013671875, -0.50946044921875, -0.420806884765625, -0.3321533203125, -0.243499755859375, -0.15484619140625, -0.066192626953125, 0.0224609375, 0.111114501953125, 0.19976806640625, 0.288421630859375, 0.3770751953125, 0.465728759765625, 0.55438232421875, 0.643035888671875, 0.731689453125, 0.820343017578125, 0.90899658203125, 0.997650146484375, 1.0863037109375, 1.174957275390625, 1.26361083984375, 1.352264404296875, 1.44091796875, 1.529571533203125, 1.61822509765625, 1.706878662109375, 1.7955322265625, 1.884185791015625, 1.97283935546875, 2.061492919921875, 2.150146484375, 2.238800048828125, 2.32745361328125, 2.416107177734375, 2.5047607421875, 2.593414306640625, 2.68206787109375, 2.770721435546875, 2.859375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 2.0, 8.0, 8.0, 7.0, 12.0, 16.0, 24.0, 19.0, 19.0, 20.0, 22.0, 26.0, 32.0, 23.0, 38.0, 38.0, 33.0, 41.0, 31.0, 45.0, 33.0, 44.0, 37.0, 29.0, 41.0, 34.0, 50.0, 31.0, 34.0, 20.0, 27.0, 15.0, 24.0, 19.0, 15.0, 17.0, 12.0, 3.0, 5.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.830078125, -1.770050048828125, -1.71002197265625, -1.649993896484375, -1.5899658203125, -1.529937744140625, -1.46990966796875, -1.409881591796875, -1.349853515625, -1.289825439453125, -1.22979736328125, -1.169769287109375, -1.1097412109375, -1.049713134765625, -0.98968505859375, -0.929656982421875, -0.86962890625, -0.809600830078125, -0.74957275390625, -0.689544677734375, -0.6295166015625, -0.569488525390625, -0.50946044921875, -0.449432373046875, -0.389404296875, -0.329376220703125, -0.26934814453125, -0.209320068359375, -0.1492919921875, -0.089263916015625, -0.02923583984375, 0.030792236328125, 0.0908203125, 0.150848388671875, 0.21087646484375, 0.270904541015625, 0.3309326171875, 0.390960693359375, 0.45098876953125, 0.511016845703125, 0.571044921875, 0.631072998046875, 0.69110107421875, 0.751129150390625, 0.8111572265625, 0.871185302734375, 0.93121337890625, 0.991241455078125, 1.05126953125, 1.111297607421875, 1.17132568359375, 1.231353759765625, 1.2913818359375, 1.351409912109375, 1.41143798828125, 1.471466064453125, 1.531494140625, 1.591522216796875, 1.65155029296875, 1.711578369140625, 1.7716064453125, 1.831634521484375, 1.89166259765625, 1.951690673828125, 2.01171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 7.0, 3.0, 12.0, 11.0, 21.0, 28.0, 48.0, 66.0, 93.0, 168.0, 227.0, 350.0, 514.0, 843.0, 1307.0, 2023.0, 3198.0, 5226.0, 8751.0, 14563.0, 24495.0, 41743.0, 70061.0, 109414.0, 152868.0, 175323.0, 153386.0, 109991.0, 69810.0, 41901.0, 24688.0, 14550.0, 8752.0, 5347.0, 3128.0, 2023.0, 1270.0, 821.0, 513.0, 343.0, 209.0, 162.0, 99.0, 68.0, 41.0, 30.0, 16.0, 14.0, 11.0, 11.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.4501953125, -1.4041595458984375, -1.358123779296875, -1.3120880126953125, -1.26605224609375, -1.2200164794921875, -1.173980712890625, -1.1279449462890625, -1.0819091796875, -1.0358734130859375, -0.989837646484375, -0.9438018798828125, -0.89776611328125, -0.8517303466796875, -0.805694580078125, -0.7596588134765625, -0.713623046875, -0.6675872802734375, -0.621551513671875, -0.5755157470703125, -0.52947998046875, -0.4834442138671875, -0.437408447265625, -0.3913726806640625, -0.3453369140625, -0.2993011474609375, -0.253265380859375, -0.2072296142578125, -0.16119384765625, -0.1151580810546875, -0.069122314453125, -0.0230865478515625, 0.02294921875, 0.0689849853515625, 0.115020751953125, 0.1610565185546875, 0.20709228515625, 0.2531280517578125, 0.299163818359375, 0.3451995849609375, 0.3912353515625, 0.4372711181640625, 0.483306884765625, 0.5293426513671875, 0.57537841796875, 0.6214141845703125, 0.667449951171875, 0.7134857177734375, 0.759521484375, 0.8055572509765625, 0.851593017578125, 0.8976287841796875, 0.94366455078125, 0.9897003173828125, 1.035736083984375, 1.0817718505859375, 1.1278076171875, 1.1738433837890625, 1.219879150390625, 1.2659149169921875, 1.31195068359375, 1.3579864501953125, 1.404022216796875, 1.4500579833984375, 1.49609375]}, "gradients/decoder.bert.encoder.layer.14.attention.self.key.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 10.0, 8.0, 16.0, 16.0, 19.0, 27.0, 24.0, 39.0, 39.0, 26.0, 37.0, 53.0, 61.0, 64.0, 48.0, 51.0, 53.0, 65.0, 54.0, 43.0, 34.0, 30.0, 33.0, 33.0, 21.0, 14.0, 5.0, 11.0, 7.0, 9.0, 5.0, 7.0, 8.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00013637542724609375, -0.00013181939721107483, -0.0001272633671760559, -0.000122707337141037, -0.00011815130710601807, -0.00011359527707099915, -0.00010903924703598022, -0.0001044832170009613, -9.992718696594238e-05, -9.537115693092346e-05, -9.081512689590454e-05, -8.625909686088562e-05, -8.17030668258667e-05, -7.714703679084778e-05, -7.259100675582886e-05, -6.803497672080994e-05, -6.347894668579102e-05, -5.8922916650772095e-05, -5.4366886615753174e-05, -4.981085658073425e-05, -4.525482654571533e-05, -4.069879651069641e-05, -3.614276647567749e-05, -3.158673644065857e-05, -2.703070640563965e-05, -2.2474676370620728e-05, -1.7918646335601807e-05, -1.3362616300582886e-05, -8.806586265563965e-06, -4.250556230545044e-06, 3.0547380447387695e-07, 4.861503839492798e-06, 9.417533874511719e-06, 1.397356390953064e-05, 1.852959394454956e-05, 2.308562397956848e-05, 2.7641654014587402e-05, 3.219768404960632e-05, 3.6753714084625244e-05, 4.1309744119644165e-05, 4.5865774154663086e-05, 5.042180418968201e-05, 5.497783422470093e-05, 5.953386425971985e-05, 6.408989429473877e-05, 6.864592432975769e-05, 7.320195436477661e-05, 7.775798439979553e-05, 8.231401443481445e-05, 8.687004446983337e-05, 9.14260745048523e-05, 9.598210453987122e-05, 0.00010053813457489014, 0.00010509416460990906, 0.00010965019464492798, 0.0001142062246799469, 0.00011876225471496582, 0.00012331828474998474, 0.00012787431478500366, 0.00013243034482002258, 0.0001369863748550415, 0.00014154240489006042, 0.00014609843492507935, 0.00015065446496009827, 0.0001552104949951172]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 5.0, 15.0, 27.0, 29.0, 60.0, 65.0, 98.0, 146.0, 209.0, 360.0, 534.0, 783.0, 1165.0, 1795.0, 2752.0, 4341.0, 6845.0, 11015.0, 17530.0, 27979.0, 44890.0, 69772.0, 102714.0, 137309.0, 155398.0, 143376.0, 110913.0, 75660.0, 49285.0, 30954.0, 19677.0, 11852.0, 7549.0, 4713.0, 3009.0, 1972.0, 1300.0, 805.0, 560.0, 366.0, 240.0, 169.0, 110.0, 68.0, 49.0, 41.0, 22.0, 5.0, 7.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.29296875, -1.2533111572265625, -1.213653564453125, -1.1739959716796875, -1.13433837890625, -1.0946807861328125, -1.055023193359375, -1.0153656005859375, -0.9757080078125, -0.9360504150390625, -0.896392822265625, -0.8567352294921875, -0.81707763671875, -0.7774200439453125, -0.737762451171875, -0.6981048583984375, -0.658447265625, -0.6187896728515625, -0.579132080078125, -0.5394744873046875, -0.49981689453125, -0.4601593017578125, -0.420501708984375, -0.3808441162109375, -0.3411865234375, -0.3015289306640625, -0.261871337890625, -0.2222137451171875, -0.18255615234375, -0.1428985595703125, -0.103240966796875, -0.0635833740234375, -0.02392578125, 0.0157318115234375, 0.055389404296875, 0.0950469970703125, 0.13470458984375, 0.1743621826171875, 0.214019775390625, 0.2536773681640625, 0.2933349609375, 0.3329925537109375, 0.372650146484375, 0.4123077392578125, 0.45196533203125, 0.4916229248046875, 0.531280517578125, 0.5709381103515625, 0.610595703125, 0.6502532958984375, 0.689910888671875, 0.7295684814453125, 0.76922607421875, 0.8088836669921875, 0.848541259765625, 0.8881988525390625, 0.9278564453125, 0.9675140380859375, 1.007171630859375, 1.0468292236328125, 1.08648681640625, 1.1261444091796875, 1.165802001953125, 1.2054595947265625, 1.2451171875]}, "gradients/decoder.bert.encoder.layer.14.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 6.0, 9.0, 11.0, 6.0, 15.0, 10.0, 23.0, 14.0, 25.0, 16.0, 22.0, 24.0, 31.0, 24.0, 30.0, 39.0, 48.0, 36.0, 44.0, 48.0, 45.0, 52.0, 43.0, 42.0, 28.0, 39.0, 35.0, 43.0, 27.0, 27.0, 27.0, 14.0, 15.0, 18.0, 9.0, 13.0, 9.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3779296875, -0.36574554443359375, -0.3535614013671875, -0.34137725830078125, -0.329193115234375, -0.31700897216796875, -0.3048248291015625, -0.29264068603515625, -0.28045654296875, -0.26827239990234375, -0.2560882568359375, -0.24390411376953125, -0.231719970703125, -0.21953582763671875, -0.2073516845703125, -0.19516754150390625, -0.1829833984375, -0.17079925537109375, -0.1586151123046875, -0.14643096923828125, -0.134246826171875, -0.12206268310546875, -0.1098785400390625, -0.09769439697265625, -0.08551025390625, -0.07332611083984375, -0.0611419677734375, -0.04895782470703125, -0.036773681640625, -0.02458953857421875, -0.0124053955078125, -0.00022125244140625, 0.011962890625, 0.02414703369140625, 0.0363311767578125, 0.04851531982421875, 0.060699462890625, 0.07288360595703125, 0.0850677490234375, 0.09725189208984375, 0.10943603515625, 0.12162017822265625, 0.1338043212890625, 0.14598846435546875, 0.158172607421875, 0.17035675048828125, 0.1825408935546875, 0.19472503662109375, 0.2069091796875, 0.21909332275390625, 0.2312774658203125, 0.24346160888671875, 0.255645751953125, 0.26782989501953125, 0.2800140380859375, 0.29219818115234375, 0.30438232421875, 0.31656646728515625, 0.3287506103515625, 0.34093475341796875, 0.353118896484375, 0.36530303955078125, 0.3774871826171875, 0.38967132568359375, 0.40185546875]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 5.0, 9.0, 9.0, 13.0, 9.0, 23.0, 27.0, 27.0, 38.0, 50.0, 58.0, 64.0, 84.0, 63.0, 77.0, 76.0, 57.0, 57.0, 51.0, 51.0, 39.0, 28.0, 18.0, 16.0, 16.0, 5.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.052423477172852, -3.884748935699463, -3.717074394226074, -3.5493998527526855, -3.381725311279297, -3.214050769805908, -3.0463764667510986, -2.87870192527771, -2.7110273838043213, -2.5433528423309326, -2.375678300857544, -2.2080039978027344, -2.0403294563293457, -1.8726547956466675, -1.7049803733825684, -1.5373058319091797, -1.369631290435791, -1.2019567489624023, -1.0342822074890137, -0.8666077852249146, -0.6989332437515259, -0.5312587022781372, -0.3635842800140381, -0.19590973854064941, -0.028235197067260742, 0.13943931460380554, 0.3071138262748718, 0.4747883081436157, 0.6424628496170044, 0.8101373910903931, 0.9778118133544922, 1.1454863548278809, 1.3131604194641113, 1.4808349609375, 1.6485095024108887, 1.8161839246749878, 1.9838584661483765, 2.1515331268310547, 2.3192074298858643, 2.486881971359253, 2.6545565128326416, 2.8222310543060303, 2.989905595779419, 3.1575798988342285, 3.325254440307617, 3.492928981781006, 3.6606035232543945, 3.828278064727783, 3.995952606201172, 4.1636271476745605, 4.331301689147949, 4.498976230621338, 4.666650772094727, 4.834325313568115, 5.001999855041504, 5.169673919677734, 5.337348937988281, 5.50502347946167, 5.672698020935059, 5.840372562408447, 6.008047103881836, 6.175721645355225, 6.343396186828613, 6.511070251464844, 6.678744792938232]}, "gradients/decoder.bert.encoder.layer.13.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 6.0, 9.0, 15.0, 11.0, 17.0, 17.0, 21.0, 26.0, 36.0, 20.0, 28.0, 42.0, 39.0, 48.0, 41.0, 47.0, 41.0, 53.0, 42.0, 39.0, 46.0, 38.0, 30.0, 49.0, 33.0, 33.0, 33.0, 26.0, 20.0, 17.0, 14.0, 13.0, 11.0, 4.0, 9.0, 3.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.283984661102295, -3.1750056743621826, -3.066026449203491, -2.957047462463379, -2.8480682373046875, -2.739089250564575, -2.630110263824463, -2.5211310386657715, -2.412152051925659, -2.303173065185547, -2.1941938400268555, -2.085214853286743, -1.9762357473373413, -1.8672566413879395, -1.7582776546478271, -1.6492985486984253, -1.5403194427490234, -1.4313403367996216, -1.3223612308502197, -1.2133822441101074, -1.1044031381607056, -0.9954240322113037, -0.8864449858665466, -0.7774659395217896, -0.6684868335723877, -0.5595077276229858, -0.45052868127822876, -0.3415496051311493, -0.23257052898406982, -0.12359142303466797, -0.014612376689910889, 0.09436666965484619, 0.20334577560424805, 0.3123248517513275, 0.421303927898407, 0.5302829742431641, 0.6392620801925659, 0.7482411861419678, 0.8572202324867249, 0.9661992788314819, 1.0751783847808838, 1.1841574907302856, 1.2931365966796875, 1.4021155834197998, 1.5110946893692017, 1.6200737953186035, 1.7290527820587158, 1.8380318880081177, 1.9470109939575195, 2.055989980697632, 2.1649692058563232, 2.2739481925964355, 2.382927417755127, 2.4919064044952393, 2.6008853912353516, 2.709864616394043, 2.8188436031341553, 2.9278225898742676, 3.036801815032959, 3.1457808017730713, 3.2547597885131836, 3.363739013671875, 3.4727180004119873, 3.5816969871520996, 3.690676212310791]}, "gradients/decoder.bert.encoder.layer.13.output.dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 23.0, 35.0, 55.0, 66.0, 117.0, 156.0, 282.0, 431.0, 659.0, 1008.0, 1658.0, 2756.0, 4457.0, 7922.0, 14438.0, 26289.0, 52670.0, 109433.0, 247390.0, 581787.0, 1089495.0, 1058603.0, 547382.0, 232953.0, 104091.0, 50201.0, 25895.0, 14270.0, 7955.0, 4599.0, 2742.0, 1632.0, 1032.0, 697.0, 372.0, 263.0, 153.0, 98.0, 70.0, 44.0, 30.0, 19.0, 13.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1328125, -3.99932861328125, -3.8658447265625, -3.73236083984375, -3.598876953125, -3.46539306640625, -3.3319091796875, -3.19842529296875, -3.06494140625, -2.93145751953125, -2.7979736328125, -2.66448974609375, -2.531005859375, -2.39752197265625, -2.2640380859375, -2.13055419921875, -1.9970703125, -1.86358642578125, -1.7301025390625, -1.59661865234375, -1.463134765625, -1.32965087890625, -1.1961669921875, -1.06268310546875, -0.92919921875, -0.79571533203125, -0.6622314453125, -0.52874755859375, -0.395263671875, -0.26177978515625, -0.1282958984375, 0.00518798828125, 0.138671875, 0.27215576171875, 0.4056396484375, 0.53912353515625, 0.672607421875, 0.80609130859375, 0.9395751953125, 1.07305908203125, 1.20654296875, 1.34002685546875, 1.4735107421875, 1.60699462890625, 1.740478515625, 1.87396240234375, 2.0074462890625, 2.14093017578125, 2.2744140625, 2.40789794921875, 2.5413818359375, 2.67486572265625, 2.808349609375, 2.94183349609375, 3.0753173828125, 3.20880126953125, 3.34228515625, 3.47576904296875, 3.6092529296875, 3.74273681640625, 3.876220703125, 4.00970458984375, 4.1431884765625, 4.27667236328125, 4.41015625]}, "gradients/decoder.bert.encoder.layer.13.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 2.0, 7.0, 8.0, 8.0, 10.0, 9.0, 19.0, 34.0, 28.0, 32.0, 29.0, 34.0, 45.0, 44.0, 50.0, 50.0, 51.0, 44.0, 47.0, 49.0, 44.0, 41.0, 37.0, 50.0, 41.0, 30.0, 26.0, 21.0, 23.0, 17.0, 16.0, 15.0, 5.0, 7.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.822265625, -2.735595703125, -2.64892578125, -2.562255859375, -2.4755859375, -2.388916015625, -2.30224609375, -2.215576171875, -2.12890625, -2.042236328125, -1.95556640625, -1.868896484375, -1.7822265625, -1.695556640625, -1.60888671875, -1.522216796875, -1.435546875, -1.348876953125, -1.26220703125, -1.175537109375, -1.0888671875, -1.002197265625, -0.91552734375, -0.828857421875, -0.7421875, -0.655517578125, -0.56884765625, -0.482177734375, -0.3955078125, -0.308837890625, -0.22216796875, -0.135498046875, -0.048828125, 0.037841796875, 0.12451171875, 0.211181640625, 0.2978515625, 0.384521484375, 0.47119140625, 0.557861328125, 0.64453125, 0.731201171875, 0.81787109375, 0.904541015625, 0.9912109375, 1.077880859375, 1.16455078125, 1.251220703125, 1.337890625, 1.424560546875, 1.51123046875, 1.597900390625, 1.6845703125, 1.771240234375, 1.85791015625, 1.944580078125, 2.03125, 2.117919921875, 2.20458984375, 2.291259765625, 2.3779296875, 2.464599609375, 2.55126953125, 2.637939453125, 2.724609375]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 9.0, 12.0, 24.0, 29.0, 54.0, 70.0, 105.0, 170.0, 271.0, 472.0, 754.0, 1330.0, 2234.0, 3892.0, 7243.0, 13458.0, 25037.0, 49942.0, 102516.0, 215123.0, 461634.0, 908566.0, 1104904.0, 675027.0, 322403.0, 150352.0, 72403.0, 35694.0, 18600.0, 9641.0, 5211.0, 2932.0, 1683.0, 966.0, 601.0, 342.0, 212.0, 141.0, 87.0, 56.0, 32.0, 18.0, 14.0, 9.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5390625, -4.39385986328125, -4.2486572265625, -4.10345458984375, -3.958251953125, -3.81304931640625, -3.6678466796875, -3.52264404296875, -3.37744140625, -3.23223876953125, -3.0870361328125, -2.94183349609375, -2.796630859375, -2.65142822265625, -2.5062255859375, -2.36102294921875, -2.2158203125, -2.07061767578125, -1.9254150390625, -1.78021240234375, -1.635009765625, -1.48980712890625, -1.3446044921875, -1.19940185546875, -1.05419921875, -0.90899658203125, -0.7637939453125, -0.61859130859375, -0.473388671875, -0.32818603515625, -0.1829833984375, -0.03778076171875, 0.107421875, 0.25262451171875, 0.3978271484375, 0.54302978515625, 0.688232421875, 0.83343505859375, 0.9786376953125, 1.12384033203125, 1.26904296875, 1.41424560546875, 1.5594482421875, 1.70465087890625, 1.849853515625, 1.99505615234375, 2.1402587890625, 2.28546142578125, 2.4306640625, 2.57586669921875, 2.7210693359375, 2.86627197265625, 3.011474609375, 3.15667724609375, 3.3018798828125, 3.44708251953125, 3.59228515625, 3.73748779296875, 3.8826904296875, 4.02789306640625, 4.173095703125, 4.31829833984375, 4.4635009765625, 4.60870361328125, 4.75390625]}, "gradients/decoder.bert.encoder.layer.13.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 6.0, 7.0, 6.0, 13.0, 20.0, 23.0, 20.0, 32.0, 46.0, 67.0, 82.0, 111.0, 146.0, 171.0, 187.0, 197.0, 231.0, 277.0, 306.0, 289.0, 277.0, 272.0, 244.0, 231.0, 183.0, 129.0, 109.0, 103.0, 61.0, 53.0, 45.0, 38.0, 14.0, 14.0, 13.0, 14.0, 9.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.341796875, -1.2975921630859375, -1.253387451171875, -1.2091827392578125, -1.16497802734375, -1.1207733154296875, -1.076568603515625, -1.0323638916015625, -0.9881591796875, -0.9439544677734375, -0.899749755859375, -0.8555450439453125, -0.81134033203125, -0.7671356201171875, -0.722930908203125, -0.6787261962890625, -0.634521484375, -0.5903167724609375, -0.546112060546875, -0.5019073486328125, -0.45770263671875, -0.4134979248046875, -0.369293212890625, -0.3250885009765625, -0.2808837890625, -0.2366790771484375, -0.192474365234375, -0.1482696533203125, -0.10406494140625, -0.0598602294921875, -0.015655517578125, 0.0285491943359375, 0.07275390625, 0.1169586181640625, 0.161163330078125, 0.2053680419921875, 0.24957275390625, 0.2937774658203125, 0.337982177734375, 0.3821868896484375, 0.4263916015625, 0.4705963134765625, 0.514801025390625, 0.5590057373046875, 0.60321044921875, 0.6474151611328125, 0.691619873046875, 0.7358245849609375, 0.780029296875, 0.8242340087890625, 0.868438720703125, 0.9126434326171875, 0.95684814453125, 1.0010528564453125, 1.045257568359375, 1.0894622802734375, 1.1336669921875, 1.1778717041015625, 1.222076416015625, 1.2662811279296875, 1.31048583984375, 1.3546905517578125, 1.398895263671875, 1.4430999755859375, 1.4873046875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 11.0, 7.0, 13.0, 20.0, 18.0, 22.0, 26.0, 35.0, 32.0, 40.0, 56.0, 70.0, 79.0, 80.0, 87.0, 60.0, 69.0, 52.0, 43.0, 37.0, 37.0, 17.0, 18.0, 18.0, 10.0, 6.0, 2.0, 7.0, 4.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.834712982177734, -4.677600860595703, -4.520488739013672, -4.363376617431641, -4.206264495849609, -4.049152374267578, -3.8920400142669678, -3.7349278926849365, -3.5778157711029053, -3.420703649520874, -3.2635915279388428, -3.1064794063568115, -2.949367046356201, -2.79225492477417, -2.6351428031921387, -2.4780306816101074, -2.320918560028076, -2.163806438446045, -2.0066943168640137, -1.8495820760726929, -1.6924699544906616, -1.5353578329086304, -1.3782455921173096, -1.2211334705352783, -1.064021348953247, -0.9069092273712158, -0.7497970461845398, -0.5926848649978638, -0.4355727434158325, -0.27846062183380127, -0.12134844064712524, 0.03576374053955078, 0.19287586212158203, 0.34998801350593567, 0.5071001648902893, 0.6642123460769653, 0.8213244676589966, 0.9784365892410278, 1.1355488300323486, 1.2926609516143799, 1.4497730731964111, 1.6068851947784424, 1.7639973163604736, 1.9211095571517944, 2.0782217979431152, 2.2353339195251465, 2.3924460411071777, 2.549558162689209, 2.7066702842712402, 2.8637824058532715, 3.0208945274353027, 3.178006649017334, 3.3351187705993652, 3.4922308921813965, 3.649343252182007, 3.806455373764038, 3.9635674953460693, 4.12067985534668, 4.277791976928711, 4.434904098510742, 4.592016220092773, 4.749128341674805, 4.906240463256836, 5.063352584838867, 5.220464706420898]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 7.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 10.0, 20.0, 19.0, 20.0, 20.0, 21.0, 32.0, 21.0, 44.0, 35.0, 55.0, 52.0, 51.0, 63.0, 56.0, 48.0, 53.0, 51.0, 48.0, 33.0, 29.0, 23.0, 28.0, 28.0, 22.0, 16.0, 20.0, 10.0, 14.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4806437492370605, -3.3726115226745605, -3.2645792961120605, -3.1565470695495605, -3.0485148429870605, -2.9404826164245605, -2.8324503898620605, -2.7244184017181396, -2.6163861751556396, -2.5083539485931396, -2.4003217220306396, -2.2922894954681396, -2.1842572689056396, -2.0762252807617188, -1.9681929349899292, -1.8601608276367188, -1.7521284818649292, -1.6440962553024292, -1.5360640287399292, -1.4280319213867188, -1.3199996948242188, -1.2119674682617188, -1.1039352416992188, -0.9959030747413635, -0.8878708481788635, -0.7798386216163635, -0.6718064546585083, -0.5637742280960083, -0.4557420313358307, -0.3477098345756531, -0.23967760801315308, -0.13164544105529785, -0.02361321449279785, 0.08441898971796036, 0.19245119392871857, 0.3004834055900574, 0.408515602350235, 0.5165477991104126, 0.6245800256729126, 0.7326121926307678, 0.8406444191932678, 0.9486766457557678, 1.056708812713623, 1.164741039276123, 1.272773265838623, 1.380805492401123, 1.488837718963623, 1.5968698263168335, 1.7049020528793335, 1.8129342794418335, 1.9209665060043335, 2.028998613357544, 2.137030839920044, 2.245063066482544, 2.353095293045044, 2.461127519607544, 2.569159746170044, 2.677191972732544, 2.785224199295044, 2.893256425857544, 3.001288652420044, 3.109320640563965, 3.217352867126465, 3.325385093688965, 3.433417320251465]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 14.0, 8.0, 20.0, 20.0, 29.0, 28.0, 35.0, 56.0, 71.0, 95.0, 109.0, 151.0, 236.0, 359.0, 543.0, 828.0, 1390.0, 2383.0, 4530.0, 8607.0, 17937.0, 40174.0, 99170.0, 249758.0, 339483.0, 163917.0, 64011.0, 27062.0, 12709.0, 6456.0, 3210.0, 1875.0, 1087.0, 679.0, 405.0, 298.0, 202.0, 147.0, 115.0, 81.0, 47.0, 44.0, 36.0, 35.0, 31.0, 20.0, 15.0, 8.0, 4.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.7783203125, -0.7541961669921875, -0.730072021484375, -0.7059478759765625, -0.68182373046875, -0.6576995849609375, -0.633575439453125, -0.6094512939453125, -0.5853271484375, -0.5612030029296875, -0.537078857421875, -0.5129547119140625, -0.48883056640625, -0.4647064208984375, -0.440582275390625, -0.4164581298828125, -0.392333984375, -0.3682098388671875, -0.344085693359375, -0.3199615478515625, -0.29583740234375, -0.2717132568359375, -0.247589111328125, -0.2234649658203125, -0.1993408203125, -0.1752166748046875, -0.151092529296875, -0.1269683837890625, -0.10284423828125, -0.0787200927734375, -0.054595947265625, -0.0304718017578125, -0.00634765625, 0.0177764892578125, 0.041900634765625, 0.0660247802734375, 0.09014892578125, 0.1142730712890625, 0.138397216796875, 0.1625213623046875, 0.1866455078125, 0.2107696533203125, 0.234893798828125, 0.2590179443359375, 0.28314208984375, 0.3072662353515625, 0.331390380859375, 0.3555145263671875, 0.379638671875, 0.4037628173828125, 0.427886962890625, 0.4520111083984375, 0.47613525390625, 0.5002593994140625, 0.524383544921875, 0.5485076904296875, 0.5726318359375, 0.5967559814453125, 0.620880126953125, 0.6450042724609375, 0.66912841796875, 0.6932525634765625, 0.717376708984375, 0.7415008544921875, 0.765625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 1.0, 8.0, 8.0, 11.0, 14.0, 17.0, 9.0, 23.0, 12.0, 24.0, 32.0, 26.0, 38.0, 33.0, 48.0, 43.0, 40.0, 52.0, 49.0, 60.0, 48.0, 42.0, 45.0, 40.0, 34.0, 29.0, 32.0, 28.0, 24.0, 23.0, 19.0, 18.0, 16.0, 10.0, 8.0, 9.0, 3.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.186279296875, -3.07568359375, -2.965087890625, -2.8544921875, -2.743896484375, -2.63330078125, -2.522705078125, -2.412109375, -2.301513671875, -2.19091796875, -2.080322265625, -1.9697265625, -1.859130859375, -1.74853515625, -1.637939453125, -1.52734375, -1.416748046875, -1.30615234375, -1.195556640625, -1.0849609375, -0.974365234375, -0.86376953125, -0.753173828125, -0.642578125, -0.531982421875, -0.42138671875, -0.310791015625, -0.2001953125, -0.089599609375, 0.02099609375, 0.131591796875, 0.2421875, 0.352783203125, 0.46337890625, 0.573974609375, 0.6845703125, 0.795166015625, 0.90576171875, 1.016357421875, 1.126953125, 1.237548828125, 1.34814453125, 1.458740234375, 1.5693359375, 1.679931640625, 1.79052734375, 1.901123046875, 2.01171875, 2.122314453125, 2.23291015625, 2.343505859375, 2.4541015625, 2.564697265625, 2.67529296875, 2.785888671875, 2.896484375, 3.007080078125, 3.11767578125, 3.228271484375, 3.3388671875, 3.449462890625, 3.56005859375, 3.670654296875, 3.78125]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 7.0, 4.0, 7.0, 7.0, 14.0, 24.0, 32.0, 32.0, 53.0, 60.0, 92.0, 159.0, 238.0, 366.0, 604.0, 1062.0, 2063.0, 4452.0, 10982.0, 36877.0, 874190.0, 88359.0, 16630.0, 6190.0, 2762.0, 1355.0, 703.0, 375.0, 280.0, 162.0, 113.0, 107.0, 52.0, 41.0, 30.0, 18.0, 18.0, 13.0, 7.0, 9.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-1.9404296875, -1.8845062255859375, -1.828582763671875, -1.7726593017578125, -1.71673583984375, -1.6608123779296875, -1.604888916015625, -1.5489654541015625, -1.4930419921875, -1.4371185302734375, -1.381195068359375, -1.3252716064453125, -1.26934814453125, -1.2134246826171875, -1.157501220703125, -1.1015777587890625, -1.045654296875, -0.9897308349609375, -0.933807373046875, -0.8778839111328125, -0.82196044921875, -0.7660369873046875, -0.710113525390625, -0.6541900634765625, -0.5982666015625, -0.5423431396484375, -0.486419677734375, -0.4304962158203125, -0.37457275390625, -0.3186492919921875, -0.262725830078125, -0.2068023681640625, -0.15087890625, -0.0949554443359375, -0.039031982421875, 0.0168914794921875, 0.07281494140625, 0.1287384033203125, 0.184661865234375, 0.2405853271484375, 0.2965087890625, 0.3524322509765625, 0.408355712890625, 0.4642791748046875, 0.52020263671875, 0.5761260986328125, 0.632049560546875, 0.6879730224609375, 0.743896484375, 0.7998199462890625, 0.855743408203125, 0.9116668701171875, 0.96759033203125, 1.0235137939453125, 1.079437255859375, 1.1353607177734375, 1.1912841796875, 1.2472076416015625, 1.303131103515625, 1.3590545654296875, 1.41497802734375, 1.4709014892578125, 1.526824951171875, 1.5827484130859375, 1.638671875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 10.0, 16.0, 10.0, 20.0, 18.0, 21.0, 19.0, 26.0, 32.0, 30.0, 29.0, 35.0, 48.0, 29.0, 39.0, 46.0, 44.0, 40.0, 31.0, 33.0, 40.0, 39.0, 36.0, 39.0, 28.0, 30.0, 25.0, 22.0, 20.0, 23.0, 11.0, 17.0, 9.0, 10.0, 20.0, 7.0, 6.0, 10.0, 10.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.05859375, -1.994293212890625, -1.92999267578125, -1.865692138671875, -1.8013916015625, -1.737091064453125, -1.67279052734375, -1.608489990234375, -1.544189453125, -1.479888916015625, -1.41558837890625, -1.351287841796875, -1.2869873046875, -1.222686767578125, -1.15838623046875, -1.094085693359375, -1.02978515625, -0.965484619140625, -0.90118408203125, -0.836883544921875, -0.7725830078125, -0.708282470703125, -0.64398193359375, -0.579681396484375, -0.515380859375, -0.451080322265625, -0.38677978515625, -0.322479248046875, -0.2581787109375, -0.193878173828125, -0.12957763671875, -0.065277099609375, -0.0009765625, 0.063323974609375, 0.12762451171875, 0.191925048828125, 0.2562255859375, 0.320526123046875, 0.38482666015625, 0.449127197265625, 0.513427734375, 0.577728271484375, 0.64202880859375, 0.706329345703125, 0.7706298828125, 0.834930419921875, 0.89923095703125, 0.963531494140625, 1.02783203125, 1.092132568359375, 1.15643310546875, 1.220733642578125, 1.2850341796875, 1.349334716796875, 1.41363525390625, 1.477935791015625, 1.542236328125, 1.606536865234375, 1.67083740234375, 1.735137939453125, 1.7994384765625, 1.863739013671875, 1.92803955078125, 1.992340087890625, 2.056640625]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 7.0, 12.0, 12.0, 16.0, 15.0, 20.0, 26.0, 63.0, 52.0, 95.0, 113.0, 197.0, 231.0, 385.0, 574.0, 927.0, 1670.0, 3575.0, 9192.0, 33364.0, 926675.0, 49883.0, 12026.0, 4463.0, 2028.0, 1045.0, 612.0, 362.0, 259.0, 187.0, 119.0, 92.0, 68.0, 48.0, 31.0, 32.0, 16.0, 17.0, 16.0, 9.0, 5.0, 5.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5185546875, -0.502655029296875, -0.48675537109375, -0.470855712890625, -0.4549560546875, -0.439056396484375, -0.42315673828125, -0.407257080078125, -0.391357421875, -0.375457763671875, -0.35955810546875, -0.343658447265625, -0.3277587890625, -0.311859130859375, -0.29595947265625, -0.280059814453125, -0.26416015625, -0.248260498046875, -0.23236083984375, -0.216461181640625, -0.2005615234375, -0.184661865234375, -0.16876220703125, -0.152862548828125, -0.136962890625, -0.121063232421875, -0.10516357421875, -0.089263916015625, -0.0733642578125, -0.057464599609375, -0.04156494140625, -0.025665283203125, -0.009765625, 0.006134033203125, 0.02203369140625, 0.037933349609375, 0.0538330078125, 0.069732666015625, 0.08563232421875, 0.101531982421875, 0.117431640625, 0.133331298828125, 0.14923095703125, 0.165130615234375, 0.1810302734375, 0.196929931640625, 0.21282958984375, 0.228729248046875, 0.24462890625, 0.260528564453125, 0.27642822265625, 0.292327880859375, 0.3082275390625, 0.324127197265625, 0.34002685546875, 0.355926513671875, 0.371826171875, 0.387725830078125, 0.40362548828125, 0.419525146484375, 0.4354248046875, 0.451324462890625, 0.46722412109375, 0.483123779296875, 0.4990234375]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 4.0, 7.0, 8.0, 13.0, 18.0, 45.0, 51.0, 104.0, 93.0, 119.0, 122.0, 133.0, 89.0, 59.0, 39.0, 34.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.121397018432617e-05, -5.9478916227817535e-05, -5.77438622713089e-05, -5.600880831480026e-05, -5.4273754358291626e-05, -5.253870040178299e-05, -5.080364644527435e-05, -4.9068592488765717e-05, -4.733353853225708e-05, -4.5598484575748444e-05, -4.386343061923981e-05, -4.212837666273117e-05, -4.0393322706222534e-05, -3.86582687497139e-05, -3.692321479320526e-05, -3.5188160836696625e-05, -3.345310688018799e-05, -3.171805292367935e-05, -2.9982998967170715e-05, -2.824794501066208e-05, -2.6512891054153442e-05, -2.4777837097644806e-05, -2.304278314113617e-05, -2.1307729184627533e-05, -1.9572675228118896e-05, -1.783762127161026e-05, -1.6102567315101624e-05, -1.4367513358592987e-05, -1.263245940208435e-05, -1.0897405445575714e-05, -9.162351489067078e-06, -7.427297532558441e-06, -5.692243576049805e-06, -3.957189619541168e-06, -2.2221356630325317e-06, -4.870817065238953e-07, 1.2479722499847412e-06, 2.9830262064933777e-06, 4.718080163002014e-06, 6.453134119510651e-06, 8.188188076019287e-06, 9.923242032527924e-06, 1.165829598903656e-05, 1.3393349945545197e-05, 1.5128403902053833e-05, 1.686345785856247e-05, 1.8598511815071106e-05, 2.0333565771579742e-05, 2.206861972808838e-05, 2.3803673684597015e-05, 2.5538727641105652e-05, 2.727378159761429e-05, 2.9008835554122925e-05, 3.074388951063156e-05, 3.24789434671402e-05, 3.4213997423648834e-05, 3.594905138015747e-05, 3.768410533666611e-05, 3.9419159293174744e-05, 4.115421324968338e-05, 4.2889267206192017e-05, 4.462432116270065e-05, 4.635937511920929e-05, 4.8094429075717926e-05, 4.982948303222656e-05]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 13.0, 10.0, 25.0, 28.0, 34.0, 28.0, 59.0, 71.0, 130.0, 152.0, 226.0, 369.0, 496.0, 759.0, 1211.0, 1935.0, 3012.0, 5158.0, 8925.0, 18448.0, 48265.0, 150867.0, 385524.0, 274337.0, 87507.0, 29962.0, 13149.0, 6915.0, 3954.0, 2472.0, 1538.0, 970.0, 632.0, 447.0, 274.0, 165.0, 127.0, 100.0, 61.0, 50.0, 40.0, 22.0, 24.0, 14.0, 14.0, 9.0, 5.0, 3.0, 6.0, 5.0, 1.0, 4.0, 1.0], "bins": [-0.19580078125, -0.19000244140625, -0.1842041015625, -0.17840576171875, -0.172607421875, -0.16680908203125, -0.1610107421875, -0.15521240234375, -0.1494140625, -0.14361572265625, -0.1378173828125, -0.13201904296875, -0.126220703125, -0.12042236328125, -0.1146240234375, -0.10882568359375, -0.10302734375, -0.09722900390625, -0.0914306640625, -0.08563232421875, -0.079833984375, -0.07403564453125, -0.0682373046875, -0.06243896484375, -0.056640625, -0.05084228515625, -0.0450439453125, -0.03924560546875, -0.033447265625, -0.02764892578125, -0.0218505859375, -0.01605224609375, -0.01025390625, -0.00445556640625, 0.0013427734375, 0.00714111328125, 0.012939453125, 0.01873779296875, 0.0245361328125, 0.03033447265625, 0.0361328125, 0.04193115234375, 0.0477294921875, 0.05352783203125, 0.059326171875, 0.06512451171875, 0.0709228515625, 0.07672119140625, 0.08251953125, 0.08831787109375, 0.0941162109375, 0.09991455078125, 0.105712890625, 0.11151123046875, 0.1173095703125, 0.12310791015625, 0.12890625, 0.13470458984375, 0.1405029296875, 0.14630126953125, 0.152099609375, 0.15789794921875, 0.1636962890625, 0.16949462890625, 0.17529296875]}, "gradients/decoder.bert.encoder.layer.13.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 2.0, 6.0, 11.0, 11.0, 12.0, 10.0, 16.0, 27.0, 36.0, 36.0, 45.0, 68.0, 59.0, 64.0, 71.0, 86.0, 78.0, 79.0, 60.0, 39.0, 22.0, 39.0, 23.0, 20.0, 14.0, 12.0, 11.0, 4.0, 2.0, 8.0, 4.0, 7.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.038665771484375, -0.037572383880615234, -0.03647899627685547, -0.0353856086730957, -0.03429222106933594, -0.03319883346557617, -0.032105445861816406, -0.03101205825805664, -0.029918670654296875, -0.02882528305053711, -0.027731895446777344, -0.026638507843017578, -0.025545120239257812, -0.024451732635498047, -0.02335834503173828, -0.022264957427978516, -0.02117156982421875, -0.020078182220458984, -0.01898479461669922, -0.017891407012939453, -0.016798019409179688, -0.015704631805419922, -0.014611244201660156, -0.01351785659790039, -0.012424468994140625, -0.01133108139038086, -0.010237693786621094, -0.009144306182861328, -0.008050918579101562, -0.006957530975341797, -0.005864143371582031, -0.004770755767822266, -0.0036773681640625, -0.0025839805603027344, -0.0014905929565429688, -0.0003972053527832031, 0.0006961822509765625, 0.0017895698547363281, 0.0028829574584960938, 0.003976345062255859, 0.005069732666015625, 0.006163120269775391, 0.007256507873535156, 0.008349895477294922, 0.009443283081054688, 0.010536670684814453, 0.011630058288574219, 0.012723445892333984, 0.01381683349609375, 0.014910221099853516, 0.01600360870361328, 0.017096996307373047, 0.018190383911132812, 0.019283771514892578, 0.020377159118652344, 0.02147054672241211, 0.022563934326171875, 0.02365732192993164, 0.024750709533691406, 0.025844097137451172, 0.026937484741210938, 0.028030872344970703, 0.02912425994873047, 0.030217647552490234, 0.03131103515625]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 6.0, 11.0, 7.0, 15.0, 23.0, 15.0, 26.0, 27.0, 32.0, 41.0, 34.0, 71.0, 77.0, 74.0, 84.0, 86.0, 59.0, 63.0, 50.0, 40.0, 35.0, 30.0, 19.0, 18.0, 11.0, 7.0, 8.0, 3.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.78282356262207, -4.625185012817383, -4.467546463012695, -4.309907913208008, -4.15226936340332, -3.994630813598633, -3.836992025375366, -3.6793534755706787, -3.521714925765991, -3.3640763759613037, -3.206437826156616, -3.0487992763519287, -2.891160488128662, -2.7335219383239746, -2.575883388519287, -2.4182448387145996, -2.260606288909912, -2.1029677391052246, -1.945329189300537, -1.78769052028656, -1.6300519704818726, -1.472413420677185, -1.314774751663208, -1.1571362018585205, -0.999497652053833, -0.8418591022491455, -0.6842204928398132, -0.526581883430481, -0.36894333362579346, -0.21130478382110596, -0.05366617441177368, 0.1039724349975586, 0.2616105079650879, 0.4192490875720978, 0.5768876671791077, 0.7345262765884399, 0.8921648263931274, 1.049803376197815, 1.207442045211792, 1.3650805950164795, 1.522719144821167, 1.6803576946258545, 1.837996244430542, 1.995634913444519, 2.153273582458496, 2.3109121322631836, 2.468550682067871, 2.6261892318725586, 2.783827781677246, 2.9414663314819336, 3.099104881286621, 3.2567434310913086, 3.414381980895996, 3.5720205307006836, 3.72965931892395, 3.8872978687286377, 4.044936180114746, 4.202574729919434, 4.360213279724121, 4.517851829528809, 4.675490379333496, 4.833128929138184, 4.990767478942871, 5.148406028747559, 5.306045055389404]}, "gradients/decoder.bert.encoder.layer.13.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 8.0, 19.0, 19.0, 20.0, 19.0, 22.0, 29.0, 23.0, 39.0, 44.0, 50.0, 48.0, 52.0, 64.0, 60.0, 44.0, 56.0, 52.0, 43.0, 36.0, 33.0, 21.0, 27.0, 28.0, 24.0, 19.0, 15.0, 14.0, 12.0, 11.0, 9.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.4642462730407715, -3.3566370010375977, -3.2490274906158447, -3.141418218612671, -3.033808946609497, -2.926199436187744, -2.8185901641845703, -2.7109808921813965, -2.6033713817596436, -2.4957621097564697, -2.388152599334717, -2.280543327331543, -2.172934055328369, -2.065324544906616, -1.9577152729034424, -1.850105881690979, -1.7424966096878052, -1.6348872184753418, -1.527277946472168, -1.4196685552597046, -1.3120591640472412, -1.2044498920440674, -1.096840500831604, -0.9892311096191406, -0.881621778011322, -0.7740124464035034, -0.66640305519104, -0.5587937235832214, -0.45118436217308044, -0.34357500076293945, -0.23596566915512085, -0.12835627794265747, -0.020746946334838867, 0.08686240762472153, 0.19447176158428192, 0.3020811080932617, 0.4096904695034027, 0.5172998309135437, 0.6249091625213623, 0.7325185537338257, 0.8401278853416443, 0.9477372169494629, 1.0553466081619263, 1.1629559993743896, 1.2705652713775635, 1.3781746625900269, 1.4857840538024902, 1.593393325805664, 1.7010027170181274, 1.8086121082305908, 1.9162213802337646, 2.0238308906555176, 2.1314401626586914, 2.2390494346618652, 2.346658706665039, 2.454268217086792, 2.561877489089966, 2.6694867610931396, 2.7770962715148926, 2.8847055435180664, 2.9923148155212402, 3.099924325942993, 3.207533597946167, 3.31514310836792, 3.4227523803710938]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 10.0, 14.0, 32.0, 28.0, 55.0, 96.0, 142.0, 189.0, 262.0, 446.0, 712.0, 1207.0, 1970.0, 3230.0, 5543.0, 9686.0, 17087.0, 29882.0, 52272.0, 87158.0, 133918.0, 172855.0, 174677.0, 137208.0, 91173.0, 54783.0, 31489.0, 17655.0, 10122.0, 5863.0, 3356.0, 2044.0, 1204.0, 813.0, 447.0, 313.0, 205.0, 139.0, 93.0, 49.0, 38.0, 23.0, 22.0, 18.0, 10.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-2.96875, -2.8760986328125, -2.783447265625, -2.6907958984375, -2.59814453125, -2.5054931640625, -2.412841796875, -2.3201904296875, -2.2275390625, -2.1348876953125, -2.042236328125, -1.9495849609375, -1.85693359375, -1.7642822265625, -1.671630859375, -1.5789794921875, -1.486328125, -1.3936767578125, -1.301025390625, -1.2083740234375, -1.11572265625, -1.0230712890625, -0.930419921875, -0.8377685546875, -0.7451171875, -0.6524658203125, -0.559814453125, -0.4671630859375, -0.37451171875, -0.2818603515625, -0.189208984375, -0.0965576171875, -0.00390625, 0.0887451171875, 0.181396484375, 0.2740478515625, 0.36669921875, 0.4593505859375, 0.552001953125, 0.6446533203125, 0.7373046875, 0.8299560546875, 0.922607421875, 1.0152587890625, 1.10791015625, 1.2005615234375, 1.293212890625, 1.3858642578125, 1.478515625, 1.5711669921875, 1.663818359375, 1.7564697265625, 1.84912109375, 1.9417724609375, 2.034423828125, 2.1270751953125, 2.2197265625, 2.3123779296875, 2.405029296875, 2.4976806640625, 2.59033203125, 2.6829833984375, 2.775634765625, 2.8682861328125, 2.9609375]}, "gradients/decoder.bert.encoder.layer.13.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 10.0, 18.0, 25.0, 14.0, 31.0, 23.0, 27.0, 37.0, 36.0, 51.0, 51.0, 52.0, 64.0, 58.0, 42.0, 74.0, 44.0, 51.0, 53.0, 46.0, 34.0, 26.0, 23.0, 18.0, 16.0, 15.0, 10.0, 13.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.859375, -4.733367919921875, -4.60736083984375, -4.481353759765625, -4.3553466796875, -4.229339599609375, -4.10333251953125, -3.977325439453125, -3.851318359375, -3.725311279296875, -3.59930419921875, -3.473297119140625, -3.3472900390625, -3.221282958984375, -3.09527587890625, -2.969268798828125, -2.84326171875, -2.717254638671875, -2.59124755859375, -2.465240478515625, -2.3392333984375, -2.213226318359375, -2.08721923828125, -1.961212158203125, -1.835205078125, -1.709197998046875, -1.58319091796875, -1.457183837890625, -1.3311767578125, -1.205169677734375, -1.07916259765625, -0.953155517578125, -0.8271484375, -0.701141357421875, -0.57513427734375, -0.449127197265625, -0.3231201171875, -0.197113037109375, -0.07110595703125, 0.054901123046875, 0.180908203125, 0.306915283203125, 0.43292236328125, 0.558929443359375, 0.6849365234375, 0.810943603515625, 0.93695068359375, 1.062957763671875, 1.18896484375, 1.314971923828125, 1.44097900390625, 1.566986083984375, 1.6929931640625, 1.819000244140625, 1.94500732421875, 2.071014404296875, 2.197021484375, 2.323028564453125, 2.44903564453125, 2.575042724609375, 2.7010498046875, 2.827056884765625, 2.95306396484375, 3.079071044921875, 3.205078125]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 7.0, 15.0, 26.0, 26.0, 33.0, 55.0, 94.0, 129.0, 202.0, 257.0, 441.0, 692.0, 1081.0, 1572.0, 2601.0, 4231.0, 6829.0, 11153.0, 18371.0, 30550.0, 48946.0, 75975.0, 111344.0, 144012.0, 157137.0, 139014.0, 104698.0, 71480.0, 45219.0, 27808.0, 17270.0, 10420.0, 6274.0, 3876.0, 2377.0, 1568.0, 928.0, 643.0, 405.0, 275.0, 179.0, 114.0, 70.0, 47.0, 26.0, 28.0, 17.0, 6.0, 9.0, 6.0, 3.0, 2.0, 3.0, 2.0], "bins": [-2.767578125, -2.687164306640625, -2.60675048828125, -2.526336669921875, -2.4459228515625, -2.365509033203125, -2.28509521484375, -2.204681396484375, -2.124267578125, -2.043853759765625, -1.96343994140625, -1.883026123046875, -1.8026123046875, -1.722198486328125, -1.64178466796875, -1.561370849609375, -1.48095703125, -1.400543212890625, -1.32012939453125, -1.239715576171875, -1.1593017578125, -1.078887939453125, -0.99847412109375, -0.918060302734375, -0.837646484375, -0.757232666015625, -0.67681884765625, -0.596405029296875, -0.5159912109375, -0.435577392578125, -0.35516357421875, -0.274749755859375, -0.1943359375, -0.113922119140625, -0.03350830078125, 0.046905517578125, 0.1273193359375, 0.207733154296875, 0.28814697265625, 0.368560791015625, 0.448974609375, 0.529388427734375, 0.60980224609375, 0.690216064453125, 0.7706298828125, 0.851043701171875, 0.93145751953125, 1.011871337890625, 1.09228515625, 1.172698974609375, 1.25311279296875, 1.333526611328125, 1.4139404296875, 1.494354248046875, 1.57476806640625, 1.655181884765625, 1.735595703125, 1.816009521484375, 1.89642333984375, 1.976837158203125, 2.0572509765625, 2.137664794921875, 2.21807861328125, 2.298492431640625, 2.37890625]}, "gradients/decoder.bert.encoder.layer.13.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 7.0, 7.0, 16.0, 7.0, 15.0, 21.0, 15.0, 22.0, 29.0, 38.0, 32.0, 40.0, 51.0, 47.0, 47.0, 43.0, 38.0, 33.0, 46.0, 39.0, 35.0, 50.0, 37.0, 35.0, 29.0, 28.0, 30.0, 25.0, 18.0, 18.0, 22.0, 10.0, 16.0, 13.0, 6.0, 8.0, 10.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.09765625, -2.03515625, -1.97265625, -1.91015625, -1.84765625, -1.78515625, -1.72265625, -1.66015625, -1.59765625, -1.53515625, -1.47265625, -1.41015625, -1.34765625, -1.28515625, -1.22265625, -1.16015625, -1.09765625, -1.03515625, -0.97265625, -0.91015625, -0.84765625, -0.78515625, -0.72265625, -0.66015625, -0.59765625, -0.53515625, -0.47265625, -0.41015625, -0.34765625, -0.28515625, -0.22265625, -0.16015625, -0.09765625, -0.03515625, 0.02734375, 0.08984375, 0.15234375, 0.21484375, 0.27734375, 0.33984375, 0.40234375, 0.46484375, 0.52734375, 0.58984375, 0.65234375, 0.71484375, 0.77734375, 0.83984375, 0.90234375, 0.96484375, 1.02734375, 1.08984375, 1.15234375, 1.21484375, 1.27734375, 1.33984375, 1.40234375, 1.46484375, 1.52734375, 1.58984375, 1.65234375, 1.71484375, 1.77734375, 1.83984375, 1.90234375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 17.0, 24.0, 37.0, 51.0, 81.0, 131.0, 217.0, 366.0, 685.0, 1111.0, 2041.0, 4113.0, 8585.0, 18646.0, 42539.0, 97592.0, 200974.0, 280759.0, 207124.0, 101734.0, 44014.0, 19416.0, 9035.0, 4359.0, 2128.0, 1173.0, 633.0, 373.0, 209.0, 130.0, 78.0, 61.0, 30.0, 26.0, 14.0, 10.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.142578125, -2.0723876953125, -2.002197265625, -1.9320068359375, -1.86181640625, -1.7916259765625, -1.721435546875, -1.6512451171875, -1.5810546875, -1.5108642578125, -1.440673828125, -1.3704833984375, -1.30029296875, -1.2301025390625, -1.159912109375, -1.0897216796875, -1.01953125, -0.9493408203125, -0.879150390625, -0.8089599609375, -0.73876953125, -0.6685791015625, -0.598388671875, -0.5281982421875, -0.4580078125, -0.3878173828125, -0.317626953125, -0.2474365234375, -0.17724609375, -0.1070556640625, -0.036865234375, 0.0333251953125, 0.103515625, 0.1737060546875, 0.243896484375, 0.3140869140625, 0.38427734375, 0.4544677734375, 0.524658203125, 0.5948486328125, 0.6650390625, 0.7352294921875, 0.805419921875, 0.8756103515625, 0.94580078125, 1.0159912109375, 1.086181640625, 1.1563720703125, 1.2265625, 1.2967529296875, 1.366943359375, 1.4371337890625, 1.50732421875, 1.5775146484375, 1.647705078125, 1.7178955078125, 1.7880859375, 1.8582763671875, 1.928466796875, 1.9986572265625, 2.06884765625, 2.1390380859375, 2.209228515625, 2.2794189453125, 2.349609375]}, "gradients/decoder.bert.encoder.layer.13.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 12.0, 11.0, 12.0, 18.0, 18.0, 28.0, 27.0, 46.0, 64.0, 68.0, 79.0, 88.0, 76.0, 84.0, 85.0, 66.0, 58.0, 32.0, 22.0, 19.0, 21.0, 16.0, 7.0, 5.0, 7.0, 4.0, 7.0, 2.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001800060272216797, -0.0001732073724269867, -0.0001664087176322937, -0.0001596100628376007, -0.00015281140804290771, -0.00014601275324821472, -0.00013921409845352173, -0.00013241544365882874, -0.00012561678886413574, -0.00011881813406944275, -0.00011201947927474976, -0.00010522082448005676, -9.842216968536377e-05, -9.162351489067078e-05, -8.482486009597778e-05, -7.802620530128479e-05, -7.12275505065918e-05, -6.44288957118988e-05, -5.763024091720581e-05, -5.083158612251282e-05, -4.4032931327819824e-05, -3.723427653312683e-05, -3.0435621738433838e-05, -2.3636966943740845e-05, -1.683831214904785e-05, -1.0039657354354858e-05, -3.2410025596618652e-06, 3.557652235031128e-06, 1.0356307029724121e-05, 1.7154961824417114e-05, 2.3953616619110107e-05, 3.07522714138031e-05, 3.7550926208496094e-05, 4.434958100318909e-05, 5.114823579788208e-05, 5.794689059257507e-05, 6.474554538726807e-05, 7.154420018196106e-05, 7.834285497665405e-05, 8.514150977134705e-05, 9.194016456604004e-05, 9.873881936073303e-05, 0.00010553747415542603, 0.00011233612895011902, 0.00011913478374481201, 0.000125933438539505, 0.000132732093334198, 0.000139530748128891, 0.00014632940292358398, 0.00015312805771827698, 0.00015992671251296997, 0.00016672536730766296, 0.00017352402210235596, 0.00018032267689704895, 0.00018712133169174194, 0.00019391998648643494, 0.00020071864128112793, 0.00020751729607582092, 0.00021431595087051392, 0.0002211146056652069, 0.0002279132604598999, 0.0002347119152545929, 0.0002415105700492859, 0.0002483092248439789, 0.0002551078796386719]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 6.0, 8.0, 20.0, 19.0, 38.0, 45.0, 75.0, 82.0, 160.0, 222.0, 353.0, 527.0, 765.0, 1255.0, 1955.0, 3157.0, 5178.0, 8687.0, 14951.0, 26557.0, 46598.0, 81086.0, 130774.0, 179551.0, 185499.0, 143306.0, 91479.0, 53192.0, 30187.0, 17263.0, 10032.0, 5924.0, 3446.0, 2191.0, 1447.0, 879.0, 545.0, 391.0, 227.0, 163.0, 94.0, 66.0, 57.0, 40.0, 24.0, 15.0, 15.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.6279296875, -1.581573486328125, -1.53521728515625, -1.488861083984375, -1.4425048828125, -1.396148681640625, -1.34979248046875, -1.303436279296875, -1.257080078125, -1.210723876953125, -1.16436767578125, -1.118011474609375, -1.0716552734375, -1.025299072265625, -0.97894287109375, -0.932586669921875, -0.88623046875, -0.839874267578125, -0.79351806640625, -0.747161865234375, -0.7008056640625, -0.654449462890625, -0.60809326171875, -0.561737060546875, -0.515380859375, -0.469024658203125, -0.42266845703125, -0.376312255859375, -0.3299560546875, -0.283599853515625, -0.23724365234375, -0.190887451171875, -0.14453125, -0.098175048828125, -0.05181884765625, -0.005462646484375, 0.0408935546875, 0.087249755859375, 0.13360595703125, 0.179962158203125, 0.226318359375, 0.272674560546875, 0.31903076171875, 0.365386962890625, 0.4117431640625, 0.458099365234375, 0.50445556640625, 0.550811767578125, 0.59716796875, 0.643524169921875, 0.68988037109375, 0.736236572265625, 0.7825927734375, 0.828948974609375, 0.87530517578125, 0.921661376953125, 0.968017578125, 1.014373779296875, 1.06072998046875, 1.107086181640625, 1.1534423828125, 1.199798583984375, 1.24615478515625, 1.292510986328125, 1.3388671875]}, "gradients/decoder.bert.encoder.layer.13.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 11.0, 18.0, 14.0, 11.0, 25.0, 25.0, 34.0, 55.0, 62.0, 56.0, 69.0, 68.0, 67.0, 69.0, 64.0, 52.0, 54.0, 39.0, 36.0, 28.0, 21.0, 24.0, 20.0, 16.0, 18.0, 7.0, 3.0, 7.0, 5.0, 5.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63037109375, -0.612213134765625, -0.59405517578125, -0.575897216796875, -0.5577392578125, -0.539581298828125, -0.52142333984375, -0.503265380859375, -0.485107421875, -0.466949462890625, -0.44879150390625, -0.430633544921875, -0.4124755859375, -0.394317626953125, -0.37615966796875, -0.358001708984375, -0.33984375, -0.321685791015625, -0.30352783203125, -0.285369873046875, -0.2672119140625, -0.249053955078125, -0.23089599609375, -0.212738037109375, -0.194580078125, -0.176422119140625, -0.15826416015625, -0.140106201171875, -0.1219482421875, -0.103790283203125, -0.08563232421875, -0.067474365234375, -0.04931640625, -0.031158447265625, -0.01300048828125, 0.005157470703125, 0.0233154296875, 0.041473388671875, 0.05963134765625, 0.077789306640625, 0.095947265625, 0.114105224609375, 0.13226318359375, 0.150421142578125, 0.1685791015625, 0.186737060546875, 0.20489501953125, 0.223052978515625, 0.2412109375, 0.259368896484375, 0.27752685546875, 0.295684814453125, 0.3138427734375, 0.332000732421875, 0.35015869140625, 0.368316650390625, 0.386474609375, 0.404632568359375, 0.42279052734375, 0.440948486328125, 0.4591064453125, 0.477264404296875, 0.49542236328125, 0.513580322265625, 0.53173828125]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 15.0, 10.0, 14.0, 17.0, 27.0, 35.0, 36.0, 45.0, 45.0, 52.0, 57.0, 77.0, 61.0, 66.0, 84.0, 61.0, 42.0, 52.0, 40.0, 31.0, 33.0, 16.0, 9.0, 9.0, 6.0, 9.0, 6.0, 10.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.544699192047119, -4.395304203033447, -4.245909690856934, -4.096514701843262, -3.94711971282959, -3.797724723815918, -3.648329973220825, -3.4989352226257324, -3.3495402336120605, -3.2001452445983887, -3.050750494003296, -2.901355743408203, -2.7519607543945312, -2.6025657653808594, -2.4531710147857666, -2.303776264190674, -2.154381275177002, -2.00498628616333, -1.8555915355682373, -1.706196665763855, -1.5568017959594727, -1.4074069261550903, -1.258012056350708, -1.1086171865463257, -0.9592223167419434, -0.809827446937561, -0.6604325771331787, -0.5110377073287964, -0.36164283752441406, -0.21224796772003174, -0.06285309791564941, 0.08654177188873291, 0.23593664169311523, 0.38533151149749756, 0.5347263813018799, 0.6841212511062622, 0.8335161209106445, 0.9829109907150269, 1.1323058605194092, 1.2817007303237915, 1.4310956001281738, 1.5804904699325562, 1.7298853397369385, 1.8792802095413208, 2.028675079345703, 2.178070068359375, 2.3274648189544678, 2.4768595695495605, 2.6262545585632324, 2.7756495475769043, 2.925044298171997, 3.07443904876709, 3.2238340377807617, 3.3732290267944336, 3.5226237773895264, 3.672018527984619, 3.821413516998291, 3.970808506011963, 4.120203018188477, 4.269598007202148, 4.41899299621582, 4.568387985229492, 4.717782974243164, 4.867177486419678, 5.01657247543335]}, "gradients/decoder.bert.encoder.layer.12.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 1.0, 0.0, 3.0, 5.0, 8.0, 10.0, 6.0, 20.0, 15.0, 13.0, 22.0, 25.0, 17.0, 31.0, 38.0, 56.0, 41.0, 52.0, 52.0, 49.0, 46.0, 57.0, 60.0, 50.0, 43.0, 37.0, 38.0, 31.0, 30.0, 27.0, 23.0, 27.0, 16.0, 18.0, 12.0, 10.0, 9.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4886584281921387, -3.3750526905059814, -3.261446952819824, -3.147841453552246, -3.034235715866089, -2.9206299781799316, -2.8070244789123535, -2.6934187412261963, -2.579813003540039, -2.466207265853882, -2.3526015281677246, -2.2389960289001465, -2.1253902912139893, -2.011784553527832, -1.8981789350509644, -1.7845733165740967, -1.6709675788879395, -1.5573618412017822, -1.4437562227249146, -1.3301506042480469, -1.2165448665618896, -1.1029391288757324, -0.9893335103988647, -0.8757278323173523, -0.7621221542358398, -0.6485164761543274, -0.5349107980728149, -0.4213051199913025, -0.30769944190979004, -0.1940937638282776, -0.08048808574676514, 0.033117592334747314, 0.14672327041625977, 0.2603289484977722, 0.37393462657928467, 0.4875403046607971, 0.6011459827423096, 0.714751660823822, 0.8283573389053345, 0.9419630169868469, 1.0555686950683594, 1.1691744327545166, 1.2827800512313843, 1.396385669708252, 1.5099914073944092, 1.6235971450805664, 1.737202763557434, 1.8508083820343018, 1.964414119720459, 2.078019857406616, 2.1916255950927734, 2.3052310943603516, 2.418836832046509, 2.532442569732666, 2.646048069000244, 2.7596538066864014, 2.8732595443725586, 2.986865282058716, 3.100471019744873, 3.214076519012451, 3.3276822566986084, 3.4412879943847656, 3.5548934936523438, 3.668499231338501, 3.782104969024658]}, "gradients/decoder.bert.encoder.layer.12.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 8.0, 11.0, 9.0, 14.0, 17.0, 25.0, 35.0, 51.0, 84.0, 121.0, 191.0, 242.0, 405.0, 620.0, 978.0, 1516.0, 2618.0, 4210.0, 7294.0, 12687.0, 22965.0, 43738.0, 87558.0, 189565.0, 440461.0, 930094.0, 1155416.0, 705022.0, 309709.0, 137022.0, 65684.0, 33196.0, 17842.0, 9998.0, 5893.0, 3405.0, 2104.0, 1258.0, 837.0, 500.0, 337.0, 198.0, 128.0, 87.0, 44.0, 35.0, 23.0, 12.0, 9.0, 4.0, 7.0, 2.0, 0.0, 3.0], "bins": [-4.62109375, -4.493743896484375, -4.36639404296875, -4.239044189453125, -4.1116943359375, -3.984344482421875, -3.85699462890625, -3.729644775390625, -3.602294921875, -3.474945068359375, -3.34759521484375, -3.220245361328125, -3.0928955078125, -2.965545654296875, -2.83819580078125, -2.710845947265625, -2.58349609375, -2.456146240234375, -2.32879638671875, -2.201446533203125, -2.0740966796875, -1.946746826171875, -1.81939697265625, -1.692047119140625, -1.564697265625, -1.437347412109375, -1.30999755859375, -1.182647705078125, -1.0552978515625, -0.927947998046875, -0.80059814453125, -0.673248291015625, -0.5458984375, -0.418548583984375, -0.29119873046875, -0.163848876953125, -0.0364990234375, 0.090850830078125, 0.21820068359375, 0.345550537109375, 0.472900390625, 0.600250244140625, 0.72760009765625, 0.854949951171875, 0.9822998046875, 1.109649658203125, 1.23699951171875, 1.364349365234375, 1.49169921875, 1.619049072265625, 1.74639892578125, 1.873748779296875, 2.0010986328125, 2.128448486328125, 2.25579833984375, 2.383148193359375, 2.510498046875, 2.637847900390625, 2.76519775390625, 2.892547607421875, 3.0198974609375, 3.147247314453125, 3.27459716796875, 3.401947021484375, 3.529296875]}, "gradients/decoder.bert.encoder.layer.12.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 3.0, 6.0, 12.0, 12.0, 10.0, 17.0, 20.0, 25.0, 27.0, 31.0, 33.0, 29.0, 35.0, 47.0, 44.0, 38.0, 47.0, 45.0, 45.0, 43.0, 53.0, 47.0, 42.0, 52.0, 33.0, 39.0, 30.0, 21.0, 22.0, 20.0, 16.0, 14.0, 6.0, 6.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158203125, -2.080718994140625, -2.00323486328125, -1.925750732421875, -1.8482666015625, -1.770782470703125, -1.69329833984375, -1.615814208984375, -1.538330078125, -1.460845947265625, -1.38336181640625, -1.305877685546875, -1.2283935546875, -1.150909423828125, -1.07342529296875, -0.995941162109375, -0.91845703125, -0.840972900390625, -0.76348876953125, -0.686004638671875, -0.6085205078125, -0.531036376953125, -0.45355224609375, -0.376068115234375, -0.298583984375, -0.221099853515625, -0.14361572265625, -0.066131591796875, 0.0113525390625, 0.088836669921875, 0.16632080078125, 0.243804931640625, 0.3212890625, 0.398773193359375, 0.47625732421875, 0.553741455078125, 0.6312255859375, 0.708709716796875, 0.78619384765625, 0.863677978515625, 0.941162109375, 1.018646240234375, 1.09613037109375, 1.173614501953125, 1.2510986328125, 1.328582763671875, 1.40606689453125, 1.483551025390625, 1.56103515625, 1.638519287109375, 1.71600341796875, 1.793487548828125, 1.8709716796875, 1.948455810546875, 2.02593994140625, 2.103424072265625, 2.180908203125, 2.258392333984375, 2.33587646484375, 2.413360595703125, 2.4908447265625, 2.568328857421875, 2.64581298828125, 2.723297119140625, 2.80078125]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 12.0, 27.0, 27.0, 32.0, 51.0, 70.0, 147.0, 178.0, 293.0, 450.0, 668.0, 1115.0, 1713.0, 2657.0, 4331.0, 7002.0, 11909.0, 19924.0, 34891.0, 62601.0, 117873.0, 225025.0, 436110.0, 782583.0, 985691.0, 698189.0, 375902.0, 192632.0, 101597.0, 55110.0, 30693.0, 17587.0, 10411.0, 6148.0, 3853.0, 2487.0, 1508.0, 995.0, 622.0, 404.0, 255.0, 185.0, 112.0, 80.0, 39.0, 34.0, 21.0, 13.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.94140625, -3.8197021484375, -3.697998046875, -3.5762939453125, -3.45458984375, -3.3328857421875, -3.211181640625, -3.0894775390625, -2.9677734375, -2.8460693359375, -2.724365234375, -2.6026611328125, -2.48095703125, -2.3592529296875, -2.237548828125, -2.1158447265625, -1.994140625, -1.8724365234375, -1.750732421875, -1.6290283203125, -1.50732421875, -1.3856201171875, -1.263916015625, -1.1422119140625, -1.0205078125, -0.8988037109375, -0.777099609375, -0.6553955078125, -0.53369140625, -0.4119873046875, -0.290283203125, -0.1685791015625, -0.046875, 0.0748291015625, 0.196533203125, 0.3182373046875, 0.43994140625, 0.5616455078125, 0.683349609375, 0.8050537109375, 0.9267578125, 1.0484619140625, 1.170166015625, 1.2918701171875, 1.41357421875, 1.5352783203125, 1.656982421875, 1.7786865234375, 1.900390625, 2.0220947265625, 2.143798828125, 2.2655029296875, 2.38720703125, 2.5089111328125, 2.630615234375, 2.7523193359375, 2.8740234375, 2.9957275390625, 3.117431640625, 3.2391357421875, 3.36083984375, 3.4825439453125, 3.604248046875, 3.7259521484375, 3.84765625]}, "gradients/decoder.bert.encoder.layer.12.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 11.0, 7.0, 16.0, 20.0, 21.0, 33.0, 37.0, 49.0, 62.0, 82.0, 101.0, 110.0, 146.0, 172.0, 230.0, 251.0, 280.0, 266.0, 302.0, 251.0, 258.0, 215.0, 213.0, 166.0, 158.0, 123.0, 89.0, 79.0, 70.0, 51.0, 38.0, 35.0, 22.0, 31.0, 15.0, 11.0, 11.0, 11.0, 2.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.146484375, -1.1075897216796875, -1.068695068359375, -1.0298004150390625, -0.99090576171875, -0.9520111083984375, -0.913116455078125, -0.8742218017578125, -0.8353271484375, -0.7964324951171875, -0.757537841796875, -0.7186431884765625, -0.67974853515625, -0.6408538818359375, -0.601959228515625, -0.5630645751953125, -0.524169921875, -0.4852752685546875, -0.446380615234375, -0.4074859619140625, -0.36859130859375, -0.3296966552734375, -0.290802001953125, -0.2519073486328125, -0.2130126953125, -0.1741180419921875, -0.135223388671875, -0.0963287353515625, -0.05743408203125, -0.0185394287109375, 0.020355224609375, 0.0592498779296875, 0.09814453125, 0.1370391845703125, 0.175933837890625, 0.2148284912109375, 0.25372314453125, 0.2926177978515625, 0.331512451171875, 0.3704071044921875, 0.4093017578125, 0.4481964111328125, 0.487091064453125, 0.5259857177734375, 0.56488037109375, 0.6037750244140625, 0.642669677734375, 0.6815643310546875, 0.720458984375, 0.7593536376953125, 0.798248291015625, 0.8371429443359375, 0.87603759765625, 0.9149322509765625, 0.953826904296875, 0.9927215576171875, 1.0316162109375, 1.0705108642578125, 1.109405517578125, 1.1483001708984375, 1.18719482421875, 1.2260894775390625, 1.264984130859375, 1.3038787841796875, 1.3427734375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 5.0, 3.0, 4.0, 2.0, 1.0, 6.0, 5.0, 16.0, 11.0, 13.0, 18.0, 18.0, 27.0, 27.0, 37.0, 35.0, 50.0, 61.0, 57.0, 62.0, 75.0, 70.0, 63.0, 41.0, 52.0, 34.0, 36.0, 34.0, 19.0, 18.0, 17.0, 23.0, 14.0, 15.0, 4.0, 9.0, 6.0, 6.0, 8.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.879155397415161, -3.7437703609466553, -3.6083853244781494, -3.4730002880096436, -3.3376152515411377, -3.202230215072632, -3.066845417022705, -2.931460380554199, -2.7960753440856934, -2.6606903076171875, -2.5253052711486816, -2.389920234680176, -2.25453519821167, -2.119150161743164, -1.9837652444839478, -1.848380208015442, -1.7129950523376465, -1.5776100158691406, -1.4422249794006348, -1.306839942932129, -1.171454906463623, -1.0360698699951172, -0.9006849527359009, -0.765299916267395, -0.6299148797988892, -0.4945298433303833, -0.35914483666419983, -0.22375982999801636, -0.0883747935295105, 0.04701024293899536, 0.18239521980285645, 0.3177802562713623, 0.45316553115844727, 0.5885505676269531, 0.723935604095459, 0.8593205809593201, 0.9947056174278259, 1.1300907135009766, 1.2654756307601929, 1.4008606672286987, 1.5362457036972046, 1.6716307401657104, 1.8070157766342163, 1.9424006938934326, 2.0777857303619385, 2.2131707668304443, 2.34855580329895, 2.483940839767456, 2.619325876235962, 2.7547109127044678, 2.8900959491729736, 3.0254809856414795, 3.1608660221099854, 3.296251058578491, 3.431635856628418, 3.567020893096924, 3.7024059295654297, 3.8377909660339355, 3.9731760025024414, 4.108561038970947, 4.243946075439453, 4.379331111907959, 4.514716148376465, 4.650101184844971, 4.785486221313477]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 6.0, 10.0, 16.0, 11.0, 19.0, 20.0, 27.0, 27.0, 26.0, 27.0, 35.0, 38.0, 38.0, 35.0, 50.0, 43.0, 43.0, 39.0, 41.0, 41.0, 36.0, 36.0, 33.0, 38.0, 28.0, 32.0, 25.0, 29.0, 27.0, 22.0, 11.0, 7.0, 9.0, 9.0, 9.0, 5.0, 9.0, 5.0, 1.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.609907865524292, -2.525479316711426, -2.4410510063171387, -2.3566224575042725, -2.2721941471099854, -2.187765598297119, -2.103337287902832, -2.018908739089966, -1.9344803094863892, -1.8500518798828125, -1.7656234502792358, -1.6811950206756592, -1.596766471862793, -1.5123381614685059, -1.4279096126556396, -1.343481183052063, -1.2590527534484863, -1.1746243238449097, -1.090195894241333, -1.0057673454284668, -0.9213389754295349, -0.8369105458259583, -0.7524820566177368, -0.6680536270141602, -0.5836251974105835, -0.49919676780700684, -0.4147683084011078, -0.33033984899520874, -0.24591141939163208, -0.16148298978805542, -0.07705450057983398, 0.007373929023742676, 0.09180212020874023, 0.1762305647134781, 0.26065900921821594, 0.345087468624115, 0.42951589822769165, 0.5139443278312683, 0.5983728170394897, 0.6828012466430664, 0.7672296762466431, 0.8516581058502197, 0.9360865354537964, 1.020514965057373, 1.1049435138702393, 1.1893718242645264, 1.2738003730773926, 1.3582288026809692, 1.442657232284546, 1.5270856618881226, 1.6115140914916992, 1.6959426403045654, 1.7803709506988525, 1.8647994995117188, 1.9492279291152954, 2.033656358718872, 2.1180849075317383, 2.2025134563446045, 2.2869417667388916, 2.371370315551758, 2.455798625946045, 2.540227174758911, 2.6246557235717773, 2.7090840339660645, 2.7935123443603516]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 14.0, 21.0, 28.0, 51.0, 78.0, 119.0, 226.0, 343.0, 546.0, 861.0, 1567.0, 2514.0, 4346.0, 7772.0, 14075.0, 27113.0, 55223.0, 113766.0, 215393.0, 263345.0, 169441.0, 84421.0, 41009.0, 20590.0, 10972.0, 5983.0, 3470.0, 2074.0, 1240.0, 781.0, 417.0, 285.0, 184.0, 101.0, 61.0, 42.0, 29.0, 18.0, 10.0, 9.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3681640625, -0.353607177734375, -0.33905029296875, -0.324493408203125, -0.3099365234375, -0.295379638671875, -0.28082275390625, -0.266265869140625, -0.251708984375, -0.237152099609375, -0.22259521484375, -0.208038330078125, -0.1934814453125, -0.178924560546875, -0.16436767578125, -0.149810791015625, -0.13525390625, -0.120697021484375, -0.10614013671875, -0.091583251953125, -0.0770263671875, -0.062469482421875, -0.04791259765625, -0.033355712890625, -0.018798828125, -0.004241943359375, 0.01031494140625, 0.024871826171875, 0.0394287109375, 0.053985595703125, 0.06854248046875, 0.083099365234375, 0.09765625, 0.112213134765625, 0.12677001953125, 0.141326904296875, 0.1558837890625, 0.170440673828125, 0.18499755859375, 0.199554443359375, 0.214111328125, 0.228668212890625, 0.24322509765625, 0.257781982421875, 0.2723388671875, 0.286895751953125, 0.30145263671875, 0.316009521484375, 0.33056640625, 0.345123291015625, 0.35968017578125, 0.374237060546875, 0.3887939453125, 0.403350830078125, 0.41790771484375, 0.432464599609375, 0.447021484375, 0.461578369140625, 0.47613525390625, 0.490692138671875, 0.5052490234375, 0.519805908203125, 0.53436279296875, 0.548919677734375, 0.5634765625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 6.0, 7.0, 10.0, 15.0, 21.0, 14.0, 28.0, 22.0, 34.0, 47.0, 27.0, 36.0, 54.0, 50.0, 41.0, 45.0, 33.0, 39.0, 46.0, 47.0, 40.0, 32.0, 51.0, 41.0, 27.0, 22.0, 31.0, 19.0, 16.0, 16.0, 7.0, 11.0, 11.0, 7.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.6640625, -3.56134033203125, -3.4586181640625, -3.35589599609375, -3.253173828125, -3.15045166015625, -3.0477294921875, -2.94500732421875, -2.84228515625, -2.73956298828125, -2.6368408203125, -2.53411865234375, -2.431396484375, -2.32867431640625, -2.2259521484375, -2.12322998046875, -2.0205078125, -1.91778564453125, -1.8150634765625, -1.71234130859375, -1.609619140625, -1.50689697265625, -1.4041748046875, -1.30145263671875, -1.19873046875, -1.09600830078125, -0.9932861328125, -0.89056396484375, -0.787841796875, -0.68511962890625, -0.5823974609375, -0.47967529296875, -0.376953125, -0.27423095703125, -0.1715087890625, -0.06878662109375, 0.033935546875, 0.13665771484375, 0.2393798828125, 0.34210205078125, 0.44482421875, 0.54754638671875, 0.6502685546875, 0.75299072265625, 0.855712890625, 0.95843505859375, 1.0611572265625, 1.16387939453125, 1.2666015625, 1.36932373046875, 1.4720458984375, 1.57476806640625, 1.677490234375, 1.78021240234375, 1.8829345703125, 1.98565673828125, 2.08837890625, 2.19110107421875, 2.2938232421875, 2.39654541015625, 2.499267578125, 2.60198974609375, 2.7047119140625, 2.80743408203125, 2.91015625]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 8.0, 19.0, 19.0, 31.0, 58.0, 56.0, 110.0, 136.0, 268.0, 402.0, 690.0, 1181.0, 2317.0, 4777.0, 10930.0, 31822.0, 697579.0, 255311.0, 24822.0, 9182.0, 4147.0, 1918.0, 1151.0, 570.0, 403.0, 226.0, 129.0, 78.0, 70.0, 36.0, 26.0, 19.0, 17.0, 15.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9794921875, -0.940155029296875, -0.90081787109375, -0.861480712890625, -0.8221435546875, -0.782806396484375, -0.74346923828125, -0.704132080078125, -0.664794921875, -0.625457763671875, -0.58612060546875, -0.546783447265625, -0.5074462890625, -0.468109130859375, -0.42877197265625, -0.389434814453125, -0.35009765625, -0.310760498046875, -0.27142333984375, -0.232086181640625, -0.1927490234375, -0.153411865234375, -0.11407470703125, -0.074737548828125, -0.035400390625, 0.003936767578125, 0.04327392578125, 0.082611083984375, 0.1219482421875, 0.161285400390625, 0.20062255859375, 0.239959716796875, 0.279296875, 0.318634033203125, 0.35797119140625, 0.397308349609375, 0.4366455078125, 0.475982666015625, 0.51531982421875, 0.554656982421875, 0.593994140625, 0.633331298828125, 0.67266845703125, 0.712005615234375, 0.7513427734375, 0.790679931640625, 0.83001708984375, 0.869354248046875, 0.90869140625, 0.948028564453125, 0.98736572265625, 1.026702880859375, 1.0660400390625, 1.105377197265625, 1.14471435546875, 1.184051513671875, 1.223388671875, 1.262725830078125, 1.30206298828125, 1.341400146484375, 1.3807373046875, 1.420074462890625, 1.45941162109375, 1.498748779296875, 1.5380859375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 9.0, 4.0, 5.0, 3.0, 6.0, 9.0, 10.0, 9.0, 19.0, 15.0, 24.0, 22.0, 36.0, 44.0, 42.0, 33.0, 34.0, 50.0, 42.0, 48.0, 42.0, 48.0, 51.0, 51.0, 38.0, 37.0, 36.0, 26.0, 33.0, 42.0, 22.0, 30.0, 21.0, 11.0, 18.0, 7.0, 3.0, 4.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.927734375, -1.861724853515625, -1.79571533203125, -1.729705810546875, -1.6636962890625, -1.597686767578125, -1.53167724609375, -1.465667724609375, -1.399658203125, -1.333648681640625, -1.26763916015625, -1.201629638671875, -1.1356201171875, -1.069610595703125, -1.00360107421875, -0.937591552734375, -0.87158203125, -0.805572509765625, -0.73956298828125, -0.673553466796875, -0.6075439453125, -0.541534423828125, -0.47552490234375, -0.409515380859375, -0.343505859375, -0.277496337890625, -0.21148681640625, -0.145477294921875, -0.0794677734375, -0.013458251953125, 0.05255126953125, 0.118560791015625, 0.1845703125, 0.250579833984375, 0.31658935546875, 0.382598876953125, 0.4486083984375, 0.514617919921875, 0.58062744140625, 0.646636962890625, 0.712646484375, 0.778656005859375, 0.84466552734375, 0.910675048828125, 0.9766845703125, 1.042694091796875, 1.10870361328125, 1.174713134765625, 1.24072265625, 1.306732177734375, 1.37274169921875, 1.438751220703125, 1.5047607421875, 1.570770263671875, 1.63677978515625, 1.702789306640625, 1.768798828125, 1.834808349609375, 1.90081787109375, 1.966827392578125, 2.0328369140625, 2.098846435546875, 2.16485595703125, 2.230865478515625, 2.296875]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 7.0, 6.0, 6.0, 14.0, 20.0, 21.0, 16.0, 53.0, 69.0, 80.0, 142.0, 202.0, 288.0, 420.0, 650.0, 1043.0, 1638.0, 2750.0, 4457.0, 7778.0, 14057.0, 27967.0, 510242.0, 415809.0, 27284.0, 13734.0, 7828.0, 4559.0, 2669.0, 1657.0, 1017.0, 697.0, 447.0, 292.0, 195.0, 127.0, 94.0, 72.0, 42.0, 31.0, 20.0, 21.0, 7.0, 10.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1943359375, -0.18785476684570312, -0.18137359619140625, -0.17489242553710938, -0.1684112548828125, -0.16193008422851562, -0.15544891357421875, -0.14896774291992188, -0.142486572265625, -0.13600540161132812, -0.12952423095703125, -0.12304306030273438, -0.1165618896484375, -0.11008071899414062, -0.10359954833984375, -0.09711837768554688, -0.09063720703125, -0.08415603637695312, -0.07767486572265625, -0.07119369506835938, -0.0647125244140625, -0.058231353759765625, -0.05175018310546875, -0.045269012451171875, -0.038787841796875, -0.032306671142578125, -0.02582550048828125, -0.019344329833984375, -0.0128631591796875, -0.006381988525390625, 9.918212890625e-05, 0.006580352783203125, 0.0130615234375, 0.019542694091796875, 0.02602386474609375, 0.032505035400390625, 0.0389862060546875, 0.045467376708984375, 0.05194854736328125, 0.058429718017578125, 0.064910888671875, 0.07139205932617188, 0.07787322998046875, 0.08435440063476562, 0.0908355712890625, 0.09731674194335938, 0.10379791259765625, 0.11027908325195312, 0.11676025390625, 0.12324142456054688, 0.12972259521484375, 0.13620376586914062, 0.1426849365234375, 0.14916610717773438, 0.15564727783203125, 0.16212844848632812, 0.168609619140625, 0.17509078979492188, 0.18157196044921875, 0.18805313110351562, 0.1945343017578125, 0.20101547241210938, 0.20749664306640625, 0.21397781372070312, 0.220458984375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 15.0, 14.0, 8.0, 16.0, 23.0, 25.0, 31.0, 41.0, 56.0, 39.0, 46.0, 44.0, 66.0, 70.0, 57.0, 53.0, 57.0, 48.0, 47.0, 46.0, 39.0, 31.0, 21.0, 23.0, 23.0, 8.0, 6.0, 9.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.187490463256836e-05, -2.1115876734256744e-05, -2.035684883594513e-05, -1.9597820937633514e-05, -1.88387930393219e-05, -1.8079765141010284e-05, -1.732073724269867e-05, -1.6561709344387054e-05, -1.580268144607544e-05, -1.5043653547763824e-05, -1.428462564945221e-05, -1.3525597751140594e-05, -1.276656985282898e-05, -1.2007541954517365e-05, -1.124851405620575e-05, -1.0489486157894135e-05, -9.73045825958252e-06, -8.971430361270905e-06, -8.21240246295929e-06, -7.4533745646476746e-06, -6.6943466663360596e-06, -5.935318768024445e-06, -5.17629086971283e-06, -4.417262971401215e-06, -3.6582350730895996e-06, -2.8992071747779846e-06, -2.1401792764663696e-06, -1.3811513781547546e-06, -6.221234798431396e-07, 1.3690441846847534e-07, 8.959323167800903e-07, 1.6549602150917053e-06, 2.4139881134033203e-06, 3.1730160117149353e-06, 3.93204391002655e-06, 4.691071808338165e-06, 5.45009970664978e-06, 6.209127604961395e-06, 6.96815550327301e-06, 7.727183401584625e-06, 8.48621129989624e-06, 9.245239198207855e-06, 1.000426709651947e-05, 1.0763294994831085e-05, 1.15223228931427e-05, 1.2281350791454315e-05, 1.304037868976593e-05, 1.3799406588077545e-05, 1.455843448638916e-05, 1.5317462384700775e-05, 1.607649028301239e-05, 1.6835518181324005e-05, 1.759454607963562e-05, 1.8353573977947235e-05, 1.911260187625885e-05, 1.9871629774570465e-05, 2.063065767288208e-05, 2.1389685571193695e-05, 2.214871346950531e-05, 2.2907741367816925e-05, 2.366676926612854e-05, 2.4425797164440155e-05, 2.518482506275177e-05, 2.5943852961063385e-05, 2.6702880859375e-05]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 12.0, 14.0, 20.0, 31.0, 36.0, 73.0, 102.0, 165.0, 254.0, 372.0, 581.0, 970.0, 1581.0, 2579.0, 4217.0, 6983.0, 12020.0, 20659.0, 36521.0, 64584.0, 111092.0, 174734.0, 208315.0, 163437.0, 101758.0, 58601.0, 33119.0, 18557.0, 10705.0, 6385.0, 3918.0, 2332.0, 1398.0, 906.0, 537.0, 371.0, 234.0, 128.0, 99.0, 62.0, 40.0, 30.0, 8.0, 6.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06571769714355469, -0.06332015991210938, -0.06092262268066406, -0.05852508544921875, -0.05612754821777344, -0.053730010986328125, -0.05133247375488281, -0.0489349365234375, -0.04653739929199219, -0.044139862060546875, -0.04174232482910156, -0.03934478759765625, -0.03694725036621094, -0.034549713134765625, -0.03215217590332031, -0.029754638671875, -0.027357101440429688, -0.024959564208984375, -0.022562026977539062, -0.02016448974609375, -0.017766952514648438, -0.015369415283203125, -0.012971878051757812, -0.0105743408203125, -0.008176803588867188, -0.005779266357421875, -0.0033817291259765625, -0.00098419189453125, 0.0014133453369140625, 0.003810882568359375, 0.0062084197998046875, 0.00860595703125, 0.011003494262695312, 0.013401031494140625, 0.015798568725585938, 0.01819610595703125, 0.020593643188476562, 0.022991180419921875, 0.025388717651367188, 0.0277862548828125, 0.030183792114257812, 0.032581329345703125, 0.03497886657714844, 0.03737640380859375, 0.03977394104003906, 0.042171478271484375, 0.04456901550292969, 0.046966552734375, 0.04936408996582031, 0.051761627197265625, 0.05415916442871094, 0.05655670166015625, 0.05895423889160156, 0.061351776123046875, 0.06374931335449219, 0.0661468505859375, 0.06854438781738281, 0.07094192504882812, 0.07333946228027344, 0.07573699951171875, 0.07813453674316406, 0.08053207397460938, 0.08292961120605469, 0.0853271484375]}, "gradients/decoder.bert.encoder.layer.12.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 3.0, 4.0, 12.0, 5.0, 14.0, 8.0, 17.0, 26.0, 29.0, 25.0, 39.0, 41.0, 45.0, 58.0, 40.0, 59.0, 52.0, 55.0, 58.0, 58.0, 56.0, 57.0, 34.0, 49.0, 29.0, 30.0, 19.0, 10.0, 14.0, 12.0, 6.0, 4.0, 6.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0207977294921875, -0.02012491226196289, -0.01945209503173828, -0.018779277801513672, -0.018106460571289062, -0.017433643341064453, -0.016760826110839844, -0.016088008880615234, -0.015415191650390625, -0.014742374420166016, -0.014069557189941406, -0.013396739959716797, -0.012723922729492188, -0.012051105499267578, -0.011378288269042969, -0.01070547103881836, -0.01003265380859375, -0.00935983657836914, -0.008687019348144531, -0.008014202117919922, -0.0073413848876953125, -0.006668567657470703, -0.005995750427246094, -0.005322933197021484, -0.004650115966796875, -0.003977298736572266, -0.0033044815063476562, -0.002631664276123047, -0.0019588470458984375, -0.0012860298156738281, -0.0006132125854492188, 5.9604644775390625e-05, 0.000732421875, 0.0014052391052246094, 0.0020780563354492188, 0.002750873565673828, 0.0034236907958984375, 0.004096508026123047, 0.004769325256347656, 0.005442142486572266, 0.006114959716796875, 0.006787776947021484, 0.007460594177246094, 0.008133411407470703, 0.008806228637695312, 0.009479045867919922, 0.010151863098144531, 0.01082468032836914, 0.01149749755859375, 0.01217031478881836, 0.012843132019042969, 0.013515949249267578, 0.014188766479492188, 0.014861583709716797, 0.015534400939941406, 0.016207218170166016, 0.016880035400390625, 0.017552852630615234, 0.018225669860839844, 0.018898487091064453, 0.019571304321289062, 0.020244121551513672, 0.02091693878173828, 0.02158975601196289, 0.0222625732421875]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 13.0, 14.0, 10.0, 17.0, 18.0, 18.0, 25.0, 42.0, 38.0, 43.0, 54.0, 58.0, 49.0, 82.0, 70.0, 74.0, 41.0, 50.0, 40.0, 32.0, 38.0, 22.0, 19.0, 22.0, 16.0, 22.0, 11.0, 11.0, 4.0, 10.0, 6.0, 6.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9336400032043457, -3.7984774112701416, -3.6633148193359375, -3.5281522274017334, -3.3929896354675293, -3.257827043533325, -3.122664451599121, -2.987501621246338, -2.852339267730713, -2.717176675796509, -2.5820140838623047, -2.4468514919281006, -2.3116888999938965, -2.1765263080596924, -2.0413637161254883, -1.9062010049819946, -1.771038293838501, -1.6358757019042969, -1.5007131099700928, -1.3655505180358887, -1.2303879261016846, -1.0952253341674805, -0.9600626230239868, -0.8249000310897827, -0.6897374391555786, -0.5545748472213745, -0.419412225484848, -0.28424960374832153, -0.14908701181411743, -0.01392441987991333, 0.12123823165893555, 0.25640082359313965, 0.39156341552734375, 0.5267260074615479, 0.661888599395752, 0.7970512509346008, 0.9322138428688049, 1.0673763751983643, 1.202539086341858, 1.337701678276062, 1.4728642702102661, 1.6080268621444702, 1.7431894540786743, 1.878352165222168, 2.013514757156372, 2.148677349090576, 2.2838399410247803, 2.4190025329589844, 2.5541651248931885, 2.6893277168273926, 2.8244903087615967, 2.959652900695801, 3.094815492630005, 3.229978084564209, 3.365140914916992, 3.500303268432617, 3.6354660987854004, 3.7706286907196045, 3.9057912826538086, 4.040954113006592, 4.176116466522217, 4.311279296875, 4.446441650390625, 4.581604480743408, 4.716766834259033]}, "gradients/decoder.bert.encoder.layer.12.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 8.0, 3.0, 5.0, 6.0, 7.0, 8.0, 17.0, 10.0, 19.0, 18.0, 27.0, 29.0, 26.0, 29.0, 36.0, 35.0, 37.0, 39.0, 46.0, 43.0, 43.0, 41.0, 38.0, 46.0, 31.0, 42.0, 32.0, 39.0, 28.0, 29.0, 22.0, 36.0, 23.0, 23.0, 11.0, 6.0, 9.0, 12.0, 7.0, 4.0, 10.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6143991947174072, -2.530123472213745, -2.445847749710083, -2.361572265625, -2.277296543121338, -2.193020820617676, -2.1087450981140137, -2.0244693756103516, -1.940193772315979, -1.855918049812317, -1.7716424465179443, -1.6873667240142822, -1.6030910015106201, -1.5188153982162476, -1.4345396757125854, -1.350264072418213, -1.2659883499145508, -1.1817126274108887, -1.0974370241165161, -1.013161301612854, -0.9288856387138367, -0.8446099758148193, -0.7603342533111572, -0.6760585904121399, -0.5917829275131226, -0.5075072646141052, -0.4232315719127655, -0.3389558792114258, -0.25468021631240845, -0.1704045534133911, -0.086128830909729, -0.00185316801071167, 0.08242225646972656, 0.1666979342699051, 0.2509736120700836, 0.33524930477142334, 0.4195249676704407, 0.503800630569458, 0.5880763530731201, 0.6723520159721375, 0.7566276788711548, 0.8409033417701721, 0.9251790046691895, 1.0094547271728516, 1.0937304496765137, 1.1780060529708862, 1.2622817754745483, 1.346557378768921, 1.430833101272583, 1.5151088237762451, 1.5993844270706177, 1.6836601495742798, 1.7679357528686523, 1.8522114753723145, 1.9364871978759766, 2.0207629203796387, 2.105038642883301, 2.189314365386963, 2.273590087890625, 2.357865810394287, 2.44214129447937, 2.5264170169830322, 2.6106927394866943, 2.6949684619903564, 2.7792439460754395]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 7.0, 14.0, 10.0, 22.0, 23.0, 51.0, 78.0, 96.0, 143.0, 205.0, 356.0, 488.0, 855.0, 1416.0, 2395.0, 4256.0, 7382.0, 12992.0, 23257.0, 41503.0, 72808.0, 118052.0, 167225.0, 185886.0, 156676.0, 105623.0, 63904.0, 36025.0, 20153.0, 11201.0, 6281.0, 3564.0, 2096.0, 1243.0, 799.0, 533.0, 316.0, 209.0, 134.0, 86.0, 55.0, 51.0, 27.0, 17.0, 17.0, 9.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.88671875, -2.79168701171875, -2.6966552734375, -2.60162353515625, -2.506591796875, -2.41156005859375, -2.3165283203125, -2.22149658203125, -2.12646484375, -2.03143310546875, -1.9364013671875, -1.84136962890625, -1.746337890625, -1.65130615234375, -1.5562744140625, -1.46124267578125, -1.3662109375, -1.27117919921875, -1.1761474609375, -1.08111572265625, -0.986083984375, -0.89105224609375, -0.7960205078125, -0.70098876953125, -0.60595703125, -0.51092529296875, -0.4158935546875, -0.32086181640625, -0.225830078125, -0.13079833984375, -0.0357666015625, 0.05926513671875, 0.154296875, 0.24932861328125, 0.3443603515625, 0.43939208984375, 0.534423828125, 0.62945556640625, 0.7244873046875, 0.81951904296875, 0.91455078125, 1.00958251953125, 1.1046142578125, 1.19964599609375, 1.294677734375, 1.38970947265625, 1.4847412109375, 1.57977294921875, 1.6748046875, 1.76983642578125, 1.8648681640625, 1.95989990234375, 2.054931640625, 2.14996337890625, 2.2449951171875, 2.34002685546875, 2.43505859375, 2.53009033203125, 2.6251220703125, 2.72015380859375, 2.815185546875, 2.91021728515625, 3.0052490234375, 3.10028076171875, 3.1953125]}, "gradients/decoder.bert.encoder.layer.12.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 7.0, 8.0, 7.0, 7.0, 9.0, 9.0, 14.0, 17.0, 18.0, 19.0, 20.0, 29.0, 27.0, 26.0, 26.0, 46.0, 33.0, 37.0, 32.0, 40.0, 41.0, 39.0, 54.0, 41.0, 32.0, 50.0, 37.0, 34.0, 32.0, 28.0, 29.0, 19.0, 30.0, 16.0, 11.0, 8.0, 14.0, 11.0, 7.0, 9.0, 6.0, 8.0, 3.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.931640625, -2.841094970703125, -2.75054931640625, -2.660003662109375, -2.5694580078125, -2.478912353515625, -2.38836669921875, -2.297821044921875, -2.207275390625, -2.116729736328125, -2.02618408203125, -1.935638427734375, -1.8450927734375, -1.754547119140625, -1.66400146484375, -1.573455810546875, -1.48291015625, -1.392364501953125, -1.30181884765625, -1.211273193359375, -1.1207275390625, -1.030181884765625, -0.93963623046875, -0.849090576171875, -0.758544921875, -0.667999267578125, -0.57745361328125, -0.486907958984375, -0.3963623046875, -0.305816650390625, -0.21527099609375, -0.124725341796875, -0.0341796875, 0.056365966796875, 0.14691162109375, 0.237457275390625, 0.3280029296875, 0.418548583984375, 0.50909423828125, 0.599639892578125, 0.690185546875, 0.780731201171875, 0.87127685546875, 0.961822509765625, 1.0523681640625, 1.142913818359375, 1.23345947265625, 1.324005126953125, 1.41455078125, 1.505096435546875, 1.59564208984375, 1.686187744140625, 1.7767333984375, 1.867279052734375, 1.95782470703125, 2.048370361328125, 2.138916015625, 2.229461669921875, 2.32000732421875, 2.410552978515625, 2.5010986328125, 2.591644287109375, 2.68218994140625, 2.772735595703125, 2.86328125]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 16.0, 27.0, 33.0, 43.0, 70.0, 90.0, 106.0, 212.0, 315.0, 515.0, 785.0, 1254.0, 2049.0, 3387.0, 5860.0, 10531.0, 19362.0, 34523.0, 62013.0, 105086.0, 157728.0, 189088.0, 170573.0, 119537.0, 71854.0, 41196.0, 22693.0, 12306.0, 6974.0, 4001.0, 2420.0, 1460.0, 869.0, 554.0, 325.0, 251.0, 134.0, 92.0, 67.0, 41.0, 34.0, 27.0, 15.0, 13.0, 9.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.837890625, -2.738800048828125, -2.63970947265625, -2.540618896484375, -2.4415283203125, -2.342437744140625, -2.24334716796875, -2.144256591796875, -2.045166015625, -1.946075439453125, -1.84698486328125, -1.747894287109375, -1.6488037109375, -1.549713134765625, -1.45062255859375, -1.351531982421875, -1.25244140625, -1.153350830078125, -1.05426025390625, -0.955169677734375, -0.8560791015625, -0.756988525390625, -0.65789794921875, -0.558807373046875, -0.459716796875, -0.360626220703125, -0.26153564453125, -0.162445068359375, -0.0633544921875, 0.035736083984375, 0.13482666015625, 0.233917236328125, 0.3330078125, 0.432098388671875, 0.53118896484375, 0.630279541015625, 0.7293701171875, 0.828460693359375, 0.92755126953125, 1.026641845703125, 1.125732421875, 1.224822998046875, 1.32391357421875, 1.423004150390625, 1.5220947265625, 1.621185302734375, 1.72027587890625, 1.819366455078125, 1.91845703125, 2.017547607421875, 2.11663818359375, 2.215728759765625, 2.3148193359375, 2.413909912109375, 2.51300048828125, 2.612091064453125, 2.711181640625, 2.810272216796875, 2.90936279296875, 3.008453369140625, 3.1075439453125, 3.206634521484375, 3.30572509765625, 3.404815673828125, 3.50390625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 4.0, 2.0, 3.0, 9.0, 14.0, 8.0, 14.0, 23.0, 12.0, 28.0, 19.0, 14.0, 29.0, 25.0, 24.0, 34.0, 29.0, 35.0, 45.0, 39.0, 39.0, 44.0, 48.0, 42.0, 36.0, 42.0, 34.0, 33.0, 26.0, 29.0, 22.0, 18.0, 29.0, 25.0, 22.0, 18.0, 15.0, 9.0, 9.0, 7.0, 9.0, 6.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.712890625, -1.661163330078125, -1.60943603515625, -1.557708740234375, -1.5059814453125, -1.454254150390625, -1.40252685546875, -1.350799560546875, -1.299072265625, -1.247344970703125, -1.19561767578125, -1.143890380859375, -1.0921630859375, -1.040435791015625, -0.98870849609375, -0.936981201171875, -0.88525390625, -0.833526611328125, -0.78179931640625, -0.730072021484375, -0.6783447265625, -0.626617431640625, -0.57489013671875, -0.523162841796875, -0.471435546875, -0.419708251953125, -0.36798095703125, -0.316253662109375, -0.2645263671875, -0.212799072265625, -0.16107177734375, -0.109344482421875, -0.0576171875, -0.005889892578125, 0.04583740234375, 0.097564697265625, 0.1492919921875, 0.201019287109375, 0.25274658203125, 0.304473876953125, 0.356201171875, 0.407928466796875, 0.45965576171875, 0.511383056640625, 0.5631103515625, 0.614837646484375, 0.66656494140625, 0.718292236328125, 0.77001953125, 0.821746826171875, 0.87347412109375, 0.925201416015625, 0.9769287109375, 1.028656005859375, 1.08038330078125, 1.132110595703125, 1.183837890625, 1.235565185546875, 1.28729248046875, 1.339019775390625, 1.3907470703125, 1.442474365234375, 1.49420166015625, 1.545928955078125, 1.59765625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 5.0, 19.0, 23.0, 30.0, 42.0, 58.0, 84.0, 138.0, 201.0, 306.0, 476.0, 809.0, 1278.0, 2073.0, 3431.0, 6171.0, 11411.0, 21687.0, 43342.0, 86810.0, 162603.0, 232870.0, 211291.0, 127716.0, 65488.0, 32208.0, 16882.0, 8865.0, 4905.0, 2823.0, 1677.0, 1039.0, 607.0, 408.0, 234.0, 167.0, 129.0, 84.0, 47.0, 36.0, 28.0, 16.0, 11.0, 5.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.944610595703125, -1.88531494140625, -1.826019287109375, -1.7667236328125, -1.707427978515625, -1.64813232421875, -1.588836669921875, -1.529541015625, -1.470245361328125, -1.41094970703125, -1.351654052734375, -1.2923583984375, -1.233062744140625, -1.17376708984375, -1.114471435546875, -1.05517578125, -0.995880126953125, -0.93658447265625, -0.877288818359375, -0.8179931640625, -0.758697509765625, -0.69940185546875, -0.640106201171875, -0.580810546875, -0.521514892578125, -0.46221923828125, -0.402923583984375, -0.3436279296875, -0.284332275390625, -0.22503662109375, -0.165740966796875, -0.1064453125, -0.047149658203125, 0.01214599609375, 0.071441650390625, 0.1307373046875, 0.190032958984375, 0.24932861328125, 0.308624267578125, 0.367919921875, 0.427215576171875, 0.48651123046875, 0.545806884765625, 0.6051025390625, 0.664398193359375, 0.72369384765625, 0.782989501953125, 0.84228515625, 0.901580810546875, 0.96087646484375, 1.020172119140625, 1.0794677734375, 1.138763427734375, 1.19805908203125, 1.257354736328125, 1.316650390625, 1.375946044921875, 1.43524169921875, 1.494537353515625, 1.5538330078125, 1.613128662109375, 1.67242431640625, 1.731719970703125, 1.791015625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 3.0, 17.0, 16.0, 23.0, 26.0, 70.0, 53.0, 72.0, 102.0, 95.0, 103.0, 94.0, 78.0, 60.0, 47.0, 30.0, 28.0, 17.0, 13.0, 12.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021827220916748047, -0.00021053291857242584, -0.00020279362797737122, -0.0001950543373823166, -0.00018731504678726196, -0.00017957575619220734, -0.0001718364655971527, -0.00016409717500209808, -0.00015635788440704346, -0.00014861859381198883, -0.0001408793032169342, -0.00013314001262187958, -0.00012540072202682495, -0.00011766143143177032, -0.0001099221408367157, -0.00010218285024166107, -9.444355964660645e-05, -8.670426905155182e-05, -7.896497845649719e-05, -7.122568786144257e-05, -6.348639726638794e-05, -5.574710667133331e-05, -4.8007816076278687e-05, -4.026852548122406e-05, -3.2529234886169434e-05, -2.4789944291114807e-05, -1.705065369606018e-05, -9.311363101005554e-06, -1.5720725059509277e-06, 6.167218089103699e-06, 1.3906508684158325e-05, 2.164579927921295e-05, 2.9385089874267578e-05, 3.7124380469322205e-05, 4.486367106437683e-05, 5.260296165943146e-05, 6.0342252254486084e-05, 6.808154284954071e-05, 7.582083344459534e-05, 8.356012403964996e-05, 9.129941463470459e-05, 9.903870522975922e-05, 0.00010677799582481384, 0.00011451728641986847, 0.0001222565770149231, 0.00012999586760997772, 0.00013773515820503235, 0.00014547444880008698, 0.0001532137393951416, 0.00016095302999019623, 0.00016869232058525085, 0.00017643161118030548, 0.0001841709017753601, 0.00019191019237041473, 0.00019964948296546936, 0.000207388773560524, 0.0002151280641555786, 0.00022286735475063324, 0.00023060664534568787, 0.0002383459359407425, 0.0002460852265357971, 0.00025382451713085175, 0.00026156380772590637, 0.000269303098320961, 0.0002770423889160156]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 7.0, 8.0, 12.0, 19.0, 35.0, 48.0, 59.0, 78.0, 136.0, 206.0, 292.0, 421.0, 669.0, 966.0, 1477.0, 2327.0, 3485.0, 5617.0, 9059.0, 14739.0, 23991.0, 40081.0, 66547.0, 105844.0, 151662.0, 176482.0, 155662.0, 110555.0, 69736.0, 41990.0, 25278.0, 15387.0, 9124.0, 5896.0, 3594.0, 2368.0, 1544.0, 997.0, 702.0, 505.0, 281.0, 220.0, 137.0, 95.0, 73.0, 51.0, 37.0, 22.0, 14.0, 10.0, 11.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3681640625, -1.3261260986328125, -1.284088134765625, -1.2420501708984375, -1.20001220703125, -1.1579742431640625, -1.115936279296875, -1.0738983154296875, -1.0318603515625, -0.9898223876953125, -0.947784423828125, -0.9057464599609375, -0.86370849609375, -0.8216705322265625, -0.779632568359375, -0.7375946044921875, -0.695556640625, -0.6535186767578125, -0.611480712890625, -0.5694427490234375, -0.52740478515625, -0.4853668212890625, -0.443328857421875, -0.4012908935546875, -0.3592529296875, -0.3172149658203125, -0.275177001953125, -0.2331390380859375, -0.19110107421875, -0.1490631103515625, -0.107025146484375, -0.0649871826171875, -0.02294921875, 0.0190887451171875, 0.061126708984375, 0.1031646728515625, 0.14520263671875, 0.1872406005859375, 0.229278564453125, 0.2713165283203125, 0.3133544921875, 0.3553924560546875, 0.397430419921875, 0.4394683837890625, 0.48150634765625, 0.5235443115234375, 0.565582275390625, 0.6076202392578125, 0.649658203125, 0.6916961669921875, 0.733734130859375, 0.7757720947265625, 0.81781005859375, 0.8598480224609375, 0.901885986328125, 0.9439239501953125, 0.9859619140625, 1.0279998779296875, 1.070037841796875, 1.1120758056640625, 1.15411376953125, 1.1961517333984375, 1.238189697265625, 1.2802276611328125, 1.322265625]}, "gradients/decoder.bert.encoder.layer.12.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 3.0, 4.0, 9.0, 9.0, 8.0, 10.0, 14.0, 17.0, 13.0, 25.0, 22.0, 44.0, 51.0, 37.0, 65.0, 59.0, 54.0, 71.0, 53.0, 70.0, 59.0, 43.0, 39.0, 37.0, 24.0, 34.0, 19.0, 17.0, 15.0, 11.0, 16.0, 12.0, 7.0, 5.0, 7.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4609375, -0.445037841796875, -0.42913818359375, -0.413238525390625, -0.3973388671875, -0.381439208984375, -0.36553955078125, -0.349639892578125, -0.333740234375, -0.317840576171875, -0.30194091796875, -0.286041259765625, -0.2701416015625, -0.254241943359375, -0.23834228515625, -0.222442626953125, -0.20654296875, -0.190643310546875, -0.17474365234375, -0.158843994140625, -0.1429443359375, -0.127044677734375, -0.11114501953125, -0.095245361328125, -0.079345703125, -0.063446044921875, -0.04754638671875, -0.031646728515625, -0.0157470703125, 0.000152587890625, 0.01605224609375, 0.031951904296875, 0.0478515625, 0.063751220703125, 0.07965087890625, 0.095550537109375, 0.1114501953125, 0.127349853515625, 0.14324951171875, 0.159149169921875, 0.175048828125, 0.190948486328125, 0.20684814453125, 0.222747802734375, 0.2386474609375, 0.254547119140625, 0.27044677734375, 0.286346435546875, 0.30224609375, 0.318145751953125, 0.33404541015625, 0.349945068359375, 0.3658447265625, 0.381744384765625, 0.39764404296875, 0.413543701171875, 0.429443359375, 0.445343017578125, 0.46124267578125, 0.477142333984375, 0.4930419921875, 0.508941650390625, 0.52484130859375, 0.540740966796875, 0.556640625]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 0.0, 8.0, 8.0, 10.0, 6.0, 8.0, 13.0, 18.0, 29.0, 27.0, 21.0, 34.0, 40.0, 46.0, 51.0, 58.0, 61.0, 53.0, 65.0, 47.0, 51.0, 56.0, 34.0, 36.0, 33.0, 28.0, 21.0, 14.0, 19.0, 21.0, 17.0, 14.0, 10.0, 6.0, 4.0, 3.0, 2.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5796639919281006, -3.455317974090576, -3.330972194671631, -3.2066264152526855, -3.082280397415161, -2.9579343795776367, -2.8335886001586914, -2.709242820739746, -2.5848968029022217, -2.4605507850646973, -2.336205005645752, -2.2118592262268066, -2.0875132083892822, -1.9631673097610474, -1.8388214111328125, -1.7144755125045776, -1.5901296138763428, -1.465783715248108, -1.341437816619873, -1.2170919179916382, -1.0927460193634033, -0.9684001207351685, -0.8440542221069336, -0.7197083234786987, -0.5953624248504639, -0.471016526222229, -0.34667062759399414, -0.22232472896575928, -0.09797883033752441, 0.02636706829071045, 0.1507129669189453, 0.2750588655471802, 0.39940452575683594, 0.5237504243850708, 0.6480963230133057, 0.7724422216415405, 0.8967881202697754, 1.0211340188980103, 1.1454799175262451, 1.26982581615448, 1.3941717147827148, 1.5185176134109497, 1.6428635120391846, 1.7672094106674194, 1.8915553092956543, 2.0159010887145996, 2.140247106552124, 2.2645931243896484, 2.3889389038085938, 2.513284683227539, 2.6376307010650635, 2.761976718902588, 2.886322498321533, 3.0106682777404785, 3.135014295578003, 3.2593603134155273, 3.3837060928344727, 3.508051872253418, 3.6323978900909424, 3.756743907928467, 3.881089687347412, 4.005435466766357, 4.129781723022461, 4.254127502441406, 4.378473281860352]}, "gradients/decoder.bert.encoder.layer.11.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 0.0, 3.0, 6.0, 6.0, 6.0, 7.0, 10.0, 17.0, 14.0, 17.0, 12.0, 33.0, 26.0, 27.0, 23.0, 28.0, 30.0, 28.0, 38.0, 41.0, 30.0, 38.0, 41.0, 42.0, 49.0, 46.0, 33.0, 32.0, 34.0, 29.0, 35.0, 29.0, 27.0, 29.0, 24.0, 17.0, 21.0, 19.0, 12.0, 7.0, 8.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.772695302963257, -2.6886179447174072, -2.6045405864715576, -2.520463228225708, -2.4363858699798584, -2.352308511734009, -2.2682313919067383, -2.1841540336608887, -2.100076675415039, -2.0159993171691895, -1.9319219589233398, -1.8478446006774902, -1.7637672424316406, -1.679689884185791, -1.595612645149231, -1.5115352869033813, -1.4274578094482422, -1.3433804512023926, -1.259303092956543, -1.1752257347106934, -1.0911483764648438, -1.0070710182189941, -0.9229937791824341, -0.8389164209365845, -0.7548390626907349, -0.6707617044448853, -0.5866843461990356, -0.5026070475578308, -0.4185296893119812, -0.3344523310661316, -0.25037503242492676, -0.16629767417907715, -0.08222031593322754, 0.0018570274114608765, 0.08593437075614929, 0.1700116991996765, 0.2540890574455261, 0.33816641569137573, 0.42224371433258057, 0.5063210725784302, 0.5903984308242798, 0.6744757890701294, 0.758553147315979, 0.8426304459571838, 0.9267078042030334, 1.0107851028442383, 1.094862461090088, 1.1789398193359375, 1.263017177581787, 1.3470945358276367, 1.4311718940734863, 1.515249252319336, 1.5993266105651855, 1.6834039688110352, 1.7674812078475952, 1.8515585660934448, 1.9356359243392944, 2.0197131633758545, 2.103790521621704, 2.1878678798675537, 2.2719452381134033, 2.356022596359253, 2.4400999546051025, 2.524177312850952, 2.6082546710968018]}, "gradients/decoder.bert.encoder.layer.11.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 6.0, 13.0, 17.0, 21.0, 26.0, 43.0, 60.0, 111.0, 138.0, 206.0, 338.0, 494.0, 799.0, 1229.0, 1902.0, 3032.0, 4753.0, 7999.0, 13031.0, 22007.0, 38866.0, 69766.0, 132836.0, 263011.0, 525158.0, 895709.0, 960537.0, 609575.0, 304787.0, 151061.0, 78713.0, 43273.0, 24996.0, 15041.0, 9179.0, 5574.0, 3484.0, 2172.0, 1490.0, 990.0, 613.0, 431.0, 262.0, 180.0, 118.0, 76.0, 49.0, 43.0, 29.0, 7.0, 13.0, 12.0, 6.0, 1.0, 4.0, 3.0], "bins": [-3.72265625, -3.613525390625, -3.50439453125, -3.395263671875, -3.2861328125, -3.177001953125, -3.06787109375, -2.958740234375, -2.849609375, -2.740478515625, -2.63134765625, -2.522216796875, -2.4130859375, -2.303955078125, -2.19482421875, -2.085693359375, -1.9765625, -1.867431640625, -1.75830078125, -1.649169921875, -1.5400390625, -1.430908203125, -1.32177734375, -1.212646484375, -1.103515625, -0.994384765625, -0.88525390625, -0.776123046875, -0.6669921875, -0.557861328125, -0.44873046875, -0.339599609375, -0.23046875, -0.121337890625, -0.01220703125, 0.096923828125, 0.2060546875, 0.315185546875, 0.42431640625, 0.533447265625, 0.642578125, 0.751708984375, 0.86083984375, 0.969970703125, 1.0791015625, 1.188232421875, 1.29736328125, 1.406494140625, 1.515625, 1.624755859375, 1.73388671875, 1.843017578125, 1.9521484375, 2.061279296875, 2.17041015625, 2.279541015625, 2.388671875, 2.497802734375, 2.60693359375, 2.716064453125, 2.8251953125, 2.934326171875, 3.04345703125, 3.152587890625, 3.26171875]}, "gradients/decoder.bert.encoder.layer.11.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 1.0, 3.0, 4.0, 9.0, 5.0, 9.0, 11.0, 10.0, 11.0, 12.0, 21.0, 22.0, 29.0, 19.0, 20.0, 34.0, 27.0, 37.0, 36.0, 47.0, 31.0, 33.0, 40.0, 34.0, 47.0, 34.0, 45.0, 41.0, 26.0, 31.0, 32.0, 33.0, 37.0, 24.0, 28.0, 16.0, 22.0, 15.0, 9.0, 13.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.9384765625, -1.8764801025390625, -1.814483642578125, -1.7524871826171875, -1.69049072265625, -1.6284942626953125, -1.566497802734375, -1.5045013427734375, -1.4425048828125, -1.3805084228515625, -1.318511962890625, -1.2565155029296875, -1.19451904296875, -1.1325225830078125, -1.070526123046875, -1.0085296630859375, -0.946533203125, -0.8845367431640625, -0.822540283203125, -0.7605438232421875, -0.69854736328125, -0.6365509033203125, -0.574554443359375, -0.5125579833984375, -0.4505615234375, -0.3885650634765625, -0.326568603515625, -0.2645721435546875, -0.20257568359375, -0.1405792236328125, -0.078582763671875, -0.0165863037109375, 0.04541015625, 0.1074066162109375, 0.169403076171875, 0.2313995361328125, 0.29339599609375, 0.3553924560546875, 0.417388916015625, 0.4793853759765625, 0.5413818359375, 0.6033782958984375, 0.665374755859375, 0.7273712158203125, 0.78936767578125, 0.8513641357421875, 0.913360595703125, 0.9753570556640625, 1.037353515625, 1.0993499755859375, 1.161346435546875, 1.2233428955078125, 1.28533935546875, 1.3473358154296875, 1.409332275390625, 1.4713287353515625, 1.5333251953125, 1.5953216552734375, 1.657318115234375, 1.7193145751953125, 1.78131103515625, 1.8433074951171875, 1.905303955078125, 1.9673004150390625, 2.029296875]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 5.0, 7.0, 5.0, 7.0, 14.0, 20.0, 23.0, 36.0, 61.0, 70.0, 122.0, 179.0, 234.0, 345.0, 479.0, 770.0, 1258.0, 1799.0, 2800.0, 4225.0, 7085.0, 11143.0, 18753.0, 31769.0, 55263.0, 98765.0, 180792.0, 334167.0, 602512.0, 892245.0, 821963.0, 506113.0, 275508.0, 148540.0, 82486.0, 45859.0, 26553.0, 16116.0, 9600.0, 5842.0, 3632.0, 2430.0, 1505.0, 1019.0, 693.0, 487.0, 295.0, 211.0, 150.0, 108.0, 68.0, 52.0, 34.0, 28.0, 15.0, 13.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-3.5625, -3.446990966796875, -3.33148193359375, -3.215972900390625, -3.1004638671875, -2.984954833984375, -2.86944580078125, -2.753936767578125, -2.638427734375, -2.522918701171875, -2.40740966796875, -2.291900634765625, -2.1763916015625, -2.060882568359375, -1.94537353515625, -1.829864501953125, -1.71435546875, -1.598846435546875, -1.48333740234375, -1.367828369140625, -1.2523193359375, -1.136810302734375, -1.02130126953125, -0.905792236328125, -0.790283203125, -0.674774169921875, -0.55926513671875, -0.443756103515625, -0.3282470703125, -0.212738037109375, -0.09722900390625, 0.018280029296875, 0.1337890625, 0.249298095703125, 0.36480712890625, 0.480316162109375, 0.5958251953125, 0.711334228515625, 0.82684326171875, 0.942352294921875, 1.057861328125, 1.173370361328125, 1.28887939453125, 1.404388427734375, 1.5198974609375, 1.635406494140625, 1.75091552734375, 1.866424560546875, 1.98193359375, 2.097442626953125, 2.21295166015625, 2.328460693359375, 2.4439697265625, 2.559478759765625, 2.67498779296875, 2.790496826171875, 2.906005859375, 3.021514892578125, 3.13702392578125, 3.252532958984375, 3.3680419921875, 3.483551025390625, 3.59906005859375, 3.714569091796875, 3.830078125]}, "gradients/decoder.bert.encoder.layer.11.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 3.0, 8.0, 7.0, 15.0, 16.0, 25.0, 35.0, 31.0, 41.0, 55.0, 61.0, 84.0, 113.0, 113.0, 149.0, 153.0, 186.0, 210.0, 250.0, 243.0, 280.0, 246.0, 279.0, 210.0, 198.0, 189.0, 135.0, 135.0, 125.0, 91.0, 80.0, 53.0, 43.0, 41.0, 31.0, 30.0, 18.0, 23.0, 23.0, 6.0, 9.0, 5.0, 2.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.2822265625, -1.24560546875, -1.208984375, -1.17236328125, -1.1357421875, -1.09912109375, -1.0625, -1.02587890625, -0.9892578125, -0.95263671875, -0.916015625, -0.87939453125, -0.8427734375, -0.80615234375, -0.76953125, -0.73291015625, -0.6962890625, -0.65966796875, -0.623046875, -0.58642578125, -0.5498046875, -0.51318359375, -0.4765625, -0.43994140625, -0.4033203125, -0.36669921875, -0.330078125, -0.29345703125, -0.2568359375, -0.22021484375, -0.18359375, -0.14697265625, -0.1103515625, -0.07373046875, -0.037109375, -0.00048828125, 0.0361328125, 0.07275390625, 0.109375, 0.14599609375, 0.1826171875, 0.21923828125, 0.255859375, 0.29248046875, 0.3291015625, 0.36572265625, 0.40234375, 0.43896484375, 0.4755859375, 0.51220703125, 0.548828125, 0.58544921875, 0.6220703125, 0.65869140625, 0.6953125, 0.73193359375, 0.7685546875, 0.80517578125, 0.841796875, 0.87841796875, 0.9150390625, 0.95166015625, 0.98828125, 1.02490234375, 1.0615234375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 9.0, 15.0, 14.0, 19.0, 25.0, 24.0, 38.0, 40.0, 47.0, 51.0, 54.0, 71.0, 49.0, 61.0, 57.0, 56.0, 47.0, 48.0, 37.0, 30.0, 27.0, 27.0, 21.0, 17.0, 14.0, 9.0, 10.0, 9.0, 8.0, 5.0, 2.0, 10.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.496438026428223, -4.368464469909668, -4.2404913902282715, -4.112517833709717, -3.984544515609741, -3.8565711975097656, -3.72859787940979, -3.6006245613098145, -3.4726510047912598, -3.344677686691284, -3.2167043685913086, -3.088730812072754, -2.9607574939727783, -2.8327841758728027, -2.704810857772827, -2.5768375396728516, -2.448864221572876, -2.3208909034729004, -2.192917585372925, -2.064944267272949, -1.9369707107543945, -1.808997392654419, -1.6810240745544434, -1.5530507564544678, -1.4250773191452026, -1.297104001045227, -1.169130563735962, -1.0411572456359863, -0.913183867931366, -0.7852104902267456, -0.65723717212677, -0.5292637944221497, -0.4012901782989502, -0.27331680059432983, -0.14534345269203186, -0.017370104789733887, 0.11060327291488647, 0.23857665061950684, 0.3665499687194824, 0.4945233464241028, 0.6224967241287231, 0.7504701018333435, 0.8784434795379639, 1.0064167976379395, 1.134390115737915, 1.2623635530471802, 1.3903368711471558, 1.518310308456421, 1.6462836265563965, 1.774256944656372, 1.9022303819656372, 2.0302038192749023, 2.158177137374878, 2.2861504554748535, 2.414123773574829, 2.5420970916748047, 2.6700706481933594, 2.798043966293335, 2.9260172843933105, 3.0539908409118652, 3.181964159011841, 3.3099374771118164, 3.437910795211792, 3.5658841133117676, 3.693857431411743]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 2.0, 3.0, 7.0, 10.0, 10.0, 13.0, 13.0, 11.0, 16.0, 14.0, 13.0, 24.0, 26.0, 24.0, 40.0, 36.0, 33.0, 43.0, 35.0, 44.0, 42.0, 50.0, 42.0, 42.0, 40.0, 39.0, 51.0, 40.0, 37.0, 38.0, 30.0, 20.0, 21.0, 15.0, 12.0, 15.0, 11.0, 10.0, 1.0, 6.0, 3.0, 10.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6131093502044678, -2.5276355743408203, -2.442161798477173, -2.3566880226135254, -2.271214246749878, -2.1857404708862305, -2.100266695022583, -2.0147929191589355, -1.929319143295288, -1.8438453674316406, -1.7583715915679932, -1.6728978157043457, -1.5874240398406982, -1.5019502639770508, -1.4164764881134033, -1.3310027122497559, -1.2455288171768188, -1.1600550413131714, -1.074581265449524, -0.9891074895858765, -0.903633713722229, -0.8181599378585815, -0.7326861023902893, -0.6472123265266418, -0.5617385506629944, -0.4762647747993469, -0.39079099893569946, -0.3053171932697296, -0.21984341740608215, -0.1343696415424347, -0.048895835876464844, 0.03657793998718262, 0.12205171585083008, 0.20752549171447754, 0.292999267578125, 0.37847307324409485, 0.4639468491077423, 0.5494205951690674, 0.6348944306373596, 0.7203682065010071, 0.8058419823646545, 0.891315758228302, 0.9767895340919495, 1.0622633695602417, 1.1477371454238892, 1.2332109212875366, 1.318684697151184, 1.4041584730148315, 1.489632248878479, 1.5751060247421265, 1.660579800605774, 1.7460535764694214, 1.8315273523330688, 1.9170011281967163, 2.0024750232696533, 2.087948799133301, 2.1734225749969482, 2.2588963508605957, 2.344370126724243, 2.4298439025878906, 2.515317678451538, 2.6007914543151855, 2.686265230178833, 2.7717390060424805, 2.857212781906128]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 16.0, 21.0, 31.0, 45.0, 74.0, 96.0, 113.0, 168.0, 306.0, 396.0, 681.0, 1029.0, 1532.0, 2516.0, 4023.0, 6822.0, 11860.0, 21531.0, 40597.0, 79134.0, 152402.0, 242129.0, 218644.0, 124461.0, 63906.0, 33248.0, 17540.0, 9842.0, 5729.0, 3483.0, 2186.0, 1364.0, 867.0, 591.0, 392.0, 249.0, 172.0, 118.0, 64.0, 53.0, 30.0, 31.0, 23.0, 11.0, 9.0, 11.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.367431640625, -0.3558921813964844, -0.34435272216796875, -0.3328132629394531, -0.3212738037109375, -0.3097343444824219, -0.29819488525390625, -0.2866554260253906, -0.275115966796875, -0.2635765075683594, -0.25203704833984375, -0.24049758911132812, -0.2289581298828125, -0.21741867065429688, -0.20587921142578125, -0.19433975219726562, -0.18280029296875, -0.17126083374023438, -0.15972137451171875, -0.14818191528320312, -0.1366424560546875, -0.12510299682617188, -0.11356353759765625, -0.10202407836914062, -0.090484619140625, -0.07894515991210938, -0.06740570068359375, -0.055866241455078125, -0.0443267822265625, -0.032787322998046875, -0.02124786376953125, -0.009708404541015625, 0.0018310546875, 0.013370513916015625, 0.02490997314453125, 0.036449432373046875, 0.0479888916015625, 0.059528350830078125, 0.07106781005859375, 0.08260726928710938, 0.094146728515625, 0.10568618774414062, 0.11722564697265625, 0.12876510620117188, 0.1403045654296875, 0.15184402465820312, 0.16338348388671875, 0.17492294311523438, 0.18646240234375, 0.19800186157226562, 0.20954132080078125, 0.22108078002929688, 0.2326202392578125, 0.24415969848632812, 0.25569915771484375, 0.2672386169433594, 0.278778076171875, 0.2903175354003906, 0.30185699462890625, 0.3133964538574219, 0.3249359130859375, 0.3364753723144531, 0.34801483154296875, 0.3595542907714844, 0.37109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 16.0, 17.0, 15.0, 25.0, 27.0, 29.0, 35.0, 39.0, 47.0, 50.0, 65.0, 52.0, 42.0, 71.0, 51.0, 56.0, 34.0, 43.0, 46.0, 32.0, 33.0, 18.0, 24.0, 20.0, 18.0, 14.0, 7.0, 3.0, 6.0, 7.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337890625, -3.22503662109375, -3.1121826171875, -2.99932861328125, -2.886474609375, -2.77362060546875, -2.6607666015625, -2.54791259765625, -2.43505859375, -2.32220458984375, -2.2093505859375, -2.09649658203125, -1.983642578125, -1.87078857421875, -1.7579345703125, -1.64508056640625, -1.5322265625, -1.41937255859375, -1.3065185546875, -1.19366455078125, -1.080810546875, -0.96795654296875, -0.8551025390625, -0.74224853515625, -0.62939453125, -0.51654052734375, -0.4036865234375, -0.29083251953125, -0.177978515625, -0.06512451171875, 0.0477294921875, 0.16058349609375, 0.2734375, 0.38629150390625, 0.4991455078125, 0.61199951171875, 0.724853515625, 0.83770751953125, 0.9505615234375, 1.06341552734375, 1.17626953125, 1.28912353515625, 1.4019775390625, 1.51483154296875, 1.627685546875, 1.74053955078125, 1.8533935546875, 1.96624755859375, 2.0791015625, 2.19195556640625, 2.3048095703125, 2.41766357421875, 2.530517578125, 2.64337158203125, 2.7562255859375, 2.86907958984375, 2.98193359375, 3.09478759765625, 3.2076416015625, 3.32049560546875, 3.433349609375, 3.54620361328125, 3.6590576171875, 3.77191162109375, 3.884765625]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 5.0, 7.0, 10.0, 6.0, 16.0, 22.0, 32.0, 43.0, 49.0, 62.0, 86.0, 110.0, 191.0, 288.0, 393.0, 593.0, 897.0, 1366.0, 2463.0, 4203.0, 8344.0, 18001.0, 62307.0, 821098.0, 86651.0, 20708.0, 9069.0, 4653.0, 2621.0, 1514.0, 875.0, 580.0, 372.0, 277.0, 173.0, 140.0, 90.0, 68.0, 40.0, 37.0, 21.0, 20.0, 14.0, 7.0, 10.0, 6.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.875, -0.8454132080078125, -0.815826416015625, -0.7862396240234375, -0.75665283203125, -0.7270660400390625, -0.697479248046875, -0.6678924560546875, -0.6383056640625, -0.6087188720703125, -0.579132080078125, -0.5495452880859375, -0.51995849609375, -0.4903717041015625, -0.460784912109375, -0.4311981201171875, -0.401611328125, -0.3720245361328125, -0.342437744140625, -0.3128509521484375, -0.28326416015625, -0.2536773681640625, -0.224090576171875, -0.1945037841796875, -0.1649169921875, -0.1353302001953125, -0.105743408203125, -0.0761566162109375, -0.04656982421875, -0.0169830322265625, 0.012603759765625, 0.0421905517578125, 0.07177734375, 0.1013641357421875, 0.130950927734375, 0.1605377197265625, 0.19012451171875, 0.2197113037109375, 0.249298095703125, 0.2788848876953125, 0.3084716796875, 0.3380584716796875, 0.367645263671875, 0.3972320556640625, 0.42681884765625, 0.4564056396484375, 0.485992431640625, 0.5155792236328125, 0.545166015625, 0.5747528076171875, 0.604339599609375, 0.6339263916015625, 0.66351318359375, 0.6930999755859375, 0.722686767578125, 0.7522735595703125, 0.7818603515625, 0.8114471435546875, 0.841033935546875, 0.8706207275390625, 0.90020751953125, 0.9297943115234375, 0.959381103515625, 0.9889678955078125, 1.0185546875]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 7.0, 7.0, 7.0, 5.0, 6.0, 6.0, 9.0, 11.0, 25.0, 17.0, 23.0, 20.0, 22.0, 24.0, 32.0, 28.0, 25.0, 28.0, 41.0, 25.0, 43.0, 39.0, 47.0, 30.0, 45.0, 46.0, 43.0, 42.0, 32.0, 28.0, 29.0, 22.0, 24.0, 27.0, 12.0, 18.0, 21.0, 10.0, 19.0, 20.0, 9.0, 6.0, 6.0, 5.0, 9.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.66796875, -1.612030029296875, -1.55609130859375, -1.500152587890625, -1.4442138671875, -1.388275146484375, -1.33233642578125, -1.276397705078125, -1.220458984375, -1.164520263671875, -1.10858154296875, -1.052642822265625, -0.9967041015625, -0.940765380859375, -0.88482666015625, -0.828887939453125, -0.77294921875, -0.717010498046875, -0.66107177734375, -0.605133056640625, -0.5491943359375, -0.493255615234375, -0.43731689453125, -0.381378173828125, -0.325439453125, -0.269500732421875, -0.21356201171875, -0.157623291015625, -0.1016845703125, -0.045745849609375, 0.01019287109375, 0.066131591796875, 0.1220703125, 0.178009033203125, 0.23394775390625, 0.289886474609375, 0.3458251953125, 0.401763916015625, 0.45770263671875, 0.513641357421875, 0.569580078125, 0.625518798828125, 0.68145751953125, 0.737396240234375, 0.7933349609375, 0.849273681640625, 0.90521240234375, 0.961151123046875, 1.01708984375, 1.073028564453125, 1.12896728515625, 1.184906005859375, 1.2408447265625, 1.296783447265625, 1.35272216796875, 1.408660888671875, 1.464599609375, 1.520538330078125, 1.57647705078125, 1.632415771484375, 1.6883544921875, 1.744293212890625, 1.80023193359375, 1.856170654296875, 1.912109375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 10.0, 14.0, 25.0, 25.0, 38.0, 52.0, 79.0, 128.0, 175.0, 278.0, 371.0, 571.0, 845.0, 1380.0, 2124.0, 3315.0, 5229.0, 8823.0, 14982.0, 28882.0, 520861.0, 395118.0, 27700.0, 14742.0, 8471.0, 5116.0, 3170.0, 2091.0, 1330.0, 902.0, 531.0, 352.0, 245.0, 181.0, 118.0, 83.0, 59.0, 44.0, 22.0, 22.0, 11.0, 15.0, 7.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1239013671875, -0.11947250366210938, -0.11504364013671875, -0.11061477661132812, -0.1061859130859375, -0.10175704956054688, -0.09732818603515625, -0.09289932250976562, -0.088470458984375, -0.08404159545898438, -0.07961273193359375, -0.07518386840820312, -0.0707550048828125, -0.06632614135742188, -0.06189727783203125, -0.057468414306640625, -0.05303955078125, -0.048610687255859375, -0.04418182373046875, -0.039752960205078125, -0.0353240966796875, -0.030895233154296875, -0.02646636962890625, -0.022037506103515625, -0.017608642578125, -0.013179779052734375, -0.00875091552734375, -0.004322052001953125, 0.0001068115234375, 0.004535675048828125, 0.00896453857421875, 0.013393402099609375, 0.017822265625, 0.022251129150390625, 0.02667999267578125, 0.031108856201171875, 0.0355377197265625, 0.039966583251953125, 0.04439544677734375, 0.048824310302734375, 0.053253173828125, 0.057682037353515625, 0.06211090087890625, 0.06653976440429688, 0.0709686279296875, 0.07539749145507812, 0.07982635498046875, 0.08425521850585938, 0.08868408203125, 0.09311294555664062, 0.09754180908203125, 0.10197067260742188, 0.1063995361328125, 0.11082839965820312, 0.11525726318359375, 0.11968612670898438, 0.124114990234375, 0.12854385375976562, 0.13297271728515625, 0.13740158081054688, 0.1418304443359375, 0.14625930786132812, 0.15068817138671875, 0.15511703491210938, 0.1595458984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.key.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 8.0, 5.0, 8.0, 14.0, 12.0, 14.0, 15.0, 14.0, 20.0, 19.0, 25.0, 21.0, 41.0, 33.0, 40.0, 36.0, 36.0, 37.0, 39.0, 33.0, 42.0, 46.0, 38.0, 42.0, 47.0, 44.0, 40.0, 29.0, 34.0, 29.0, 10.0, 17.0, 18.0, 17.0, 16.0, 14.0, 9.0, 10.0, 8.0, 8.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3709068298339844e-05, -1.322571188211441e-05, -1.2742355465888977e-05, -1.2258999049663544e-05, -1.177564263343811e-05, -1.1292286217212677e-05, -1.0808929800987244e-05, -1.032557338476181e-05, -9.842216968536377e-06, -9.358860552310944e-06, -8.87550413608551e-06, -8.392147719860077e-06, -7.908791303634644e-06, -7.42543488740921e-06, -6.942078471183777e-06, -6.4587220549583435e-06, -5.97536563873291e-06, -5.492009222507477e-06, -5.0086528062820435e-06, -4.52529639005661e-06, -4.041939973831177e-06, -3.5585835576057434e-06, -3.07522714138031e-06, -2.5918707251548767e-06, -2.1085143089294434e-06, -1.62515789270401e-06, -1.1418014764785767e-06, -6.584450602531433e-07, -1.7508864402770996e-07, 3.082677721977234e-07, 7.916241884231567e-07, 1.27498060464859e-06, 1.7583370208740234e-06, 2.2416934370994568e-06, 2.72504985332489e-06, 3.2084062695503235e-06, 3.691762685775757e-06, 4.17511910200119e-06, 4.6584755182266235e-06, 5.141831934452057e-06, 5.62518835067749e-06, 6.108544766902924e-06, 6.591901183128357e-06, 7.07525759935379e-06, 7.558614015579224e-06, 8.041970431804657e-06, 8.52532684803009e-06, 9.008683264255524e-06, 9.492039680480957e-06, 9.97539609670639e-06, 1.0458752512931824e-05, 1.0942108929157257e-05, 1.142546534538269e-05, 1.1908821761608124e-05, 1.2392178177833557e-05, 1.287553459405899e-05, 1.3358891010284424e-05, 1.3842247426509857e-05, 1.432560384273529e-05, 1.4808960258960724e-05, 1.5292316675186157e-05, 1.577567309141159e-05, 1.6259029507637024e-05, 1.6742385923862457e-05, 1.722574234008789e-05]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 12.0, 8.0, 10.0, 28.0, 28.0, 48.0, 77.0, 109.0, 179.0, 271.0, 466.0, 616.0, 1077.0, 1704.0, 2758.0, 4774.0, 7850.0, 13115.0, 22629.0, 38990.0, 66707.0, 110457.0, 164014.0, 191656.0, 159762.0, 106611.0, 64029.0, 37358.0, 21464.0, 12611.0, 7439.0, 4481.0, 2680.0, 1716.0, 967.0, 648.0, 416.0, 233.0, 211.0, 102.0, 85.0, 46.0, 33.0, 26.0, 17.0, 9.0, 13.0, 6.0, 5.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0582275390625, -0.056433677673339844, -0.05463981628417969, -0.05284595489501953, -0.051052093505859375, -0.04925823211669922, -0.04746437072753906, -0.045670509338378906, -0.04387664794921875, -0.042082786560058594, -0.04028892517089844, -0.03849506378173828, -0.036701202392578125, -0.03490734100341797, -0.03311347961425781, -0.031319618225097656, -0.0295257568359375, -0.027731895446777344, -0.025938034057617188, -0.02414417266845703, -0.022350311279296875, -0.02055644989013672, -0.018762588500976562, -0.016968727111816406, -0.01517486572265625, -0.013381004333496094, -0.011587142944335938, -0.009793281555175781, -0.007999420166015625, -0.006205558776855469, -0.0044116973876953125, -0.0026178359985351562, -0.000823974609375, 0.0009698867797851562, 0.0027637481689453125, 0.004557609558105469, 0.006351470947265625, 0.008145332336425781, 0.009939193725585938, 0.011733055114746094, 0.01352691650390625, 0.015320777893066406, 0.017114639282226562, 0.01890850067138672, 0.020702362060546875, 0.02249622344970703, 0.024290084838867188, 0.026083946228027344, 0.0278778076171875, 0.029671669006347656, 0.03146553039550781, 0.03325939178466797, 0.035053253173828125, 0.03684711456298828, 0.03864097595214844, 0.040434837341308594, 0.04222869873046875, 0.044022560119628906, 0.04581642150878906, 0.04761028289794922, 0.049404144287109375, 0.05119800567626953, 0.05299186706542969, 0.054785728454589844, 0.05657958984375]}, "gradients/decoder.bert.encoder.layer.11.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 7.0, 14.0, 23.0, 21.0, 37.0, 48.0, 54.0, 67.0, 93.0, 82.0, 79.0, 90.0, 72.0, 81.0, 49.0, 40.0, 28.0, 27.0, 19.0, 13.0, 12.0, 6.0, 6.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02734375, -0.026546716690063477, -0.025749683380126953, -0.02495265007019043, -0.024155616760253906, -0.023358583450317383, -0.02256155014038086, -0.021764516830444336, -0.020967483520507812, -0.02017045021057129, -0.019373416900634766, -0.018576383590698242, -0.01777935028076172, -0.016982316970825195, -0.016185283660888672, -0.015388250350952148, -0.014591217041015625, -0.013794183731079102, -0.012997150421142578, -0.012200117111206055, -0.011403083801269531, -0.010606050491333008, -0.009809017181396484, -0.009011983871459961, -0.008214950561523438, -0.007417917251586914, -0.006620883941650391, -0.005823850631713867, -0.005026817321777344, -0.00422978401184082, -0.003432750701904297, -0.0026357173919677734, -0.00183868408203125, -0.0010416507720947266, -0.0002446174621582031, 0.0005524158477783203, 0.0013494491577148438, 0.002146482467651367, 0.0029435157775878906, 0.003740549087524414, 0.0045375823974609375, 0.005334615707397461, 0.006131649017333984, 0.006928682327270508, 0.007725715637207031, 0.008522748947143555, 0.009319782257080078, 0.010116815567016602, 0.010913848876953125, 0.011710882186889648, 0.012507915496826172, 0.013304948806762695, 0.014101982116699219, 0.014899015426635742, 0.015696048736572266, 0.01649308204650879, 0.017290115356445312, 0.018087148666381836, 0.01888418197631836, 0.019681215286254883, 0.020478248596191406, 0.02127528190612793, 0.022072315216064453, 0.022869348526000977, 0.0236663818359375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 6.0, 8.0, 12.0, 16.0, 11.0, 19.0, 19.0, 27.0, 26.0, 46.0, 41.0, 51.0, 53.0, 56.0, 64.0, 63.0, 57.0, 57.0, 48.0, 54.0, 41.0, 34.0, 22.0, 30.0, 24.0, 20.0, 13.0, 11.0, 10.0, 10.0, 9.0, 3.0, 4.0, 9.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.615414142608643, -4.485564231872559, -4.355713844299316, -4.225863933563232, -4.096014022827148, -3.9661636352539062, -3.8363137245178223, -3.706463575363159, -3.576613426208496, -3.446763277053833, -3.316913366317749, -3.187063217163086, -3.057213068008423, -2.9273629188537598, -2.797513008117676, -2.6676628589630127, -2.5378129482269287, -2.4079627990722656, -2.2781128883361816, -2.1482627391815186, -2.0184125900268555, -1.888562560081482, -1.7587125301361084, -1.6288623809814453, -1.4990123510360718, -1.3691623210906982, -1.2393121719360352, -1.1094621419906616, -0.9796120524406433, -0.849761962890625, -0.7199119329452515, -0.5900618433952332, -0.46021151542663574, -0.33036142587661743, -0.2005113661289215, -0.07066130638122559, 0.059188783168792725, 0.18903887271881104, 0.31888890266418457, 0.4487389922142029, 0.5785890817642212, 0.7084391713142395, 0.8382892608642578, 0.9681392908096313, 1.0979893207550049, 1.227839469909668, 1.3576894998550415, 1.487539529800415, 1.6173896789550781, 1.7472397089004517, 1.8770898580551147, 2.0069398880004883, 2.1367900371551514, 2.2666401863098145, 2.3964900970458984, 2.5263402462005615, 2.6561903953552246, 2.7860405445098877, 2.9158904552459717, 3.0457406044006348, 3.175590753555298, 3.305440902709961, 3.435290813446045, 3.565140962600708, 3.694990873336792]}, "gradients/decoder.bert.encoder.layer.11.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 3.0, 6.0, 12.0, 8.0, 16.0, 12.0, 11.0, 18.0, 10.0, 13.0, 27.0, 26.0, 27.0, 34.0, 41.0, 30.0, 44.0, 36.0, 43.0, 46.0, 47.0, 42.0, 45.0, 37.0, 40.0, 48.0, 39.0, 37.0, 40.0, 30.0, 18.0, 23.0, 12.0, 13.0, 14.0, 12.0, 9.0, 1.0, 6.0, 4.0, 9.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.592935085296631, -2.507789134979248, -2.4226431846618652, -2.3374974727630615, -2.2523515224456787, -2.167205572128296, -2.082059621810913, -1.9969137907028198, -1.9117679595947266, -1.8266220092773438, -1.7414761781692505, -1.6563302278518677, -1.5711843967437744, -1.4860384464263916, -1.4008924961090088, -1.3157466650009155, -1.2306007146835327, -1.14545476436615, -1.0603089332580566, -0.9751629829406738, -0.8900171518325806, -0.8048712015151978, -0.7197253108024597, -0.6345794200897217, -0.5494335293769836, -0.4642876386642456, -0.37914174795150757, -0.29399582743644714, -0.2088499367237091, -0.12370404601097107, -0.038558125495910645, 0.04658776521682739, 0.13173365592956543, 0.21687954664230347, 0.3020254373550415, 0.38717135787010193, 0.47231724858283997, 0.5574631690979004, 0.6426090598106384, 0.7277549505233765, 0.8129008412361145, 0.8980467319488525, 0.9831926226615906, 1.0683385133743286, 1.1534844636917114, 1.2386302947998047, 1.3237762451171875, 1.4089221954345703, 1.4940680265426636, 1.5792139768600464, 1.6643598079681396, 1.7495057582855225, 1.8346515893936157, 1.9197975397109985, 2.004943370819092, 2.0900893211364746, 2.1752352714538574, 2.2603812217712402, 2.345527172088623, 2.4306728839874268, 2.5158188343048096, 2.6009647846221924, 2.686110734939575, 2.771256446838379, 2.8564023971557617]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 12.0, 8.0, 20.0, 22.0, 49.0, 52.0, 98.0, 150.0, 213.0, 337.0, 549.0, 877.0, 1357.0, 2396.0, 4162.0, 7593.0, 14313.0, 27009.0, 51777.0, 95480.0, 156596.0, 204335.0, 189142.0, 130639.0, 74832.0, 40063.0, 20976.0, 10979.0, 6037.0, 3355.0, 1978.0, 1206.0, 675.0, 454.0, 296.0, 164.0, 102.0, 92.0, 48.0, 41.0, 17.0, 18.0, 11.0, 6.0, 4.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.384765625, -3.2783203125, -3.171875, -3.0654296875, -2.958984375, -2.8525390625, -2.74609375, -2.6396484375, -2.533203125, -2.4267578125, -2.3203125, -2.2138671875, -2.107421875, -2.0009765625, -1.89453125, -1.7880859375, -1.681640625, -1.5751953125, -1.46875, -1.3623046875, -1.255859375, -1.1494140625, -1.04296875, -0.9365234375, -0.830078125, -0.7236328125, -0.6171875, -0.5107421875, -0.404296875, -0.2978515625, -0.19140625, -0.0849609375, 0.021484375, 0.1279296875, 0.234375, 0.3408203125, 0.447265625, 0.5537109375, 0.66015625, 0.7666015625, 0.873046875, 0.9794921875, 1.0859375, 1.1923828125, 1.298828125, 1.4052734375, 1.51171875, 1.6181640625, 1.724609375, 1.8310546875, 1.9375, 2.0439453125, 2.150390625, 2.2568359375, 2.36328125, 2.4697265625, 2.576171875, 2.6826171875, 2.7890625, 2.8955078125, 3.001953125, 3.1083984375, 3.21484375, 3.3212890625, 3.427734375]}, "gradients/decoder.bert.encoder.layer.11.attention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 8.0, 12.0, 5.0, 13.0, 15.0, 10.0, 21.0, 21.0, 16.0, 26.0, 36.0, 25.0, 30.0, 26.0, 47.0, 33.0, 43.0, 30.0, 46.0, 42.0, 34.0, 43.0, 50.0, 39.0, 53.0, 21.0, 27.0, 30.0, 26.0, 24.0, 17.0, 21.0, 10.0, 13.0, 12.0, 9.0, 8.0, 5.0, 4.0, 6.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.796875, -2.7100830078125, -2.623291015625, -2.5364990234375, -2.44970703125, -2.3629150390625, -2.276123046875, -2.1893310546875, -2.1025390625, -2.0157470703125, -1.928955078125, -1.8421630859375, -1.75537109375, -1.6685791015625, -1.581787109375, -1.4949951171875, -1.408203125, -1.3214111328125, -1.234619140625, -1.1478271484375, -1.06103515625, -0.9742431640625, -0.887451171875, -0.8006591796875, -0.7138671875, -0.6270751953125, -0.540283203125, -0.4534912109375, -0.36669921875, -0.2799072265625, -0.193115234375, -0.1063232421875, -0.01953125, 0.0672607421875, 0.154052734375, 0.2408447265625, 0.32763671875, 0.4144287109375, 0.501220703125, 0.5880126953125, 0.6748046875, 0.7615966796875, 0.848388671875, 0.9351806640625, 1.02197265625, 1.1087646484375, 1.195556640625, 1.2823486328125, 1.369140625, 1.4559326171875, 1.542724609375, 1.6295166015625, 1.71630859375, 1.8031005859375, 1.889892578125, 1.9766845703125, 2.0634765625, 2.1502685546875, 2.237060546875, 2.3238525390625, 2.41064453125, 2.4974365234375, 2.584228515625, 2.6710205078125, 2.7578125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 1.0, 4.0, 8.0, 12.0, 20.0, 28.0, 61.0, 88.0, 179.0, 270.0, 496.0, 954.0, 1703.0, 3367.0, 6769.0, 13599.0, 27218.0, 54835.0, 105702.0, 177670.0, 223102.0, 189862.0, 118262.0, 62079.0, 31096.0, 15294.0, 7641.0, 3918.0, 2015.0, 1045.0, 521.0, 315.0, 169.0, 90.0, 58.0, 32.0, 23.0, 18.0, 11.0, 12.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.60546875, -3.48760986328125, -3.3697509765625, -3.25189208984375, -3.134033203125, -3.01617431640625, -2.8983154296875, -2.78045654296875, -2.66259765625, -2.54473876953125, -2.4268798828125, -2.30902099609375, -2.191162109375, -2.07330322265625, -1.9554443359375, -1.83758544921875, -1.7197265625, -1.60186767578125, -1.4840087890625, -1.36614990234375, -1.248291015625, -1.13043212890625, -1.0125732421875, -0.89471435546875, -0.77685546875, -0.65899658203125, -0.5411376953125, -0.42327880859375, -0.305419921875, -0.18756103515625, -0.0697021484375, 0.04815673828125, 0.166015625, 0.28387451171875, 0.4017333984375, 0.51959228515625, 0.637451171875, 0.75531005859375, 0.8731689453125, 0.99102783203125, 1.10888671875, 1.22674560546875, 1.3446044921875, 1.46246337890625, 1.580322265625, 1.69818115234375, 1.8160400390625, 1.93389892578125, 2.0517578125, 2.16961669921875, 2.2874755859375, 2.40533447265625, 2.523193359375, 2.64105224609375, 2.7589111328125, 2.87677001953125, 2.99462890625, 3.11248779296875, 3.2303466796875, 3.34820556640625, 3.466064453125, 3.58392333984375, 3.7017822265625, 3.81964111328125, 3.9375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 1.0, 6.0, 4.0, 3.0, 4.0, 11.0, 9.0, 14.0, 6.0, 10.0, 14.0, 10.0, 25.0, 20.0, 17.0, 17.0, 34.0, 24.0, 39.0, 32.0, 26.0, 34.0, 39.0, 45.0, 40.0, 26.0, 48.0, 42.0, 31.0, 31.0, 35.0, 36.0, 33.0, 26.0, 25.0, 23.0, 38.0, 19.0, 11.0, 17.0, 20.0, 10.0, 7.0, 8.0, 12.0, 6.0, 3.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-1.6494140625, -1.599700927734375, -1.54998779296875, -1.500274658203125, -1.4505615234375, -1.400848388671875, -1.35113525390625, -1.301422119140625, -1.251708984375, -1.201995849609375, -1.15228271484375, -1.102569580078125, -1.0528564453125, -1.003143310546875, -0.95343017578125, -0.903717041015625, -0.85400390625, -0.804290771484375, -0.75457763671875, -0.704864501953125, -0.6551513671875, -0.605438232421875, -0.55572509765625, -0.506011962890625, -0.456298828125, -0.406585693359375, -0.35687255859375, -0.307159423828125, -0.2574462890625, -0.207733154296875, -0.15802001953125, -0.108306884765625, -0.05859375, -0.008880615234375, 0.04083251953125, 0.090545654296875, 0.1402587890625, 0.189971923828125, 0.23968505859375, 0.289398193359375, 0.339111328125, 0.388824462890625, 0.43853759765625, 0.488250732421875, 0.5379638671875, 0.587677001953125, 0.63739013671875, 0.687103271484375, 0.73681640625, 0.786529541015625, 0.83624267578125, 0.885955810546875, 0.9356689453125, 0.985382080078125, 1.03509521484375, 1.084808349609375, 1.134521484375, 1.184234619140625, 1.23394775390625, 1.283660888671875, 1.3333740234375, 1.383087158203125, 1.43280029296875, 1.482513427734375, 1.5322265625]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 7.0, 9.0, 20.0, 21.0, 26.0, 32.0, 52.0, 56.0, 107.0, 159.0, 198.0, 278.0, 406.0, 774.0, 1257.0, 2260.0, 4837.0, 13036.0, 47725.0, 205549.0, 457208.0, 232842.0, 55723.0, 14656.0, 5211.0, 2447.0, 1304.0, 763.0, 506.0, 348.0, 205.0, 159.0, 117.0, 71.0, 50.0, 37.0, 34.0, 18.0, 9.0, 7.0, 10.0, 7.0, 4.0, 1.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.42578125, -3.31719970703125, -3.2086181640625, -3.10003662109375, -2.991455078125, -2.88287353515625, -2.7742919921875, -2.66571044921875, -2.55712890625, -2.44854736328125, -2.3399658203125, -2.23138427734375, -2.122802734375, -2.01422119140625, -1.9056396484375, -1.79705810546875, -1.6884765625, -1.57989501953125, -1.4713134765625, -1.36273193359375, -1.254150390625, -1.14556884765625, -1.0369873046875, -0.92840576171875, -0.81982421875, -0.71124267578125, -0.6026611328125, -0.49407958984375, -0.385498046875, -0.27691650390625, -0.1683349609375, -0.05975341796875, 0.048828125, 0.15740966796875, 0.2659912109375, 0.37457275390625, 0.483154296875, 0.59173583984375, 0.7003173828125, 0.80889892578125, 0.91748046875, 1.02606201171875, 1.1346435546875, 1.24322509765625, 1.351806640625, 1.46038818359375, 1.5689697265625, 1.67755126953125, 1.7861328125, 1.89471435546875, 2.0032958984375, 2.11187744140625, 2.220458984375, 2.32904052734375, 2.4376220703125, 2.54620361328125, 2.65478515625, 2.76336669921875, 2.8719482421875, 2.98052978515625, 3.089111328125, 3.19769287109375, 3.3062744140625, 3.41485595703125, 3.5234375]}, "gradients/decoder.bert.encoder.layer.11.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 3.0, 14.0, 28.0, 41.0, 60.0, 85.0, 89.0, 128.0, 127.0, 95.0, 101.0, 64.0, 55.0, 34.0, 24.0, 9.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023293495178222656, -0.00022500008344650269, -0.0002170652151107788, -0.00020913034677505493, -0.00020119547843933105, -0.00019326061010360718, -0.0001853257417678833, -0.00017739087343215942, -0.00016945600509643555, -0.00016152113676071167, -0.0001535862684249878, -0.00014565140008926392, -0.00013771653175354004, -0.00012978166341781616, -0.00012184679508209229, -0.00011391192674636841, -0.00010597705841064453, -9.804219007492065e-05, -9.010732173919678e-05, -8.21724534034729e-05, -7.423758506774902e-05, -6.630271673202515e-05, -5.836784839630127e-05, -5.043298006057739e-05, -4.2498111724853516e-05, -3.456324338912964e-05, -2.6628375053405762e-05, -1.8693506717681885e-05, -1.0758638381958008e-05, -2.823770046234131e-06, 5.111098289489746e-06, 1.3045966625213623e-05, 2.09808349609375e-05, 2.8915703296661377e-05, 3.6850571632385254e-05, 4.478543996810913e-05, 5.272030830383301e-05, 6.0655176639556885e-05, 6.859004497528076e-05, 7.652491331100464e-05, 8.445978164672852e-05, 9.239464998245239e-05, 0.00010032951831817627, 0.00010826438665390015, 0.00011619925498962402, 0.0001241341233253479, 0.00013206899166107178, 0.00014000385999679565, 0.00014793872833251953, 0.0001558735966682434, 0.00016380846500396729, 0.00017174333333969116, 0.00017967820167541504, 0.00018761307001113892, 0.0001955479383468628, 0.00020348280668258667, 0.00021141767501831055, 0.00021935254335403442, 0.0002272874116897583, 0.00023522228002548218, 0.00024315714836120605, 0.00025109201669692993, 0.0002590268850326538, 0.0002669617533683777, 0.00027489662170410156]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 10.0, 9.0, 12.0, 20.0, 25.0, 21.0, 43.0, 71.0, 122.0, 163.0, 272.0, 414.0, 642.0, 1109.0, 1950.0, 3893.0, 8349.0, 20409.0, 56984.0, 158527.0, 316922.0, 282127.0, 123262.0, 42970.0, 15870.0, 6770.0, 3226.0, 1738.0, 982.0, 563.0, 336.0, 239.0, 161.0, 116.0, 68.0, 60.0, 34.0, 20.0, 13.0, 6.0, 11.0, 6.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.4765625, -2.4034423828125, -2.330322265625, -2.2572021484375, -2.18408203125, -2.1109619140625, -2.037841796875, -1.9647216796875, -1.8916015625, -1.8184814453125, -1.745361328125, -1.6722412109375, -1.59912109375, -1.5260009765625, -1.452880859375, -1.3797607421875, -1.306640625, -1.2335205078125, -1.160400390625, -1.0872802734375, -1.01416015625, -0.9410400390625, -0.867919921875, -0.7947998046875, -0.7216796875, -0.6485595703125, -0.575439453125, -0.5023193359375, -0.42919921875, -0.3560791015625, -0.282958984375, -0.2098388671875, -0.13671875, -0.0635986328125, 0.009521484375, 0.0826416015625, 0.15576171875, 0.2288818359375, 0.302001953125, 0.3751220703125, 0.4482421875, 0.5213623046875, 0.594482421875, 0.6676025390625, 0.74072265625, 0.8138427734375, 0.886962890625, 0.9600830078125, 1.033203125, 1.1063232421875, 1.179443359375, 1.2525634765625, 1.32568359375, 1.3988037109375, 1.471923828125, 1.5450439453125, 1.6181640625, 1.6912841796875, 1.764404296875, 1.8375244140625, 1.91064453125, 1.9837646484375, 2.056884765625, 2.1300048828125, 2.203125]}, "gradients/decoder.bert.encoder.layer.11.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 9.0, 13.0, 17.0, 21.0, 32.0, 24.0, 34.0, 41.0, 60.0, 50.0, 63.0, 58.0, 69.0, 64.0, 50.0, 58.0, 46.0, 34.0, 29.0, 22.0, 37.0, 29.0, 24.0, 11.0, 11.0, 14.0, 9.0, 6.0, 10.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.373046875, -0.3606109619140625, -0.348175048828125, -0.3357391357421875, -0.32330322265625, -0.3108673095703125, -0.298431396484375, -0.2859954833984375, -0.2735595703125, -0.2611236572265625, -0.248687744140625, -0.2362518310546875, -0.22381591796875, -0.2113800048828125, -0.198944091796875, -0.1865081787109375, -0.174072265625, -0.1616363525390625, -0.149200439453125, -0.1367645263671875, -0.12432861328125, -0.1118927001953125, -0.099456787109375, -0.0870208740234375, -0.0745849609375, -0.0621490478515625, -0.049713134765625, -0.0372772216796875, -0.02484130859375, -0.0124053955078125, 3.0517578125e-05, 0.0124664306640625, 0.02490234375, 0.0373382568359375, 0.049774169921875, 0.0622100830078125, 0.07464599609375, 0.0870819091796875, 0.099517822265625, 0.1119537353515625, 0.1243896484375, 0.1368255615234375, 0.149261474609375, 0.1616973876953125, 0.17413330078125, 0.1865692138671875, 0.199005126953125, 0.2114410400390625, 0.223876953125, 0.2363128662109375, 0.248748779296875, 0.2611846923828125, 0.27362060546875, 0.2860565185546875, 0.298492431640625, 0.3109283447265625, 0.3233642578125, 0.3358001708984375, 0.348236083984375, 0.3606719970703125, 0.37310791015625, 0.3855438232421875, 0.397979736328125, 0.4104156494140625, 0.4228515625]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 10.0, 16.0, 21.0, 22.0, 36.0, 37.0, 51.0, 45.0, 52.0, 51.0, 72.0, 75.0, 66.0, 61.0, 55.0, 47.0, 49.0, 31.0, 38.0, 29.0, 17.0, 11.0, 13.0, 14.0, 13.0, 5.0, 3.0, 11.0, 0.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.992527484893799, -4.848790168762207, -4.705052852630615, -4.561315536499023, -4.417578220367432, -4.27384090423584, -4.130103588104248, -3.9863665103912354, -3.8426291942596436, -3.6988918781280518, -3.55515456199646, -3.411417245864868, -3.2676801681518555, -3.1239428520202637, -2.980205535888672, -2.83646821975708, -2.6927309036254883, -2.5489935874938965, -2.4052562713623047, -2.261518955230713, -2.117781639099121, -1.9740444421768188, -1.8303072452545166, -1.6865699291229248, -1.542832612991333, -1.3990952968597412, -1.2553579807281494, -1.1116207838058472, -0.9678834676742554, -0.8241461515426636, -0.6804088950157166, -0.5366716384887695, -0.39293432235717773, -0.24919703602790833, -0.10545974969863892, 0.03827753663063049, 0.1820148229598999, 0.3257521390914917, 0.4694893956184387, 0.6132266521453857, 0.7569639682769775, 0.9007012844085693, 1.0444386005401611, 1.1881757974624634, 1.3319131135940552, 1.475650429725647, 1.6193876266479492, 1.763124942779541, 1.9068622589111328, 2.0505995750427246, 2.1943368911743164, 2.338074207305908, 2.4818115234375, 2.625548839569092, 2.7692859172821045, 2.9130232334136963, 3.056760549545288, 3.20049786567688, 3.3442351818084717, 3.4879724979400635, 3.631709575653076, 3.775446891784668, 3.9191842079162598, 4.062921524047852, 4.206658840179443]}, "gradients/decoder.bert.encoder.layer.10.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 10.0, 3.0, 7.0, 6.0, 10.0, 14.0, 12.0, 12.0, 17.0, 20.0, 22.0, 21.0, 24.0, 24.0, 27.0, 27.0, 30.0, 38.0, 42.0, 42.0, 44.0, 35.0, 34.0, 38.0, 44.0, 35.0, 45.0, 41.0, 33.0, 31.0, 25.0, 30.0, 24.0, 26.0, 22.0, 15.0, 12.0, 15.0, 9.0, 5.0, 5.0, 6.0, 6.0, 8.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0], "bins": [-2.913811206817627, -2.8311164379119873, -2.7484216690063477, -2.665726900100708, -2.5830321311950684, -2.5003373622894287, -2.417642593383789, -2.3349475860595703, -2.2522530555725098, -2.16955828666687, -2.0868635177612305, -2.004168748855591, -1.9214739799499512, -1.8387792110443115, -1.7560843229293823, -1.6733895540237427, -1.5906946659088135, -1.5079998970031738, -1.4253051280975342, -1.3426103591918945, -1.2599155902862549, -1.1772208213806152, -1.094525933265686, -1.0118311643600464, -0.9291363954544067, -0.8464416265487671, -0.7637468576431274, -0.681052029132843, -0.5983572602272034, -0.5156624913215637, -0.4329676926136017, -0.35027289390563965, -0.2675778865814209, -0.18488310277462006, -0.10218831896781921, -0.01949353516101837, 0.06320124864578247, 0.14589601755142212, 0.22859081625938416, 0.3112856149673462, 0.39398038387298584, 0.4766751527786255, 0.5593699216842651, 0.6420647501945496, 0.7247595191001892, 0.8074542880058289, 0.8901491165161133, 0.9728438854217529, 1.0555386543273926, 1.1382334232330322, 1.2209281921386719, 1.3036229610443115, 1.3863177299499512, 1.4690124988555908, 1.55170738697052, 1.6344021558761597, 1.7170969247817993, 1.799791693687439, 1.8824864625930786, 1.9651812314987183, 2.0478761196136475, 2.130570888519287, 2.2132656574249268, 2.2959604263305664, 2.378655195236206]}, "gradients/decoder.bert.encoder.layer.10.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 5.0, 1.0, 2.0, 5.0, 7.0, 5.0, 23.0, 12.0, 34.0, 39.0, 62.0, 80.0, 133.0, 200.0, 305.0, 466.0, 748.0, 1133.0, 1989.0, 3382.0, 5994.0, 10817.0, 20320.0, 40412.0, 84921.0, 195216.0, 496890.0, 1133539.0, 1220581.0, 571054.0, 220362.0, 94121.0, 44198.0, 21728.0, 11151.0, 6090.0, 3384.0, 1907.0, 1144.0, 702.0, 416.0, 249.0, 156.0, 95.0, 70.0, 45.0, 30.0, 19.0, 21.0, 11.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-5.13671875, -4.990234375, -4.84375, -4.697265625, -4.55078125, -4.404296875, -4.2578125, -4.111328125, -3.96484375, -3.818359375, -3.671875, -3.525390625, -3.37890625, -3.232421875, -3.0859375, -2.939453125, -2.79296875, -2.646484375, -2.5, -2.353515625, -2.20703125, -2.060546875, -1.9140625, -1.767578125, -1.62109375, -1.474609375, -1.328125, -1.181640625, -1.03515625, -0.888671875, -0.7421875, -0.595703125, -0.44921875, -0.302734375, -0.15625, -0.009765625, 0.13671875, 0.283203125, 0.4296875, 0.576171875, 0.72265625, 0.869140625, 1.015625, 1.162109375, 1.30859375, 1.455078125, 1.6015625, 1.748046875, 1.89453125, 2.041015625, 2.1875, 2.333984375, 2.48046875, 2.626953125, 2.7734375, 2.919921875, 3.06640625, 3.212890625, 3.359375, 3.505859375, 3.65234375, 3.798828125, 3.9453125, 4.091796875, 4.23828125]}, "gradients/decoder.bert.encoder.layer.10.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 5.0, 10.0, 10.0, 8.0, 18.0, 10.0, 9.0, 15.0, 15.0, 23.0, 17.0, 26.0, 35.0, 45.0, 33.0, 39.0, 33.0, 43.0, 50.0, 46.0, 44.0, 49.0, 47.0, 30.0, 27.0, 32.0, 35.0, 43.0, 25.0, 29.0, 25.0, 29.0, 18.0, 19.0, 8.0, 9.0, 7.0, 6.0, 6.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.30078125, -2.231292724609375, -2.16180419921875, -2.092315673828125, -2.0228271484375, -1.953338623046875, -1.88385009765625, -1.814361572265625, -1.744873046875, -1.675384521484375, -1.60589599609375, -1.536407470703125, -1.4669189453125, -1.397430419921875, -1.32794189453125, -1.258453369140625, -1.18896484375, -1.119476318359375, -1.04998779296875, -0.980499267578125, -0.9110107421875, -0.841522216796875, -0.77203369140625, -0.702545166015625, -0.633056640625, -0.563568115234375, -0.49407958984375, -0.424591064453125, -0.3551025390625, -0.285614013671875, -0.21612548828125, -0.146636962890625, -0.0771484375, -0.007659912109375, 0.06182861328125, 0.131317138671875, 0.2008056640625, 0.270294189453125, 0.33978271484375, 0.409271240234375, 0.478759765625, 0.548248291015625, 0.61773681640625, 0.687225341796875, 0.7567138671875, 0.826202392578125, 0.89569091796875, 0.965179443359375, 1.03466796875, 1.104156494140625, 1.17364501953125, 1.243133544921875, 1.3126220703125, 1.382110595703125, 1.45159912109375, 1.521087646484375, 1.590576171875, 1.660064697265625, 1.72955322265625, 1.799041748046875, 1.8685302734375, 1.938018798828125, 2.00750732421875, 2.076995849609375, 2.146484375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 11.0, 14.0, 15.0, 33.0, 47.0, 83.0, 113.0, 150.0, 203.0, 338.0, 511.0, 797.0, 1266.0, 2037.0, 3327.0, 5225.0, 8822.0, 14665.0, 25899.0, 45744.0, 83516.0, 158130.0, 308328.0, 597766.0, 968742.0, 893252.0, 511557.0, 261149.0, 134853.0, 71926.0, 39815.0, 22429.0, 12958.0, 7747.0, 4658.0, 2962.0, 1818.0, 1185.0, 753.0, 499.0, 341.0, 206.0, 144.0, 90.0, 52.0, 35.0, 30.0, 18.0, 14.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.9501953125, -3.822265625, -3.6943359375, -3.56640625, -3.4384765625, -3.310546875, -3.1826171875, -3.0546875, -2.9267578125, -2.798828125, -2.6708984375, -2.54296875, -2.4150390625, -2.287109375, -2.1591796875, -2.03125, -1.9033203125, -1.775390625, -1.6474609375, -1.51953125, -1.3916015625, -1.263671875, -1.1357421875, -1.0078125, -0.8798828125, -0.751953125, -0.6240234375, -0.49609375, -0.3681640625, -0.240234375, -0.1123046875, 0.015625, 0.1435546875, 0.271484375, 0.3994140625, 0.52734375, 0.6552734375, 0.783203125, 0.9111328125, 1.0390625, 1.1669921875, 1.294921875, 1.4228515625, 1.55078125, 1.6787109375, 1.806640625, 1.9345703125, 2.0625, 2.1904296875, 2.318359375, 2.4462890625, 2.57421875, 2.7021484375, 2.830078125, 2.9580078125, 3.0859375, 3.2138671875, 3.341796875, 3.4697265625, 3.59765625, 3.7255859375, 3.853515625, 3.9814453125, 4.109375]}, "gradients/decoder.bert.encoder.layer.10.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 9.0, 9.0, 15.0, 13.0, 15.0, 26.0, 33.0, 45.0, 49.0, 67.0, 66.0, 102.0, 122.0, 130.0, 170.0, 189.0, 242.0, 295.0, 302.0, 300.0, 267.0, 243.0, 233.0, 210.0, 176.0, 161.0, 119.0, 93.0, 66.0, 75.0, 50.0, 52.0, 35.0, 21.0, 15.0, 22.0, 9.0, 10.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3837890625, -1.3425445556640625, -1.301300048828125, -1.2600555419921875, -1.21881103515625, -1.1775665283203125, -1.136322021484375, -1.0950775146484375, -1.0538330078125, -1.0125885009765625, -0.971343994140625, -0.9300994873046875, -0.88885498046875, -0.8476104736328125, -0.806365966796875, -0.7651214599609375, -0.723876953125, -0.6826324462890625, -0.641387939453125, -0.6001434326171875, -0.55889892578125, -0.5176544189453125, -0.476409912109375, -0.4351654052734375, -0.3939208984375, -0.3526763916015625, -0.311431884765625, -0.2701873779296875, -0.22894287109375, -0.1876983642578125, -0.146453857421875, -0.1052093505859375, -0.06396484375, -0.0227203369140625, 0.018524169921875, 0.0597686767578125, 0.10101318359375, 0.1422576904296875, 0.183502197265625, 0.2247467041015625, 0.2659912109375, 0.3072357177734375, 0.348480224609375, 0.3897247314453125, 0.43096923828125, 0.4722137451171875, 0.513458251953125, 0.5547027587890625, 0.595947265625, 0.6371917724609375, 0.678436279296875, 0.7196807861328125, 0.76092529296875, 0.8021697998046875, 0.843414306640625, 0.8846588134765625, 0.9259033203125, 0.9671478271484375, 1.008392333984375, 1.0496368408203125, 1.09088134765625, 1.1321258544921875, 1.173370361328125, 1.2146148681640625, 1.255859375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 2.0, 6.0, 12.0, 12.0, 13.0, 35.0, 25.0, 36.0, 47.0, 69.0, 58.0, 73.0, 60.0, 85.0, 68.0, 51.0, 63.0, 50.0, 36.0, 30.0, 29.0, 23.0, 20.0, 13.0, 14.0, 11.0, 8.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.848748683929443, -5.6829633712768555, -5.517178058624268, -5.35139274597168, -5.185607433319092, -5.019822120666504, -4.854036808013916, -4.688251495361328, -4.522466659545898, -4.3566813468933105, -4.190896034240723, -4.025110721588135, -3.859325408935547, -3.693540096282959, -3.52775502204895, -3.3619697093963623, -3.1961841583251953, -3.0303988456726074, -2.8646135330200195, -2.6988282203674316, -2.5330429077148438, -2.367257595062256, -2.201472520828247, -2.035687208175659, -1.8699018955230713, -1.7041165828704834, -1.5383312702178955, -1.3725460767745972, -1.2067607641220093, -1.0409754514694214, -0.8751901984214783, -0.7094049453735352, -0.5436191558837891, -0.37783387303352356, -0.21204859018325806, -0.046263307332992554, 0.11952197551727295, 0.28530728816986084, 0.45109254121780396, 0.6168777942657471, 0.782663106918335, 0.9484484195709229, 1.1142337322235107, 1.280018925666809, 1.445804238319397, 1.6115895509719849, 1.7773747444152832, 1.943160057067871, 2.108945369720459, 2.274730682373047, 2.4405159950256348, 2.6063013076782227, 2.7720866203308105, 2.9378719329833984, 3.1036570072174072, 3.269442319869995, 3.435227632522583, 3.601012945175171, 3.766798257827759, 3.9325835704803467, 4.0983686447143555, 4.264153957366943, 4.429939270019531, 4.595724582672119, 4.761509895324707]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 6.0, 8.0, 12.0, 16.0, 10.0, 6.0, 26.0, 20.0, 16.0, 24.0, 32.0, 36.0, 34.0, 34.0, 46.0, 39.0, 42.0, 47.0, 37.0, 39.0, 50.0, 39.0, 33.0, 43.0, 33.0, 40.0, 28.0, 27.0, 24.0, 28.0, 25.0, 16.0, 11.0, 13.0, 11.0, 11.0, 5.0, 2.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.831474542617798, -2.7447054386138916, -2.6579365730285645, -2.571167469024658, -2.484398365020752, -2.3976292610168457, -2.3108603954315186, -2.2240912914276123, -2.137322425842285, -2.050553321838379, -1.9637843370437622, -1.8770153522491455, -1.7902462482452393, -1.7034772634506226, -1.6167082786560059, -1.5299391746520996, -1.4431700706481934, -1.3564010858535767, -1.2696319818496704, -1.1828629970550537, -1.0960938930511475, -1.0093249082565308, -0.9225559234619141, -0.8357868790626526, -0.7490178346633911, -0.6622487902641296, -0.5754797458648682, -0.48871076107025146, -0.40194171667099, -0.3151726722717285, -0.22840368747711182, -0.14163464307785034, -0.05486559867858887, 0.031903430819511414, 0.1186724603176117, 0.20544147491455078, 0.29221051931381226, 0.37897956371307373, 0.46574854850769043, 0.5525175929069519, 0.6392866373062134, 0.7260556817054749, 0.8128247261047363, 0.899593710899353, 0.9863627552986145, 1.073131799697876, 1.1599007844924927, 1.2466697692871094, 1.3334388732910156, 1.4202078580856323, 1.5069769620895386, 1.5937459468841553, 1.6805150508880615, 1.7672840356826782, 1.854053020477295, 1.9408221244812012, 2.0275912284851074, 2.1143603324890137, 2.201129198074341, 2.287898302078247, 2.3746674060821533, 2.4614362716674805, 2.5482053756713867, 2.634974479675293, 2.72174334526062]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 7.0, 12.0, 14.0, 19.0, 31.0, 50.0, 79.0, 122.0, 182.0, 270.0, 428.0, 714.0, 1053.0, 1669.0, 2665.0, 4493.0, 7487.0, 12709.0, 22244.0, 40753.0, 76440.0, 141034.0, 223254.0, 216572.0, 133689.0, 71984.0, 38784.0, 21223.0, 12218.0, 7186.0, 4271.0, 2489.0, 1582.0, 1039.0, 659.0, 391.0, 267.0, 157.0, 103.0, 79.0, 51.0, 21.0, 22.0, 16.0, 6.0, 11.0, 5.0, 1.0, 3.0, 3.0, 2.0], "bins": [-0.428466796875, -0.4165496826171875, -0.404632568359375, -0.3927154541015625, -0.38079833984375, -0.3688812255859375, -0.356964111328125, -0.3450469970703125, -0.3331298828125, -0.3212127685546875, -0.309295654296875, -0.2973785400390625, -0.28546142578125, -0.2735443115234375, -0.261627197265625, -0.2497100830078125, -0.23779296875, -0.2258758544921875, -0.213958740234375, -0.2020416259765625, -0.19012451171875, -0.1782073974609375, -0.166290283203125, -0.1543731689453125, -0.1424560546875, -0.1305389404296875, -0.118621826171875, -0.1067047119140625, -0.09478759765625, -0.0828704833984375, -0.070953369140625, -0.0590362548828125, -0.047119140625, -0.0352020263671875, -0.023284912109375, -0.0113677978515625, 0.00054931640625, 0.0124664306640625, 0.024383544921875, 0.0363006591796875, 0.0482177734375, 0.0601348876953125, 0.072052001953125, 0.0839691162109375, 0.09588623046875, 0.1078033447265625, 0.119720458984375, 0.1316375732421875, 0.1435546875, 0.1554718017578125, 0.167388916015625, 0.1793060302734375, 0.19122314453125, 0.2031402587890625, 0.215057373046875, 0.2269744873046875, 0.2388916015625, 0.2508087158203125, 0.262725830078125, 0.2746429443359375, 0.28656005859375, 0.2984771728515625, 0.310394287109375, 0.3223114013671875, 0.334228515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 7.0, 12.0, 13.0, 19.0, 14.0, 18.0, 22.0, 32.0, 32.0, 35.0, 40.0, 49.0, 42.0, 53.0, 54.0, 48.0, 58.0, 46.0, 47.0, 36.0, 45.0, 39.0, 35.0, 39.0, 31.0, 29.0, 21.0, 17.0, 12.0, 13.0, 14.0, 5.0, 3.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.11328125, -3.002471923828125, -2.89166259765625, -2.780853271484375, -2.6700439453125, -2.559234619140625, -2.44842529296875, -2.337615966796875, -2.226806640625, -2.115997314453125, -2.00518798828125, -1.894378662109375, -1.7835693359375, -1.672760009765625, -1.56195068359375, -1.451141357421875, -1.34033203125, -1.229522705078125, -1.11871337890625, -1.007904052734375, -0.8970947265625, -0.786285400390625, -0.67547607421875, -0.564666748046875, -0.453857421875, -0.343048095703125, -0.23223876953125, -0.121429443359375, -0.0106201171875, 0.100189208984375, 0.21099853515625, 0.321807861328125, 0.4326171875, 0.543426513671875, 0.65423583984375, 0.765045166015625, 0.8758544921875, 0.986663818359375, 1.09747314453125, 1.208282470703125, 1.319091796875, 1.429901123046875, 1.54071044921875, 1.651519775390625, 1.7623291015625, 1.873138427734375, 1.98394775390625, 2.094757080078125, 2.20556640625, 2.316375732421875, 2.42718505859375, 2.537994384765625, 2.6488037109375, 2.759613037109375, 2.87042236328125, 2.981231689453125, 3.092041015625, 3.202850341796875, 3.31365966796875, 3.424468994140625, 3.5352783203125, 3.646087646484375, 3.75689697265625, 3.867706298828125, 3.978515625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 4.0, 10.0, 28.0, 27.0, 41.0, 54.0, 81.0, 108.0, 190.0, 267.0, 412.0, 738.0, 1230.0, 2166.0, 4242.0, 9431.0, 23597.0, 180019.0, 766428.0, 35348.0, 12237.0, 5434.0, 2809.0, 1433.0, 823.0, 490.0, 318.0, 191.0, 123.0, 71.0, 51.0, 44.0, 32.0, 26.0, 13.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0], "bins": [-1.4501953125, -1.4111785888671875, -1.372161865234375, -1.3331451416015625, -1.29412841796875, -1.2551116943359375, -1.216094970703125, -1.1770782470703125, -1.1380615234375, -1.0990447998046875, -1.060028076171875, -1.0210113525390625, -0.98199462890625, -0.9429779052734375, -0.903961181640625, -0.8649444580078125, -0.825927734375, -0.7869110107421875, -0.747894287109375, -0.7088775634765625, -0.66986083984375, -0.6308441162109375, -0.591827392578125, -0.5528106689453125, -0.5137939453125, -0.4747772216796875, -0.435760498046875, -0.3967437744140625, -0.35772705078125, -0.3187103271484375, -0.279693603515625, -0.2406768798828125, -0.20166015625, -0.1626434326171875, -0.123626708984375, -0.0846099853515625, -0.04559326171875, -0.0065765380859375, 0.032440185546875, 0.0714569091796875, 0.1104736328125, 0.1494903564453125, 0.188507080078125, 0.2275238037109375, 0.26654052734375, 0.3055572509765625, 0.344573974609375, 0.3835906982421875, 0.422607421875, 0.4616241455078125, 0.500640869140625, 0.5396575927734375, 0.57867431640625, 0.6176910400390625, 0.656707763671875, 0.6957244873046875, 0.7347412109375, 0.7737579345703125, 0.812774658203125, 0.8517913818359375, 0.89080810546875, 0.9298248291015625, 0.968841552734375, 1.0078582763671875, 1.046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 13.0, 8.0, 10.0, 21.0, 19.0, 12.0, 23.0, 29.0, 28.0, 27.0, 34.0, 34.0, 37.0, 32.0, 43.0, 41.0, 52.0, 45.0, 50.0, 43.0, 42.0, 31.0, 36.0, 28.0, 33.0, 28.0, 29.0, 24.0, 20.0, 14.0, 19.0, 13.0, 13.0, 17.0, 9.0, 11.0, 1.0, 11.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8662109375, -1.8038787841796875, -1.741546630859375, -1.6792144775390625, -1.61688232421875, -1.5545501708984375, -1.492218017578125, -1.4298858642578125, -1.3675537109375, -1.3052215576171875, -1.242889404296875, -1.1805572509765625, -1.11822509765625, -1.0558929443359375, -0.993560791015625, -0.9312286376953125, -0.868896484375, -0.8065643310546875, -0.744232177734375, -0.6819000244140625, -0.61956787109375, -0.5572357177734375, -0.494903564453125, -0.4325714111328125, -0.3702392578125, -0.3079071044921875, -0.245574951171875, -0.1832427978515625, -0.12091064453125, -0.0585784912109375, 0.003753662109375, 0.0660858154296875, 0.12841796875, 0.1907501220703125, 0.253082275390625, 0.3154144287109375, 0.37774658203125, 0.4400787353515625, 0.502410888671875, 0.5647430419921875, 0.6270751953125, 0.6894073486328125, 0.751739501953125, 0.8140716552734375, 0.87640380859375, 0.9387359619140625, 1.001068115234375, 1.0634002685546875, 1.125732421875, 1.1880645751953125, 1.250396728515625, 1.3127288818359375, 1.37506103515625, 1.4373931884765625, 1.499725341796875, 1.5620574951171875, 1.6243896484375, 1.6867218017578125, 1.749053955078125, 1.8113861083984375, 1.87371826171875, 1.9360504150390625, 1.998382568359375, 2.0607147216796875, 2.123046875]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 11.0, 6.0, 12.0, 8.0, 19.0, 25.0, 31.0, 52.0, 67.0, 78.0, 126.0, 210.0, 285.0, 482.0, 809.0, 1361.0, 2438.0, 4408.0, 9121.0, 20849.0, 81348.0, 867326.0, 32499.0, 12970.0, 6330.0, 3268.0, 1781.0, 962.0, 568.0, 372.0, 241.0, 143.0, 93.0, 73.0, 53.0, 43.0, 19.0, 22.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2481689453125, -0.24047088623046875, -0.2327728271484375, -0.22507476806640625, -0.217376708984375, -0.20967864990234375, -0.2019805908203125, -0.19428253173828125, -0.18658447265625, -0.17888641357421875, -0.1711883544921875, -0.16349029541015625, -0.155792236328125, -0.14809417724609375, -0.1403961181640625, -0.13269805908203125, -0.125, -0.11730194091796875, -0.1096038818359375, -0.10190582275390625, -0.094207763671875, -0.08650970458984375, -0.0788116455078125, -0.07111358642578125, -0.06341552734375, -0.05571746826171875, -0.0480194091796875, -0.04032135009765625, -0.032623291015625, -0.02492523193359375, -0.0172271728515625, -0.00952911376953125, -0.0018310546875, 0.00586700439453125, 0.0135650634765625, 0.02126312255859375, 0.028961181640625, 0.03665924072265625, 0.0443572998046875, 0.05205535888671875, 0.05975341796875, 0.06745147705078125, 0.0751495361328125, 0.08284759521484375, 0.090545654296875, 0.09824371337890625, 0.1059417724609375, 0.11363983154296875, 0.121337890625, 0.12903594970703125, 0.1367340087890625, 0.14443206787109375, 0.152130126953125, 0.15982818603515625, 0.1675262451171875, 0.17522430419921875, 0.18292236328125, 0.19062042236328125, 0.1983184814453125, 0.20601654052734375, 0.213714599609375, 0.22141265869140625, 0.2291107177734375, 0.23680877685546875, 0.2445068359375]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 6.0, 6.0, 14.0, 15.0, 16.0, 17.0, 21.0, 30.0, 34.0, 32.0, 37.0, 53.0, 58.0, 46.0, 56.0, 60.0, 49.0, 71.0, 53.0, 49.0, 32.0, 36.0, 31.0, 23.0, 31.0, 21.0, 21.0, 19.0, 9.0, 6.0, 10.0, 4.0, 8.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3424625396728516e-05, -2.272985875606537e-05, -2.203509211540222e-05, -2.1340325474739075e-05, -2.0645558834075928e-05, -1.995079219341278e-05, -1.9256025552749634e-05, -1.8561258912086487e-05, -1.786649227142334e-05, -1.7171725630760193e-05, -1.6476958990097046e-05, -1.57821923494339e-05, -1.5087425708770752e-05, -1.4392659068107605e-05, -1.3697892427444458e-05, -1.3003125786781311e-05, -1.2308359146118164e-05, -1.1613592505455017e-05, -1.091882586479187e-05, -1.0224059224128723e-05, -9.529292583465576e-06, -8.83452594280243e-06, -8.139759302139282e-06, -7.444992661476135e-06, -6.750226020812988e-06, -6.055459380149841e-06, -5.360692739486694e-06, -4.665926098823547e-06, -3.9711594581604e-06, -3.2763928174972534e-06, -2.5816261768341064e-06, -1.8868595361709595e-06, -1.1920928955078125e-06, -4.973262548446655e-07, 1.9744038581848145e-07, 8.922070264816284e-07, 1.5869736671447754e-06, 2.2817403078079224e-06, 2.9765069484710693e-06, 3.6712735891342163e-06, 4.366040229797363e-06, 5.06080687046051e-06, 5.755573511123657e-06, 6.450340151786804e-06, 7.145106792449951e-06, 7.839873433113098e-06, 8.534640073776245e-06, 9.229406714439392e-06, 9.924173355102539e-06, 1.0618939995765686e-05, 1.1313706636428833e-05, 1.200847327709198e-05, 1.2703239917755127e-05, 1.3398006558418274e-05, 1.4092773199081421e-05, 1.4787539839744568e-05, 1.5482306480407715e-05, 1.6177073121070862e-05, 1.687183976173401e-05, 1.7566606402397156e-05, 1.8261373043060303e-05, 1.895613968372345e-05, 1.9650906324386597e-05, 2.0345672965049744e-05, 2.104043960571289e-05]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 12.0, 19.0, 21.0, 37.0, 40.0, 42.0, 88.0, 100.0, 166.0, 220.0, 310.0, 450.0, 605.0, 898.0, 1344.0, 2061.0, 3187.0, 5163.0, 8423.0, 14741.0, 26667.0, 48780.0, 90379.0, 157148.0, 220346.0, 195072.0, 120715.0, 66278.0, 35924.0, 19706.0, 11089.0, 6553.0, 4179.0, 2548.0, 1654.0, 1135.0, 712.0, 500.0, 384.0, 253.0, 188.0, 125.0, 105.0, 40.0, 55.0, 27.0, 20.0, 13.0, 11.0, 8.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.07470703125, -0.07242584228515625, -0.0701446533203125, -0.06786346435546875, -0.065582275390625, -0.06330108642578125, -0.0610198974609375, -0.05873870849609375, -0.05645751953125, -0.05417633056640625, -0.0518951416015625, -0.04961395263671875, -0.047332763671875, -0.04505157470703125, -0.0427703857421875, -0.04048919677734375, -0.0382080078125, -0.03592681884765625, -0.0336456298828125, -0.03136444091796875, -0.029083251953125, -0.02680206298828125, -0.0245208740234375, -0.02223968505859375, -0.01995849609375, -0.01767730712890625, -0.0153961181640625, -0.01311492919921875, -0.010833740234375, -0.00855255126953125, -0.0062713623046875, -0.00399017333984375, -0.001708984375, 0.00057220458984375, 0.0028533935546875, 0.00513458251953125, 0.007415771484375, 0.00969696044921875, 0.0119781494140625, 0.01425933837890625, 0.01654052734375, 0.01882171630859375, 0.0211029052734375, 0.02338409423828125, 0.025665283203125, 0.02794647216796875, 0.0302276611328125, 0.03250885009765625, 0.0347900390625, 0.03707122802734375, 0.0393524169921875, 0.04163360595703125, 0.043914794921875, 0.04619598388671875, 0.0484771728515625, 0.05075836181640625, 0.05303955078125, 0.05532073974609375, 0.0576019287109375, 0.05988311767578125, 0.062164306640625, 0.06444549560546875, 0.0667266845703125, 0.06900787353515625, 0.0712890625]}, "gradients/decoder.bert.encoder.layer.10.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 2.0, 5.0, 11.0, 11.0, 9.0, 8.0, 12.0, 17.0, 29.0, 32.0, 42.0, 40.0, 50.0, 65.0, 73.0, 68.0, 77.0, 64.0, 63.0, 60.0, 44.0, 47.0, 33.0, 26.0, 23.0, 18.0, 14.0, 11.0, 8.0, 9.0, 7.0, 3.0, 1.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0217742919921875, -0.021143674850463867, -0.020513057708740234, -0.0198824405670166, -0.01925182342529297, -0.018621206283569336, -0.017990589141845703, -0.01735997200012207, -0.016729354858398438, -0.016098737716674805, -0.015468120574951172, -0.014837503433227539, -0.014206886291503906, -0.013576269149780273, -0.01294565200805664, -0.012315034866333008, -0.011684417724609375, -0.011053800582885742, -0.01042318344116211, -0.009792566299438477, -0.009161949157714844, -0.008531332015991211, -0.007900714874267578, -0.007270097732543945, -0.0066394805908203125, -0.00600886344909668, -0.005378246307373047, -0.004747629165649414, -0.004117012023925781, -0.0034863948822021484, -0.0028557777404785156, -0.002225160598754883, -0.00159454345703125, -0.0009639263153076172, -0.0003333091735839844, 0.00029730796813964844, 0.0009279251098632812, 0.001558542251586914, 0.002189159393310547, 0.0028197765350341797, 0.0034503936767578125, 0.004081010818481445, 0.004711627960205078, 0.005342245101928711, 0.005972862243652344, 0.0066034793853759766, 0.007234096527099609, 0.007864713668823242, 0.008495330810546875, 0.009125947952270508, 0.00975656509399414, 0.010387182235717773, 0.011017799377441406, 0.011648416519165039, 0.012279033660888672, 0.012909650802612305, 0.013540267944335938, 0.01417088508605957, 0.014801502227783203, 0.015432119369506836, 0.01606273651123047, 0.0166933536529541, 0.017323970794677734, 0.017954587936401367, 0.018585205078125]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 9.0, 10.0, 3.0, 6.0, 10.0, 17.0, 13.0, 32.0, 23.0, 40.0, 49.0, 68.0, 57.0, 69.0, 67.0, 83.0, 65.0, 59.0, 59.0, 48.0, 37.0, 28.0, 32.0, 20.0, 19.0, 16.0, 12.0, 11.0, 7.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.861233711242676, -5.695018291473389, -5.528802871704102, -5.362587928771973, -5.1963725090026855, -5.030157089233398, -4.863941669464111, -4.697726249694824, -4.531511306762695, -4.365295886993408, -4.199080467224121, -4.032865524291992, -3.866650104522705, -3.700434684753418, -3.534219264984131, -3.3680038452148438, -3.2017884254455566, -3.0355730056762695, -2.8693578243255615, -2.7031424045562744, -2.5369272232055664, -2.3707118034362793, -2.204496383666992, -2.038280963897705, -1.872065782546997, -1.7058504819869995, -1.539635181427002, -1.3734197616577148, -1.2072044610977173, -1.0409891605377197, -0.8747738003730774, -0.7085584402084351, -0.5423436164855957, -0.37612828612327576, -0.2099129557609558, -0.043697625398635864, 0.12251770496368408, 0.28873300552368164, 0.454948365688324, 0.6211637258529663, 0.7873790264129639, 0.9535943269729614, 1.119809627532959, 1.286025047302246, 1.4522403478622437, 1.6184556484222412, 1.7846710681915283, 1.9508863687515259, 2.1171016693115234, 2.2833170890808105, 2.4495322704315186, 2.6157476902008057, 2.7819628715515137, 2.948178291320801, 3.114393711090088, 3.280609130859375, 3.446824312210083, 3.61303973197937, 3.779254913330078, 3.9454703330993652, 4.111685752868652, 4.277900695800781, 4.444116115570068, 4.6103315353393555, 4.776546955108643]}, "gradients/decoder.bert.encoder.layer.10.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 4.0, 10.0, 11.0, 15.0, 10.0, 6.0, 27.0, 22.0, 15.0, 24.0, 32.0, 35.0, 38.0, 38.0, 39.0, 43.0, 41.0, 47.0, 37.0, 40.0, 49.0, 39.0, 31.0, 45.0, 34.0, 38.0, 28.0, 26.0, 28.0, 26.0, 21.0, 16.0, 13.0, 11.0, 11.0, 10.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.807745933532715, -2.7214558124542236, -2.6351656913757324, -2.548875570297241, -2.46258544921875, -2.376295328140259, -2.2900052070617676, -2.2037150859832764, -2.117424964904785, -2.031134843826294, -1.9448447227478027, -1.8585546016693115, -1.7722644805908203, -1.685974359512329, -1.599684238433838, -1.5133941173553467, -1.4271039962768555, -1.3408138751983643, -1.254523754119873, -1.1682336330413818, -1.0819435119628906, -0.9956533908843994, -0.9093632698059082, -0.823073148727417, -0.7367830276489258, -0.6504929065704346, -0.5642027854919434, -0.47791266441345215, -0.39162254333496094, -0.3053324222564697, -0.21904230117797852, -0.1327521800994873, -0.04646182060241699, 0.03982830047607422, 0.12611842155456543, 0.21240854263305664, 0.29869866371154785, 0.38498878479003906, 0.4712789058685303, 0.5575690269470215, 0.6438591480255127, 0.7301492691040039, 0.8164393901824951, 0.9027295112609863, 0.9890196323394775, 1.0753097534179688, 1.16159987449646, 1.2478899955749512, 1.3341801166534424, 1.4204702377319336, 1.5067603588104248, 1.593050479888916, 1.6793406009674072, 1.7656307220458984, 1.8519208431243896, 1.9382109642028809, 2.024501085281372, 2.1107912063598633, 2.1970813274383545, 2.2833714485168457, 2.369661569595337, 2.455951690673828, 2.5422418117523193, 2.6285319328308105, 2.7148220539093018]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 4.0, 7.0, 15.0, 26.0, 37.0, 41.0, 81.0, 134.0, 155.0, 269.0, 422.0, 681.0, 1089.0, 1798.0, 3045.0, 5246.0, 9280.0, 17090.0, 31339.0, 57234.0, 100977.0, 159705.0, 200052.0, 178969.0, 122085.0, 70944.0, 39223.0, 20958.0, 11620.0, 6543.0, 3742.0, 2193.0, 1362.0, 748.0, 509.0, 320.0, 179.0, 162.0, 93.0, 65.0, 33.0, 30.0, 12.0, 20.0, 8.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.501953125, -3.394805908203125, -3.28765869140625, -3.180511474609375, -3.0733642578125, -2.966217041015625, -2.85906982421875, -2.751922607421875, -2.644775390625, -2.537628173828125, -2.43048095703125, -2.323333740234375, -2.2161865234375, -2.109039306640625, -2.00189208984375, -1.894744873046875, -1.78759765625, -1.680450439453125, -1.57330322265625, -1.466156005859375, -1.3590087890625, -1.251861572265625, -1.14471435546875, -1.037567138671875, -0.930419921875, -0.823272705078125, -0.71612548828125, -0.608978271484375, -0.5018310546875, -0.394683837890625, -0.28753662109375, -0.180389404296875, -0.0732421875, 0.033905029296875, 0.14105224609375, 0.248199462890625, 0.3553466796875, 0.462493896484375, 0.56964111328125, 0.676788330078125, 0.783935546875, 0.891082763671875, 0.99822998046875, 1.105377197265625, 1.2125244140625, 1.319671630859375, 1.42681884765625, 1.533966064453125, 1.64111328125, 1.748260498046875, 1.85540771484375, 1.962554931640625, 2.0697021484375, 2.176849365234375, 2.28399658203125, 2.391143798828125, 2.498291015625, 2.605438232421875, 2.71258544921875, 2.819732666015625, 2.9268798828125, 3.034027099609375, 3.14117431640625, 3.248321533203125, 3.35546875]}, "gradients/decoder.bert.encoder.layer.10.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 18.0, 18.0, 17.0, 14.0, 20.0, 17.0, 24.0, 27.0, 29.0, 32.0, 37.0, 33.0, 42.0, 52.0, 33.0, 46.0, 50.0, 40.0, 37.0, 52.0, 34.0, 33.0, 33.0, 29.0, 24.0, 29.0, 28.0, 17.0, 12.0, 15.0, 16.0, 5.0, 7.0, 9.0, 6.0, 7.0, 7.0, 6.0, 3.0, 1.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.01171875, -2.920196533203125, -2.82867431640625, -2.737152099609375, -2.6456298828125, -2.554107666015625, -2.46258544921875, -2.371063232421875, -2.279541015625, -2.188018798828125, -2.09649658203125, -2.004974365234375, -1.9134521484375, -1.821929931640625, -1.73040771484375, -1.638885498046875, -1.54736328125, -1.455841064453125, -1.36431884765625, -1.272796630859375, -1.1812744140625, -1.089752197265625, -0.99822998046875, -0.906707763671875, -0.815185546875, -0.723663330078125, -0.63214111328125, -0.540618896484375, -0.4490966796875, -0.357574462890625, -0.26605224609375, -0.174530029296875, -0.0830078125, 0.008514404296875, 0.10003662109375, 0.191558837890625, 0.2830810546875, 0.374603271484375, 0.46612548828125, 0.557647705078125, 0.649169921875, 0.740692138671875, 0.83221435546875, 0.923736572265625, 1.0152587890625, 1.106781005859375, 1.19830322265625, 1.289825439453125, 1.38134765625, 1.472869873046875, 1.56439208984375, 1.655914306640625, 1.7474365234375, 1.838958740234375, 1.93048095703125, 2.022003173828125, 2.113525390625, 2.205047607421875, 2.29656982421875, 2.388092041015625, 2.4796142578125, 2.571136474609375, 2.66265869140625, 2.754180908203125, 2.845703125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 16.0, 15.0, 20.0, 21.0, 36.0, 48.0, 90.0, 105.0, 151.0, 239.0, 364.0, 607.0, 992.0, 1602.0, 2466.0, 4070.0, 7050.0, 11742.0, 20363.0, 34710.0, 59817.0, 97494.0, 142686.0, 175172.0, 165757.0, 124868.0, 80807.0, 48685.0, 28051.0, 16381.0, 9515.0, 5693.0, 3299.0, 2104.0, 1261.0, 789.0, 489.0, 313.0, 208.0, 152.0, 97.0, 79.0, 55.0, 24.0, 12.0, 15.0, 13.0, 10.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.16015625, -3.063812255859375, -2.96746826171875, -2.871124267578125, -2.7747802734375, -2.678436279296875, -2.58209228515625, -2.485748291015625, -2.389404296875, -2.293060302734375, -2.19671630859375, -2.100372314453125, -2.0040283203125, -1.907684326171875, -1.81134033203125, -1.714996337890625, -1.61865234375, -1.522308349609375, -1.42596435546875, -1.329620361328125, -1.2332763671875, -1.136932373046875, -1.04058837890625, -0.944244384765625, -0.847900390625, -0.751556396484375, -0.65521240234375, -0.558868408203125, -0.4625244140625, -0.366180419921875, -0.26983642578125, -0.173492431640625, -0.0771484375, 0.019195556640625, 0.11553955078125, 0.211883544921875, 0.3082275390625, 0.404571533203125, 0.50091552734375, 0.597259521484375, 0.693603515625, 0.789947509765625, 0.88629150390625, 0.982635498046875, 1.0789794921875, 1.175323486328125, 1.27166748046875, 1.368011474609375, 1.46435546875, 1.560699462890625, 1.65704345703125, 1.753387451171875, 1.8497314453125, 1.946075439453125, 2.04241943359375, 2.138763427734375, 2.235107421875, 2.331451416015625, 2.42779541015625, 2.524139404296875, 2.6204833984375, 2.716827392578125, 2.81317138671875, 2.909515380859375, 3.005859375]}, "gradients/decoder.bert.encoder.layer.10.attention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 16.0, 18.0, 18.0, 19.0, 11.0, 19.0, 20.0, 22.0, 25.0, 23.0, 23.0, 39.0, 30.0, 37.0, 38.0, 42.0, 23.0, 41.0, 33.0, 43.0, 37.0, 38.0, 39.0, 28.0, 36.0, 22.0, 17.0, 28.0, 21.0, 23.0, 24.0, 22.0, 16.0, 15.0, 14.0, 11.0, 7.0, 7.0, 9.0, 4.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5634765625, -1.5135345458984375, -1.463592529296875, -1.4136505126953125, -1.36370849609375, -1.3137664794921875, -1.263824462890625, -1.2138824462890625, -1.1639404296875, -1.1139984130859375, -1.064056396484375, -1.0141143798828125, -0.96417236328125, -0.9142303466796875, -0.864288330078125, -0.8143463134765625, -0.764404296875, -0.7144622802734375, -0.664520263671875, -0.6145782470703125, -0.56463623046875, -0.5146942138671875, -0.464752197265625, -0.4148101806640625, -0.3648681640625, -0.3149261474609375, -0.264984130859375, -0.2150421142578125, -0.16510009765625, -0.1151580810546875, -0.065216064453125, -0.0152740478515625, 0.03466796875, 0.0846099853515625, 0.134552001953125, 0.1844940185546875, 0.23443603515625, 0.2843780517578125, 0.334320068359375, 0.3842620849609375, 0.4342041015625, 0.4841461181640625, 0.534088134765625, 0.5840301513671875, 0.63397216796875, 0.6839141845703125, 0.733856201171875, 0.7837982177734375, 0.833740234375, 0.8836822509765625, 0.933624267578125, 0.9835662841796875, 1.03350830078125, 1.0834503173828125, 1.133392333984375, 1.1833343505859375, 1.2332763671875, 1.2832183837890625, 1.333160400390625, 1.3831024169921875, 1.43304443359375, 1.4829864501953125, 1.532928466796875, 1.5828704833984375, 1.6328125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 21.0, 18.0, 24.0, 34.0, 50.0, 63.0, 112.0, 127.0, 202.0, 324.0, 477.0, 689.0, 1073.0, 1811.0, 3093.0, 5941.0, 11697.0, 25276.0, 56182.0, 124925.0, 234206.0, 267020.0, 167398.0, 78680.0, 35001.0, 15979.0, 7941.0, 4110.0, 2265.0, 1362.0, 798.0, 511.0, 369.0, 215.0, 155.0, 106.0, 79.0, 51.0, 37.0, 30.0, 25.0, 14.0, 17.0, 6.0, 5.0, 3.0, 5.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.0390625, -1.9715576171875, -1.904052734375, -1.8365478515625, -1.76904296875, -1.7015380859375, -1.634033203125, -1.5665283203125, -1.4990234375, -1.4315185546875, -1.364013671875, -1.2965087890625, -1.22900390625, -1.1614990234375, -1.093994140625, -1.0264892578125, -0.958984375, -0.8914794921875, -0.823974609375, -0.7564697265625, -0.68896484375, -0.6214599609375, -0.553955078125, -0.4864501953125, -0.4189453125, -0.3514404296875, -0.283935546875, -0.2164306640625, -0.14892578125, -0.0814208984375, -0.013916015625, 0.0535888671875, 0.12109375, 0.1885986328125, 0.256103515625, 0.3236083984375, 0.39111328125, 0.4586181640625, 0.526123046875, 0.5936279296875, 0.6611328125, 0.7286376953125, 0.796142578125, 0.8636474609375, 0.93115234375, 0.9986572265625, 1.066162109375, 1.1336669921875, 1.201171875, 1.2686767578125, 1.336181640625, 1.4036865234375, 1.47119140625, 1.5386962890625, 1.606201171875, 1.6737060546875, 1.7412109375, 1.8087158203125, 1.876220703125, 1.9437255859375, 2.01123046875, 2.0787353515625, 2.146240234375, 2.2137451171875, 2.28125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 14.0, 30.0, 46.0, 52.0, 108.0, 100.0, 114.0, 108.0, 97.0, 82.0, 62.0, 45.0, 28.0, 28.0, 20.0, 12.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00024318695068359375, -0.0002345442771911621, -0.00022590160369873047, -0.00021725893020629883, -0.0002086162567138672, -0.00019997358322143555, -0.0001913309097290039, -0.00018268823623657227, -0.00017404556274414062, -0.00016540288925170898, -0.00015676021575927734, -0.0001481175422668457, -0.00013947486877441406, -0.00013083219528198242, -0.00012218952178955078, -0.00011354684829711914, -0.0001049041748046875, -9.626150131225586e-05, -8.761882781982422e-05, -7.897615432739258e-05, -7.033348083496094e-05, -6.16908073425293e-05, -5.3048133850097656e-05, -4.4405460357666016e-05, -3.5762786865234375e-05, -2.7120113372802734e-05, -1.8477439880371094e-05, -9.834766387939453e-06, -1.1920928955078125e-06, 7.450580596923828e-06, 1.609325408935547e-05, 2.473592758178711e-05, 3.337860107421875e-05, 4.202127456665039e-05, 5.066394805908203e-05, 5.930662155151367e-05, 6.794929504394531e-05, 7.659196853637695e-05, 8.52346420288086e-05, 9.387731552124023e-05, 0.00010251998901367188, 0.00011116266250610352, 0.00011980533599853516, 0.0001284480094909668, 0.00013709068298339844, 0.00014573335647583008, 0.00015437602996826172, 0.00016301870346069336, 0.000171661376953125, 0.00018030405044555664, 0.00018894672393798828, 0.00019758939743041992, 0.00020623207092285156, 0.0002148747444152832, 0.00022351741790771484, 0.00023216009140014648, 0.00024080276489257812, 0.00024944543838500977, 0.0002580881118774414, 0.00026673078536987305, 0.0002753734588623047, 0.00028401613235473633, 0.00029265880584716797, 0.0003013014793395996, 0.00030994415283203125]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 3.0, 9.0, 8.0, 8.0, 18.0, 14.0, 26.0, 28.0, 45.0, 59.0, 73.0, 128.0, 179.0, 214.0, 318.0, 482.0, 706.0, 1073.0, 1895.0, 3305.0, 5993.0, 11601.0, 23539.0, 48466.0, 100193.0, 185684.0, 249018.0, 198971.0, 108603.0, 54002.0, 25549.0, 12781.0, 6491.0, 3562.0, 1971.0, 1223.0, 728.0, 498.0, 309.0, 202.0, 145.0, 113.0, 80.0, 71.0, 47.0, 35.0, 30.0, 28.0, 13.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73046875, -1.67193603515625, -1.6134033203125, -1.55487060546875, -1.496337890625, -1.43780517578125, -1.3792724609375, -1.32073974609375, -1.26220703125, -1.20367431640625, -1.1451416015625, -1.08660888671875, -1.028076171875, -0.96954345703125, -0.9110107421875, -0.85247802734375, -0.7939453125, -0.73541259765625, -0.6768798828125, -0.61834716796875, -0.559814453125, -0.50128173828125, -0.4427490234375, -0.38421630859375, -0.32568359375, -0.26715087890625, -0.2086181640625, -0.15008544921875, -0.091552734375, -0.03302001953125, 0.0255126953125, 0.08404541015625, 0.142578125, 0.20111083984375, 0.2596435546875, 0.31817626953125, 0.376708984375, 0.43524169921875, 0.4937744140625, 0.55230712890625, 0.61083984375, 0.66937255859375, 0.7279052734375, 0.78643798828125, 0.844970703125, 0.90350341796875, 0.9620361328125, 1.02056884765625, 1.0791015625, 1.13763427734375, 1.1961669921875, 1.25469970703125, 1.313232421875, 1.37176513671875, 1.4302978515625, 1.48883056640625, 1.54736328125, 1.60589599609375, 1.6644287109375, 1.72296142578125, 1.781494140625, 1.84002685546875, 1.8985595703125, 1.95709228515625, 2.015625]}, "gradients/decoder.bert.encoder.layer.10.attention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 9.0, 5.0, 5.0, 12.0, 11.0, 11.0, 23.0, 28.0, 28.0, 30.0, 41.0, 54.0, 47.0, 42.0, 56.0, 47.0, 47.0, 65.0, 57.0, 48.0, 36.0, 42.0, 37.0, 24.0, 39.0, 32.0, 23.0, 18.0, 14.0, 8.0, 7.0, 4.0, 6.0, 9.0, 6.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.4013671875, -0.3897247314453125, -0.378082275390625, -0.3664398193359375, -0.35479736328125, -0.3431549072265625, -0.331512451171875, -0.3198699951171875, -0.3082275390625, -0.2965850830078125, -0.284942626953125, -0.2733001708984375, -0.26165771484375, -0.2500152587890625, -0.238372802734375, -0.2267303466796875, -0.215087890625, -0.2034454345703125, -0.191802978515625, -0.1801605224609375, -0.16851806640625, -0.1568756103515625, -0.145233154296875, -0.1335906982421875, -0.1219482421875, -0.1103057861328125, -0.098663330078125, -0.0870208740234375, -0.07537841796875, -0.0637359619140625, -0.052093505859375, -0.0404510498046875, -0.02880859375, -0.0171661376953125, -0.005523681640625, 0.0061187744140625, 0.01776123046875, 0.0294036865234375, 0.041046142578125, 0.0526885986328125, 0.0643310546875, 0.0759735107421875, 0.087615966796875, 0.0992584228515625, 0.11090087890625, 0.1225433349609375, 0.134185791015625, 0.1458282470703125, 0.157470703125, 0.1691131591796875, 0.180755615234375, 0.1923980712890625, 0.20404052734375, 0.2156829833984375, 0.227325439453125, 0.2389678955078125, 0.2506103515625, 0.2622528076171875, 0.273895263671875, 0.2855377197265625, 0.29718017578125, 0.3088226318359375, 0.320465087890625, 0.3321075439453125, 0.34375]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 4.0, 15.0, 13.0, 13.0, 15.0, 21.0, 33.0, 36.0, 41.0, 48.0, 75.0, 65.0, 58.0, 72.0, 88.0, 59.0, 48.0, 44.0, 55.0, 32.0, 32.0, 26.0, 16.0, 19.0, 15.0, 12.0, 9.0, 3.0, 7.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.999162197113037, -5.831065654754639, -5.662968635559082, -5.494872093200684, -5.326775550842285, -5.1586785316467285, -4.99058198928833, -4.822484970092773, -4.654388427734375, -4.486291885375977, -4.31819486618042, -4.1500983238220215, -3.982001543045044, -3.8139047622680664, -3.645808219909668, -3.4777114391326904, -3.309614896774292, -3.1415181159973145, -2.973421573638916, -2.8053247928619385, -2.637228012084961, -2.4691314697265625, -2.301034688949585, -2.1329379081726074, -1.9648412466049194, -1.7967445850372314, -1.628647804260254, -1.460551142692566, -1.292454481124878, -1.1243577003479004, -0.9562610387802124, -0.7881642580032349, -0.6200675964355469, -0.4519708752632141, -0.28387418389320374, -0.11577749252319336, 0.052319228649139404, 0.22041594982147217, 0.38851261138916016, 0.5566093921661377, 0.7247060537338257, 0.8928027749061584, 1.0608994960784912, 1.2289961576461792, 1.3970928192138672, 1.5651895999908447, 1.7332862615585327, 1.9013830423355103, 2.0694797039031982, 2.237576484680176, 2.405673027038574, 2.5737698078155518, 2.7418665885925293, 2.9099631309509277, 3.0780599117279053, 3.246156692504883, 3.4142532348632812, 3.582350015640259, 3.7504465579986572, 3.9185433387756348, 4.086639881134033, 4.25473690032959, 4.422833442687988, 4.590929985046387, 4.759027004241943]}, "gradients/decoder.bert.encoder.layer.9.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 5.0, 4.0, 11.0, 9.0, 16.0, 18.0, 9.0, 16.0, 30.0, 24.0, 24.0, 31.0, 35.0, 30.0, 30.0, 38.0, 38.0, 56.0, 43.0, 45.0, 46.0, 42.0, 29.0, 30.0, 34.0, 35.0, 34.0, 29.0, 30.0, 33.0, 20.0, 25.0, 15.0, 11.0, 12.0, 9.0, 10.0, 4.0, 10.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8219175338745117, -2.7345430850982666, -2.6471686363220215, -2.5597941875457764, -2.4724197387695312, -2.385045289993286, -2.297670841217041, -2.210296392440796, -2.122921943664551, -2.0355474948883057, -1.9481730461120605, -1.8607985973358154, -1.7734241485595703, -1.6860496997833252, -1.59867525100708, -1.511300802230835, -1.4239263534545898, -1.3365519046783447, -1.2491774559020996, -1.1618030071258545, -1.0744285583496094, -0.9870541095733643, -0.8996796607971191, -0.812305212020874, -0.7249307632446289, -0.6375563144683838, -0.5501818656921387, -0.46280741691589355, -0.37543296813964844, -0.2880585193634033, -0.2006840705871582, -0.11330962181091309, -0.02593541145324707, 0.06143903732299805, 0.14881348609924316, 0.23618793487548828, 0.3235623836517334, 0.4109368324279785, 0.49831128120422363, 0.5856857299804688, 0.6730601787567139, 0.760434627532959, 0.8478090763092041, 0.9351835250854492, 1.0225579738616943, 1.1099324226379395, 1.1973068714141846, 1.2846813201904297, 1.3720557689666748, 1.45943021774292, 1.546804666519165, 1.6341791152954102, 1.7215535640716553, 1.8089280128479004, 1.8963024616241455, 1.9836769104003906, 2.0710513591766357, 2.158425807952881, 2.245800256729126, 2.333174705505371, 2.420549154281616, 2.5079236030578613, 2.5952980518341064, 2.6826725006103516, 2.7700469493865967]}, "gradients/decoder.bert.encoder.layer.9.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 13.0, 16.0, 20.0, 17.0, 27.0, 39.0, 77.0, 94.0, 173.0, 250.0, 392.0, 731.0, 1190.0, 1877.0, 3316.0, 5852.0, 10470.0, 19480.0, 37004.0, 76234.0, 172125.0, 430029.0, 1022466.0, 1279485.0, 665221.0, 256497.0, 107413.0, 49786.0, 24690.0, 13027.0, 6999.0, 3847.0, 2222.0, 1275.0, 738.0, 482.0, 235.0, 157.0, 98.0, 73.0, 47.0, 38.0, 20.0, 12.0, 8.0, 13.0, 5.0, 2.0, 0.0, 0.0, 1.0, 5.0], "bins": [-5.24609375, -5.09716796875, -4.9482421875, -4.79931640625, -4.650390625, -4.50146484375, -4.3525390625, -4.20361328125, -4.0546875, -3.90576171875, -3.7568359375, -3.60791015625, -3.458984375, -3.31005859375, -3.1611328125, -3.01220703125, -2.86328125, -2.71435546875, -2.5654296875, -2.41650390625, -2.267578125, -2.11865234375, -1.9697265625, -1.82080078125, -1.671875, -1.52294921875, -1.3740234375, -1.22509765625, -1.076171875, -0.92724609375, -0.7783203125, -0.62939453125, -0.48046875, -0.33154296875, -0.1826171875, -0.03369140625, 0.115234375, 0.26416015625, 0.4130859375, 0.56201171875, 0.7109375, 0.85986328125, 1.0087890625, 1.15771484375, 1.306640625, 1.45556640625, 1.6044921875, 1.75341796875, 1.90234375, 2.05126953125, 2.2001953125, 2.34912109375, 2.498046875, 2.64697265625, 2.7958984375, 2.94482421875, 3.09375, 3.24267578125, 3.3916015625, 3.54052734375, 3.689453125, 3.83837890625, 3.9873046875, 4.13623046875, 4.28515625]}, "gradients/decoder.bert.encoder.layer.9.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 8.0, 4.0, 3.0, 7.0, 7.0, 16.0, 16.0, 11.0, 18.0, 19.0, 24.0, 29.0, 36.0, 25.0, 27.0, 34.0, 43.0, 54.0, 47.0, 42.0, 49.0, 48.0, 43.0, 41.0, 33.0, 35.0, 40.0, 32.0, 33.0, 27.0, 26.0, 18.0, 18.0, 22.0, 15.0, 11.0, 12.0, 6.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.396484375, -2.32330322265625, -2.2501220703125, -2.17694091796875, -2.103759765625, -2.03057861328125, -1.9573974609375, -1.88421630859375, -1.81103515625, -1.73785400390625, -1.6646728515625, -1.59149169921875, -1.518310546875, -1.44512939453125, -1.3719482421875, -1.29876708984375, -1.2255859375, -1.15240478515625, -1.0792236328125, -1.00604248046875, -0.932861328125, -0.85968017578125, -0.7864990234375, -0.71331787109375, -0.64013671875, -0.56695556640625, -0.4937744140625, -0.42059326171875, -0.347412109375, -0.27423095703125, -0.2010498046875, -0.12786865234375, -0.0546875, 0.01849365234375, 0.0916748046875, 0.16485595703125, 0.238037109375, 0.31121826171875, 0.3843994140625, 0.45758056640625, 0.53076171875, 0.60394287109375, 0.6771240234375, 0.75030517578125, 0.823486328125, 0.89666748046875, 0.9698486328125, 1.04302978515625, 1.1162109375, 1.18939208984375, 1.2625732421875, 1.33575439453125, 1.408935546875, 1.48211669921875, 1.5552978515625, 1.62847900390625, 1.70166015625, 1.77484130859375, 1.8480224609375, 1.92120361328125, 1.994384765625, 2.06756591796875, 2.1407470703125, 2.21392822265625, 2.287109375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 13.0, 11.0, 26.0, 72.0, 81.0, 143.0, 220.0, 427.0, 731.0, 1440.0, 2567.0, 4874.0, 9441.0, 18633.0, 38537.0, 83064.0, 188194.0, 447615.0, 1025924.0, 1256031.0, 635381.0, 263905.0, 114014.0, 51901.0, 24866.0, 12295.0, 6323.0, 3405.0, 1850.0, 938.0, 582.0, 330.0, 169.0, 115.0, 66.0, 37.0, 24.0, 14.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.37286376953125, -5.1949462890625, -5.01702880859375, -4.839111328125, -4.66119384765625, -4.4832763671875, -4.30535888671875, -4.12744140625, -3.94952392578125, -3.7716064453125, -3.59368896484375, -3.415771484375, -3.23785400390625, -3.0599365234375, -2.88201904296875, -2.7041015625, -2.52618408203125, -2.3482666015625, -2.17034912109375, -1.992431640625, -1.81451416015625, -1.6365966796875, -1.45867919921875, -1.28076171875, -1.10284423828125, -0.9249267578125, -0.74700927734375, -0.569091796875, -0.39117431640625, -0.2132568359375, -0.03533935546875, 0.142578125, 0.32049560546875, 0.4984130859375, 0.67633056640625, 0.854248046875, 1.03216552734375, 1.2100830078125, 1.38800048828125, 1.56591796875, 1.74383544921875, 1.9217529296875, 2.09967041015625, 2.277587890625, 2.45550537109375, 2.6334228515625, 2.81134033203125, 2.9892578125, 3.16717529296875, 3.3450927734375, 3.52301025390625, 3.700927734375, 3.87884521484375, 4.0567626953125, 4.23468017578125, 4.41259765625, 4.59051513671875, 4.7684326171875, 4.94635009765625, 5.124267578125, 5.30218505859375, 5.4801025390625, 5.65802001953125, 5.8359375]}, "gradients/decoder.bert.encoder.layer.9.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 8.0, 8.0, 15.0, 17.0, 24.0, 21.0, 26.0, 41.0, 48.0, 87.0, 88.0, 110.0, 143.0, 177.0, 205.0, 248.0, 308.0, 295.0, 324.0, 325.0, 297.0, 226.0, 210.0, 178.0, 152.0, 104.0, 78.0, 69.0, 51.0, 44.0, 30.0, 30.0, 21.0, 12.0, 14.0, 18.0, 7.0, 6.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4149322509765625, -1.369903564453125, -1.3248748779296875, -1.27984619140625, -1.2348175048828125, -1.189788818359375, -1.1447601318359375, -1.0997314453125, -1.0547027587890625, -1.009674072265625, -0.9646453857421875, -0.91961669921875, -0.8745880126953125, -0.829559326171875, -0.7845306396484375, -0.739501953125, -0.6944732666015625, -0.649444580078125, -0.6044158935546875, -0.55938720703125, -0.5143585205078125, -0.469329833984375, -0.4243011474609375, -0.3792724609375, -0.3342437744140625, -0.289215087890625, -0.2441864013671875, -0.19915771484375, -0.1541290283203125, -0.109100341796875, -0.0640716552734375, -0.01904296875, 0.0259857177734375, 0.071014404296875, 0.1160430908203125, 0.16107177734375, 0.2061004638671875, 0.251129150390625, 0.2961578369140625, 0.3411865234375, 0.3862152099609375, 0.431243896484375, 0.4762725830078125, 0.52130126953125, 0.5663299560546875, 0.611358642578125, 0.6563873291015625, 0.701416015625, 0.7464447021484375, 0.791473388671875, 0.8365020751953125, 0.88153076171875, 0.9265594482421875, 0.971588134765625, 1.0166168212890625, 1.0616455078125, 1.1066741943359375, 1.151702880859375, 1.1967315673828125, 1.24176025390625, 1.2867889404296875, 1.331817626953125, 1.3768463134765625, 1.421875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 4.0, 2.0, 5.0, 6.0, 13.0, 12.0, 11.0, 14.0, 18.0, 24.0, 37.0, 41.0, 47.0, 55.0, 72.0, 60.0, 64.0, 67.0, 61.0, 76.0, 55.0, 49.0, 42.0, 28.0, 27.0, 25.0, 14.0, 14.0, 13.0, 8.0, 6.0, 9.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.115167617797852, -5.950706958770752, -5.7862467765808105, -5.621786117553711, -5.4573259353637695, -5.29286527633667, -5.1284050941467285, -4.963944435119629, -4.7994842529296875, -4.635023593902588, -4.4705634117126465, -4.306102752685547, -4.1416425704956055, -3.977181911468506, -3.8127214908599854, -3.648261070251465, -3.4838004112243652, -3.3193399906158447, -3.154879570007324, -2.9904191493988037, -2.825958728790283, -2.6614980697631836, -2.497037649154663, -2.3325772285461426, -2.168116807937622, -2.0036563873291016, -1.839195966720581, -1.674735426902771, -1.5102750062942505, -1.34581458568573, -1.18135404586792, -1.0168936252593994, -0.8524336814880371, -0.6879732608795166, -0.5235127806663513, -0.3590523302555084, -0.19459187984466553, -0.03013145923614502, 0.13432902097702026, 0.29878950119018555, 0.46324992179870605, 0.6277103424072266, 0.7921708226203918, 0.9566313028335571, 1.1210917234420776, 1.2855521440505981, 1.4500126838684082, 1.6144731044769287, 1.7789335250854492, 1.9433939456939697, 2.1078543663024902, 2.2723147869110107, 2.4367752075195312, 2.601235866546631, 2.7656962871551514, 2.930156707763672, 3.0946171283721924, 3.259077548980713, 3.4235379695892334, 3.587998390197754, 3.7524590492248535, 3.916919231414795, 4.0813798904418945, 4.245840072631836, 4.4103007316589355]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 8.0, 8.0, 4.0, 10.0, 18.0, 10.0, 16.0, 14.0, 25.0, 20.0, 32.0, 27.0, 32.0, 33.0, 44.0, 42.0, 38.0, 58.0, 25.0, 44.0, 43.0, 38.0, 40.0, 34.0, 42.0, 39.0, 25.0, 30.0, 22.0, 32.0, 21.0, 22.0, 18.0, 17.0, 15.0, 11.0, 8.0, 12.0, 3.0, 4.0, 4.0, 7.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.7552988529205322, -2.6693832874298096, -2.583467960357666, -2.4975523948669434, -2.4116368293762207, -2.325721502304077, -2.2398059368133545, -2.153890609741211, -2.0679750442504883, -1.9820595979690552, -1.896144151687622, -1.8102285861968994, -1.7243131399154663, -1.6383976936340332, -1.5524821281433105, -1.4665666818618774, -1.3806512355804443, -1.2947357892990112, -1.2088203430175781, -1.1229047775268555, -1.0369893312454224, -0.9510738849639893, -0.8651583790779114, -0.7792428731918335, -0.6933274269104004, -0.6074119806289673, -0.5214964747428894, -0.4355809986591339, -0.3496655225753784, -0.2637500464916229, -0.17783457040786743, -0.09191906452178955, -0.006003618240356445, 0.07991185784339905, 0.16582733392715454, 0.25174281001091003, 0.3376582860946655, 0.423573762178421, 0.5094892382621765, 0.5954047441482544, 0.6813201904296875, 0.7672356367111206, 0.8531511425971985, 0.9390666484832764, 1.0249820947647095, 1.1108975410461426, 1.1968131065368652, 1.2827285528182983, 1.3686439990997314, 1.4545594453811646, 1.5404748916625977, 1.6263904571533203, 1.7123059034347534, 1.7982213497161865, 1.8841369152069092, 1.9700523614883423, 2.0559678077697754, 2.141883373260498, 2.2277987003326416, 2.3137142658233643, 2.399629592895508, 2.4855451583862305, 2.571460723876953, 2.657376289367676, 2.7432916164398193]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 15.0, 24.0, 25.0, 25.0, 51.0, 67.0, 122.0, 136.0, 235.0, 364.0, 576.0, 882.0, 1361.0, 2190.0, 3480.0, 6284.0, 10998.0, 19590.0, 36293.0, 67930.0, 128564.0, 214372.0, 230811.0, 148472.0, 80579.0, 42139.0, 22663.0, 12327.0, 7054.0, 4033.0, 2482.0, 1542.0, 985.0, 609.0, 413.0, 274.0, 189.0, 109.0, 87.0, 64.0, 38.0, 25.0, 20.0, 14.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.385498046875, -0.3731117248535156, -0.36072540283203125, -0.3483390808105469, -0.3359527587890625, -0.3235664367675781, -0.31118011474609375, -0.2987937927246094, -0.286407470703125, -0.2740211486816406, -0.26163482666015625, -0.24924850463867188, -0.2368621826171875, -0.22447586059570312, -0.21208953857421875, -0.19970321655273438, -0.18731689453125, -0.17493057250976562, -0.16254425048828125, -0.15015792846679688, -0.1377716064453125, -0.12538528442382812, -0.11299896240234375, -0.10061264038085938, -0.088226318359375, -0.07583999633789062, -0.06345367431640625, -0.051067352294921875, -0.0386810302734375, -0.026294708251953125, -0.01390838623046875, -0.001522064208984375, 0.0108642578125, 0.023250579833984375, 0.03563690185546875, 0.048023223876953125, 0.0604095458984375, 0.07279586791992188, 0.08518218994140625, 0.09756851196289062, 0.109954833984375, 0.12234115600585938, 0.13472747802734375, 0.14711380004882812, 0.1595001220703125, 0.17188644409179688, 0.18427276611328125, 0.19665908813476562, 0.20904541015625, 0.22143173217773438, 0.23381805419921875, 0.24620437622070312, 0.2585906982421875, 0.2709770202636719, 0.28336334228515625, 0.2957496643066406, 0.308135986328125, 0.3205223083496094, 0.33290863037109375, 0.3452949523925781, 0.3576812744140625, 0.3700675964355469, 0.38245391845703125, 0.3948402404785156, 0.4072265625]}, "gradients/decoder.bert.encoder.layer.9.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 7.0, 5.0, 3.0, 11.0, 10.0, 16.0, 23.0, 19.0, 20.0, 25.0, 23.0, 41.0, 35.0, 44.0, 40.0, 39.0, 47.0, 30.0, 48.0, 45.0, 52.0, 37.0, 43.0, 43.0, 32.0, 38.0, 38.0, 28.0, 24.0, 12.0, 24.0, 18.0, 16.0, 19.0, 9.0, 7.0, 12.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.404296875, -3.302093505859375, -3.19989013671875, -3.097686767578125, -2.9954833984375, -2.893280029296875, -2.79107666015625, -2.688873291015625, -2.586669921875, -2.484466552734375, -2.38226318359375, -2.280059814453125, -2.1778564453125, -2.075653076171875, -1.97344970703125, -1.871246337890625, -1.76904296875, -1.666839599609375, -1.56463623046875, -1.462432861328125, -1.3602294921875, -1.258026123046875, -1.15582275390625, -1.053619384765625, -0.951416015625, -0.849212646484375, -0.74700927734375, -0.644805908203125, -0.5426025390625, -0.440399169921875, -0.33819580078125, -0.235992431640625, -0.1337890625, -0.031585693359375, 0.07061767578125, 0.172821044921875, 0.2750244140625, 0.377227783203125, 0.47943115234375, 0.581634521484375, 0.683837890625, 0.786041259765625, 0.88824462890625, 0.990447998046875, 1.0926513671875, 1.194854736328125, 1.29705810546875, 1.399261474609375, 1.50146484375, 1.603668212890625, 1.70587158203125, 1.808074951171875, 1.9102783203125, 2.012481689453125, 2.11468505859375, 2.216888427734375, 2.319091796875, 2.421295166015625, 2.52349853515625, 2.625701904296875, 2.7279052734375, 2.830108642578125, 2.93231201171875, 3.034515380859375, 3.13671875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 11.0, 7.0, 6.0, 10.0, 18.0, 30.0, 35.0, 33.0, 53.0, 86.0, 105.0, 153.0, 224.0, 270.0, 468.0, 767.0, 1194.0, 2007.0, 3628.0, 6792.0, 14501.0, 38870.0, 728524.0, 199926.0, 26828.0, 11178.0, 5350.0, 2858.0, 1699.0, 1018.0, 601.0, 434.0, 267.0, 172.0, 124.0, 73.0, 63.0, 45.0, 29.0, 23.0, 27.0, 16.0, 8.0, 5.0, 8.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.1845703125, -1.1505661010742188, -1.1165618896484375, -1.0825576782226562, -1.048553466796875, -1.0145492553710938, -0.9805450439453125, -0.9465408325195312, -0.91253662109375, -0.8785324096679688, -0.8445281982421875, -0.8105239868164062, -0.776519775390625, -0.7425155639648438, -0.7085113525390625, -0.6745071411132812, -0.6405029296875, -0.6064987182617188, -0.5724945068359375, -0.5384902954101562, -0.504486083984375, -0.47048187255859375, -0.4364776611328125, -0.40247344970703125, -0.36846923828125, -0.33446502685546875, -0.3004608154296875, -0.26645660400390625, -0.232452392578125, -0.19844818115234375, -0.1644439697265625, -0.13043975830078125, -0.096435546875, -0.06243133544921875, -0.0284271240234375, 0.00557708740234375, 0.039581298828125, 0.07358551025390625, 0.1075897216796875, 0.14159393310546875, 0.17559814453125, 0.20960235595703125, 0.2436065673828125, 0.27761077880859375, 0.311614990234375, 0.34561920166015625, 0.3796234130859375, 0.41362762451171875, 0.4476318359375, 0.48163604736328125, 0.5156402587890625, 0.5496444702148438, 0.583648681640625, 0.6176528930664062, 0.6516571044921875, 0.6856613159179688, 0.71966552734375, 0.7536697387695312, 0.7876739501953125, 0.8216781616210938, 0.855682373046875, 0.8896865844726562, 0.9236907958984375, 0.9576950073242188, 0.99169921875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 6.0, 6.0, 6.0, 3.0, 8.0, 11.0, 14.0, 11.0, 18.0, 20.0, 21.0, 27.0, 22.0, 30.0, 31.0, 25.0, 35.0, 19.0, 38.0, 37.0, 37.0, 47.0, 39.0, 37.0, 33.0, 45.0, 36.0, 32.0, 32.0, 38.0, 27.0, 34.0, 40.0, 20.0, 14.0, 14.0, 17.0, 17.0, 12.0, 7.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.017578125, -1.958251953125, -1.89892578125, -1.839599609375, -1.7802734375, -1.720947265625, -1.66162109375, -1.602294921875, -1.54296875, -1.483642578125, -1.42431640625, -1.364990234375, -1.3056640625, -1.246337890625, -1.18701171875, -1.127685546875, -1.068359375, -1.009033203125, -0.94970703125, -0.890380859375, -0.8310546875, -0.771728515625, -0.71240234375, -0.653076171875, -0.59375, -0.534423828125, -0.47509765625, -0.415771484375, -0.3564453125, -0.297119140625, -0.23779296875, -0.178466796875, -0.119140625, -0.059814453125, -0.00048828125, 0.058837890625, 0.1181640625, 0.177490234375, 0.23681640625, 0.296142578125, 0.35546875, 0.414794921875, 0.47412109375, 0.533447265625, 0.5927734375, 0.652099609375, 0.71142578125, 0.770751953125, 0.830078125, 0.889404296875, 0.94873046875, 1.008056640625, 1.0673828125, 1.126708984375, 1.18603515625, 1.245361328125, 1.3046875, 1.364013671875, 1.42333984375, 1.482666015625, 1.5419921875, 1.601318359375, 1.66064453125, 1.719970703125, 1.779296875]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 14.0, 24.0, 7.0, 33.0, 31.0, 48.0, 63.0, 116.0, 171.0, 244.0, 375.0, 571.0, 935.0, 1667.0, 2980.0, 5600.0, 11065.0, 25333.0, 353166.0, 594630.0, 26702.0, 11657.0, 5597.0, 3028.0, 1676.0, 1001.0, 618.0, 391.0, 247.0, 159.0, 122.0, 78.0, 72.0, 36.0, 27.0, 17.0, 9.0, 11.0, 5.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.265869140625, -0.25782012939453125, -0.2497711181640625, -0.24172210693359375, -0.233673095703125, -0.22562408447265625, -0.2175750732421875, -0.20952606201171875, -0.20147705078125, -0.19342803955078125, -0.1853790283203125, -0.17733001708984375, -0.169281005859375, -0.16123199462890625, -0.1531829833984375, -0.14513397216796875, -0.1370849609375, -0.12903594970703125, -0.1209869384765625, -0.11293792724609375, -0.104888916015625, -0.09683990478515625, -0.0887908935546875, -0.08074188232421875, -0.07269287109375, -0.06464385986328125, -0.0565948486328125, -0.04854583740234375, -0.040496826171875, -0.03244781494140625, -0.0243988037109375, -0.01634979248046875, -0.00830078125, -0.00025177001953125, 0.0077972412109375, 0.01584625244140625, 0.023895263671875, 0.03194427490234375, 0.0399932861328125, 0.04804229736328125, 0.05609130859375, 0.06414031982421875, 0.0721893310546875, 0.08023834228515625, 0.088287353515625, 0.09633636474609375, 0.1043853759765625, 0.11243438720703125, 0.1204833984375, 0.12853240966796875, 0.1365814208984375, 0.14463043212890625, 0.152679443359375, 0.16072845458984375, 0.1687774658203125, 0.17682647705078125, 0.18487548828125, 0.19292449951171875, 0.2009735107421875, 0.20902252197265625, 0.217071533203125, 0.22512054443359375, 0.2331695556640625, 0.24121856689453125, 0.249267578125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 8.0, 4.0, 7.0, 8.0, 18.0, 13.0, 19.0, 29.0, 29.0, 29.0, 38.0, 40.0, 42.0, 46.0, 52.0, 58.0, 44.0, 34.0, 53.0, 40.0, 32.0, 39.0, 46.0, 47.0, 27.0, 32.0, 21.0, 27.0, 21.0, 27.0, 16.0, 10.0, 12.0, 5.0, 8.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.9848346710205078e-05, -1.9300729036331177e-05, -1.8753111362457275e-05, -1.8205493688583374e-05, -1.7657876014709473e-05, -1.711025834083557e-05, -1.656264066696167e-05, -1.601502299308777e-05, -1.5467405319213867e-05, -1.4919787645339966e-05, -1.4372169971466064e-05, -1.3824552297592163e-05, -1.3276934623718262e-05, -1.272931694984436e-05, -1.2181699275970459e-05, -1.1634081602096558e-05, -1.1086463928222656e-05, -1.0538846254348755e-05, -9.991228580474854e-06, -9.443610906600952e-06, -8.89599323272705e-06, -8.34837555885315e-06, -7.800757884979248e-06, -7.253140211105347e-06, -6.705522537231445e-06, -6.157904863357544e-06, -5.610287189483643e-06, -5.062669515609741e-06, -4.51505184173584e-06, -3.9674341678619385e-06, -3.419816493988037e-06, -2.8721988201141357e-06, -2.3245811462402344e-06, -1.776963472366333e-06, -1.2293457984924316e-06, -6.817281246185303e-07, -1.341104507446289e-07, 4.1350722312927246e-07, 9.611248970031738e-07, 1.5087425708770752e-06, 2.0563602447509766e-06, 2.603977918624878e-06, 3.1515955924987793e-06, 3.6992132663726807e-06, 4.246830940246582e-06, 4.794448614120483e-06, 5.342066287994385e-06, 5.889683961868286e-06, 6.4373016357421875e-06, 6.984919309616089e-06, 7.53253698348999e-06, 8.080154657363892e-06, 8.627772331237793e-06, 9.175390005111694e-06, 9.723007678985596e-06, 1.0270625352859497e-05, 1.0818243026733398e-05, 1.13658607006073e-05, 1.1913478374481201e-05, 1.2461096048355103e-05, 1.3008713722229004e-05, 1.3556331396102905e-05, 1.4103949069976807e-05, 1.4651566743850708e-05, 1.519918441772461e-05]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.weight": {"_type": "histogram", "values": [3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 7.0, 4.0, 10.0, 10.0, 13.0, 20.0, 24.0, 48.0, 83.0, 77.0, 134.0, 207.0, 301.0, 491.0, 742.0, 1115.0, 1689.0, 2610.0, 4023.0, 6348.0, 10363.0, 16698.0, 28108.0, 48318.0, 81944.0, 135184.0, 187707.0, 186925.0, 133315.0, 81549.0, 47692.0, 27743.0, 17124.0, 10208.0, 6317.0, 3889.0, 2634.0, 1582.0, 1123.0, 692.0, 474.0, 327.0, 215.0, 150.0, 123.0, 67.0, 44.0, 26.0, 14.0, 17.0, 11.0, 5.0, 8.0, 6.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.07720947265625, -0.07486915588378906, -0.07252883911132812, -0.07018852233886719, -0.06784820556640625, -0.06550788879394531, -0.06316757202148438, -0.06082725524902344, -0.0584869384765625, -0.05614662170410156, -0.053806304931640625, -0.05146598815917969, -0.04912567138671875, -0.04678535461425781, -0.044445037841796875, -0.04210472106933594, -0.039764404296875, -0.03742408752441406, -0.035083770751953125, -0.03274345397949219, -0.03040313720703125, -0.028062820434570312, -0.025722503662109375, -0.023382186889648438, -0.0210418701171875, -0.018701553344726562, -0.016361236572265625, -0.014020919799804688, -0.01168060302734375, -0.009340286254882812, -0.006999969482421875, -0.0046596527099609375, -0.0023193359375, 2.09808349609375e-05, 0.002361297607421875, 0.0047016143798828125, 0.00704193115234375, 0.009382247924804688, 0.011722564697265625, 0.014062881469726562, 0.0164031982421875, 0.018743515014648438, 0.021083831787109375, 0.023424148559570312, 0.02576446533203125, 0.028104782104492188, 0.030445098876953125, 0.03278541564941406, 0.035125732421875, 0.03746604919433594, 0.039806365966796875, 0.04214668273925781, 0.04448699951171875, 0.04682731628417969, 0.049167633056640625, 0.05150794982910156, 0.0538482666015625, 0.05618858337402344, 0.058528900146484375, 0.06086921691894531, 0.06320953369140625, 0.06554985046386719, 0.06789016723632812, 0.07023048400878906, 0.07257080078125]}, "gradients/decoder.bert.encoder.layer.9.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 5.0, 5.0, 11.0, 13.0, 14.0, 16.0, 19.0, 27.0, 37.0, 35.0, 48.0, 56.0, 44.0, 69.0, 68.0, 66.0, 56.0, 72.0, 48.0, 54.0, 43.0, 32.0, 36.0, 27.0, 19.0, 13.0, 16.0, 8.0, 7.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0203094482421875, -0.01946711540222168, -0.01862478256225586, -0.01778244972229004, -0.01694011688232422, -0.0160977840423584, -0.015255451202392578, -0.014413118362426758, -0.013570785522460938, -0.012728452682495117, -0.011886119842529297, -0.011043787002563477, -0.010201454162597656, -0.009359121322631836, -0.008516788482666016, -0.007674455642700195, -0.006832122802734375, -0.005989789962768555, -0.005147457122802734, -0.004305124282836914, -0.0034627914428710938, -0.0026204586029052734, -0.0017781257629394531, -0.0009357929229736328, -9.34600830078125e-05, 0.0007488727569580078, 0.0015912055969238281, 0.0024335384368896484, 0.0032758712768554688, 0.004118204116821289, 0.004960536956787109, 0.00580286979675293, 0.00664520263671875, 0.00748753547668457, 0.00832986831665039, 0.009172201156616211, 0.010014533996582031, 0.010856866836547852, 0.011699199676513672, 0.012541532516479492, 0.013383865356445312, 0.014226198196411133, 0.015068531036376953, 0.015910863876342773, 0.016753196716308594, 0.017595529556274414, 0.018437862396240234, 0.019280195236206055, 0.020122528076171875, 0.020964860916137695, 0.021807193756103516, 0.022649526596069336, 0.023491859436035156, 0.024334192276000977, 0.025176525115966797, 0.026018857955932617, 0.026861190795898438, 0.027703523635864258, 0.028545856475830078, 0.0293881893157959, 0.03023052215576172, 0.03107285499572754, 0.03191518783569336, 0.03275752067565918, 0.033599853515625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 1.0, 5.0, 11.0, 11.0, 12.0, 8.0, 15.0, 22.0, 28.0, 33.0, 56.0, 39.0, 61.0, 69.0, 66.0, 63.0, 68.0, 65.0, 77.0, 54.0, 38.0, 41.0, 22.0, 27.0, 25.0, 14.0, 15.0, 11.0, 5.0, 10.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.1463704109191895, -5.979775905609131, -5.813181400299072, -5.646586894989014, -5.479991912841797, -5.313397407531738, -5.14680290222168, -4.980208396911621, -4.8136138916015625, -4.647019386291504, -4.480424880981445, -4.313830375671387, -4.147235870361328, -3.9806411266326904, -3.8140463829040527, -3.647451877593994, -3.4808573722839355, -3.314262866973877, -3.1476683616638184, -2.9810736179351807, -2.814479112625122, -2.6478846073150635, -2.481289863586426, -2.314695358276367, -2.1481008529663086, -1.98150634765625, -1.8149117231369019, -1.6483170986175537, -1.4817225933074951, -1.3151280879974365, -1.1485334634780884, -0.9819388389587402, -0.8153438568115234, -0.6487492918968201, -0.4821547269821167, -0.31556016206741333, -0.14896559715270996, 0.017628967761993408, 0.18422353267669678, 0.3508181571960449, 0.5174126625061035, 0.6840072274208069, 0.8506017923355103, 1.0171964168548584, 1.183790922164917, 1.3503854274749756, 1.5169800519943237, 1.6835746765136719, 1.8501691818237305, 2.016763687133789, 2.1833581924438477, 2.3499529361724854, 2.516547441482544, 2.6831419467926025, 2.8497366905212402, 3.016331195831299, 3.1829257011413574, 3.349520206451416, 3.5161147117614746, 3.6827094554901123, 3.849303960800171, 4.015898704528809, 4.182493209838867, 4.349087715148926, 4.515682220458984]}, "gradients/decoder.bert.encoder.layer.9.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 6.0, 6.0, 9.0, 5.0, 9.0, 18.0, 8.0, 17.0, 13.0, 24.0, 20.0, 32.0, 28.0, 33.0, 31.0, 41.0, 43.0, 40.0, 51.0, 34.0, 46.0, 38.0, 42.0, 37.0, 35.0, 39.0, 45.0, 24.0, 30.0, 22.0, 32.0, 18.0, 26.0, 16.0, 18.0, 14.0, 11.0, 8.0, 14.0, 3.0, 4.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.7307229042053223, -2.6451244354248047, -2.559526205062866, -2.4739277362823486, -2.38832950592041, -2.3027310371398926, -2.217132568359375, -2.1315343379974365, -2.045936107635498, -1.96033775806427, -1.874739408493042, -1.7891409397125244, -1.703542709350586, -1.6179442405700684, -1.5323458909988403, -1.4467475414276123, -1.3611490726470947, -1.2755507230758667, -1.1899523735046387, -1.104353904724121, -1.0187556743621826, -0.9331572651863098, -0.847558856010437, -0.761960506439209, -0.676362156867981, -0.5907638072967529, -0.5051654577255249, -0.4195670485496521, -0.3339686989784241, -0.24837034940719604, -0.16277194023132324, -0.07717359066009521, 0.008424520492553711, 0.09402288496494293, 0.17962124943733215, 0.26521962881088257, 0.3508179783821106, 0.4364163279533386, 0.5220147371292114, 0.6076130867004395, 0.6932114362716675, 0.7788097858428955, 0.8644081354141235, 0.9500065445899963, 1.0356049537658691, 1.1212031841278076, 1.2068016529083252, 1.2924000024795532, 1.3779983520507812, 1.4635967016220093, 1.5491950511932373, 1.6347935199737549, 1.7203917503356934, 1.805990219116211, 1.891588568687439, 1.977186918258667, 2.0627851486206055, 2.148383617401123, 2.2339818477630615, 2.319580316543579, 2.4051785469055176, 2.490777015686035, 2.5763754844665527, 2.661973714828491, 2.747572183609009]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 7.0, 7.0, 19.0, 19.0, 34.0, 44.0, 71.0, 104.0, 194.0, 271.0, 435.0, 726.0, 1282.0, 2249.0, 4417.0, 8200.0, 16104.0, 31684.0, 62185.0, 114471.0, 181745.0, 217199.0, 177109.0, 109108.0, 58651.0, 29738.0, 15167.0, 7912.0, 4044.0, 2314.0, 1181.0, 726.0, 403.0, 249.0, 160.0, 103.0, 72.0, 50.0, 39.0, 19.0, 15.0, 8.0, 9.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.0390625, -3.921844482421875, -3.80462646484375, -3.687408447265625, -3.5701904296875, -3.452972412109375, -3.33575439453125, -3.218536376953125, -3.101318359375, -2.984100341796875, -2.86688232421875, -2.749664306640625, -2.6324462890625, -2.515228271484375, -2.39801025390625, -2.280792236328125, -2.16357421875, -2.046356201171875, -1.92913818359375, -1.811920166015625, -1.6947021484375, -1.577484130859375, -1.46026611328125, -1.343048095703125, -1.225830078125, -1.108612060546875, -0.99139404296875, -0.874176025390625, -0.7569580078125, -0.639739990234375, -0.52252197265625, -0.405303955078125, -0.2880859375, -0.170867919921875, -0.05364990234375, 0.063568115234375, 0.1807861328125, 0.298004150390625, 0.41522216796875, 0.532440185546875, 0.649658203125, 0.766876220703125, 0.88409423828125, 1.001312255859375, 1.1185302734375, 1.235748291015625, 1.35296630859375, 1.470184326171875, 1.58740234375, 1.704620361328125, 1.82183837890625, 1.939056396484375, 2.0562744140625, 2.173492431640625, 2.29071044921875, 2.407928466796875, 2.525146484375, 2.642364501953125, 2.75958251953125, 2.876800537109375, 2.9940185546875, 3.111236572265625, 3.22845458984375, 3.345672607421875, 3.462890625]}, "gradients/decoder.bert.encoder.layer.9.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 4.0, 13.0, 11.0, 17.0, 11.0, 20.0, 30.0, 21.0, 35.0, 33.0, 43.0, 50.0, 36.0, 53.0, 43.0, 60.0, 57.0, 51.0, 37.0, 41.0, 37.0, 46.0, 37.0, 30.0, 28.0, 19.0, 21.0, 11.0, 24.0, 19.0, 13.0, 15.0, 8.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.681640625, -3.570770263671875, -3.45989990234375, -3.349029541015625, -3.2381591796875, -3.127288818359375, -3.01641845703125, -2.905548095703125, -2.794677734375, -2.683807373046875, -2.57293701171875, -2.462066650390625, -2.3511962890625, -2.240325927734375, -2.12945556640625, -2.018585205078125, -1.90771484375, -1.796844482421875, -1.68597412109375, -1.575103759765625, -1.4642333984375, -1.353363037109375, -1.24249267578125, -1.131622314453125, -1.020751953125, -0.909881591796875, -0.79901123046875, -0.688140869140625, -0.5772705078125, -0.466400146484375, -0.35552978515625, -0.244659423828125, -0.1337890625, -0.022918701171875, 0.08795166015625, 0.198822021484375, 0.3096923828125, 0.420562744140625, 0.53143310546875, 0.642303466796875, 0.753173828125, 0.864044189453125, 0.97491455078125, 1.085784912109375, 1.1966552734375, 1.307525634765625, 1.41839599609375, 1.529266357421875, 1.64013671875, 1.751007080078125, 1.86187744140625, 1.972747802734375, 2.0836181640625, 2.194488525390625, 2.30535888671875, 2.416229248046875, 2.527099609375, 2.637969970703125, 2.74884033203125, 2.859710693359375, 2.9705810546875, 3.081451416015625, 3.19232177734375, 3.303192138671875, 3.4140625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 6.0, 12.0, 16.0, 29.0, 38.0, 76.0, 104.0, 159.0, 250.0, 421.0, 712.0, 1137.0, 2021.0, 3218.0, 5919.0, 10013.0, 17492.0, 30475.0, 51204.0, 84044.0, 126125.0, 163229.0, 170057.0, 139323.0, 96736.0, 60314.0, 36081.0, 20816.0, 12020.0, 6773.0, 3811.0, 2276.0, 1414.0, 885.0, 544.0, 280.0, 189.0, 123.0, 66.0, 47.0, 41.0, 19.0, 20.0, 8.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1953125, -3.095947265625, -2.99658203125, -2.897216796875, -2.7978515625, -2.698486328125, -2.59912109375, -2.499755859375, -2.400390625, -2.301025390625, -2.20166015625, -2.102294921875, -2.0029296875, -1.903564453125, -1.80419921875, -1.704833984375, -1.60546875, -1.506103515625, -1.40673828125, -1.307373046875, -1.2080078125, -1.108642578125, -1.00927734375, -0.909912109375, -0.810546875, -0.711181640625, -0.61181640625, -0.512451171875, -0.4130859375, -0.313720703125, -0.21435546875, -0.114990234375, -0.015625, 0.083740234375, 0.18310546875, 0.282470703125, 0.3818359375, 0.481201171875, 0.58056640625, 0.679931640625, 0.779296875, 0.878662109375, 0.97802734375, 1.077392578125, 1.1767578125, 1.276123046875, 1.37548828125, 1.474853515625, 1.57421875, 1.673583984375, 1.77294921875, 1.872314453125, 1.9716796875, 2.071044921875, 2.17041015625, 2.269775390625, 2.369140625, 2.468505859375, 2.56787109375, 2.667236328125, 2.7666015625, 2.865966796875, 2.96533203125, 3.064697265625, 3.1640625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 11.0, 13.0, 19.0, 14.0, 24.0, 20.0, 33.0, 20.0, 37.0, 40.0, 34.0, 42.0, 48.0, 30.0, 34.0, 41.0, 49.0, 39.0, 38.0, 45.0, 39.0, 41.0, 31.0, 36.0, 36.0, 27.0, 18.0, 20.0, 18.0, 20.0, 11.0, 9.0, 7.0, 5.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7509765625, -1.6909942626953125, -1.631011962890625, -1.5710296630859375, -1.51104736328125, -1.4510650634765625, -1.391082763671875, -1.3311004638671875, -1.2711181640625, -1.2111358642578125, -1.151153564453125, -1.0911712646484375, -1.03118896484375, -0.9712066650390625, -0.911224365234375, -0.8512420654296875, -0.791259765625, -0.7312774658203125, -0.671295166015625, -0.6113128662109375, -0.55133056640625, -0.4913482666015625, -0.431365966796875, -0.3713836669921875, -0.3114013671875, -0.2514190673828125, -0.191436767578125, -0.1314544677734375, -0.07147216796875, -0.0114898681640625, 0.048492431640625, 0.1084747314453125, 0.16845703125, 0.2284393310546875, 0.288421630859375, 0.3484039306640625, 0.40838623046875, 0.4683685302734375, 0.528350830078125, 0.5883331298828125, 0.6483154296875, 0.7082977294921875, 0.768280029296875, 0.8282623291015625, 0.88824462890625, 0.9482269287109375, 1.008209228515625, 1.0681915283203125, 1.128173828125, 1.1881561279296875, 1.248138427734375, 1.3081207275390625, 1.36810302734375, 1.4280853271484375, 1.488067626953125, 1.5480499267578125, 1.6080322265625, 1.6680145263671875, 1.727996826171875, 1.7879791259765625, 1.84796142578125, 1.9079437255859375, 1.967926025390625, 2.0279083251953125, 2.087890625]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 5.0, 3.0, 6.0, 10.0, 11.0, 12.0, 15.0, 27.0, 30.0, 55.0, 78.0, 116.0, 123.0, 208.0, 302.0, 424.0, 621.0, 893.0, 1353.0, 2096.0, 3348.0, 5138.0, 8420.0, 13876.0, 23362.0, 40053.0, 67391.0, 107171.0, 153446.0, 177414.0, 156672.0, 110757.0, 70055.0, 42026.0, 24500.0, 14306.0, 8897.0, 5276.0, 3501.0, 2092.0, 1427.0, 974.0, 647.0, 389.0, 325.0, 205.0, 155.0, 89.0, 81.0, 55.0, 37.0, 24.0, 24.0, 12.0, 14.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.4140625, -1.37060546875, -1.3271484375, -1.28369140625, -1.240234375, -1.19677734375, -1.1533203125, -1.10986328125, -1.06640625, -1.02294921875, -0.9794921875, -0.93603515625, -0.892578125, -0.84912109375, -0.8056640625, -0.76220703125, -0.71875, -0.67529296875, -0.6318359375, -0.58837890625, -0.544921875, -0.50146484375, -0.4580078125, -0.41455078125, -0.37109375, -0.32763671875, -0.2841796875, -0.24072265625, -0.197265625, -0.15380859375, -0.1103515625, -0.06689453125, -0.0234375, 0.02001953125, 0.0634765625, 0.10693359375, 0.150390625, 0.19384765625, 0.2373046875, 0.28076171875, 0.32421875, 0.36767578125, 0.4111328125, 0.45458984375, 0.498046875, 0.54150390625, 0.5849609375, 0.62841796875, 0.671875, 0.71533203125, 0.7587890625, 0.80224609375, 0.845703125, 0.88916015625, 0.9326171875, 0.97607421875, 1.01953125, 1.06298828125, 1.1064453125, 1.14990234375, 1.193359375, 1.23681640625, 1.2802734375, 1.32373046875, 1.3671875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 21.0, 10.0, 27.0, 32.0, 53.0, 61.0, 86.0, 110.0, 94.0, 94.0, 91.0, 66.0, 71.0, 43.0, 28.0, 28.0, 28.0, 8.0, 10.0, 8.0, 0.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021326541900634766, -0.00020658224821090698, -0.0001998990774154663, -0.00019321590662002563, -0.00018653273582458496, -0.0001798495650291443, -0.0001731663942337036, -0.00016648322343826294, -0.00015980005264282227, -0.0001531168818473816, -0.00014643371105194092, -0.00013975054025650024, -0.00013306736946105957, -0.0001263841986656189, -0.00011970102787017822, -0.00011301785707473755, -0.00010633468627929688, -9.96515154838562e-05, -9.296834468841553e-05, -8.628517389297485e-05, -7.960200309753418e-05, -7.29188323020935e-05, -6.623566150665283e-05, -5.955249071121216e-05, -5.2869319915771484e-05, -4.618614912033081e-05, -3.950297832489014e-05, -3.281980752944946e-05, -2.613663673400879e-05, -1.9453465938568115e-05, -1.2770295143127441e-05, -6.087124347686768e-06, 5.960464477539062e-07, 7.27921724319458e-06, 1.3962388038635254e-05, 2.0645558834075928e-05, 2.73287296295166e-05, 3.4011900424957275e-05, 4.069507122039795e-05, 4.737824201583862e-05, 5.40614128112793e-05, 6.074458360671997e-05, 6.742775440216064e-05, 7.411092519760132e-05, 8.079409599304199e-05, 8.747726678848267e-05, 9.416043758392334e-05, 0.00010084360837936401, 0.00010752677917480469, 0.00011420994997024536, 0.00012089312076568604, 0.0001275762915611267, 0.00013425946235656738, 0.00014094263315200806, 0.00014762580394744873, 0.0001543089747428894, 0.00016099214553833008, 0.00016767531633377075, 0.00017435848712921143, 0.0001810416579246521, 0.00018772482872009277, 0.00019440799951553345, 0.00020109117031097412, 0.0002077743411064148, 0.00021445751190185547]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 9.0, 8.0, 22.0, 24.0, 29.0, 45.0, 64.0, 103.0, 158.0, 188.0, 296.0, 412.0, 617.0, 972.0, 1381.0, 2081.0, 3310.0, 5331.0, 8801.0, 14298.0, 24063.0, 39653.0, 64733.0, 100756.0, 140575.0, 163931.0, 154229.0, 117938.0, 78416.0, 48909.0, 29901.0, 18027.0, 10692.0, 6720.0, 4166.0, 2661.0, 1727.0, 1032.0, 700.0, 504.0, 312.0, 228.0, 145.0, 109.0, 74.0, 55.0, 42.0, 33.0, 23.0, 17.0, 12.0, 9.0, 5.0, 5.0, 2.0, 0.0, 1.0], "bins": [-1.2744140625, -1.2354583740234375, -1.196502685546875, -1.1575469970703125, -1.11859130859375, -1.0796356201171875, -1.040679931640625, -1.0017242431640625, -0.9627685546875, -0.9238128662109375, -0.884857177734375, -0.8459014892578125, -0.80694580078125, -0.7679901123046875, -0.729034423828125, -0.6900787353515625, -0.651123046875, -0.6121673583984375, -0.573211669921875, -0.5342559814453125, -0.49530029296875, -0.4563446044921875, -0.417388916015625, -0.3784332275390625, -0.3394775390625, -0.3005218505859375, -0.261566162109375, -0.2226104736328125, -0.18365478515625, -0.1446990966796875, -0.105743408203125, -0.0667877197265625, -0.02783203125, 0.0111236572265625, 0.050079345703125, 0.0890350341796875, 0.12799072265625, 0.1669464111328125, 0.205902099609375, 0.2448577880859375, 0.2838134765625, 0.3227691650390625, 0.361724853515625, 0.4006805419921875, 0.43963623046875, 0.4785919189453125, 0.517547607421875, 0.5565032958984375, 0.595458984375, 0.6344146728515625, 0.673370361328125, 0.7123260498046875, 0.75128173828125, 0.7902374267578125, 0.829193115234375, 0.8681488037109375, 0.9071044921875, 0.9460601806640625, 0.985015869140625, 1.0239715576171875, 1.06292724609375, 1.1018829345703125, 1.140838623046875, 1.1797943115234375, 1.21875]}, "gradients/decoder.bert.encoder.layer.9.attention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 6.0, 7.0, 5.0, 2.0, 10.0, 10.0, 12.0, 21.0, 21.0, 21.0, 25.0, 35.0, 39.0, 40.0, 51.0, 46.0, 51.0, 48.0, 63.0, 67.0, 58.0, 51.0, 44.0, 53.0, 42.0, 31.0, 25.0, 18.0, 22.0, 16.0, 13.0, 9.0, 4.0, 13.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.325439453125, -0.31262969970703125, -0.2998199462890625, -0.28701019287109375, -0.274200439453125, -0.26139068603515625, -0.2485809326171875, -0.23577117919921875, -0.22296142578125, -0.21015167236328125, -0.1973419189453125, -0.18453216552734375, -0.171722412109375, -0.15891265869140625, -0.1461029052734375, -0.13329315185546875, -0.1204833984375, -0.10767364501953125, -0.0948638916015625, -0.08205413818359375, -0.069244384765625, -0.05643463134765625, -0.0436248779296875, -0.03081512451171875, -0.01800537109375, -0.00519561767578125, 0.0076141357421875, 0.02042388916015625, 0.033233642578125, 0.04604339599609375, 0.0588531494140625, 0.07166290283203125, 0.08447265625, 0.09728240966796875, 0.1100921630859375, 0.12290191650390625, 0.135711669921875, 0.14852142333984375, 0.1613311767578125, 0.17414093017578125, 0.18695068359375, 0.19976043701171875, 0.2125701904296875, 0.22537994384765625, 0.238189697265625, 0.25099945068359375, 0.2638092041015625, 0.27661895751953125, 0.2894287109375, 0.30223846435546875, 0.3150482177734375, 0.32785797119140625, 0.340667724609375, 0.35347747802734375, 0.3662872314453125, 0.37909698486328125, 0.39190673828125, 0.40471649169921875, 0.4175262451171875, 0.43033599853515625, 0.443145751953125, 0.45595550537109375, 0.4687652587890625, 0.48157501220703125, 0.494384765625]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 7.0, 3.0, 5.0, 9.0, 9.0, 11.0, 14.0, 15.0, 33.0, 26.0, 39.0, 53.0, 43.0, 56.0, 61.0, 55.0, 59.0, 64.0, 74.0, 50.0, 45.0, 36.0, 32.0, 36.0, 38.0, 18.0, 15.0, 25.0, 11.0, 15.0, 7.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-5.586828708648682, -5.435853481292725, -5.284878253936768, -5.133902549743652, -4.982927322387695, -4.831952095031738, -4.680976867675781, -4.530001640319824, -4.379026412963867, -4.22805118560791, -4.077075958251953, -3.926100492477417, -3.775125026702881, -3.624149799346924, -3.473174571990967, -3.3221993446350098, -3.1712236404418945, -3.0202484130859375, -2.8692729473114014, -2.7182977199554443, -2.567322254180908, -2.416347026824951, -2.265371799468994, -2.114396572113037, -1.963421106338501, -1.8124457597732544, -1.6614704132080078, -1.5104951858520508, -1.3595198392868042, -1.2085444927215576, -1.0575692653656006, -0.906593918800354, -0.7556185722351074, -0.6046432256698608, -0.45366793870925903, -0.30269262194633484, -0.15171730518341064, -0.0007419586181640625, 0.15023332834243774, 0.30120861530303955, 0.45218396186828613, 0.6031593084335327, 0.7541345953941345, 0.9051098823547363, 1.056085228919983, 1.2070605754852295, 1.3580358028411865, 1.509011149406433, 1.6599864959716797, 1.8109618425369263, 1.9619371891021729, 2.11291241645813, 2.263887882232666, 2.414863109588623, 2.56583833694458, 2.716813564300537, 2.8677890300750732, 3.0187642574310303, 3.1697397232055664, 3.3207149505615234, 3.4716901779174805, 3.6226656436920166, 3.7736408710479736, 3.9246163368225098, 4.075591564178467]}, "gradients/decoder.bert.encoder.layer.8.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 8.0, 10.0, 15.0, 12.0, 13.0, 17.0, 19.0, 22.0, 32.0, 34.0, 35.0, 35.0, 52.0, 35.0, 34.0, 45.0, 43.0, 45.0, 36.0, 43.0, 41.0, 30.0, 30.0, 33.0, 39.0, 29.0, 33.0, 22.0, 22.0, 23.0, 26.0, 18.0, 14.0, 6.0, 11.0, 6.0, 10.0, 6.0, 2.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.960685968399048, -2.8687639236450195, -2.776841878890991, -2.684919834136963, -2.5929975509643555, -2.501075506210327, -2.409153461456299, -2.3172314167022705, -2.225309371948242, -2.133387327194214, -2.0414652824401855, -1.9495431184768677, -1.8576210737228394, -1.765699028968811, -1.6737768650054932, -1.5818548202514648, -1.4899327754974365, -1.3980107307434082, -1.3060886859893799, -1.214166522026062, -1.1222444772720337, -1.0303224325180054, -0.9384003281593323, -0.8464782238006592, -0.7545561790466309, -0.6626341342926025, -0.5707120299339294, -0.47878995537757874, -0.386867880821228, -0.2949458062648773, -0.2030237317085266, -0.11110162734985352, -0.019179821014404297, 0.07274225354194641, 0.16466432809829712, 0.2565864026546478, 0.34850847721099854, 0.44043055176734924, 0.5323526263237, 0.624274730682373, 0.7161967754364014, 0.8081188201904297, 0.9000409245491028, 0.9919630289077759, 1.0838850736618042, 1.1758071184158325, 1.2677292823791504, 1.3596513271331787, 1.451573371887207, 1.5434954166412354, 1.6354174613952637, 1.7273396253585815, 1.8192616701126099, 1.9111837148666382, 2.003105878829956, 2.0950279235839844, 2.1869499683380127, 2.278872013092041, 2.3707940578460693, 2.4627161026000977, 2.554638385772705, 2.6465604305267334, 2.7384824752807617, 2.83040452003479, 2.9223265647888184]}, "gradients/decoder.bert.encoder.layer.8.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 6.0, 9.0, 14.0, 22.0, 38.0, 44.0, 69.0, 97.0, 142.0, 208.0, 306.0, 490.0, 741.0, 1203.0, 1893.0, 3125.0, 5119.0, 8279.0, 14171.0, 23935.0, 42807.0, 78571.0, 152940.0, 323707.0, 696550.0, 1088655.0, 887205.0, 440143.0, 199750.0, 98811.0, 52476.0, 29462.0, 16860.0, 10058.0, 6035.0, 3876.0, 2351.0, 1452.0, 946.0, 609.0, 385.0, 251.0, 160.0, 114.0, 73.0, 49.0, 22.0, 15.0, 15.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.4296875, -4.2982177734375, -4.166748046875, -4.0352783203125, -3.90380859375, -3.7723388671875, -3.640869140625, -3.5093994140625, -3.3779296875, -3.2464599609375, -3.114990234375, -2.9835205078125, -2.85205078125, -2.7205810546875, -2.589111328125, -2.4576416015625, -2.326171875, -2.1947021484375, -2.063232421875, -1.9317626953125, -1.80029296875, -1.6688232421875, -1.537353515625, -1.4058837890625, -1.2744140625, -1.1429443359375, -1.011474609375, -0.8800048828125, -0.74853515625, -0.6170654296875, -0.485595703125, -0.3541259765625, -0.22265625, -0.0911865234375, 0.040283203125, 0.1717529296875, 0.30322265625, 0.4346923828125, 0.566162109375, 0.6976318359375, 0.8291015625, 0.9605712890625, 1.092041015625, 1.2235107421875, 1.35498046875, 1.4864501953125, 1.617919921875, 1.7493896484375, 1.880859375, 2.0123291015625, 2.143798828125, 2.2752685546875, 2.40673828125, 2.5382080078125, 2.669677734375, 2.8011474609375, 2.9326171875, 3.0640869140625, 3.195556640625, 3.3270263671875, 3.45849609375, 3.5899658203125, 3.721435546875, 3.8529052734375, 3.984375]}, "gradients/decoder.bert.encoder.layer.8.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 8.0, 9.0, 9.0, 14.0, 12.0, 15.0, 23.0, 15.0, 28.0, 25.0, 48.0, 27.0, 32.0, 36.0, 47.0, 38.0, 52.0, 43.0, 42.0, 40.0, 51.0, 32.0, 38.0, 44.0, 31.0, 26.0, 37.0, 27.0, 27.0, 27.0, 12.0, 17.0, 22.0, 10.0, 7.0, 6.0, 9.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.185333251953125, -2.10894775390625, -2.032562255859375, -1.9561767578125, -1.879791259765625, -1.80340576171875, -1.727020263671875, -1.650634765625, -1.574249267578125, -1.49786376953125, -1.421478271484375, -1.3450927734375, -1.268707275390625, -1.19232177734375, -1.115936279296875, -1.03955078125, -0.963165283203125, -0.88677978515625, -0.810394287109375, -0.7340087890625, -0.657623291015625, -0.58123779296875, -0.504852294921875, -0.428466796875, -0.352081298828125, -0.27569580078125, -0.199310302734375, -0.1229248046875, -0.046539306640625, 0.02984619140625, 0.106231689453125, 0.1826171875, 0.259002685546875, 0.33538818359375, 0.411773681640625, 0.4881591796875, 0.564544677734375, 0.64093017578125, 0.717315673828125, 0.793701171875, 0.870086669921875, 0.94647216796875, 1.022857666015625, 1.0992431640625, 1.175628662109375, 1.25201416015625, 1.328399658203125, 1.40478515625, 1.481170654296875, 1.55755615234375, 1.633941650390625, 1.7103271484375, 1.786712646484375, 1.86309814453125, 1.939483642578125, 2.015869140625, 2.092254638671875, 2.16864013671875, 2.245025634765625, 2.3214111328125, 2.397796630859375, 2.47418212890625, 2.550567626953125, 2.626953125]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 4.0, 3.0, 10.0, 25.0, 34.0, 36.0, 63.0, 93.0, 155.0, 237.0, 371.0, 576.0, 795.0, 1299.0, 2028.0, 3164.0, 4988.0, 7911.0, 12729.0, 20817.0, 35333.0, 60147.0, 104826.0, 187538.0, 339999.0, 606556.0, 892892.0, 802159.0, 485024.0, 269005.0, 147852.0, 83786.0, 48648.0, 28753.0, 17371.0, 10812.0, 6585.0, 4104.0, 2647.0, 1739.0, 1148.0, 688.0, 501.0, 277.0, 190.0, 151.0, 70.0, 44.0, 39.0, 26.0, 16.0, 9.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.908203125, -3.777069091796875, -3.64593505859375, -3.514801025390625, -3.3836669921875, -3.252532958984375, -3.12139892578125, -2.990264892578125, -2.859130859375, -2.727996826171875, -2.59686279296875, -2.465728759765625, -2.3345947265625, -2.203460693359375, -2.07232666015625, -1.941192626953125, -1.81005859375, -1.678924560546875, -1.54779052734375, -1.416656494140625, -1.2855224609375, -1.154388427734375, -1.02325439453125, -0.892120361328125, -0.760986328125, -0.629852294921875, -0.49871826171875, -0.367584228515625, -0.2364501953125, -0.105316162109375, 0.02581787109375, 0.156951904296875, 0.2880859375, 0.419219970703125, 0.55035400390625, 0.681488037109375, 0.8126220703125, 0.943756103515625, 1.07489013671875, 1.206024169921875, 1.337158203125, 1.468292236328125, 1.59942626953125, 1.730560302734375, 1.8616943359375, 1.992828369140625, 2.12396240234375, 2.255096435546875, 2.38623046875, 2.517364501953125, 2.64849853515625, 2.779632568359375, 2.9107666015625, 3.041900634765625, 3.17303466796875, 3.304168701171875, 3.435302734375, 3.566436767578125, 3.69757080078125, 3.828704833984375, 3.9598388671875, 4.090972900390625, 4.22210693359375, 4.353240966796875, 4.484375]}, "gradients/decoder.bert.encoder.layer.8.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 10.0, 11.0, 17.0, 34.0, 32.0, 39.0, 59.0, 64.0, 72.0, 119.0, 146.0, 170.0, 202.0, 216.0, 224.0, 261.0, 296.0, 314.0, 276.0, 238.0, 211.0, 191.0, 169.0, 118.0, 114.0, 96.0, 81.0, 62.0, 40.0, 43.0, 32.0, 24.0, 17.0, 12.0, 17.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3173828125, -1.2734222412109375, -1.229461669921875, -1.1855010986328125, -1.14154052734375, -1.0975799560546875, -1.053619384765625, -1.0096588134765625, -0.9656982421875, -0.9217376708984375, -0.877777099609375, -0.8338165283203125, -0.78985595703125, -0.7458953857421875, -0.701934814453125, -0.6579742431640625, -0.614013671875, -0.5700531005859375, -0.526092529296875, -0.4821319580078125, -0.43817138671875, -0.3942108154296875, -0.350250244140625, -0.3062896728515625, -0.2623291015625, -0.2183685302734375, -0.174407958984375, -0.1304473876953125, -0.08648681640625, -0.0425262451171875, 0.001434326171875, 0.0453948974609375, 0.08935546875, 0.1333160400390625, 0.177276611328125, 0.2212371826171875, 0.26519775390625, 0.3091583251953125, 0.353118896484375, 0.3970794677734375, 0.4410400390625, 0.4850006103515625, 0.528961181640625, 0.5729217529296875, 0.61688232421875, 0.6608428955078125, 0.704803466796875, 0.7487640380859375, 0.792724609375, 0.8366851806640625, 0.880645751953125, 0.9246063232421875, 0.96856689453125, 1.0125274658203125, 1.056488037109375, 1.1004486083984375, 1.1444091796875, 1.1883697509765625, 1.232330322265625, 1.2762908935546875, 1.32025146484375, 1.3642120361328125, 1.408172607421875, 1.4521331787109375, 1.49609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 2.0, 8.0, 6.0, 13.0, 11.0, 8.0, 16.0, 20.0, 29.0, 43.0, 31.0, 57.0, 60.0, 65.0, 62.0, 61.0, 74.0, 58.0, 61.0, 54.0, 36.0, 40.0, 42.0, 25.0, 26.0, 14.0, 22.0, 14.0, 5.0, 4.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.3671746253967285, -6.194919109344482, -6.0226640701293945, -5.850408554077148, -5.678153038024902, -5.505897521972656, -5.333642482757568, -5.161386966705322, -4.989131927490234, -4.816876411437988, -4.6446213722229, -4.472365856170654, -4.300110340118408, -4.12785530090332, -3.955599784851074, -3.783344268798828, -3.611088752746582, -3.438833475112915, -3.266577959060669, -3.094322681427002, -2.922067165374756, -2.749811887741089, -2.577556610107422, -2.405301094055176, -2.233045816421509, -2.060790538787842, -1.8885350227355957, -1.7162797451019287, -1.5440243482589722, -1.3717689514160156, -1.1995136737823486, -1.027258276939392, -0.8550024032592773, -0.6827470064163208, -0.510491669178009, -0.33823633193969727, -0.16598093509674072, 0.00627446174621582, 0.1785297393798828, 0.35078513622283936, 0.5230405330657959, 0.6952959299087524, 0.8675512671470642, 1.039806604385376, 1.2120620012283325, 1.384317398071289, 1.556572675704956, 1.7288280725479126, 1.9010834693908691, 2.073338747024536, 2.2455942630767822, 2.417849540710449, 2.5901050567626953, 2.7623603343963623, 2.9346156120300293, 3.1068711280822754, 3.2791264057159424, 3.4513816833496094, 3.6236371994018555, 3.7958924770355225, 3.9681477546691895, 4.1404032707214355, 4.312658309936523, 4.4849138259887695, 4.657169342041016]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 10.0, 8.0, 6.0, 7.0, 21.0, 16.0, 17.0, 29.0, 30.0, 31.0, 30.0, 36.0, 45.0, 38.0, 42.0, 50.0, 38.0, 40.0, 44.0, 41.0, 39.0, 49.0, 40.0, 40.0, 36.0, 31.0, 28.0, 26.0, 24.0, 21.0, 15.0, 8.0, 15.0, 13.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0973005294799805, -3.001399278640747, -2.9054980278015137, -2.8095967769622803, -2.713695526123047, -2.6177942752838135, -2.52189302444458, -2.4259917736053467, -2.3300905227661133, -2.23418927192688, -2.1382880210876465, -2.042386770248413, -1.9464855194091797, -1.8505842685699463, -1.754683017730713, -1.6587817668914795, -1.562880516052246, -1.4669792652130127, -1.3710780143737793, -1.275176763534546, -1.1792755126953125, -1.083374261856079, -0.9874730110168457, -0.8915717601776123, -0.7956705093383789, -0.6997692584991455, -0.6038680076599121, -0.5079667568206787, -0.4120655059814453, -0.3161642551422119, -0.22026300430297852, -0.12436175346374512, -0.028460264205932617, 0.06744098663330078, 0.16334223747253418, 0.2592434883117676, 0.355144739151001, 0.4510459899902344, 0.5469472408294678, 0.6428484916687012, 0.7387497425079346, 0.834650993347168, 0.9305522441864014, 1.0264534950256348, 1.1223547458648682, 1.2182559967041016, 1.314157247543335, 1.4100584983825684, 1.5059597492218018, 1.6018610000610352, 1.6977622509002686, 1.793663501739502, 1.8895647525787354, 1.9854660034179688, 2.081367254257202, 2.1772685050964355, 2.273169755935669, 2.3690710067749023, 2.4649722576141357, 2.560873508453369, 2.6567747592926025, 2.752676010131836, 2.8485772609710693, 2.9444785118103027, 3.040379762649536]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 3.0, 5.0, 0.0, 6.0, 12.0, 10.0, 28.0, 19.0, 44.0, 51.0, 58.0, 101.0, 166.0, 248.0, 319.0, 513.0, 681.0, 1042.0, 1502.0, 2376.0, 3736.0, 6187.0, 10142.0, 17913.0, 31341.0, 58191.0, 108712.0, 189956.0, 234196.0, 169738.0, 93703.0, 50399.0, 27576.0, 15303.0, 8989.0, 5470.0, 3387.0, 2103.0, 1471.0, 860.0, 648.0, 427.0, 264.0, 178.0, 147.0, 113.0, 62.0, 45.0, 43.0, 16.0, 22.0, 14.0, 9.0, 1.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.383056640625, -0.3712272644042969, -0.35939788818359375, -0.3475685119628906, -0.3357391357421875, -0.3239097595214844, -0.31208038330078125, -0.3002510070800781, -0.288421630859375, -0.2765922546386719, -0.26476287841796875, -0.2529335021972656, -0.2411041259765625, -0.22927474975585938, -0.21744537353515625, -0.20561599731445312, -0.19378662109375, -0.18195724487304688, -0.17012786865234375, -0.15829849243164062, -0.1464691162109375, -0.13463973999023438, -0.12281036376953125, -0.11098098754882812, -0.099151611328125, -0.08732223510742188, -0.07549285888671875, -0.06366348266601562, -0.0518341064453125, -0.040004730224609375, -0.02817535400390625, -0.016345977783203125, -0.0045166015625, 0.007312774658203125, 0.01914215087890625, 0.030971527099609375, 0.0428009033203125, 0.054630279541015625, 0.06645965576171875, 0.07828903198242188, 0.090118408203125, 0.10194778442382812, 0.11377716064453125, 0.12560653686523438, 0.1374359130859375, 0.14926528930664062, 0.16109466552734375, 0.17292404174804688, 0.18475341796875, 0.19658279418945312, 0.20841217041015625, 0.22024154663085938, 0.2320709228515625, 0.24390029907226562, 0.25572967529296875, 0.2675590515136719, 0.279388427734375, 0.2912178039550781, 0.30304718017578125, 0.3148765563964844, 0.3267059326171875, 0.3385353088378906, 0.35036468505859375, 0.3621940612792969, 0.3740234375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 7.0, 5.0, 5.0, 13.0, 17.0, 24.0, 24.0, 30.0, 31.0, 29.0, 34.0, 36.0, 37.0, 48.0, 46.0, 52.0, 52.0, 54.0, 47.0, 47.0, 47.0, 38.0, 42.0, 41.0, 25.0, 29.0, 19.0, 20.0, 20.0, 9.0, 11.0, 14.0, 12.0, 9.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.78125, -3.666168212890625, -3.55108642578125, -3.436004638671875, -3.3209228515625, -3.205841064453125, -3.09075927734375, -2.975677490234375, -2.860595703125, -2.745513916015625, -2.63043212890625, -2.515350341796875, -2.4002685546875, -2.285186767578125, -2.17010498046875, -2.055023193359375, -1.93994140625, -1.824859619140625, -1.70977783203125, -1.594696044921875, -1.4796142578125, -1.364532470703125, -1.24945068359375, -1.134368896484375, -1.019287109375, -0.904205322265625, -0.78912353515625, -0.674041748046875, -0.5589599609375, -0.443878173828125, -0.32879638671875, -0.213714599609375, -0.0986328125, 0.016448974609375, 0.13153076171875, 0.246612548828125, 0.3616943359375, 0.476776123046875, 0.59185791015625, 0.706939697265625, 0.822021484375, 0.937103271484375, 1.05218505859375, 1.167266845703125, 1.2823486328125, 1.397430419921875, 1.51251220703125, 1.627593994140625, 1.74267578125, 1.857757568359375, 1.97283935546875, 2.087921142578125, 2.2030029296875, 2.318084716796875, 2.43316650390625, 2.548248291015625, 2.663330078125, 2.778411865234375, 2.89349365234375, 3.008575439453125, 3.1236572265625, 3.238739013671875, 3.35382080078125, 3.468902587890625, 3.583984375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 5.0, 5.0, 11.0, 15.0, 17.0, 24.0, 31.0, 41.0, 53.0, 85.0, 117.0, 180.0, 258.0, 384.0, 581.0, 934.0, 1598.0, 2730.0, 5122.0, 10645.0, 25685.0, 164433.0, 762077.0, 42401.0, 15297.0, 6955.0, 3488.0, 2029.0, 1155.0, 723.0, 462.0, 318.0, 189.0, 138.0, 98.0, 73.0, 47.0, 31.0, 29.0, 18.0, 24.0, 12.0, 7.0, 9.0, 6.0, 4.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.041015625, -1.006561279296875, -0.97210693359375, -0.937652587890625, -0.9031982421875, -0.868743896484375, -0.83428955078125, -0.799835205078125, -0.765380859375, -0.730926513671875, -0.69647216796875, -0.662017822265625, -0.6275634765625, -0.593109130859375, -0.55865478515625, -0.524200439453125, -0.48974609375, -0.455291748046875, -0.42083740234375, -0.386383056640625, -0.3519287109375, -0.317474365234375, -0.28302001953125, -0.248565673828125, -0.214111328125, -0.179656982421875, -0.14520263671875, -0.110748291015625, -0.0762939453125, -0.041839599609375, -0.00738525390625, 0.027069091796875, 0.0615234375, 0.095977783203125, 0.13043212890625, 0.164886474609375, 0.1993408203125, 0.233795166015625, 0.26824951171875, 0.302703857421875, 0.337158203125, 0.371612548828125, 0.40606689453125, 0.440521240234375, 0.4749755859375, 0.509429931640625, 0.54388427734375, 0.578338623046875, 0.61279296875, 0.647247314453125, 0.68170166015625, 0.716156005859375, 0.7506103515625, 0.785064697265625, 0.81951904296875, 0.853973388671875, 0.888427734375, 0.922882080078125, 0.95733642578125, 0.991790771484375, 1.0262451171875, 1.060699462890625, 1.09515380859375, 1.129608154296875, 1.1640625]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 2.0, 6.0, 8.0, 2.0, 8.0, 9.0, 10.0, 12.0, 24.0, 19.0, 22.0, 31.0, 41.0, 23.0, 27.0, 38.0, 30.0, 27.0, 45.0, 33.0, 32.0, 36.0, 41.0, 50.0, 44.0, 48.0, 39.0, 33.0, 33.0, 33.0, 22.0, 32.0, 22.0, 29.0, 9.0, 15.0, 6.0, 13.0, 7.0, 7.0, 6.0, 3.0, 4.0, 7.0, 6.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9130859375, -1.8503875732421875, -1.787689208984375, -1.7249908447265625, -1.66229248046875, -1.5995941162109375, -1.536895751953125, -1.4741973876953125, -1.4114990234375, -1.3488006591796875, -1.286102294921875, -1.2234039306640625, -1.16070556640625, -1.0980072021484375, -1.035308837890625, -0.9726104736328125, -0.909912109375, -0.8472137451171875, -0.784515380859375, -0.7218170166015625, -0.65911865234375, -0.5964202880859375, -0.533721923828125, -0.4710235595703125, -0.4083251953125, -0.3456268310546875, -0.282928466796875, -0.2202301025390625, -0.15753173828125, -0.0948333740234375, -0.032135009765625, 0.0305633544921875, 0.09326171875, 0.1559600830078125, 0.218658447265625, 0.2813568115234375, 0.34405517578125, 0.4067535400390625, 0.469451904296875, 0.5321502685546875, 0.5948486328125, 0.6575469970703125, 0.720245361328125, 0.7829437255859375, 0.84564208984375, 0.9083404541015625, 0.971038818359375, 1.0337371826171875, 1.096435546875, 1.1591339111328125, 1.221832275390625, 1.2845306396484375, 1.34722900390625, 1.4099273681640625, 1.472625732421875, 1.5353240966796875, 1.5980224609375, 1.6607208251953125, 1.723419189453125, 1.7861175537109375, 1.84881591796875, 1.9115142822265625, 1.974212646484375, 2.0369110107421875, 2.099609375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 10.0, 16.0, 20.0, 29.0, 38.0, 58.0, 84.0, 146.0, 215.0, 366.0, 482.0, 841.0, 1423.0, 2371.0, 4365.0, 8279.0, 16225.0, 38475.0, 876541.0, 57108.0, 19937.0, 9621.0, 4968.0, 2777.0, 1611.0, 912.0, 557.0, 330.0, 253.0, 161.0, 87.0, 75.0, 40.0, 33.0, 32.0, 16.0, 13.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199951171875, -0.19271469116210938, -0.18547821044921875, -0.17824172973632812, -0.1710052490234375, -0.16376876831054688, -0.15653228759765625, -0.14929580688476562, -0.142059326171875, -0.13482284545898438, -0.12758636474609375, -0.12034988403320312, -0.1131134033203125, -0.10587692260742188, -0.09864044189453125, -0.09140396118164062, -0.08416748046875, -0.07693099975585938, -0.06969451904296875, -0.062458038330078125, -0.0552215576171875, -0.047985076904296875, -0.04074859619140625, -0.033512115478515625, -0.026275634765625, -0.019039154052734375, -0.01180267333984375, -0.004566192626953125, 0.0026702880859375, 0.009906768798828125, 0.01714324951171875, 0.024379730224609375, 0.0316162109375, 0.038852691650390625, 0.04608917236328125, 0.053325653076171875, 0.0605621337890625, 0.06779861450195312, 0.07503509521484375, 0.08227157592773438, 0.089508056640625, 0.09674453735351562, 0.10398101806640625, 0.11121749877929688, 0.1184539794921875, 0.12569046020507812, 0.13292694091796875, 0.14016342163085938, 0.14739990234375, 0.15463638305664062, 0.16187286376953125, 0.16910934448242188, 0.1763458251953125, 0.18358230590820312, 0.19081878662109375, 0.19805526733398438, 0.205291748046875, 0.21252822875976562, 0.21976470947265625, 0.22700119018554688, 0.2342376708984375, 0.24147415161132812, 0.24871063232421875, 0.2559471130371094, 0.26318359375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 12.0, 9.0, 10.0, 19.0, 13.0, 19.0, 36.0, 34.0, 38.0, 35.0, 40.0, 31.0, 45.0, 46.0, 51.0, 49.0, 56.0, 59.0, 37.0, 55.0, 39.0, 43.0, 34.0, 27.0, 29.0, 33.0, 12.0, 20.0, 7.0, 14.0, 10.0, 11.0, 4.0, 6.0, 10.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8835067749023438e-05, -1.8231570720672607e-05, -1.7628073692321777e-05, -1.7024576663970947e-05, -1.6421079635620117e-05, -1.5817582607269287e-05, -1.5214085578918457e-05, -1.4610588550567627e-05, -1.4007091522216797e-05, -1.3403594493865967e-05, -1.2800097465515137e-05, -1.2196600437164307e-05, -1.1593103408813477e-05, -1.0989606380462646e-05, -1.0386109352111816e-05, -9.782612323760986e-06, -9.179115295410156e-06, -8.575618267059326e-06, -7.972121238708496e-06, -7.368624210357666e-06, -6.765127182006836e-06, -6.161630153656006e-06, -5.558133125305176e-06, -4.954636096954346e-06, -4.351139068603516e-06, -3.7476420402526855e-06, -3.1441450119018555e-06, -2.5406479835510254e-06, -1.9371509552001953e-06, -1.3336539268493652e-06, -7.301568984985352e-07, -1.2665987014770508e-07, 4.76837158203125e-07, 1.080334186553955e-06, 1.6838312149047852e-06, 2.2873282432556152e-06, 2.8908252716064453e-06, 3.4943222999572754e-06, 4.0978193283081055e-06, 4.7013163566589355e-06, 5.304813385009766e-06, 5.908310413360596e-06, 6.511807441711426e-06, 7.115304470062256e-06, 7.718801498413086e-06, 8.322298526763916e-06, 8.925795555114746e-06, 9.529292583465576e-06, 1.0132789611816406e-05, 1.0736286640167236e-05, 1.1339783668518066e-05, 1.1943280696868896e-05, 1.2546777725219727e-05, 1.3150274753570557e-05, 1.3753771781921387e-05, 1.4357268810272217e-05, 1.4960765838623047e-05, 1.5564262866973877e-05, 1.6167759895324707e-05, 1.6771256923675537e-05, 1.7374753952026367e-05, 1.7978250980377197e-05, 1.8581748008728027e-05, 1.9185245037078857e-05, 1.9788742065429688e-05]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 12.0, 16.0, 30.0, 20.0, 46.0, 81.0, 91.0, 160.0, 222.0, 346.0, 503.0, 819.0, 1128.0, 1753.0, 2684.0, 4151.0, 6730.0, 10759.0, 18055.0, 30129.0, 51155.0, 86398.0, 139216.0, 190676.0, 182795.0, 126339.0, 78200.0, 46224.0, 26911.0, 16057.0, 9469.0, 6184.0, 3876.0, 2484.0, 1553.0, 1111.0, 722.0, 469.0, 319.0, 222.0, 119.0, 110.0, 77.0, 41.0, 32.0, 18.0, 14.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.07171630859375, -0.06953620910644531, -0.06735610961914062, -0.06517601013183594, -0.06299591064453125, -0.06081581115722656, -0.058635711669921875, -0.05645561218261719, -0.0542755126953125, -0.05209541320800781, -0.049915313720703125, -0.04773521423339844, -0.04555511474609375, -0.04337501525878906, -0.041194915771484375, -0.03901481628417969, -0.036834716796875, -0.03465461730957031, -0.032474517822265625, -0.030294418334960938, -0.02811431884765625, -0.025934219360351562, -0.023754119873046875, -0.021574020385742188, -0.0193939208984375, -0.017213821411132812, -0.015033721923828125, -0.012853622436523438, -0.01067352294921875, -0.008493423461914062, -0.006313323974609375, -0.0041332244873046875, -0.001953125, 0.0002269744873046875, 0.002407073974609375, 0.0045871734619140625, 0.00676727294921875, 0.008947372436523438, 0.011127471923828125, 0.013307571411132812, 0.0154876708984375, 0.017667770385742188, 0.019847869873046875, 0.022027969360351562, 0.02420806884765625, 0.026388168334960938, 0.028568267822265625, 0.030748367309570312, 0.032928466796875, 0.03510856628417969, 0.037288665771484375, 0.03946876525878906, 0.04164886474609375, 0.04382896423339844, 0.046009063720703125, 0.04818916320800781, 0.0503692626953125, 0.05254936218261719, 0.054729461669921875, 0.05690956115722656, 0.05908966064453125, 0.06126976013183594, 0.06344985961914062, 0.06562995910644531, 0.06781005859375]}, "gradients/decoder.bert.encoder.layer.8.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 1.0, 9.0, 2.0, 6.0, 10.0, 11.0, 14.0, 13.0, 17.0, 30.0, 25.0, 25.0, 41.0, 56.0, 51.0, 52.0, 62.0, 75.0, 67.0, 68.0, 62.0, 48.0, 40.0, 36.0, 30.0, 29.0, 19.0, 21.0, 21.0, 9.0, 12.0, 12.0, 5.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017608642578125, -0.016898632049560547, -0.016188621520996094, -0.01547861099243164, -0.014768600463867188, -0.014058589935302734, -0.013348579406738281, -0.012638568878173828, -0.011928558349609375, -0.011218547821044922, -0.010508537292480469, -0.009798526763916016, -0.009088516235351562, -0.00837850570678711, -0.007668495178222656, -0.006958484649658203, -0.00624847412109375, -0.005538463592529297, -0.004828453063964844, -0.004118442535400391, -0.0034084320068359375, -0.0026984214782714844, -0.0019884109497070312, -0.0012784004211425781, -0.000568389892578125, 0.00014162063598632812, 0.0008516311645507812, 0.0015616416931152344, 0.0022716522216796875, 0.0029816627502441406, 0.0036916732788085938, 0.004401683807373047, 0.0051116943359375, 0.005821704864501953, 0.006531715393066406, 0.007241725921630859, 0.007951736450195312, 0.008661746978759766, 0.009371757507324219, 0.010081768035888672, 0.010791778564453125, 0.011501789093017578, 0.012211799621582031, 0.012921810150146484, 0.013631820678710938, 0.01434183120727539, 0.015051841735839844, 0.015761852264404297, 0.01647186279296875, 0.017181873321533203, 0.017891883850097656, 0.01860189437866211, 0.019311904907226562, 0.020021915435791016, 0.02073192596435547, 0.021441936492919922, 0.022151947021484375, 0.022861957550048828, 0.02357196807861328, 0.024281978607177734, 0.024991989135742188, 0.02570199966430664, 0.026412010192871094, 0.027122020721435547, 0.02783203125]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 12.0, 11.0, 8.0, 16.0, 15.0, 33.0, 41.0, 33.0, 53.0, 58.0, 67.0, 60.0, 58.0, 74.0, 65.0, 63.0, 47.0, 39.0, 35.0, 44.0, 29.0, 30.0, 13.0, 16.0, 19.0, 8.0, 2.0, 8.0, 6.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.321294784545898, -6.150835990905762, -5.980377197265625, -5.809918403625488, -5.639459609985352, -5.469001293182373, -5.298542499542236, -5.1280837059021, -4.957624912261963, -4.787166118621826, -4.6167073249816895, -4.446248531341553, -4.275790214538574, -4.1053314208984375, -3.934872627258301, -3.764413833618164, -3.5939550399780273, -3.4234962463378906, -3.253037452697754, -3.0825788974761963, -2.9121201038360596, -2.741661310195923, -2.5712027549743652, -2.4007439613342285, -2.230285167694092, -2.059826374053955, -1.889367699623108, -1.7189090251922607, -1.548450231552124, -1.3779914379119873, -1.2075327634811401, -1.037074089050293, -0.8666157722473145, -0.6961570382118225, -0.5256983041763306, -0.3552395701408386, -0.18478083610534668, -0.014322102069854736, 0.1561366319656372, 0.3265953063964844, 0.4970541000366211, 0.667512834072113, 0.837971568107605, 1.0084302425384521, 1.1788890361785889, 1.3493478298187256, 1.5198065042495728, 1.69026517868042, 1.8607239723205566, 2.0311827659606934, 2.20164155960083, 2.3721001148223877, 2.5425589084625244, 2.713017702102661, 2.8834762573242188, 3.0539350509643555, 3.224393844604492, 3.394852638244629, 3.5653114318847656, 3.7357699871063232, 3.90622878074646, 4.076687335968018, 4.247146129608154, 4.417604923248291, 4.588063716888428]}, "gradients/decoder.bert.encoder.layer.8.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 11.0, 8.0, 5.0, 8.0, 20.0, 16.0, 17.0, 28.0, 29.0, 32.0, 34.0, 32.0, 48.0, 32.0, 44.0, 52.0, 39.0, 40.0, 41.0, 42.0, 40.0, 47.0, 41.0, 38.0, 39.0, 30.0, 28.0, 29.0, 23.0, 21.0, 14.0, 8.0, 15.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.0558407306671143, -2.9604074954986572, -2.8649744987487793, -2.7695412635803223, -2.6741080284118652, -2.578674793243408, -2.483241558074951, -2.3878085613250732, -2.292375326156616, -2.196942090988159, -2.1015090942382812, -2.006075859069824, -1.9106426239013672, -1.8152093887329102, -1.7197762727737427, -1.6243431568145752, -1.5289099216461182, -1.4334766864776611, -1.3380435705184937, -1.2426104545593262, -1.1471772193908691, -1.051743984222412, -0.9563108682632446, -0.8608776926994324, -0.7654445171356201, -0.6700113415718079, -0.5745781660079956, -0.47914499044418335, -0.3837118148803711, -0.28827863931655884, -0.19284546375274658, -0.09741228818893433, -0.0019788742065429688, 0.09345430135726929, 0.18888747692108154, 0.2843206524848938, 0.37975382804870605, 0.4751870036125183, 0.5706201791763306, 0.6660533547401428, 0.7614865303039551, 0.8569197058677673, 0.9523528814315796, 1.047785997390747, 1.143219232559204, 1.2386524677276611, 1.3340855836868286, 1.429518699645996, 1.5249519348144531, 1.6203851699829102, 1.7158182859420776, 1.8112514019012451, 1.9066846370697021, 2.002117872238159, 2.097550868988037, 2.192984104156494, 2.288417339324951, 2.383850574493408, 2.4792838096618652, 2.574716806411743, 2.6701500415802, 2.7655832767486572, 2.861016273498535, 2.956449508666992, 3.051882743835449]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 8.0, 13.0, 16.0, 20.0, 37.0, 48.0, 72.0, 86.0, 154.0, 178.0, 289.0, 527.0, 835.0, 1339.0, 2328.0, 4207.0, 7653.0, 14730.0, 28558.0, 56046.0, 104543.0, 173992.0, 219182.0, 186689.0, 116109.0, 62589.0, 31951.0, 16491.0, 8690.0, 4640.0, 2527.0, 1509.0, 871.0, 560.0, 337.0, 231.0, 143.0, 106.0, 60.0, 52.0, 35.0, 23.0, 26.0, 17.0, 9.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.90625, -3.77423095703125, -3.6422119140625, -3.51019287109375, -3.378173828125, -3.24615478515625, -3.1141357421875, -2.98211669921875, -2.85009765625, -2.71807861328125, -2.5860595703125, -2.45404052734375, -2.322021484375, -2.19000244140625, -2.0579833984375, -1.92596435546875, -1.7939453125, -1.66192626953125, -1.5299072265625, -1.39788818359375, -1.265869140625, -1.13385009765625, -1.0018310546875, -0.86981201171875, -0.73779296875, -0.60577392578125, -0.4737548828125, -0.34173583984375, -0.209716796875, -0.07769775390625, 0.0543212890625, 0.18634033203125, 0.318359375, 0.45037841796875, 0.5823974609375, 0.71441650390625, 0.846435546875, 0.97845458984375, 1.1104736328125, 1.24249267578125, 1.37451171875, 1.50653076171875, 1.6385498046875, 1.77056884765625, 1.902587890625, 2.03460693359375, 2.1666259765625, 2.29864501953125, 2.4306640625, 2.56268310546875, 2.6947021484375, 2.82672119140625, 2.958740234375, 3.09075927734375, 3.2227783203125, 3.35479736328125, 3.48681640625, 3.61883544921875, 3.7508544921875, 3.88287353515625, 4.014892578125, 4.14691162109375, 4.2789306640625, 4.41094970703125, 4.54296875]}, "gradients/decoder.bert.encoder.layer.8.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 1.0, 4.0, 13.0, 13.0, 7.0, 6.0, 18.0, 15.0, 17.0, 34.0, 32.0, 28.0, 35.0, 44.0, 59.0, 55.0, 49.0, 50.0, 47.0, 44.0, 49.0, 34.0, 37.0, 52.0, 36.0, 36.0, 40.0, 33.0, 23.0, 27.0, 14.0, 11.0, 14.0, 6.0, 4.0, 5.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.702850341796875, -3.58538818359375, -3.467926025390625, -3.3504638671875, -3.233001708984375, -3.11553955078125, -2.998077392578125, -2.880615234375, -2.763153076171875, -2.64569091796875, -2.528228759765625, -2.4107666015625, -2.293304443359375, -2.17584228515625, -2.058380126953125, -1.94091796875, -1.823455810546875, -1.70599365234375, -1.588531494140625, -1.4710693359375, -1.353607177734375, -1.23614501953125, -1.118682861328125, -1.001220703125, -0.883758544921875, -0.76629638671875, -0.648834228515625, -0.5313720703125, -0.413909912109375, -0.29644775390625, -0.178985595703125, -0.0615234375, 0.055938720703125, 0.17340087890625, 0.290863037109375, 0.4083251953125, 0.525787353515625, 0.64324951171875, 0.760711669921875, 0.878173828125, 0.995635986328125, 1.11309814453125, 1.230560302734375, 1.3480224609375, 1.465484619140625, 1.58294677734375, 1.700408935546875, 1.81787109375, 1.935333251953125, 2.05279541015625, 2.170257568359375, 2.2877197265625, 2.405181884765625, 2.52264404296875, 2.640106201171875, 2.757568359375, 2.875030517578125, 2.99249267578125, 3.109954833984375, 3.2274169921875, 3.344879150390625, 3.46234130859375, 3.579803466796875, 3.697265625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 14.0, 25.0, 23.0, 34.0, 76.0, 101.0, 162.0, 250.0, 361.0, 585.0, 939.0, 1433.0, 2433.0, 3960.0, 6556.0, 10943.0, 18044.0, 29653.0, 48056.0, 75590.0, 110488.0, 144316.0, 157455.0, 140941.0, 106863.0, 71906.0, 45539.0, 28269.0, 16991.0, 10344.0, 6186.0, 3871.0, 2290.0, 1451.0, 871.0, 564.0, 336.0, 210.0, 134.0, 107.0, 72.0, 42.0, 22.0, 14.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.84906005859375, -2.7489013671875, -2.64874267578125, -2.548583984375, -2.44842529296875, -2.3482666015625, -2.24810791015625, -2.14794921875, -2.04779052734375, -1.9476318359375, -1.84747314453125, -1.747314453125, -1.64715576171875, -1.5469970703125, -1.44683837890625, -1.3466796875, -1.24652099609375, -1.1463623046875, -1.04620361328125, -0.946044921875, -0.84588623046875, -0.7457275390625, -0.64556884765625, -0.54541015625, -0.44525146484375, -0.3450927734375, -0.24493408203125, -0.144775390625, -0.04461669921875, 0.0555419921875, 0.15570068359375, 0.255859375, 0.35601806640625, 0.4561767578125, 0.55633544921875, 0.656494140625, 0.75665283203125, 0.8568115234375, 0.95697021484375, 1.05712890625, 1.15728759765625, 1.2574462890625, 1.35760498046875, 1.457763671875, 1.55792236328125, 1.6580810546875, 1.75823974609375, 1.8583984375, 1.95855712890625, 2.0587158203125, 2.15887451171875, 2.259033203125, 2.35919189453125, 2.4593505859375, 2.55950927734375, 2.65966796875, 2.75982666015625, 2.8599853515625, 2.96014404296875, 3.060302734375, 3.16046142578125, 3.2606201171875, 3.36077880859375, 3.4609375]}, "gradients/decoder.bert.encoder.layer.8.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 8.0, 12.0, 9.0, 14.0, 6.0, 21.0, 24.0, 23.0, 24.0, 28.0, 35.0, 32.0, 37.0, 23.0, 39.0, 38.0, 46.0, 35.0, 28.0, 44.0, 42.0, 37.0, 42.0, 35.0, 33.0, 28.0, 32.0, 29.0, 24.0, 21.0, 28.0, 22.0, 18.0, 12.0, 14.0, 9.0, 15.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.982421875, -1.9237823486328125, -1.865142822265625, -1.8065032958984375, -1.74786376953125, -1.6892242431640625, -1.630584716796875, -1.5719451904296875, -1.5133056640625, -1.4546661376953125, -1.396026611328125, -1.3373870849609375, -1.27874755859375, -1.2201080322265625, -1.161468505859375, -1.1028289794921875, -1.044189453125, -0.9855499267578125, -0.926910400390625, -0.8682708740234375, -0.80963134765625, -0.7509918212890625, -0.692352294921875, -0.6337127685546875, -0.5750732421875, -0.5164337158203125, -0.457794189453125, -0.3991546630859375, -0.34051513671875, -0.2818756103515625, -0.223236083984375, -0.1645965576171875, -0.10595703125, -0.0473175048828125, 0.011322021484375, 0.0699615478515625, 0.12860107421875, 0.1872406005859375, 0.245880126953125, 0.3045196533203125, 0.3631591796875, 0.4217987060546875, 0.480438232421875, 0.5390777587890625, 0.59771728515625, 0.6563568115234375, 0.714996337890625, 0.7736358642578125, 0.832275390625, 0.8909149169921875, 0.949554443359375, 1.0081939697265625, 1.06683349609375, 1.1254730224609375, 1.184112548828125, 1.2427520751953125, 1.3013916015625, 1.3600311279296875, 1.418670654296875, 1.4773101806640625, 1.53594970703125, 1.5945892333984375, 1.653228759765625, 1.7118682861328125, 1.7705078125]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 2.0, 13.0, 17.0, 37.0, 48.0, 71.0, 82.0, 150.0, 212.0, 344.0, 514.0, 786.0, 1230.0, 1936.0, 3103.0, 5057.0, 8283.0, 13801.0, 23330.0, 38852.0, 65703.0, 106052.0, 153532.0, 180513.0, 159449.0, 111562.0, 69333.0, 42114.0, 24414.0, 14730.0, 8815.0, 5416.0, 3258.0, 2064.0, 1306.0, 828.0, 551.0, 345.0, 233.0, 170.0, 83.0, 68.0, 46.0, 35.0, 24.0, 16.0, 9.0, 4.0, 8.0, 2.0, 4.0], "bins": [-1.87890625, -1.8275146484375, -1.776123046875, -1.7247314453125, -1.67333984375, -1.6219482421875, -1.570556640625, -1.5191650390625, -1.4677734375, -1.4163818359375, -1.364990234375, -1.3135986328125, -1.26220703125, -1.2108154296875, -1.159423828125, -1.1080322265625, -1.056640625, -1.0052490234375, -0.953857421875, -0.9024658203125, -0.85107421875, -0.7996826171875, -0.748291015625, -0.6968994140625, -0.6455078125, -0.5941162109375, -0.542724609375, -0.4913330078125, -0.43994140625, -0.3885498046875, -0.337158203125, -0.2857666015625, -0.234375, -0.1829833984375, -0.131591796875, -0.0802001953125, -0.02880859375, 0.0225830078125, 0.073974609375, 0.1253662109375, 0.1767578125, 0.2281494140625, 0.279541015625, 0.3309326171875, 0.38232421875, 0.4337158203125, 0.485107421875, 0.5364990234375, 0.587890625, 0.6392822265625, 0.690673828125, 0.7420654296875, 0.79345703125, 0.8448486328125, 0.896240234375, 0.9476318359375, 0.9990234375, 1.0504150390625, 1.101806640625, 1.1531982421875, 1.20458984375, 1.2559814453125, 1.307373046875, 1.3587646484375, 1.41015625]}, "gradients/decoder.bert.encoder.layer.8.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 13.0, 13.0, 23.0, 21.0, 25.0, 49.0, 53.0, 66.0, 81.0, 77.0, 94.0, 91.0, 68.0, 71.0, 58.0, 51.0, 33.0, 23.0, 22.0, 14.0, 6.0, 11.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.00028824806213378906, -0.0002803876996040344, -0.0002725273370742798, -0.00026466697454452515, -0.0002568066120147705, -0.00024894624948501587, -0.00024108588695526123, -0.0002332255244255066, -0.00022536516189575195, -0.00021750479936599731, -0.00020964443683624268, -0.00020178407430648804, -0.0001939237117767334, -0.00018606334924697876, -0.00017820298671722412, -0.00017034262418746948, -0.00016248226165771484, -0.0001546218991279602, -0.00014676153659820557, -0.00013890117406845093, -0.0001310408115386963, -0.00012318044900894165, -0.00011532008647918701, -0.00010745972394943237, -9.959936141967773e-05, -9.17389988899231e-05, -8.387863636016846e-05, -7.601827383041382e-05, -6.815791130065918e-05, -6.029754877090454e-05, -5.24371862411499e-05, -4.4576823711395264e-05, -3.6716461181640625e-05, -2.8856098651885986e-05, -2.0995736122131348e-05, -1.3135373592376709e-05, -5.27501106262207e-06, 2.5853514671325684e-06, 1.0445713996887207e-05, 1.8306076526641846e-05, 2.6166439056396484e-05, 3.402680158615112e-05, 4.188716411590576e-05, 4.97475266456604e-05, 5.760788917541504e-05, 6.546825170516968e-05, 7.332861423492432e-05, 8.118897676467896e-05, 8.90493392944336e-05, 9.690970182418823e-05, 0.00010477006435394287, 0.00011263042688369751, 0.00012049078941345215, 0.0001283511519432068, 0.00013621151447296143, 0.00014407187700271606, 0.0001519322395324707, 0.00015979260206222534, 0.00016765296459197998, 0.00017551332712173462, 0.00018337368965148926, 0.0001912340521812439, 0.00019909441471099854, 0.00020695477724075317, 0.0002148151397705078]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 9.0, 12.0, 10.0, 25.0, 26.0, 50.0, 72.0, 92.0, 158.0, 245.0, 344.0, 517.0, 856.0, 1313.0, 2100.0, 3571.0, 6000.0, 10058.0, 17150.0, 29353.0, 49617.0, 80332.0, 121792.0, 159255.0, 168453.0, 141575.0, 99604.0, 63163.0, 37815.0, 22357.0, 12908.0, 7695.0, 4513.0, 2849.0, 1781.0, 1039.0, 623.0, 409.0, 260.0, 170.0, 129.0, 87.0, 69.0, 36.0, 23.0, 12.0, 17.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.494140625, -1.4477996826171875, -1.401458740234375, -1.3551177978515625, -1.30877685546875, -1.2624359130859375, -1.216094970703125, -1.1697540283203125, -1.1234130859375, -1.0770721435546875, -1.030731201171875, -0.9843902587890625, -0.93804931640625, -0.8917083740234375, -0.845367431640625, -0.7990264892578125, -0.752685546875, -0.7063446044921875, -0.660003662109375, -0.6136627197265625, -0.56732177734375, -0.5209808349609375, -0.474639892578125, -0.4282989501953125, -0.3819580078125, -0.3356170654296875, -0.289276123046875, -0.2429351806640625, -0.19659423828125, -0.1502532958984375, -0.103912353515625, -0.0575714111328125, -0.01123046875, 0.0351104736328125, 0.081451416015625, 0.1277923583984375, 0.17413330078125, 0.2204742431640625, 0.266815185546875, 0.3131561279296875, 0.3594970703125, 0.4058380126953125, 0.452178955078125, 0.4985198974609375, 0.54486083984375, 0.5912017822265625, 0.637542724609375, 0.6838836669921875, 0.730224609375, 0.7765655517578125, 0.822906494140625, 0.8692474365234375, 0.91558837890625, 0.9619293212890625, 1.008270263671875, 1.0546112060546875, 1.1009521484375, 1.1472930908203125, 1.193634033203125, 1.2399749755859375, 1.28631591796875, 1.3326568603515625, 1.378997802734375, 1.4253387451171875, 1.4716796875]}, "gradients/decoder.bert.encoder.layer.8.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 10.0, 4.0, 8.0, 14.0, 16.0, 16.0, 12.0, 23.0, 23.0, 29.0, 33.0, 40.0, 37.0, 45.0, 36.0, 56.0, 60.0, 54.0, 46.0, 35.0, 38.0, 50.0, 40.0, 33.0, 24.0, 43.0, 22.0, 20.0, 22.0, 12.0, 18.0, 16.0, 16.0, 4.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.41796875, -0.40587615966796875, -0.3937835693359375, -0.38169097900390625, -0.369598388671875, -0.35750579833984375, -0.3454132080078125, -0.33332061767578125, -0.32122802734375, -0.30913543701171875, -0.2970428466796875, -0.28495025634765625, -0.272857666015625, -0.26076507568359375, -0.2486724853515625, -0.23657989501953125, -0.2244873046875, -0.21239471435546875, -0.2003021240234375, -0.18820953369140625, -0.176116943359375, -0.16402435302734375, -0.1519317626953125, -0.13983917236328125, -0.12774658203125, -0.11565399169921875, -0.1035614013671875, -0.09146881103515625, -0.079376220703125, -0.06728363037109375, -0.0551910400390625, -0.04309844970703125, -0.031005859375, -0.01891326904296875, -0.0068206787109375, 0.00527191162109375, 0.017364501953125, 0.02945709228515625, 0.0415496826171875, 0.05364227294921875, 0.06573486328125, 0.07782745361328125, 0.0899200439453125, 0.10201263427734375, 0.114105224609375, 0.12619781494140625, 0.1382904052734375, 0.15038299560546875, 0.1624755859375, 0.17456817626953125, 0.1866607666015625, 0.19875335693359375, 0.210845947265625, 0.22293853759765625, 0.2350311279296875, 0.24712371826171875, 0.25921630859375, 0.27130889892578125, 0.2834014892578125, 0.29549407958984375, 0.307586669921875, 0.31967926025390625, 0.3317718505859375, 0.34386444091796875, 0.35595703125]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 4.0, 11.0, 15.0, 18.0, 11.0, 30.0, 24.0, 35.0, 47.0, 44.0, 41.0, 48.0, 60.0, 67.0, 61.0, 60.0, 55.0, 52.0, 45.0, 38.0, 39.0, 28.0, 32.0, 20.0, 21.0, 17.0, 9.0, 8.0, 10.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-5.835660457611084, -5.679697513580322, -5.523734092712402, -5.367771148681641, -5.211808204650879, -5.055845260620117, -4.899881839752197, -4.7439188957214355, -4.587955951690674, -4.431993007659912, -4.276029586791992, -4.1200666427612305, -3.9641036987304688, -3.808140516281128, -3.652177333831787, -3.4962143898010254, -3.3402512073516846, -3.1842880249023438, -3.028325080871582, -2.872361898422241, -2.7163989543914795, -2.5604357719421387, -2.404472827911377, -2.248509645462036, -2.0925464630126953, -1.936583399772644, -1.7806203365325928, -1.624657154083252, -1.4686942100524902, -1.3127310276031494, -1.1567679643630981, -1.0008049011230469, -0.8448419570922852, -0.6888788938522339, -0.5329158306121826, -0.3769527077674866, -0.2209896445274353, -0.06502658128738403, 0.09093654155731201, 0.24689960479736328, 0.40286266803741455, 0.5588257312774658, 0.7147887945175171, 0.8707519173622131, 1.0267150402069092, 1.182677984237671, 1.3386411666870117, 1.494604229927063, 1.6505672931671143, 1.8065303564071655, 1.9624934196472168, 2.1184566020965576, 2.2744195461273193, 2.43038272857666, 2.586345672607422, 2.7423088550567627, 2.8982720375061035, 3.0542352199554443, 3.210198163986206, 3.366161346435547, 3.5221242904663086, 3.6780874729156494, 3.8340506553649902, 3.990013599395752, 4.145976543426514]}, "gradients/decoder.bert.encoder.layer.7.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 13.0, 7.0, 17.0, 11.0, 24.0, 21.0, 22.0, 36.0, 24.0, 29.0, 50.0, 37.0, 34.0, 49.0, 38.0, 39.0, 40.0, 50.0, 49.0, 49.0, 40.0, 33.0, 42.0, 41.0, 29.0, 30.0, 32.0, 15.0, 15.0, 17.0, 16.0, 12.0, 5.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.170156955718994, -3.067443609237671, -2.9647302627563477, -2.8620171546936035, -2.7593038082122803, -2.656590461730957, -2.553877353668213, -2.4511640071868896, -2.3484506607055664, -2.245737314224243, -2.14302396774292, -2.040310859680176, -1.9375975131988525, -1.8348841667175293, -1.7321709394454956, -1.629457712173462, -1.5267443656921387, -1.4240310192108154, -1.3213177919387817, -1.218604564666748, -1.1158912181854248, -1.0131778717041016, -0.9104646444320679, -0.8077513575553894, -0.7050380706787109, -0.6023247838020325, -0.499611496925354, -0.39689821004867554, -0.29418492317199707, -0.1914716362953186, -0.08875834941864014, 0.01395493745803833, 0.1166682243347168, 0.21938151121139526, 0.32209479808807373, 0.4248080849647522, 0.5275213718414307, 0.6302346587181091, 0.7329479455947876, 0.8356612324714661, 0.9383745193481445, 1.0410878658294678, 1.1438010931015015, 1.2465143203735352, 1.3492276668548584, 1.4519410133361816, 1.5546542406082153, 1.657367467880249, 1.7600808143615723, 1.8627941608428955, 1.9655073881149292, 2.068220615386963, 2.170933961868286, 2.2736473083496094, 2.3763604164123535, 2.4790737628936768, 2.581787109375, 2.6845004558563232, 2.7872138023376465, 2.8899269104003906, 2.992640256881714, 3.095353603363037, 3.1980667114257812, 3.3007800579071045, 3.4034934043884277]}, "gradients/decoder.bert.encoder.layer.7.output.dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 16.0, 16.0, 43.0, 44.0, 86.0, 111.0, 202.0, 286.0, 484.0, 756.0, 1274.0, 2215.0, 3810.0, 6365.0, 11388.0, 21134.0, 39471.0, 78288.0, 164794.0, 378402.0, 875783.0, 1241154.0, 755101.0, 318865.0, 142245.0, 70221.0, 36453.0, 19397.0, 10816.0, 6202.0, 3603.0, 2109.0, 1197.0, 746.0, 477.0, 229.0, 180.0, 100.0, 66.0, 58.0, 26.0, 17.0, 12.0, 2.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-5.765625, -5.602783203125, -5.43994140625, -5.277099609375, -5.1142578125, -4.951416015625, -4.78857421875, -4.625732421875, -4.462890625, -4.300048828125, -4.13720703125, -3.974365234375, -3.8115234375, -3.648681640625, -3.48583984375, -3.322998046875, -3.16015625, -2.997314453125, -2.83447265625, -2.671630859375, -2.5087890625, -2.345947265625, -2.18310546875, -2.020263671875, -1.857421875, -1.694580078125, -1.53173828125, -1.368896484375, -1.2060546875, -1.043212890625, -0.88037109375, -0.717529296875, -0.5546875, -0.391845703125, -0.22900390625, -0.066162109375, 0.0966796875, 0.259521484375, 0.42236328125, 0.585205078125, 0.748046875, 0.910888671875, 1.07373046875, 1.236572265625, 1.3994140625, 1.562255859375, 1.72509765625, 1.887939453125, 2.05078125, 2.213623046875, 2.37646484375, 2.539306640625, 2.7021484375, 2.864990234375, 3.02783203125, 3.190673828125, 3.353515625, 3.516357421875, 3.67919921875, 3.842041015625, 4.0048828125, 4.167724609375, 4.33056640625, 4.493408203125, 4.65625]}, "gradients/decoder.bert.encoder.layer.7.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 8.0, 8.0, 11.0, 16.0, 13.0, 23.0, 19.0, 21.0, 43.0, 42.0, 39.0, 45.0, 37.0, 31.0, 38.0, 37.0, 38.0, 49.0, 46.0, 32.0, 37.0, 45.0, 32.0, 38.0, 30.0, 25.0, 38.0, 28.0, 15.0, 17.0, 16.0, 11.0, 15.0, 14.0, 6.0, 4.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.353515625, -2.2755126953125, -2.197509765625, -2.1195068359375, -2.04150390625, -1.9635009765625, -1.885498046875, -1.8074951171875, -1.7294921875, -1.6514892578125, -1.573486328125, -1.4954833984375, -1.41748046875, -1.3394775390625, -1.261474609375, -1.1834716796875, -1.10546875, -1.0274658203125, -0.949462890625, -0.8714599609375, -0.79345703125, -0.7154541015625, -0.637451171875, -0.5594482421875, -0.4814453125, -0.4034423828125, -0.325439453125, -0.2474365234375, -0.16943359375, -0.0914306640625, -0.013427734375, 0.0645751953125, 0.142578125, 0.2205810546875, 0.298583984375, 0.3765869140625, 0.45458984375, 0.5325927734375, 0.610595703125, 0.6885986328125, 0.7666015625, 0.8446044921875, 0.922607421875, 1.0006103515625, 1.07861328125, 1.1566162109375, 1.234619140625, 1.3126220703125, 1.390625, 1.4686279296875, 1.546630859375, 1.6246337890625, 1.70263671875, 1.7806396484375, 1.858642578125, 1.9366455078125, 2.0146484375, 2.0926513671875, 2.170654296875, 2.2486572265625, 2.32666015625, 2.4046630859375, 2.482666015625, 2.5606689453125, 2.638671875]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 9.0, 11.0, 19.0, 24.0, 27.0, 61.0, 79.0, 141.0, 181.0, 297.0, 431.0, 762.0, 1120.0, 1889.0, 3063.0, 5076.0, 8818.0, 15040.0, 26468.0, 47707.0, 88342.0, 168847.0, 331070.0, 645560.0, 1021185.0, 858423.0, 463513.0, 235836.0, 122099.0, 64387.0, 35416.0, 19837.0, 11300.0, 6691.0, 3947.0, 2438.0, 1568.0, 896.0, 584.0, 389.0, 236.0, 178.0, 90.0, 76.0, 44.0, 38.0, 17.0, 16.0, 11.0, 10.0, 7.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-5.375, -5.21087646484375, -5.0467529296875, -4.88262939453125, -4.718505859375, -4.55438232421875, -4.3902587890625, -4.22613525390625, -4.06201171875, -3.89788818359375, -3.7337646484375, -3.56964111328125, -3.405517578125, -3.24139404296875, -3.0772705078125, -2.91314697265625, -2.7490234375, -2.58489990234375, -2.4207763671875, -2.25665283203125, -2.092529296875, -1.92840576171875, -1.7642822265625, -1.60015869140625, -1.43603515625, -1.27191162109375, -1.1077880859375, -0.94366455078125, -0.779541015625, -0.61541748046875, -0.4512939453125, -0.28717041015625, -0.123046875, 0.04107666015625, 0.2052001953125, 0.36932373046875, 0.533447265625, 0.69757080078125, 0.8616943359375, 1.02581787109375, 1.18994140625, 1.35406494140625, 1.5181884765625, 1.68231201171875, 1.846435546875, 2.01055908203125, 2.1746826171875, 2.33880615234375, 2.5029296875, 2.66705322265625, 2.8311767578125, 2.99530029296875, 3.159423828125, 3.32354736328125, 3.4876708984375, 3.65179443359375, 3.81591796875, 3.98004150390625, 4.1441650390625, 4.30828857421875, 4.472412109375, 4.63653564453125, 4.8006591796875, 4.96478271484375, 5.12890625]}, "gradients/decoder.bert.encoder.layer.7.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 4.0, 6.0, 9.0, 7.0, 11.0, 12.0, 11.0, 14.0, 25.0, 35.0, 44.0, 46.0, 61.0, 73.0, 96.0, 118.0, 129.0, 160.0, 175.0, 181.0, 206.0, 219.0, 256.0, 248.0, 267.0, 224.0, 211.0, 183.0, 162.0, 124.0, 129.0, 100.0, 86.0, 75.0, 83.0, 54.0, 46.0, 29.0, 28.0, 28.0, 27.0, 8.0, 21.0, 11.0, 8.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.345703125, -1.3045654296875, -1.263427734375, -1.2222900390625, -1.18115234375, -1.1400146484375, -1.098876953125, -1.0577392578125, -1.0166015625, -0.9754638671875, -0.934326171875, -0.8931884765625, -0.85205078125, -0.8109130859375, -0.769775390625, -0.7286376953125, -0.6875, -0.6463623046875, -0.605224609375, -0.5640869140625, -0.52294921875, -0.4818115234375, -0.440673828125, -0.3995361328125, -0.3583984375, -0.3172607421875, -0.276123046875, -0.2349853515625, -0.19384765625, -0.1527099609375, -0.111572265625, -0.0704345703125, -0.029296875, 0.0118408203125, 0.052978515625, 0.0941162109375, 0.13525390625, 0.1763916015625, 0.217529296875, 0.2586669921875, 0.2998046875, 0.3409423828125, 0.382080078125, 0.4232177734375, 0.46435546875, 0.5054931640625, 0.546630859375, 0.5877685546875, 0.62890625, 0.6700439453125, 0.711181640625, 0.7523193359375, 0.79345703125, 0.8345947265625, 0.875732421875, 0.9168701171875, 0.9580078125, 0.9991455078125, 1.040283203125, 1.0814208984375, 1.12255859375, 1.1636962890625, 1.204833984375, 1.2459716796875, 1.287109375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 5.0, 5.0, 9.0, 10.0, 10.0, 12.0, 14.0, 23.0, 25.0, 36.0, 36.0, 59.0, 61.0, 66.0, 52.0, 50.0, 71.0, 61.0, 48.0, 59.0, 49.0, 38.0, 34.0, 31.0, 25.0, 26.0, 20.0, 14.0, 7.0, 11.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.294163227081299, -6.114944934844971, -5.935727119445801, -5.756508827209473, -5.5772905349731445, -5.398072242736816, -5.218853950500488, -5.039636135101318, -4.86041784286499, -4.681199550628662, -4.501981735229492, -4.322763442993164, -4.143545150756836, -3.964326858520508, -3.785108804702759, -3.6058907508850098, -3.4266724586486816, -3.2474541664123535, -3.0682361125946045, -2.8890180587768555, -2.7097997665405273, -2.530581474304199, -2.35136342048645, -2.172145366668701, -1.992927074432373, -1.8137089014053345, -1.634490728378296, -1.4552725553512573, -1.2760543823242188, -1.0968362092971802, -0.9176180362701416, -0.738399863243103, -0.5591816902160645, -0.3799635171890259, -0.2007453441619873, -0.02152717113494873, 0.15769100189208984, 0.3369091749191284, 0.516127347946167, 0.6953455209732056, 0.8745636940002441, 1.0537818670272827, 1.2330000400543213, 1.4122182130813599, 1.5914363861083984, 1.770654559135437, 1.9498727321624756, 2.1290907859802246, 2.3083090782165527, 2.487527370452881, 2.66674542427063, 2.845963478088379, 3.025181770324707, 3.204400062561035, 3.383618116378784, 3.562836170196533, 3.7420544624328613, 3.9212727546691895, 4.100490570068359, 4.2797088623046875, 4.458927154541016, 4.638145446777344, 4.817363739013672, 4.996581554412842, 5.17579984664917]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 9.0, 9.0, 19.0, 19.0, 16.0, 22.0, 32.0, 31.0, 29.0, 31.0, 38.0, 33.0, 47.0, 50.0, 51.0, 43.0, 51.0, 56.0, 40.0, 52.0, 42.0, 34.0, 32.0, 28.0, 32.0, 28.0, 23.0, 14.0, 18.0, 14.0, 15.0, 10.0, 6.0, 8.0, 2.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8257391452789307, -2.721311092376709, -2.6168832778930664, -2.5124552249908447, -2.408027410507202, -2.3035993576049805, -2.199171543121338, -2.094743490219116, -1.990315556526184, -1.885887622833252, -1.7814596891403198, -1.6770317554473877, -1.572603702545166, -1.4681758880615234, -1.3637478351593018, -1.2593199014663696, -1.1548919677734375, -1.0504640340805054, -0.9460361003875732, -0.8416081070899963, -0.7371801733970642, -0.6327522397041321, -0.5283242464065552, -0.42389631271362305, -0.3194683790206909, -0.2150404304265976, -0.11061248183250427, -0.006184518337249756, 0.09824341535568237, 0.2026713490486145, 0.3070993423461914, 0.41152727603912354, 0.5159552097320557, 0.6203831434249878, 0.7248110771179199, 0.8292390704154968, 0.933667004108429, 1.0380949974060059, 1.142522931098938, 1.2469508647918701, 1.3513787984848022, 1.4558067321777344, 1.5602346658706665, 1.6646625995635986, 1.7690906524658203, 1.873518466949463, 1.9779465198516846, 2.0823745727539062, 2.186802387237549, 2.2912304401397705, 2.395658254623413, 2.5000863075256348, 2.6045141220092773, 2.708942174911499, 2.8133702278137207, 2.9177980422973633, 3.022225856781006, 3.1266539096832275, 3.23108172416687, 3.335509777069092, 3.4399375915527344, 3.544365644454956, 3.6487936973571777, 3.7532215118408203, 3.857649564743042]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 7.0, 15.0, 11.0, 29.0, 19.0, 41.0, 73.0, 95.0, 167.0, 203.0, 349.0, 560.0, 956.0, 1402.0, 2401.0, 3986.0, 7075.0, 12682.0, 23314.0, 43146.0, 82809.0, 153315.0, 228697.0, 210711.0, 128128.0, 68089.0, 36107.0, 19007.0, 10236.0, 6021.0, 3391.0, 2122.0, 1231.0, 746.0, 488.0, 297.0, 205.0, 127.0, 81.0, 53.0, 59.0, 27.0, 21.0, 15.0, 11.0, 4.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0], "bins": [-0.44970703125, -0.4364204406738281, -0.42313385009765625, -0.4098472595214844, -0.3965606689453125, -0.3832740783691406, -0.36998748779296875, -0.3567008972167969, -0.343414306640625, -0.3301277160644531, -0.31684112548828125, -0.3035545349121094, -0.2902679443359375, -0.2769813537597656, -0.26369476318359375, -0.2504081726074219, -0.23712158203125, -0.22383499145507812, -0.21054840087890625, -0.19726181030273438, -0.1839752197265625, -0.17068862915039062, -0.15740203857421875, -0.14411544799804688, -0.130828857421875, -0.11754226684570312, -0.10425567626953125, -0.09096908569335938, -0.0776824951171875, -0.06439590454101562, -0.05110931396484375, -0.037822723388671875, -0.0245361328125, -0.011249542236328125, 0.00203704833984375, 0.015323638916015625, 0.0286102294921875, 0.041896820068359375, 0.05518341064453125, 0.06847000122070312, 0.081756591796875, 0.09504318237304688, 0.10832977294921875, 0.12161636352539062, 0.1349029541015625, 0.14818954467773438, 0.16147613525390625, 0.17476272583007812, 0.18804931640625, 0.20133590698242188, 0.21462249755859375, 0.22790908813476562, 0.2411956787109375, 0.2544822692871094, 0.26776885986328125, 0.2810554504394531, 0.294342041015625, 0.3076286315917969, 0.32091522216796875, 0.3342018127441406, 0.3474884033203125, 0.3607749938964844, 0.37406158447265625, 0.3873481750488281, 0.400634765625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 9.0, 20.0, 14.0, 15.0, 20.0, 26.0, 23.0, 34.0, 32.0, 39.0, 39.0, 48.0, 50.0, 48.0, 57.0, 37.0, 47.0, 52.0, 47.0, 37.0, 37.0, 33.0, 39.0, 23.0, 28.0, 26.0, 17.0, 15.0, 10.0, 21.0, 11.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.31640625, -3.19927978515625, -3.0821533203125, -2.96502685546875, -2.847900390625, -2.73077392578125, -2.6136474609375, -2.49652099609375, -2.37939453125, -2.26226806640625, -2.1451416015625, -2.02801513671875, -1.910888671875, -1.79376220703125, -1.6766357421875, -1.55950927734375, -1.4423828125, -1.32525634765625, -1.2081298828125, -1.09100341796875, -0.973876953125, -0.85675048828125, -0.7396240234375, -0.62249755859375, -0.50537109375, -0.38824462890625, -0.2711181640625, -0.15399169921875, -0.036865234375, 0.08026123046875, 0.1973876953125, 0.31451416015625, 0.431640625, 0.54876708984375, 0.6658935546875, 0.78302001953125, 0.900146484375, 1.01727294921875, 1.1343994140625, 1.25152587890625, 1.36865234375, 1.48577880859375, 1.6029052734375, 1.72003173828125, 1.837158203125, 1.95428466796875, 2.0714111328125, 2.18853759765625, 2.3056640625, 2.42279052734375, 2.5399169921875, 2.65704345703125, 2.774169921875, 2.89129638671875, 3.0084228515625, 3.12554931640625, 3.24267578125, 3.35980224609375, 3.4769287109375, 3.59405517578125, 3.711181640625, 3.82830810546875, 3.9454345703125, 4.06256103515625, 4.1796875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 10.0, 6.0, 19.0, 17.0, 25.0, 35.0, 40.0, 52.0, 96.0, 136.0, 179.0, 275.0, 431.0, 609.0, 1067.0, 1705.0, 2979.0, 5700.0, 11524.0, 26487.0, 182752.0, 740534.0, 41758.0, 15393.0, 7187.0, 3820.0, 2191.0, 1231.0, 747.0, 465.0, 337.0, 203.0, 169.0, 107.0, 72.0, 49.0, 43.0, 24.0, 23.0, 11.0, 4.0, 10.0, 12.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0251617431640625, -0.988800048828125, -0.9524383544921875, -0.91607666015625, -0.8797149658203125, -0.843353271484375, -0.8069915771484375, -0.7706298828125, -0.7342681884765625, -0.697906494140625, -0.6615447998046875, -0.62518310546875, -0.5888214111328125, -0.552459716796875, -0.5160980224609375, -0.479736328125, -0.4433746337890625, -0.407012939453125, -0.3706512451171875, -0.33428955078125, -0.2979278564453125, -0.261566162109375, -0.2252044677734375, -0.1888427734375, -0.1524810791015625, -0.116119384765625, -0.0797576904296875, -0.04339599609375, -0.0070343017578125, 0.029327392578125, 0.0656890869140625, 0.10205078125, 0.1384124755859375, 0.174774169921875, 0.2111358642578125, 0.24749755859375, 0.2838592529296875, 0.320220947265625, 0.3565826416015625, 0.3929443359375, 0.4293060302734375, 0.465667724609375, 0.5020294189453125, 0.53839111328125, 0.5747528076171875, 0.611114501953125, 0.6474761962890625, 0.683837890625, 0.7201995849609375, 0.756561279296875, 0.7929229736328125, 0.82928466796875, 0.8656463623046875, 0.902008056640625, 0.9383697509765625, 0.9747314453125, 1.0110931396484375, 1.047454833984375, 1.0838165283203125, 1.12017822265625, 1.1565399169921875, 1.192901611328125, 1.2292633056640625, 1.265625]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 6.0, 4.0, 7.0, 9.0, 13.0, 16.0, 23.0, 26.0, 17.0, 21.0, 23.0, 24.0, 31.0, 31.0, 43.0, 36.0, 33.0, 43.0, 34.0, 36.0, 40.0, 45.0, 31.0, 29.0, 34.0, 36.0, 21.0, 22.0, 33.0, 21.0, 25.0, 27.0, 21.0, 29.0, 14.0, 22.0, 11.0, 10.0, 10.0, 9.0, 6.0, 4.0, 2.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.884765625, -1.824188232421875, -1.76361083984375, -1.703033447265625, -1.6424560546875, -1.581878662109375, -1.52130126953125, -1.460723876953125, -1.400146484375, -1.339569091796875, -1.27899169921875, -1.218414306640625, -1.1578369140625, -1.097259521484375, -1.03668212890625, -0.976104736328125, -0.91552734375, -0.854949951171875, -0.79437255859375, -0.733795166015625, -0.6732177734375, -0.612640380859375, -0.55206298828125, -0.491485595703125, -0.430908203125, -0.370330810546875, -0.30975341796875, -0.249176025390625, -0.1885986328125, -0.128021240234375, -0.06744384765625, -0.006866455078125, 0.0537109375, 0.114288330078125, 0.17486572265625, 0.235443115234375, 0.2960205078125, 0.356597900390625, 0.41717529296875, 0.477752685546875, 0.538330078125, 0.598907470703125, 0.65948486328125, 0.720062255859375, 0.7806396484375, 0.841217041015625, 0.90179443359375, 0.962371826171875, 1.02294921875, 1.083526611328125, 1.14410400390625, 1.204681396484375, 1.2652587890625, 1.325836181640625, 1.38641357421875, 1.446990966796875, 1.507568359375, 1.568145751953125, 1.62872314453125, 1.689300537109375, 1.7498779296875, 1.810455322265625, 1.87103271484375, 1.931610107421875, 1.9921875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 11.0, 20.0, 21.0, 22.0, 33.0, 62.0, 96.0, 130.0, 201.0, 329.0, 599.0, 1273.0, 2577.0, 5747.0, 14199.0, 43392.0, 910998.0, 43654.0, 14214.0, 5740.0, 2471.0, 1180.0, 623.0, 298.0, 220.0, 131.0, 69.0, 71.0, 41.0, 32.0, 15.0, 13.0, 12.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.355224609375, -0.3435783386230469, -0.33193206787109375, -0.3202857971191406, -0.3086395263671875, -0.2969932556152344, -0.28534698486328125, -0.2737007141113281, -0.262054443359375, -0.2504081726074219, -0.23876190185546875, -0.22711563110351562, -0.2154693603515625, -0.20382308959960938, -0.19217681884765625, -0.18053054809570312, -0.16888427734375, -0.15723800659179688, -0.14559173583984375, -0.13394546508789062, -0.1222991943359375, -0.11065292358398438, -0.09900665283203125, -0.08736038208007812, -0.075714111328125, -0.06406784057617188, -0.05242156982421875, -0.040775299072265625, -0.0291290283203125, -0.017482757568359375, -0.00583648681640625, 0.005809783935546875, 0.0174560546875, 0.029102325439453125, 0.04074859619140625, 0.052394866943359375, 0.0640411376953125, 0.07568740844726562, 0.08733367919921875, 0.09897994995117188, 0.110626220703125, 0.12227249145507812, 0.13391876220703125, 0.14556503295898438, 0.1572113037109375, 0.16885757446289062, 0.18050384521484375, 0.19215011596679688, 0.20379638671875, 0.21544265747070312, 0.22708892822265625, 0.23873519897460938, 0.2503814697265625, 0.2620277404785156, 0.27367401123046875, 0.2853202819824219, 0.296966552734375, 0.3086128234863281, 0.32025909423828125, 0.3319053649902344, 0.3435516357421875, 0.3551979064941406, 0.36684417724609375, 0.3784904479980469, 0.39013671875]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 7.0, 10.0, 7.0, 12.0, 22.0, 21.0, 23.0, 10.0, 31.0, 42.0, 42.0, 42.0, 51.0, 53.0, 47.0, 47.0, 40.0, 44.0, 49.0, 50.0, 41.0, 49.0, 36.0, 28.0, 28.0, 27.0, 25.0, 21.0, 21.0, 10.0, 9.0, 7.0, 8.0, 5.0, 4.0, 5.0, 0.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.919269561767578e-05, -1.848861575126648e-05, -1.7784535884857178e-05, -1.7080456018447876e-05, -1.6376376152038574e-05, -1.5672296285629272e-05, -1.496821641921997e-05, -1.4264136552810669e-05, -1.3560056686401367e-05, -1.2855976819992065e-05, -1.2151896953582764e-05, -1.1447817087173462e-05, -1.074373722076416e-05, -1.0039657354354858e-05, -9.335577487945557e-06, -8.631497621536255e-06, -7.927417755126953e-06, -7.223337888717651e-06, -6.51925802230835e-06, -5.815178155899048e-06, -5.111098289489746e-06, -4.407018423080444e-06, -3.7029385566711426e-06, -2.998858690261841e-06, -2.294778823852539e-06, -1.5906989574432373e-06, -8.866190910339355e-07, -1.825392246246338e-07, 5.21540641784668e-07, 1.2256205081939697e-06, 1.9297003746032715e-06, 2.6337802410125732e-06, 3.337860107421875e-06, 4.041939973831177e-06, 4.7460198402404785e-06, 5.45009970664978e-06, 6.154179573059082e-06, 6.858259439468384e-06, 7.5623393058776855e-06, 8.266419172286987e-06, 8.970499038696289e-06, 9.67457890510559e-06, 1.0378658771514893e-05, 1.1082738637924194e-05, 1.1786818504333496e-05, 1.2490898370742798e-05, 1.31949782371521e-05, 1.3899058103561401e-05, 1.4603137969970703e-05, 1.5307217836380005e-05, 1.6011297702789307e-05, 1.671537756919861e-05, 1.741945743560791e-05, 1.8123537302017212e-05, 1.8827617168426514e-05, 1.9531697034835815e-05, 2.0235776901245117e-05, 2.093985676765442e-05, 2.164393663406372e-05, 2.2348016500473022e-05, 2.3052096366882324e-05, 2.3756176233291626e-05, 2.4460256099700928e-05, 2.516433596611023e-05, 2.586841583251953e-05]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 4.0, 12.0, 11.0, 27.0, 48.0, 61.0, 69.0, 114.0, 172.0, 244.0, 390.0, 620.0, 944.0, 1456.0, 2407.0, 4113.0, 7465.0, 14539.0, 30390.0, 63271.0, 131567.0, 234075.0, 251944.0, 154522.0, 75717.0, 36287.0, 17279.0, 8816.0, 4819.0, 2615.0, 1566.0, 1015.0, 667.0, 418.0, 274.0, 182.0, 134.0, 85.0, 56.0, 40.0, 33.0, 24.0, 21.0, 7.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10455322265625, -0.10108184814453125, -0.0976104736328125, -0.09413909912109375, -0.090667724609375, -0.08719635009765625, -0.0837249755859375, -0.08025360107421875, -0.0767822265625, -0.07331085205078125, -0.0698394775390625, -0.06636810302734375, -0.062896728515625, -0.05942535400390625, -0.0559539794921875, -0.05248260498046875, -0.04901123046875, -0.04553985595703125, -0.0420684814453125, -0.03859710693359375, -0.035125732421875, -0.03165435791015625, -0.0281829833984375, -0.02471160888671875, -0.021240234375, -0.01776885986328125, -0.0142974853515625, -0.01082611083984375, -0.007354736328125, -0.00388336181640625, -0.0004119873046875, 0.00305938720703125, 0.00653076171875, 0.01000213623046875, 0.0134735107421875, 0.01694488525390625, 0.020416259765625, 0.02388763427734375, 0.0273590087890625, 0.03083038330078125, 0.0343017578125, 0.03777313232421875, 0.0412445068359375, 0.04471588134765625, 0.048187255859375, 0.05165863037109375, 0.0551300048828125, 0.05860137939453125, 0.06207275390625, 0.06554412841796875, 0.0690155029296875, 0.07248687744140625, 0.075958251953125, 0.07942962646484375, 0.0829010009765625, 0.08637237548828125, 0.08984375, 0.09331512451171875, 0.0967864990234375, 0.10025787353515625, 0.103729248046875, 0.10720062255859375, 0.1106719970703125, 0.11414337158203125, 0.11761474609375]}, "gradients/decoder.bert.encoder.layer.7.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 10.0, 9.0, 11.0, 10.0, 18.0, 24.0, 28.0, 23.0, 31.0, 43.0, 53.0, 70.0, 54.0, 72.0, 70.0, 76.0, 55.0, 50.0, 47.0, 36.0, 37.0, 31.0, 30.0, 19.0, 6.0, 16.0, 14.0, 11.0, 6.0, 4.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.023162841796875, -0.022449970245361328, -0.021737098693847656, -0.021024227142333984, -0.020311355590820312, -0.01959848403930664, -0.01888561248779297, -0.018172740936279297, -0.017459869384765625, -0.016746997833251953, -0.01603412628173828, -0.01532125473022461, -0.014608383178710938, -0.013895511627197266, -0.013182640075683594, -0.012469768524169922, -0.01175689697265625, -0.011044025421142578, -0.010331153869628906, -0.009618282318115234, -0.008905410766601562, -0.00819253921508789, -0.007479667663574219, -0.006766796112060547, -0.006053924560546875, -0.005341053009033203, -0.004628181457519531, -0.003915309906005859, -0.0032024383544921875, -0.0024895668029785156, -0.0017766952514648438, -0.0010638236999511719, -0.0003509521484375, 0.0003619194030761719, 0.0010747909545898438, 0.0017876625061035156, 0.0025005340576171875, 0.0032134056091308594, 0.003926277160644531, 0.004639148712158203, 0.005352020263671875, 0.006064891815185547, 0.006777763366699219, 0.007490634918212891, 0.008203506469726562, 0.008916378021240234, 0.009629249572753906, 0.010342121124267578, 0.01105499267578125, 0.011767864227294922, 0.012480735778808594, 0.013193607330322266, 0.013906478881835938, 0.01461935043334961, 0.015332221984863281, 0.016045093536376953, 0.016757965087890625, 0.017470836639404297, 0.01818370819091797, 0.01889657974243164, 0.019609451293945312, 0.020322322845458984, 0.021035194396972656, 0.021748065948486328, 0.0224609375]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 7.0, 8.0, 9.0, 11.0, 12.0, 17.0, 22.0, 26.0, 38.0, 44.0, 54.0, 59.0, 62.0, 55.0, 58.0, 64.0, 62.0, 47.0, 60.0, 43.0, 42.0, 34.0, 29.0, 24.0, 26.0, 18.0, 13.0, 6.0, 14.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.235409736633301, -6.057042121887207, -5.878674507141113, -5.7003068923950195, -5.521938800811768, -5.343571186065674, -5.16520357131958, -4.986835956573486, -4.808467864990234, -4.630100250244141, -4.451732635498047, -4.273365020751953, -4.094996929168701, -3.9166293144226074, -3.7382616996765137, -3.55989408493042, -3.381526470184326, -3.2031588554382324, -3.0247910022735596, -2.846423387527466, -2.668055534362793, -2.489687919616699, -2.3113203048706055, -2.1329526901245117, -1.9545848369598389, -1.7762171030044556, -1.5978493690490723, -1.4194817543029785, -1.2411140203475952, -1.062746286392212, -0.8843786716461182, -0.7060109376907349, -0.5276436805725098, -0.34927597641944885, -0.17090827226638794, 0.007459402084350586, 0.1858271360397339, 0.3641948699951172, 0.5425624847412109, 0.7209302186965942, 0.8992979526519775, 1.0776656866073608, 1.2560334205627441, 1.434401035308838, 1.6127687692642212, 1.7911365032196045, 1.9695041179656982, 2.147871971130371, 2.326239585876465, 2.5046072006225586, 2.6829750537872314, 2.861342668533325, 3.039710521697998, 3.218078136444092, 3.3964457511901855, 3.5748133659362793, 3.753181219100952, 3.931548833847046, 4.109916687011719, 4.2882843017578125, 4.466651916503906, 4.64501953125, 4.823387145996094, 5.001755237579346, 5.1801228523254395]}, "gradients/decoder.bert.encoder.layer.7.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 3.0, 2.0, 6.0, 9.0, 9.0, 18.0, 19.0, 16.0, 24.0, 31.0, 34.0, 26.0, 31.0, 38.0, 33.0, 49.0, 51.0, 48.0, 44.0, 52.0, 52.0, 43.0, 51.0, 45.0, 32.0, 31.0, 28.0, 35.0, 27.0, 20.0, 14.0, 18.0, 16.0, 14.0, 9.0, 5.0, 9.0, 2.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8157401084899902, -2.711730480194092, -2.6077210903167725, -2.503711462020874, -2.3997018337249756, -2.2956924438476562, -2.191682815551758, -2.0876731872558594, -1.983663558959961, -1.879654049873352, -1.7756444215774536, -1.6716349124908447, -1.5676252841949463, -1.4636157751083374, -1.3596062660217285, -1.25559663772583, -1.1515871286392212, -1.0475776195526123, -0.9435679912567139, -0.839558482170105, -0.7355488538742065, -0.6315393447875977, -0.527529776096344, -0.42352020740509033, -0.31951063871383667, -0.215501070022583, -0.11149151623249054, -0.007481962442398071, 0.09652760624885559, 0.20053714513778687, 0.3045467138290405, 0.4085562825202942, 0.5125658512115479, 0.6165754199028015, 0.7205849885940552, 0.8245944976806641, 0.9286041259765625, 1.0326136350631714, 1.1366231441497803, 1.2406327724456787, 1.3446424007415771, 1.448651909828186, 1.5526615381240845, 1.6566710472106934, 1.7606806755065918, 1.8646901845932007, 1.9686996936798096, 2.072709321975708, 2.1767187118530273, 2.280728340148926, 2.384737730026245, 2.4887473583221436, 2.592756986618042, 2.6967663764953613, 2.8007760047912598, 2.904785633087158, 3.0087952613830566, 3.112804889678955, 3.2168142795562744, 3.320823907852173, 3.4248335361480713, 3.5288429260253906, 3.632852554321289, 3.7368621826171875, 3.840871810913086]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 9.0, 12.0, 20.0, 24.0, 40.0, 53.0, 90.0, 125.0, 227.0, 332.0, 529.0, 873.0, 1415.0, 2474.0, 4032.0, 6827.0, 12076.0, 20930.0, 36091.0, 61282.0, 97814.0, 142192.0, 173167.0, 164146.0, 124003.0, 81323.0, 49345.0, 29206.0, 16275.0, 9745.0, 5517.0, 3275.0, 1987.0, 1169.0, 726.0, 455.0, 291.0, 172.0, 111.0, 64.0, 46.0, 23.0, 23.0, 14.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.91015625, -3.790924072265625, -3.67169189453125, -3.552459716796875, -3.4332275390625, -3.313995361328125, -3.19476318359375, -3.075531005859375, -2.956298828125, -2.837066650390625, -2.71783447265625, -2.598602294921875, -2.4793701171875, -2.360137939453125, -2.24090576171875, -2.121673583984375, -2.00244140625, -1.883209228515625, -1.76397705078125, -1.644744873046875, -1.5255126953125, -1.406280517578125, -1.28704833984375, -1.167816162109375, -1.048583984375, -0.929351806640625, -0.81011962890625, -0.690887451171875, -0.5716552734375, -0.452423095703125, -0.33319091796875, -0.213958740234375, -0.0947265625, 0.024505615234375, 0.14373779296875, 0.262969970703125, 0.3822021484375, 0.501434326171875, 0.62066650390625, 0.739898681640625, 0.859130859375, 0.978363037109375, 1.09759521484375, 1.216827392578125, 1.3360595703125, 1.455291748046875, 1.57452392578125, 1.693756103515625, 1.81298828125, 1.932220458984375, 2.05145263671875, 2.170684814453125, 2.2899169921875, 2.409149169921875, 2.52838134765625, 2.647613525390625, 2.766845703125, 2.886077880859375, 3.00531005859375, 3.124542236328125, 3.2437744140625, 3.363006591796875, 3.48223876953125, 3.601470947265625, 3.720703125]}, "gradients/decoder.bert.encoder.layer.7.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 10.0, 9.0, 3.0, 8.0, 11.0, 14.0, 18.0, 18.0, 26.0, 29.0, 30.0, 21.0, 38.0, 52.0, 40.0, 43.0, 55.0, 54.0, 55.0, 34.0, 51.0, 47.0, 43.0, 45.0, 31.0, 20.0, 28.0, 26.0, 31.0, 24.0, 12.0, 24.0, 14.0, 14.0, 8.0, 2.0, 4.0, 3.0, 6.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.86016845703125, -2.7437744140625, -2.62738037109375, -2.510986328125, -2.39459228515625, -2.2781982421875, -2.16180419921875, -2.04541015625, -1.92901611328125, -1.8126220703125, -1.69622802734375, -1.579833984375, -1.46343994140625, -1.3470458984375, -1.23065185546875, -1.1142578125, -0.99786376953125, -0.8814697265625, -0.76507568359375, -0.648681640625, -0.53228759765625, -0.4158935546875, -0.29949951171875, -0.18310546875, -0.06671142578125, 0.0496826171875, 0.16607666015625, 0.282470703125, 0.39886474609375, 0.5152587890625, 0.63165283203125, 0.748046875, 0.86444091796875, 0.9808349609375, 1.09722900390625, 1.213623046875, 1.33001708984375, 1.4464111328125, 1.56280517578125, 1.67919921875, 1.79559326171875, 1.9119873046875, 2.02838134765625, 2.144775390625, 2.26116943359375, 2.3775634765625, 2.49395751953125, 2.6103515625, 2.72674560546875, 2.8431396484375, 2.95953369140625, 3.075927734375, 3.19232177734375, 3.3087158203125, 3.42510986328125, 3.54150390625, 3.65789794921875, 3.7742919921875, 3.89068603515625, 4.007080078125, 4.12347412109375, 4.2398681640625, 4.35626220703125, 4.47265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 12.0, 20.0, 26.0, 28.0, 43.0, 65.0, 85.0, 154.0, 245.0, 349.0, 523.0, 774.0, 1231.0, 1861.0, 2889.0, 4620.0, 7302.0, 11528.0, 18090.0, 28905.0, 44232.0, 65097.0, 92252.0, 119702.0, 136225.0, 134579.0, 114807.0, 87747.0, 61337.0, 40765.0, 26589.0, 17063.0, 10668.0, 6680.0, 4378.0, 2692.0, 1714.0, 1159.0, 716.0, 467.0, 294.0, 223.0, 137.0, 88.0, 58.0, 43.0, 33.0, 17.0, 11.0, 10.0, 6.0, 5.0, 4.0, 4.0, 3.0], "bins": [-3.322265625, -3.22430419921875, -3.1263427734375, -3.02838134765625, -2.930419921875, -2.83245849609375, -2.7344970703125, -2.63653564453125, -2.53857421875, -2.44061279296875, -2.3426513671875, -2.24468994140625, -2.146728515625, -2.04876708984375, -1.9508056640625, -1.85284423828125, -1.7548828125, -1.65692138671875, -1.5589599609375, -1.46099853515625, -1.363037109375, -1.26507568359375, -1.1671142578125, -1.06915283203125, -0.97119140625, -0.87322998046875, -0.7752685546875, -0.67730712890625, -0.579345703125, -0.48138427734375, -0.3834228515625, -0.28546142578125, -0.1875, -0.08953857421875, 0.0084228515625, 0.10638427734375, 0.204345703125, 0.30230712890625, 0.4002685546875, 0.49822998046875, 0.59619140625, 0.69415283203125, 0.7921142578125, 0.89007568359375, 0.988037109375, 1.08599853515625, 1.1839599609375, 1.28192138671875, 1.3798828125, 1.47784423828125, 1.5758056640625, 1.67376708984375, 1.771728515625, 1.86968994140625, 1.9676513671875, 2.06561279296875, 2.16357421875, 2.26153564453125, 2.3594970703125, 2.45745849609375, 2.555419921875, 2.65338134765625, 2.7513427734375, 2.84930419921875, 2.947265625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 10.0, 9.0, 9.0, 10.0, 10.0, 20.0, 11.0, 26.0, 25.0, 25.0, 23.0, 24.0, 40.0, 33.0, 37.0, 40.0, 54.0, 41.0, 52.0, 37.0, 45.0, 40.0, 45.0, 44.0, 34.0, 28.0, 37.0, 25.0, 25.0, 26.0, 23.0, 15.0, 19.0, 17.0, 10.0, 7.0, 9.0, 4.0, 3.0, 1.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.072265625, -2.00927734375, -1.9462890625, -1.88330078125, -1.8203125, -1.75732421875, -1.6943359375, -1.63134765625, -1.568359375, -1.50537109375, -1.4423828125, -1.37939453125, -1.31640625, -1.25341796875, -1.1904296875, -1.12744140625, -1.064453125, -1.00146484375, -0.9384765625, -0.87548828125, -0.8125, -0.74951171875, -0.6865234375, -0.62353515625, -0.560546875, -0.49755859375, -0.4345703125, -0.37158203125, -0.30859375, -0.24560546875, -0.1826171875, -0.11962890625, -0.056640625, 0.00634765625, 0.0693359375, 0.13232421875, 0.1953125, 0.25830078125, 0.3212890625, 0.38427734375, 0.447265625, 0.51025390625, 0.5732421875, 0.63623046875, 0.69921875, 0.76220703125, 0.8251953125, 0.88818359375, 0.951171875, 1.01416015625, 1.0771484375, 1.14013671875, 1.203125, 1.26611328125, 1.3291015625, 1.39208984375, 1.455078125, 1.51806640625, 1.5810546875, 1.64404296875, 1.70703125, 1.77001953125, 1.8330078125, 1.89599609375, 1.958984375]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 8.0, 4.0, 7.0, 12.0, 11.0, 10.0, 14.0, 32.0, 34.0, 45.0, 81.0, 124.0, 157.0, 217.0, 401.0, 606.0, 988.0, 1742.0, 3163.0, 5625.0, 10762.0, 21424.0, 44809.0, 96186.0, 184453.0, 255022.0, 205278.0, 111501.0, 53145.0, 25262.0, 12495.0, 6380.0, 3491.0, 1999.0, 1111.0, 709.0, 422.0, 250.0, 185.0, 121.0, 75.0, 60.0, 43.0, 29.0, 25.0, 15.0, 6.0, 8.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.046875, -2.94732666015625, -2.8477783203125, -2.74822998046875, -2.648681640625, -2.54913330078125, -2.4495849609375, -2.35003662109375, -2.25048828125, -2.15093994140625, -2.0513916015625, -1.95184326171875, -1.852294921875, -1.75274658203125, -1.6531982421875, -1.55364990234375, -1.4541015625, -1.35455322265625, -1.2550048828125, -1.15545654296875, -1.055908203125, -0.95635986328125, -0.8568115234375, -0.75726318359375, -0.65771484375, -0.55816650390625, -0.4586181640625, -0.35906982421875, -0.259521484375, -0.15997314453125, -0.0604248046875, 0.03912353515625, 0.138671875, 0.23822021484375, 0.3377685546875, 0.43731689453125, 0.536865234375, 0.63641357421875, 0.7359619140625, 0.83551025390625, 0.93505859375, 1.03460693359375, 1.1341552734375, 1.23370361328125, 1.333251953125, 1.43280029296875, 1.5323486328125, 1.63189697265625, 1.7314453125, 1.83099365234375, 1.9305419921875, 2.03009033203125, 2.129638671875, 2.22918701171875, 2.3287353515625, 2.42828369140625, 2.52783203125, 2.62738037109375, 2.7269287109375, 2.82647705078125, 2.926025390625, 3.02557373046875, 3.1251220703125, 3.22467041015625, 3.32421875]}, "gradients/decoder.bert.encoder.layer.7.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 7.0, 2.0, 9.0, 5.0, 12.0, 11.0, 9.0, 29.0, 22.0, 29.0, 25.0, 44.0, 55.0, 46.0, 62.0, 68.0, 64.0, 61.0, 50.0, 56.0, 65.0, 50.0, 28.0, 29.0, 26.0, 35.0, 25.0, 17.0, 15.0, 11.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00030684471130371094, -0.00029884278774261475, -0.00029084086418151855, -0.00028283894062042236, -0.00027483701705932617, -0.00026683509349823, -0.0002588331699371338, -0.0002508312463760376, -0.0002428293228149414, -0.00023482739925384521, -0.00022682547569274902, -0.00021882355213165283, -0.00021082162857055664, -0.00020281970500946045, -0.00019481778144836426, -0.00018681585788726807, -0.00017881393432617188, -0.00017081201076507568, -0.0001628100872039795, -0.0001548081636428833, -0.0001468062400817871, -0.00013880431652069092, -0.00013080239295959473, -0.00012280046939849854, -0.00011479854583740234, -0.00010679662227630615, -9.879469871520996e-05, -9.079277515411377e-05, -8.279085159301758e-05, -7.478892803192139e-05, -6.67870044708252e-05, -5.8785080909729004e-05, -5.078315734863281e-05, -4.278123378753662e-05, -3.477931022644043e-05, -2.6777386665344238e-05, -1.8775463104248047e-05, -1.0773539543151855e-05, -2.771615982055664e-06, 5.230307579040527e-06, 1.3232231140136719e-05, 2.123415470123291e-05, 2.92360782623291e-05, 3.723800182342529e-05, 4.5239925384521484e-05, 5.3241848945617676e-05, 6.124377250671387e-05, 6.924569606781006e-05, 7.724761962890625e-05, 8.524954319000244e-05, 9.325146675109863e-05, 0.00010125339031219482, 0.00010925531387329102, 0.00011725723743438721, 0.0001252591609954834, 0.0001332610845565796, 0.00014126300811767578, 0.00014926493167877197, 0.00015726685523986816, 0.00016526877880096436, 0.00017327070236206055, 0.00018127262592315674, 0.00018927454948425293, 0.00019727647304534912, 0.0002052783966064453]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 7.0, 4.0, 9.0, 8.0, 20.0, 37.0, 40.0, 73.0, 105.0, 137.0, 196.0, 286.0, 400.0, 670.0, 910.0, 1323.0, 2050.0, 3372.0, 5287.0, 8774.0, 14711.0, 24881.0, 42966.0, 72442.0, 116576.0, 162893.0, 179438.0, 152219.0, 103734.0, 63055.0, 36560.0, 21576.0, 12761.0, 7594.0, 4787.0, 2942.0, 1956.0, 1276.0, 834.0, 535.0, 378.0, 227.0, 159.0, 107.0, 85.0, 52.0, 37.0, 28.0, 14.0, 8.0, 8.0, 6.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.021484375, -1.95703125, -1.892578125, -1.828125, -1.763671875, -1.69921875, -1.634765625, -1.5703125, -1.505859375, -1.44140625, -1.376953125, -1.3125, -1.248046875, -1.18359375, -1.119140625, -1.0546875, -0.990234375, -0.92578125, -0.861328125, -0.796875, -0.732421875, -0.66796875, -0.603515625, -0.5390625, -0.474609375, -0.41015625, -0.345703125, -0.28125, -0.216796875, -0.15234375, -0.087890625, -0.0234375, 0.041015625, 0.10546875, 0.169921875, 0.234375, 0.298828125, 0.36328125, 0.427734375, 0.4921875, 0.556640625, 0.62109375, 0.685546875, 0.75, 0.814453125, 0.87890625, 0.943359375, 1.0078125, 1.072265625, 1.13671875, 1.201171875, 1.265625, 1.330078125, 1.39453125, 1.458984375, 1.5234375, 1.587890625, 1.65234375, 1.716796875, 1.78125, 1.845703125, 1.91015625, 1.974609375, 2.0390625, 2.103515625]}, "gradients/decoder.bert.encoder.layer.7.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 12.0, 8.0, 8.0, 14.0, 11.0, 21.0, 15.0, 27.0, 30.0, 37.0, 44.0, 43.0, 50.0, 55.0, 64.0, 46.0, 46.0, 67.0, 53.0, 49.0, 47.0, 34.0, 28.0, 24.0, 26.0, 16.0, 30.0, 18.0, 11.0, 8.0, 15.0, 7.0, 2.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498046875, -0.48014068603515625, -0.4622344970703125, -0.44432830810546875, -0.426422119140625, -0.40851593017578125, -0.3906097412109375, -0.37270355224609375, -0.35479736328125, -0.33689117431640625, -0.3189849853515625, -0.30107879638671875, -0.283172607421875, -0.26526641845703125, -0.2473602294921875, -0.22945404052734375, -0.2115478515625, -0.19364166259765625, -0.1757354736328125, -0.15782928466796875, -0.139923095703125, -0.12201690673828125, -0.1041107177734375, -0.08620452880859375, -0.06829833984375, -0.05039215087890625, -0.0324859619140625, -0.01457977294921875, 0.003326416015625, 0.02123260498046875, 0.0391387939453125, 0.05704498291015625, 0.074951171875, 0.09285736083984375, 0.1107635498046875, 0.12866973876953125, 0.146575927734375, 0.16448211669921875, 0.1823883056640625, 0.20029449462890625, 0.21820068359375, 0.23610687255859375, 0.2540130615234375, 0.27191925048828125, 0.289825439453125, 0.30773162841796875, 0.3256378173828125, 0.34354400634765625, 0.3614501953125, 0.37935638427734375, 0.3972625732421875, 0.41516876220703125, 0.433074951171875, 0.45098114013671875, 0.4688873291015625, 0.48679351806640625, 0.50469970703125, 0.5226058959960938, 0.5405120849609375, 0.5584182739257812, 0.576324462890625, 0.5942306518554688, 0.6121368408203125, 0.6300430297851562, 0.64794921875]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 6.0, 4.0, 10.0, 3.0, 8.0, 9.0, 20.0, 28.0, 24.0, 27.0, 48.0, 41.0, 55.0, 79.0, 61.0, 67.0, 68.0, 63.0, 54.0, 54.0, 52.0, 45.0, 29.0, 30.0, 33.0, 20.0, 13.0, 11.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.87745475769043, -6.682534217834473, -6.487614154815674, -6.292694091796875, -6.097773551940918, -5.902853012084961, -5.707932949066162, -5.513012886047363, -5.318092346191406, -5.123171806335449, -4.92825174331665, -4.733331680297852, -4.5384111404418945, -4.3434906005859375, -4.148570537567139, -3.9536502361297607, -3.758729934692383, -3.563809633255005, -3.368889331817627, -3.173969030380249, -2.979048728942871, -2.784128427505493, -2.5892081260681152, -2.3942878246307373, -2.1993675231933594, -2.0044472217559814, -1.8095269203186035, -1.6146066188812256, -1.4196863174438477, -1.2247660160064697, -1.0298457145690918, -0.8349254131317139, -0.6400055885314941, -0.4450852870941162, -0.2501649856567383, -0.05524468421936035, 0.13967561721801758, 0.3345959186553955, 0.5295162200927734, 0.7244365215301514, 0.9193568229675293, 1.1142771244049072, 1.3091974258422852, 1.504117727279663, 1.699038028717041, 1.893958330154419, 2.088878631591797, 2.283798933029175, 2.4787192344665527, 2.6736395359039307, 2.8685598373413086, 3.0634801387786865, 3.2584004402160645, 3.4533207416534424, 3.6482410430908203, 3.8431613445281982, 4.038081645965576, 4.233001708984375, 4.427922248840332, 4.622842788696289, 4.817762851715088, 5.012682914733887, 5.207603454589844, 5.402523994445801, 5.5974440574646]}, "gradients/decoder.bert.encoder.layer.6.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 0.0, 4.0, 4.0, 1.0, 5.0, 8.0, 8.0, 7.0, 8.0, 14.0, 18.0, 20.0, 23.0, 22.0, 26.0, 30.0, 39.0, 40.0, 34.0, 46.0, 46.0, 40.0, 53.0, 39.0, 41.0, 51.0, 38.0, 49.0, 48.0, 37.0, 22.0, 33.0, 32.0, 17.0, 22.0, 18.0, 11.0, 7.0, 11.0, 16.0, 7.0, 4.0, 5.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7863235473632812, -2.684755325317383, -2.5831868648529053, -2.481618642807007, -2.3800504207611084, -2.278481960296631, -2.1769137382507324, -2.075345516204834, -1.973777174949646, -1.872208833694458, -1.7706406116485596, -1.6690722703933716, -1.5675039291381836, -1.4659357070922852, -1.3643673658370972, -1.2627990245819092, -1.1612308025360107, -1.0596624612808228, -0.9580942392349243, -0.8565258979797363, -0.7549576163291931, -0.6533893346786499, -0.5518209934234619, -0.4502527117729187, -0.3486844301223755, -0.24711613357067108, -0.14554783701896667, -0.043979525566101074, 0.05758875608444214, 0.15915703773498535, 0.26072537899017334, 0.36229366064071655, 0.46386218070983887, 0.5654304623603821, 0.6669987440109253, 0.7685670852661133, 0.8701353669166565, 0.9717036485671997, 1.0732719898223877, 1.1748402118682861, 1.2764085531234741, 1.377976894378662, 1.4795451164245605, 1.5811134576797485, 1.6826817989349365, 1.784250020980835, 1.885818362236023, 1.987386703491211, 2.0889549255371094, 2.190523147583008, 2.2920916080474854, 2.393659830093384, 2.4952280521392822, 2.5967965126037598, 2.698364734649658, 2.7999329566955566, 2.901501178741455, 3.0030694007873535, 3.104637861251831, 3.2062060832977295, 3.307774305343628, 3.4093427658081055, 3.510910987854004, 3.6124792098999023, 3.71404767036438]}, "gradients/decoder.bert.encoder.layer.6.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 11.0, 19.0, 40.0, 50.0, 80.0, 95.0, 177.0, 304.0, 451.0, 689.0, 1173.0, 1966.0, 3338.0, 5759.0, 10773.0, 19930.0, 38882.0, 80806.0, 180652.0, 443372.0, 1048086.0, 1265552.0, 629651.0, 248653.0, 107323.0, 50746.0, 25285.0, 13305.0, 7206.0, 3990.0, 2330.0, 1407.0, 833.0, 519.0, 312.0, 166.0, 127.0, 78.0, 52.0, 28.0, 19.0, 18.0, 10.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.65625, -6.4615478515625, -6.266845703125, -6.0721435546875, -5.87744140625, -5.6827392578125, -5.488037109375, -5.2933349609375, -5.0986328125, -4.9039306640625, -4.709228515625, -4.5145263671875, -4.31982421875, -4.1251220703125, -3.930419921875, -3.7357177734375, -3.541015625, -3.3463134765625, -3.151611328125, -2.9569091796875, -2.76220703125, -2.5675048828125, -2.372802734375, -2.1781005859375, -1.9833984375, -1.7886962890625, -1.593994140625, -1.3992919921875, -1.20458984375, -1.0098876953125, -0.815185546875, -0.6204833984375, -0.42578125, -0.2310791015625, -0.036376953125, 0.1583251953125, 0.35302734375, 0.5477294921875, 0.742431640625, 0.9371337890625, 1.1318359375, 1.3265380859375, 1.521240234375, 1.7159423828125, 1.91064453125, 2.1053466796875, 2.300048828125, 2.4947509765625, 2.689453125, 2.8841552734375, 3.078857421875, 3.2735595703125, 3.46826171875, 3.6629638671875, 3.857666015625, 4.0523681640625, 4.2470703125, 4.4417724609375, 4.636474609375, 4.8311767578125, 5.02587890625, 5.2205810546875, 5.415283203125, 5.6099853515625, 5.8046875]}, "gradients/decoder.bert.encoder.layer.6.output.dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 8.0, 7.0, 9.0, 11.0, 19.0, 10.0, 17.0, 18.0, 18.0, 23.0, 29.0, 29.0, 32.0, 36.0, 36.0, 30.0, 44.0, 35.0, 41.0, 48.0, 49.0, 39.0, 48.0, 39.0, 29.0, 43.0, 31.0, 22.0, 29.0, 24.0, 22.0, 20.0, 15.0, 12.0, 16.0, 5.0, 5.0, 14.0, 5.0, 2.0, 1.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.498046875, -2.420623779296875, -2.34320068359375, -2.265777587890625, -2.1883544921875, -2.110931396484375, -2.03350830078125, -1.956085205078125, -1.878662109375, -1.801239013671875, -1.72381591796875, -1.646392822265625, -1.5689697265625, -1.491546630859375, -1.41412353515625, -1.336700439453125, -1.25927734375, -1.181854248046875, -1.10443115234375, -1.027008056640625, -0.9495849609375, -0.872161865234375, -0.79473876953125, -0.717315673828125, -0.639892578125, -0.562469482421875, -0.48504638671875, -0.407623291015625, -0.3302001953125, -0.252777099609375, -0.17535400390625, -0.097930908203125, -0.0205078125, 0.056915283203125, 0.13433837890625, 0.211761474609375, 0.2891845703125, 0.366607666015625, 0.44403076171875, 0.521453857421875, 0.598876953125, 0.676300048828125, 0.75372314453125, 0.831146240234375, 0.9085693359375, 0.985992431640625, 1.06341552734375, 1.140838623046875, 1.21826171875, 1.295684814453125, 1.37310791015625, 1.450531005859375, 1.5279541015625, 1.605377197265625, 1.68280029296875, 1.760223388671875, 1.837646484375, 1.915069580078125, 1.99249267578125, 2.069915771484375, 2.1473388671875, 2.224761962890625, 2.30218505859375, 2.379608154296875, 2.45703125]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 16.0, 25.0, 33.0, 72.0, 99.0, 150.0, 227.0, 428.0, 812.0, 1431.0, 2934.0, 6001.0, 12799.0, 28523.0, 68899.0, 176384.0, 474941.0, 1196802.0, 1323308.0, 554368.0, 205584.0, 79689.0, 32864.0, 14430.0, 6668.0, 3138.0, 1616.0, 885.0, 440.0, 276.0, 150.0, 106.0, 62.0, 39.0, 31.0, 12.0, 12.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.109375, -8.833984375, -8.55859375, -8.283203125, -8.0078125, -7.732421875, -7.45703125, -7.181640625, -6.90625, -6.630859375, -6.35546875, -6.080078125, -5.8046875, -5.529296875, -5.25390625, -4.978515625, -4.703125, -4.427734375, -4.15234375, -3.876953125, -3.6015625, -3.326171875, -3.05078125, -2.775390625, -2.5, -2.224609375, -1.94921875, -1.673828125, -1.3984375, -1.123046875, -0.84765625, -0.572265625, -0.296875, -0.021484375, 0.25390625, 0.529296875, 0.8046875, 1.080078125, 1.35546875, 1.630859375, 1.90625, 2.181640625, 2.45703125, 2.732421875, 3.0078125, 3.283203125, 3.55859375, 3.833984375, 4.109375, 4.384765625, 4.66015625, 4.935546875, 5.2109375, 5.486328125, 5.76171875, 6.037109375, 6.3125, 6.587890625, 6.86328125, 7.138671875, 7.4140625, 7.689453125, 7.96484375, 8.240234375, 8.515625]}, "gradients/decoder.bert.encoder.layer.6.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 1.0, 4.0, 5.0, 13.0, 14.0, 23.0, 38.0, 51.0, 61.0, 83.0, 127.0, 164.0, 177.0, 221.0, 285.0, 318.0, 394.0, 319.0, 345.0, 302.0, 259.0, 198.0, 159.0, 118.0, 105.0, 75.0, 74.0, 49.0, 32.0, 20.0, 8.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7333984375, -1.6670379638671875, -1.600677490234375, -1.5343170166015625, -1.46795654296875, -1.4015960693359375, -1.335235595703125, -1.2688751220703125, -1.2025146484375, -1.1361541748046875, -1.069793701171875, -1.0034332275390625, -0.93707275390625, -0.8707122802734375, -0.804351806640625, -0.7379913330078125, -0.671630859375, -0.6052703857421875, -0.538909912109375, -0.4725494384765625, -0.40618896484375, -0.3398284912109375, -0.273468017578125, -0.2071075439453125, -0.1407470703125, -0.0743865966796875, -0.008026123046875, 0.0583343505859375, 0.12469482421875, 0.1910552978515625, 0.257415771484375, 0.3237762451171875, 0.39013671875, 0.4564971923828125, 0.522857666015625, 0.5892181396484375, 0.65557861328125, 0.7219390869140625, 0.788299560546875, 0.8546600341796875, 0.9210205078125, 0.9873809814453125, 1.053741455078125, 1.1201019287109375, 1.18646240234375, 1.2528228759765625, 1.319183349609375, 1.3855438232421875, 1.451904296875, 1.5182647705078125, 1.584625244140625, 1.6509857177734375, 1.71734619140625, 1.7837066650390625, 1.850067138671875, 1.9164276123046875, 1.9827880859375, 2.0491485595703125, 2.115509033203125, 2.1818695068359375, 2.24822998046875, 2.3145904541015625, 2.380950927734375, 2.4473114013671875, 2.513671875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 5.0, 2.0, 4.0, 8.0, 9.0, 13.0, 7.0, 16.0, 29.0, 33.0, 45.0, 49.0, 61.0, 73.0, 85.0, 83.0, 70.0, 67.0, 61.0, 71.0, 53.0, 44.0, 25.0, 23.0, 15.0, 22.0, 9.0, 6.0, 3.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.248263359069824, -7.997119426727295, -7.745975971221924, -7.4948320388793945, -7.243688106536865, -6.992544174194336, -6.741400718688965, -6.4902567863464355, -6.239112854003906, -5.987968921661377, -5.736825466156006, -5.485681533813477, -5.234537601470947, -4.983393669128418, -4.732250213623047, -4.481106281280518, -4.2299628257751465, -3.9788191318511963, -3.727675199508667, -3.476531505584717, -3.2253875732421875, -2.9742438793182373, -2.723100185394287, -2.471956253051758, -2.2208125591278076, -1.9696687459945679, -1.7185249328613281, -1.467381238937378, -1.2162374258041382, -0.9650936126708984, -0.7139499187469482, -0.4628061056137085, -0.21166181564331055, 0.03948196768760681, 0.29062575101852417, 0.5417695045471191, 0.7929133176803589, 1.0440571308135986, 1.2952008247375488, 1.5463446378707886, 1.7974884510040283, 2.0486321449279785, 2.299776077270508, 2.550919771194458, 2.802063465118408, 3.0532073974609375, 3.3043510913848877, 3.555494785308838, 3.806638717651367, 4.0577826499938965, 4.308926105499268, 4.560070037841797, 4.811213970184326, 5.0623579025268555, 5.313501358032227, 5.564645290374756, 5.815789222717285, 6.0669331550598145, 6.3180766105651855, 6.569220542907715, 6.820364475250244, 7.071508407592773, 7.3226518630981445, 7.573795795440674, 7.824939250946045]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 5.0, 5.0, 2.0, 5.0, 8.0, 15.0, 15.0, 24.0, 12.0, 22.0, 20.0, 25.0, 29.0, 27.0, 28.0, 38.0, 28.0, 41.0, 38.0, 37.0, 47.0, 43.0, 39.0, 46.0, 41.0, 42.0, 25.0, 47.0, 32.0, 35.0, 25.0, 20.0, 22.0, 24.0, 20.0, 6.0, 13.0, 10.0, 7.0, 9.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.2820608615875244, -3.1809041500091553, -3.079747438430786, -2.978590965270996, -2.877434253692627, -2.776277542114258, -2.6751208305358887, -2.5739641189575195, -2.4728074073791504, -2.3716506958007812, -2.270493984222412, -2.169337272644043, -2.068180799484253, -1.9670240879058838, -1.8658673763275146, -1.7647106647491455, -1.6635541915893555, -1.5623974800109863, -1.4612408876419067, -1.3600841760635376, -1.258927583694458, -1.1577708721160889, -1.0566141605377197, -0.9554575085639954, -0.854300856590271, -0.7531442046165466, -0.6519875526428223, -0.5508308410644531, -0.44967418909072876, -0.3485175371170044, -0.24736082553863525, -0.1462041735649109, -0.04504728317260742, 0.05610938370227814, 0.1572660505771637, 0.25842273235321045, 0.3595793843269348, 0.4607360363006592, 0.5618927478790283, 0.6630493998527527, 0.764206051826477, 0.8653627038002014, 0.9665193557739258, 1.067676067352295, 1.168832778930664, 1.2699893712997437, 1.3711460828781128, 1.4723026752471924, 1.5734593868255615, 1.6746160984039307, 1.7757726907730103, 1.8769294023513794, 1.978085994720459, 2.079242706298828, 2.1803994178771973, 2.2815561294555664, 2.3827128410339355, 2.4838695526123047, 2.585026264190674, 2.686182975769043, 2.787339448928833, 2.888496160507202, 2.9896528720855713, 3.0908095836639404, 3.1919660568237305]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 10.0, 18.0, 26.0, 27.0, 59.0, 60.0, 101.0, 114.0, 196.0, 313.0, 509.0, 817.0, 1165.0, 1964.0, 3270.0, 5236.0, 9006.0, 14918.0, 26220.0, 45632.0, 80808.0, 138262.0, 204980.0, 200141.0, 133296.0, 76715.0, 43756.0, 24497.0, 14343.0, 8424.0, 5240.0, 3171.0, 1925.0, 1179.0, 742.0, 473.0, 329.0, 198.0, 134.0, 99.0, 54.0, 44.0, 22.0, 23.0, 10.0, 8.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.57177734375, -0.5544281005859375, -0.537078857421875, -0.5197296142578125, -0.50238037109375, -0.4850311279296875, -0.467681884765625, -0.4503326416015625, -0.4329833984375, -0.4156341552734375, -0.398284912109375, -0.3809356689453125, -0.36358642578125, -0.3462371826171875, -0.328887939453125, -0.3115386962890625, -0.294189453125, -0.2768402099609375, -0.259490966796875, -0.2421417236328125, -0.22479248046875, -0.2074432373046875, -0.190093994140625, -0.1727447509765625, -0.1553955078125, -0.1380462646484375, -0.120697021484375, -0.1033477783203125, -0.08599853515625, -0.0686492919921875, -0.051300048828125, -0.0339508056640625, -0.0166015625, 0.0007476806640625, 0.018096923828125, 0.0354461669921875, 0.05279541015625, 0.0701446533203125, 0.087493896484375, 0.1048431396484375, 0.1221923828125, 0.1395416259765625, 0.156890869140625, 0.1742401123046875, 0.19158935546875, 0.2089385986328125, 0.226287841796875, 0.2436370849609375, 0.260986328125, 0.2783355712890625, 0.295684814453125, 0.3130340576171875, 0.33038330078125, 0.3477325439453125, 0.365081787109375, 0.3824310302734375, 0.3997802734375, 0.4171295166015625, 0.434478759765625, 0.4518280029296875, 0.46917724609375, 0.4865264892578125, 0.503875732421875, 0.5212249755859375, 0.53857421875]}, "gradients/decoder.bert.encoder.layer.6.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 0.0, 6.0, 6.0, 6.0, 7.0, 6.0, 11.0, 19.0, 20.0, 21.0, 17.0, 26.0, 30.0, 21.0, 33.0, 32.0, 42.0, 42.0, 36.0, 49.0, 36.0, 54.0, 39.0, 35.0, 55.0, 32.0, 40.0, 40.0, 33.0, 28.0, 35.0, 18.0, 26.0, 25.0, 17.0, 10.0, 7.0, 8.0, 12.0, 5.0, 5.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.927734375, -3.80401611328125, -3.6802978515625, -3.55657958984375, -3.432861328125, -3.30914306640625, -3.1854248046875, -3.06170654296875, -2.93798828125, -2.81427001953125, -2.6905517578125, -2.56683349609375, -2.443115234375, -2.31939697265625, -2.1956787109375, -2.07196044921875, -1.9482421875, -1.82452392578125, -1.7008056640625, -1.57708740234375, -1.453369140625, -1.32965087890625, -1.2059326171875, -1.08221435546875, -0.95849609375, -0.83477783203125, -0.7110595703125, -0.58734130859375, -0.463623046875, -0.33990478515625, -0.2161865234375, -0.09246826171875, 0.03125, 0.15496826171875, 0.2786865234375, 0.40240478515625, 0.526123046875, 0.64984130859375, 0.7735595703125, 0.89727783203125, 1.02099609375, 1.14471435546875, 1.2684326171875, 1.39215087890625, 1.515869140625, 1.63958740234375, 1.7633056640625, 1.88702392578125, 2.0107421875, 2.13446044921875, 2.2581787109375, 2.38189697265625, 2.505615234375, 2.62933349609375, 2.7530517578125, 2.87677001953125, 3.00048828125, 3.12420654296875, 3.2479248046875, 3.37164306640625, 3.495361328125, 3.61907958984375, 3.7427978515625, 3.86651611328125, 3.990234375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 14.0, 17.0, 18.0, 24.0, 47.0, 70.0, 85.0, 136.0, 185.0, 365.0, 466.0, 825.0, 1350.0, 2400.0, 4730.0, 9987.0, 24910.0, 261490.0, 688507.0, 29650.0, 11258.0, 5381.0, 2715.0, 1478.0, 932.0, 533.0, 375.0, 206.0, 133.0, 80.0, 54.0, 38.0, 34.0, 23.0, 11.0, 11.0, 5.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.07025146484375, -2.0057373046875, -1.94122314453125, -1.876708984375, -1.81219482421875, -1.7476806640625, -1.68316650390625, -1.61865234375, -1.55413818359375, -1.4896240234375, -1.42510986328125, -1.360595703125, -1.29608154296875, -1.2315673828125, -1.16705322265625, -1.1025390625, -1.03802490234375, -0.9735107421875, -0.90899658203125, -0.844482421875, -0.77996826171875, -0.7154541015625, -0.65093994140625, -0.58642578125, -0.52191162109375, -0.4573974609375, -0.39288330078125, -0.328369140625, -0.26385498046875, -0.1993408203125, -0.13482666015625, -0.0703125, -0.00579833984375, 0.0587158203125, 0.12322998046875, 0.187744140625, 0.25225830078125, 0.3167724609375, 0.38128662109375, 0.44580078125, 0.51031494140625, 0.5748291015625, 0.63934326171875, 0.703857421875, 0.76837158203125, 0.8328857421875, 0.89739990234375, 0.9619140625, 1.02642822265625, 1.0909423828125, 1.15545654296875, 1.219970703125, 1.28448486328125, 1.3489990234375, 1.41351318359375, 1.47802734375, 1.54254150390625, 1.6070556640625, 1.67156982421875, 1.736083984375, 1.80059814453125, 1.8651123046875, 1.92962646484375, 1.994140625]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 7.0, 1.0, 5.0, 8.0, 7.0, 14.0, 15.0, 24.0, 17.0, 20.0, 18.0, 31.0, 33.0, 30.0, 29.0, 46.0, 30.0, 43.0, 43.0, 38.0, 38.0, 51.0, 36.0, 44.0, 34.0, 43.0, 36.0, 27.0, 29.0, 31.0, 28.0, 24.0, 21.0, 15.0, 24.0, 23.0, 6.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.384765625, -2.29986572265625, -2.2149658203125, -2.13006591796875, -2.045166015625, -1.96026611328125, -1.8753662109375, -1.79046630859375, -1.70556640625, -1.62066650390625, -1.5357666015625, -1.45086669921875, -1.365966796875, -1.28106689453125, -1.1961669921875, -1.11126708984375, -1.0263671875, -0.94146728515625, -0.8565673828125, -0.77166748046875, -0.686767578125, -0.60186767578125, -0.5169677734375, -0.43206787109375, -0.34716796875, -0.26226806640625, -0.1773681640625, -0.09246826171875, -0.007568359375, 0.07733154296875, 0.1622314453125, 0.24713134765625, 0.33203125, 0.41693115234375, 0.5018310546875, 0.58673095703125, 0.671630859375, 0.75653076171875, 0.8414306640625, 0.92633056640625, 1.01123046875, 1.09613037109375, 1.1810302734375, 1.26593017578125, 1.350830078125, 1.43572998046875, 1.5206298828125, 1.60552978515625, 1.6904296875, 1.77532958984375, 1.8602294921875, 1.94512939453125, 2.030029296875, 2.11492919921875, 2.1998291015625, 2.28472900390625, 2.36962890625, 2.45452880859375, 2.5394287109375, 2.62432861328125, 2.709228515625, 2.79412841796875, 2.8790283203125, 2.96392822265625, 3.048828125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 7.0, 7.0, 9.0, 12.0, 19.0, 25.0, 36.0, 56.0, 100.0, 165.0, 286.0, 555.0, 1031.0, 2299.0, 5529.0, 21362.0, 955108.0, 47272.0, 8579.0, 3148.0, 1372.0, 663.0, 384.0, 200.0, 121.0, 80.0, 45.0, 32.0, 26.0, 6.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1837615966796875, -1.143890380859375, -1.1040191650390625, -1.06414794921875, -1.0242767333984375, -0.984405517578125, -0.9445343017578125, -0.9046630859375, -0.8647918701171875, -0.824920654296875, -0.7850494384765625, -0.74517822265625, -0.7053070068359375, -0.665435791015625, -0.6255645751953125, -0.585693359375, -0.5458221435546875, -0.505950927734375, -0.4660797119140625, -0.42620849609375, -0.3863372802734375, -0.346466064453125, -0.3065948486328125, -0.2667236328125, -0.2268524169921875, -0.186981201171875, -0.1471099853515625, -0.10723876953125, -0.0673675537109375, -0.027496337890625, 0.0123748779296875, 0.05224609375, 0.0921173095703125, 0.131988525390625, 0.1718597412109375, 0.21173095703125, 0.2516021728515625, 0.291473388671875, 0.3313446044921875, 0.3712158203125, 0.4110870361328125, 0.450958251953125, 0.4908294677734375, 0.53070068359375, 0.5705718994140625, 0.610443115234375, 0.6503143310546875, 0.690185546875, 0.7300567626953125, 0.769927978515625, 0.8097991943359375, 0.84967041015625, 0.8895416259765625, 0.929412841796875, 0.9692840576171875, 1.0091552734375, 1.0490264892578125, 1.088897705078125, 1.1287689208984375, 1.16864013671875, 1.2085113525390625, 1.248382568359375, 1.2882537841796875, 1.328125]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 8.0, 5.0, 15.0, 7.0, 27.0, 25.0, 37.0, 39.0, 48.0, 87.0, 105.0, 80.0, 102.0, 83.0, 84.0, 53.0, 42.0, 28.0, 24.0, 12.0, 13.0, 3.0, 6.0, 7.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.310773849487305e-05, -5.1544979214668274e-05, -4.99822199344635e-05, -4.841946065425873e-05, -4.6856701374053955e-05, -4.529394209384918e-05, -4.373118281364441e-05, -4.2168423533439636e-05, -4.060566425323486e-05, -3.904290497303009e-05, -3.748014569282532e-05, -3.5917386412620544e-05, -3.435462713241577e-05, -3.2791867852211e-05, -3.1229108572006226e-05, -2.9666349291801453e-05, -2.810359001159668e-05, -2.6540830731391907e-05, -2.4978071451187134e-05, -2.341531217098236e-05, -2.1852552890777588e-05, -2.0289793610572815e-05, -1.8727034330368042e-05, -1.716427505016327e-05, -1.5601515769958496e-05, -1.4038756489753723e-05, -1.247599720954895e-05, -1.0913237929344177e-05, -9.350478649139404e-06, -7.787719368934631e-06, -6.224960088729858e-06, -4.6622008085250854e-06, -3.0994415283203125e-06, -1.5366822481155396e-06, 2.60770320892334e-08, 1.5888363122940063e-06, 3.1515955924987793e-06, 4.714354872703552e-06, 6.277114152908325e-06, 7.839873433113098e-06, 9.402632713317871e-06, 1.0965391993522644e-05, 1.2528151273727417e-05, 1.409091055393219e-05, 1.5653669834136963e-05, 1.7216429114341736e-05, 1.877918839454651e-05, 2.0341947674751282e-05, 2.1904706954956055e-05, 2.3467466235160828e-05, 2.50302255153656e-05, 2.6592984795570374e-05, 2.8155744075775146e-05, 2.971850335597992e-05, 3.128126263618469e-05, 3.2844021916389465e-05, 3.440678119659424e-05, 3.596954047679901e-05, 3.7532299757003784e-05, 3.909505903720856e-05, 4.065781831741333e-05, 4.22205775976181e-05, 4.3783336877822876e-05, 4.534609615802765e-05, 4.690885543823242e-05]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 6.0, 5.0, 22.0, 9.0, 16.0, 25.0, 24.0, 69.0, 107.0, 181.0, 322.0, 660.0, 1488.0, 3548.0, 8403.0, 23075.0, 85470.0, 627280.0, 233607.0, 41141.0, 13444.0, 5321.0, 2246.0, 1002.0, 495.0, 242.0, 130.0, 70.0, 46.0, 38.0, 19.0, 11.0, 13.0, 3.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7175750732421875, -0.693450927734375, -0.6693267822265625, -0.64520263671875, -0.6210784912109375, -0.596954345703125, -0.5728302001953125, -0.5487060546875, -0.5245819091796875, -0.500457763671875, -0.4763336181640625, -0.45220947265625, -0.4280853271484375, -0.403961181640625, -0.3798370361328125, -0.355712890625, -0.3315887451171875, -0.307464599609375, -0.2833404541015625, -0.25921630859375, -0.2350921630859375, -0.210968017578125, -0.1868438720703125, -0.1627197265625, -0.1385955810546875, -0.114471435546875, -0.0903472900390625, -0.06622314453125, -0.0420989990234375, -0.017974853515625, 0.0061492919921875, 0.0302734375, 0.0543975830078125, 0.078521728515625, 0.1026458740234375, 0.12677001953125, 0.1508941650390625, 0.175018310546875, 0.1991424560546875, 0.2232666015625, 0.2473907470703125, 0.271514892578125, 0.2956390380859375, 0.31976318359375, 0.3438873291015625, 0.368011474609375, 0.3921356201171875, 0.416259765625, 0.4403839111328125, 0.464508056640625, 0.4886322021484375, 0.51275634765625, 0.5368804931640625, 0.561004638671875, 0.5851287841796875, 0.6092529296875, 0.6333770751953125, 0.657501220703125, 0.6816253662109375, 0.70574951171875, 0.7298736572265625, 0.753997802734375, 0.7781219482421875, 0.80224609375]}, "gradients/decoder.bert.encoder.layer.6.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 8.0, 6.0, 6.0, 7.0, 7.0, 19.0, 23.0, 34.0, 42.0, 76.0, 105.0, 176.0, 164.0, 107.0, 62.0, 40.0, 17.0, 23.0, 21.0, 12.0, 8.0, 7.0, 11.0, 7.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07769775390625, -0.07398700714111328, -0.07027626037597656, -0.06656551361083984, -0.06285476684570312, -0.059144020080566406, -0.05543327331542969, -0.05172252655029297, -0.04801177978515625, -0.04430103302001953, -0.04059028625488281, -0.036879539489746094, -0.033168792724609375, -0.029458045959472656, -0.025747299194335938, -0.02203655242919922, -0.0183258056640625, -0.014615058898925781, -0.010904312133789062, -0.007193565368652344, -0.003482818603515625, 0.00022792816162109375, 0.0039386749267578125, 0.007649421691894531, 0.01136016845703125, 0.015070915222167969, 0.018781661987304688, 0.022492408752441406, 0.026203155517578125, 0.029913902282714844, 0.03362464904785156, 0.03733539581298828, 0.041046142578125, 0.04475688934326172, 0.04846763610839844, 0.052178382873535156, 0.055889129638671875, 0.059599876403808594, 0.06331062316894531, 0.06702136993408203, 0.07073211669921875, 0.07444286346435547, 0.07815361022949219, 0.0818643569946289, 0.08557510375976562, 0.08928585052490234, 0.09299659729003906, 0.09670734405517578, 0.1004180908203125, 0.10412883758544922, 0.10783958435058594, 0.11155033111572266, 0.11526107788085938, 0.1189718246459961, 0.12268257141113281, 0.12639331817626953, 0.13010406494140625, 0.13381481170654297, 0.1375255584716797, 0.1412363052368164, 0.14494705200195312, 0.14865779876708984, 0.15236854553222656, 0.15607929229736328, 0.1597900390625]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 9.0, 10.0, 12.0, 13.0, 16.0, 38.0, 31.0, 50.0, 52.0, 58.0, 86.0, 76.0, 73.0, 78.0, 68.0, 59.0, 69.0, 47.0, 41.0, 21.0, 21.0, 16.0, 17.0, 10.0, 4.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.105216026306152, -7.8560895919799805, -7.60696268081665, -7.3578362464904785, -7.108709812164307, -6.859582901000977, -6.610456466674805, -6.361330032348633, -6.112203598022461, -5.863077163696289, -5.613950252532959, -5.364823818206787, -5.115697383880615, -4.866570472717285, -4.617444038391113, -4.368317604064941, -4.1191911697387695, -3.8700644969940186, -3.6209380626678467, -3.3718113899230957, -3.122684955596924, -2.873558282852173, -2.624431610107422, -2.37530517578125, -2.12617826461792, -1.8770517110824585, -1.627925157546997, -1.378798484802246, -1.1296720504760742, -0.8805453777313232, -0.6314188241958618, -0.3822922706604004, -0.13316583633422852, 0.1159607321023941, 0.3650873005390167, 0.6142138838768005, 0.863340437412262, 1.1124670505523682, 1.3615936040878296, 1.610720157623291, 1.8598467111587524, 2.108973264694214, 2.358099937438965, 2.6072263717651367, 2.8563530445098877, 3.1054797172546387, 3.3546061515808105, 3.6037325859069824, 3.8528592586517334, 4.101985931396484, 4.351112365722656, 4.600238800048828, 4.849365711212158, 5.09849214553833, 5.347618579864502, 5.596745491027832, 5.845871925354004, 6.094998359680176, 6.344125270843506, 6.593251705169678, 6.84237813949585, 7.09150505065918, 7.340631484985352, 7.589757919311523, 7.838884353637695]}, "gradients/decoder.bert.encoder.layer.6.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 0.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 15.0, 17.0, 22.0, 16.0, 16.0, 26.0, 27.0, 27.0, 32.0, 35.0, 33.0, 34.0, 39.0, 39.0, 44.0, 41.0, 41.0, 47.0, 42.0, 43.0, 28.0, 40.0, 39.0, 37.0, 21.0, 23.0, 20.0, 26.0, 17.0, 15.0, 14.0, 8.0, 6.0, 7.0, 10.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.305217981338501, -3.2046446800231934, -3.1040713787078857, -3.003498077392578, -2.9029247760772705, -2.802351474761963, -2.7017784118652344, -2.6012048721313477, -2.500631809234619, -2.4000585079193115, -2.299485206604004, -2.1989119052886963, -2.0983386039733887, -1.997765302658081, -1.897192120552063, -1.7966188192367554, -1.6960453987121582, -1.5954720973968506, -1.494898796081543, -1.3943254947662354, -1.2937521934509277, -1.1931788921356201, -1.092605710029602, -0.9920324087142944, -0.8914591073989868, -0.7908858060836792, -0.6903125047683716, -0.5897392630577087, -0.4891659617424011, -0.3885926604270935, -0.28801941871643066, -0.18744611740112305, -0.08687257766723633, 0.013700708746910095, 0.11427399516105652, 0.21484726667404175, 0.31542056798934937, 0.415993869304657, 0.5165671110153198, 0.6171404123306274, 0.7177137136459351, 0.8182870149612427, 0.9188603162765503, 1.0194334983825684, 1.120006799697876, 1.2205801010131836, 1.3211534023284912, 1.4217267036437988, 1.5223000049591064, 1.622873306274414, 1.7234466075897217, 1.8240199089050293, 1.924593210220337, 2.0251665115356445, 2.125739574432373, 2.2263131141662598, 2.3268861770629883, 2.427459478378296, 2.5280327796936035, 2.628606081008911, 2.7291793823242188, 2.8297526836395264, 2.930325984954834, 3.0308990478515625, 3.131472587585449]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 3.0, 7.0, 16.0, 11.0, 17.0, 27.0, 37.0, 49.0, 56.0, 92.0, 132.0, 229.0, 274.0, 476.0, 605.0, 938.0, 1464.0, 2226.0, 3529.0, 5716.0, 9156.0, 15202.0, 25115.0, 42293.0, 68367.0, 106208.0, 147140.0, 168990.0, 151587.0, 111618.0, 72786.0, 44754.0, 26745.0, 15905.0, 9821.0, 5957.0, 3861.0, 2372.0, 1532.0, 1068.0, 677.0, 460.0, 314.0, 222.0, 146.0, 114.0, 84.0, 48.0, 35.0, 20.0, 16.0, 9.0, 11.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-4.4921875, -4.349853515625, -4.20751953125, -4.065185546875, -3.9228515625, -3.780517578125, -3.63818359375, -3.495849609375, -3.353515625, -3.211181640625, -3.06884765625, -2.926513671875, -2.7841796875, -2.641845703125, -2.49951171875, -2.357177734375, -2.21484375, -2.072509765625, -1.93017578125, -1.787841796875, -1.6455078125, -1.503173828125, -1.36083984375, -1.218505859375, -1.076171875, -0.933837890625, -0.79150390625, -0.649169921875, -0.5068359375, -0.364501953125, -0.22216796875, -0.079833984375, 0.0625, 0.204833984375, 0.34716796875, 0.489501953125, 0.6318359375, 0.774169921875, 0.91650390625, 1.058837890625, 1.201171875, 1.343505859375, 1.48583984375, 1.628173828125, 1.7705078125, 1.912841796875, 2.05517578125, 2.197509765625, 2.33984375, 2.482177734375, 2.62451171875, 2.766845703125, 2.9091796875, 3.051513671875, 3.19384765625, 3.336181640625, 3.478515625, 3.620849609375, 3.76318359375, 3.905517578125, 4.0478515625, 4.190185546875, 4.33251953125, 4.474853515625, 4.6171875]}, "gradients/decoder.bert.encoder.layer.6.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 6.0, 5.0, 11.0, 14.0, 9.0, 15.0, 19.0, 18.0, 19.0, 20.0, 29.0, 36.0, 24.0, 29.0, 27.0, 32.0, 27.0, 39.0, 31.0, 43.0, 41.0, 45.0, 54.0, 40.0, 50.0, 38.0, 28.0, 29.0, 23.0, 28.0, 27.0, 18.0, 19.0, 8.0, 13.0, 16.0, 11.0, 8.0, 7.0, 9.0, 8.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0], "bins": [-3.501953125, -3.39642333984375, -3.2908935546875, -3.18536376953125, -3.079833984375, -2.97430419921875, -2.8687744140625, -2.76324462890625, -2.65771484375, -2.55218505859375, -2.4466552734375, -2.34112548828125, -2.235595703125, -2.13006591796875, -2.0245361328125, -1.91900634765625, -1.8134765625, -1.70794677734375, -1.6024169921875, -1.49688720703125, -1.391357421875, -1.28582763671875, -1.1802978515625, -1.07476806640625, -0.96923828125, -0.86370849609375, -0.7581787109375, -0.65264892578125, -0.547119140625, -0.44158935546875, -0.3360595703125, -0.23052978515625, -0.125, -0.01947021484375, 0.0860595703125, 0.19158935546875, 0.297119140625, 0.40264892578125, 0.5081787109375, 0.61370849609375, 0.71923828125, 0.82476806640625, 0.9302978515625, 1.03582763671875, 1.141357421875, 1.24688720703125, 1.3524169921875, 1.45794677734375, 1.5634765625, 1.66900634765625, 1.7745361328125, 1.88006591796875, 1.985595703125, 2.09112548828125, 2.1966552734375, 2.30218505859375, 2.40771484375, 2.51324462890625, 2.6187744140625, 2.72430419921875, 2.829833984375, 2.93536376953125, 3.0408935546875, 3.14642333984375, 3.251953125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 8.0, 6.0, 14.0, 12.0, 25.0, 32.0, 48.0, 81.0, 151.0, 209.0, 330.0, 594.0, 1126.0, 1953.0, 4001.0, 8456.0, 18459.0, 41836.0, 94849.0, 187946.0, 264318.0, 214442.0, 114779.0, 51821.0, 22810.0, 10072.0, 4797.0, 2410.0, 1243.0, 683.0, 425.0, 230.0, 140.0, 92.0, 50.0, 39.0, 23.0, 17.0, 8.0, 11.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.421875, -7.19439697265625, -6.9669189453125, -6.73944091796875, -6.511962890625, -6.28448486328125, -6.0570068359375, -5.82952880859375, -5.60205078125, -5.37457275390625, -5.1470947265625, -4.91961669921875, -4.692138671875, -4.46466064453125, -4.2371826171875, -4.00970458984375, -3.7822265625, -3.55474853515625, -3.3272705078125, -3.09979248046875, -2.872314453125, -2.64483642578125, -2.4173583984375, -2.18988037109375, -1.96240234375, -1.73492431640625, -1.5074462890625, -1.27996826171875, -1.052490234375, -0.82501220703125, -0.5975341796875, -0.37005615234375, -0.142578125, 0.08489990234375, 0.3123779296875, 0.53985595703125, 0.767333984375, 0.99481201171875, 1.2222900390625, 1.44976806640625, 1.67724609375, 1.90472412109375, 2.1322021484375, 2.35968017578125, 2.587158203125, 2.81463623046875, 3.0421142578125, 3.26959228515625, 3.4970703125, 3.72454833984375, 3.9520263671875, 4.17950439453125, 4.406982421875, 4.63446044921875, 4.8619384765625, 5.08941650390625, 5.31689453125, 5.54437255859375, 5.7718505859375, 5.99932861328125, 6.226806640625, 6.45428466796875, 6.6817626953125, 6.90924072265625, 7.13671875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 13.0, 7.0, 16.0, 19.0, 18.0, 14.0, 21.0, 17.0, 21.0, 48.0, 36.0, 40.0, 28.0, 40.0, 38.0, 53.0, 42.0, 48.0, 33.0, 39.0, 41.0, 35.0, 31.0, 32.0, 25.0, 33.0, 28.0, 21.0, 23.0, 26.0, 20.0, 10.0, 12.0, 11.0, 8.0, 5.0, 11.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.921875, -1.85528564453125, -1.7886962890625, -1.72210693359375, -1.655517578125, -1.58892822265625, -1.5223388671875, -1.45574951171875, -1.38916015625, -1.32257080078125, -1.2559814453125, -1.18939208984375, -1.122802734375, -1.05621337890625, -0.9896240234375, -0.92303466796875, -0.8564453125, -0.78985595703125, -0.7232666015625, -0.65667724609375, -0.590087890625, -0.52349853515625, -0.4569091796875, -0.39031982421875, -0.32373046875, -0.25714111328125, -0.1905517578125, -0.12396240234375, -0.057373046875, 0.00921630859375, 0.0758056640625, 0.14239501953125, 0.208984375, 0.27557373046875, 0.3421630859375, 0.40875244140625, 0.475341796875, 0.54193115234375, 0.6085205078125, 0.67510986328125, 0.74169921875, 0.80828857421875, 0.8748779296875, 0.94146728515625, 1.008056640625, 1.07464599609375, 1.1412353515625, 1.20782470703125, 1.2744140625, 1.34100341796875, 1.4075927734375, 1.47418212890625, 1.540771484375, 1.60736083984375, 1.6739501953125, 1.74053955078125, 1.80712890625, 1.87371826171875, 1.9403076171875, 2.00689697265625, 2.073486328125, 2.14007568359375, 2.2066650390625, 2.27325439453125, 2.33984375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 13.0, 8.0, 11.0, 9.0, 15.0, 26.0, 26.0, 41.0, 69.0, 70.0, 99.0, 141.0, 168.0, 260.0, 332.0, 497.0, 613.0, 985.0, 1625.0, 2539.0, 4540.0, 8783.0, 18724.0, 44677.0, 119183.0, 286370.0, 317309.0, 143425.0, 52867.0, 21650.0, 10164.0, 5049.0, 2819.0, 1731.0, 1139.0, 692.0, 532.0, 348.0, 268.0, 192.0, 126.0, 93.0, 79.0, 62.0, 37.0, 46.0, 25.0, 25.0, 15.0, 13.0, 13.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.734375, -5.56109619140625, -5.3878173828125, -5.21453857421875, -5.041259765625, -4.86798095703125, -4.6947021484375, -4.52142333984375, -4.34814453125, -4.17486572265625, -4.0015869140625, -3.82830810546875, -3.655029296875, -3.48175048828125, -3.3084716796875, -3.13519287109375, -2.9619140625, -2.78863525390625, -2.6153564453125, -2.44207763671875, -2.268798828125, -2.09552001953125, -1.9222412109375, -1.74896240234375, -1.57568359375, -1.40240478515625, -1.2291259765625, -1.05584716796875, -0.882568359375, -0.70928955078125, -0.5360107421875, -0.36273193359375, -0.189453125, -0.01617431640625, 0.1571044921875, 0.33038330078125, 0.503662109375, 0.67694091796875, 0.8502197265625, 1.02349853515625, 1.19677734375, 1.37005615234375, 1.5433349609375, 1.71661376953125, 1.889892578125, 2.06317138671875, 2.2364501953125, 2.40972900390625, 2.5830078125, 2.75628662109375, 2.9295654296875, 3.10284423828125, 3.276123046875, 3.44940185546875, 3.6226806640625, 3.79595947265625, 3.96923828125, 4.14251708984375, 4.3157958984375, 4.48907470703125, 4.662353515625, 4.83563232421875, 5.0089111328125, 5.18218994140625, 5.35546875]}, "gradients/decoder.bert.encoder.layer.6.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 20.0, 9.0, 25.0, 31.0, 54.0, 85.0, 110.0, 138.0, 154.0, 110.0, 71.0, 59.0, 37.0, 23.0, 14.0, 14.0, 5.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006833076477050781, -0.0006625279784202576, -0.000641748309135437, -0.0006209686398506165, -0.0006001889705657959, -0.0005794093012809753, -0.0005586296319961548, -0.0005378499627113342, -0.0005170702934265137, -0.0004962906241416931, -0.00047551095485687256, -0.000454731285572052, -0.00043395161628723145, -0.0004131719470024109, -0.00039239227771759033, -0.0003716126084327698, -0.0003508329391479492, -0.00033005326986312866, -0.0003092736005783081, -0.00028849393129348755, -0.000267714262008667, -0.00024693459272384644, -0.00022615492343902588, -0.00020537525415420532, -0.00018459558486938477, -0.0001638159155845642, -0.00014303624629974365, -0.0001222565770149231, -0.00010147690773010254, -8.069723844528198e-05, -5.9917569160461426e-05, -3.913789987564087e-05, -1.8358230590820312e-05, 2.421438694000244e-06, 2.32011079788208e-05, 4.398077726364136e-05, 6.476044654846191e-05, 8.554011583328247e-05, 0.00010631978511810303, 0.00012709945440292358, 0.00014787912368774414, 0.0001686587929725647, 0.00018943846225738525, 0.0002102181315422058, 0.00023099780082702637, 0.0002517774701118469, 0.0002725571393966675, 0.00029333680868148804, 0.0003141164779663086, 0.00033489614725112915, 0.0003556758165359497, 0.00037645548582077026, 0.0003972351551055908, 0.0004180148243904114, 0.00043879449367523193, 0.0004595741629600525, 0.00048035383224487305, 0.0005011335015296936, 0.0005219131708145142, 0.0005426928400993347, 0.0005634725093841553, 0.0005842521786689758, 0.0006050318479537964, 0.0006258115172386169, 0.0006465911865234375]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 10.0, 9.0, 10.0, 20.0, 27.0, 47.0, 63.0, 110.0, 169.0, 221.0, 344.0, 467.0, 781.0, 1120.0, 1814.0, 2909.0, 4899.0, 9390.0, 20101.0, 46905.0, 115079.0, 240959.0, 291260.0, 175709.0, 74743.0, 30369.0, 13818.0, 6906.0, 3791.0, 2257.0, 1418.0, 972.0, 642.0, 395.0, 249.0, 170.0, 121.0, 86.0, 60.0, 45.0, 27.0, 17.0, 14.0, 16.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.2620849609375, -4.125732421875, -3.9893798828125, -3.85302734375, -3.7166748046875, -3.580322265625, -3.4439697265625, -3.3076171875, -3.1712646484375, -3.034912109375, -2.8985595703125, -2.76220703125, -2.6258544921875, -2.489501953125, -2.3531494140625, -2.216796875, -2.0804443359375, -1.944091796875, -1.8077392578125, -1.67138671875, -1.5350341796875, -1.398681640625, -1.2623291015625, -1.1259765625, -0.9896240234375, -0.853271484375, -0.7169189453125, -0.58056640625, -0.4442138671875, -0.307861328125, -0.1715087890625, -0.03515625, 0.1011962890625, 0.237548828125, 0.3739013671875, 0.51025390625, 0.6466064453125, 0.782958984375, 0.9193115234375, 1.0556640625, 1.1920166015625, 1.328369140625, 1.4647216796875, 1.60107421875, 1.7374267578125, 1.873779296875, 2.0101318359375, 2.146484375, 2.2828369140625, 2.419189453125, 2.5555419921875, 2.69189453125, 2.8282470703125, 2.964599609375, 3.1009521484375, 3.2373046875, 3.3736572265625, 3.510009765625, 3.6463623046875, 3.78271484375, 3.9190673828125, 4.055419921875, 4.1917724609375, 4.328125]}, "gradients/decoder.bert.encoder.layer.6.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 14.0, 15.0, 46.0, 47.0, 85.0, 87.0, 128.0, 143.0, 120.0, 102.0, 79.0, 37.0, 31.0, 16.0, 18.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.90625, -1.84930419921875, -1.7923583984375, -1.73541259765625, -1.678466796875, -1.62152099609375, -1.5645751953125, -1.50762939453125, -1.45068359375, -1.39373779296875, -1.3367919921875, -1.27984619140625, -1.222900390625, -1.16595458984375, -1.1090087890625, -1.05206298828125, -0.9951171875, -0.93817138671875, -0.8812255859375, -0.82427978515625, -0.767333984375, -0.71038818359375, -0.6534423828125, -0.59649658203125, -0.53955078125, -0.48260498046875, -0.4256591796875, -0.36871337890625, -0.311767578125, -0.25482177734375, -0.1978759765625, -0.14093017578125, -0.083984375, -0.02703857421875, 0.0299072265625, 0.08685302734375, 0.143798828125, 0.20074462890625, 0.2576904296875, 0.31463623046875, 0.37158203125, 0.42852783203125, 0.4854736328125, 0.54241943359375, 0.599365234375, 0.65631103515625, 0.7132568359375, 0.77020263671875, 0.8271484375, 0.88409423828125, 0.9410400390625, 0.99798583984375, 1.054931640625, 1.11187744140625, 1.1688232421875, 1.22576904296875, 1.28271484375, 1.33966064453125, 1.3966064453125, 1.45355224609375, 1.510498046875, 1.56744384765625, 1.6243896484375, 1.68133544921875, 1.73828125]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 14.0, 19.0, 23.0, 31.0, 38.0, 47.0, 61.0, 73.0, 99.0, 90.0, 75.0, 89.0, 64.0, 51.0, 47.0, 45.0, 34.0, 28.0, 16.0, 9.0, 11.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.25886344909668, -7.984199047088623, -7.709534645080566, -7.43487024307251, -7.160205841064453, -6.8855414390563965, -6.61087703704834, -6.336212158203125, -6.061548233032227, -5.78688383102417, -5.512219429016113, -5.237555027008057, -4.962890625, -4.688226222991943, -4.413561820983887, -4.138896942138672, -3.8642325401306152, -3.5895681381225586, -3.314903736114502, -3.0402393341064453, -2.7655749320983887, -2.490910530090332, -2.2162458896636963, -1.9415814876556396, -1.666917085647583, -1.3922526836395264, -1.1175882816314697, -0.8429237604141235, -0.5682593584060669, -0.29359495639801025, -0.018930435180664062, 0.2557339668273926, 0.5303983688354492, 0.8050627708435059, 1.0797271728515625, 1.3543916940689087, 1.6290560960769653, 1.903720498085022, 2.178385019302368, 2.453049421310425, 2.7277138233184814, 3.002378225326538, 3.2770426273345947, 3.5517072677612305, 3.826371669769287, 4.101036071777344, 4.3757004737854, 4.650364875793457, 4.925029277801514, 5.19969367980957, 5.474358081817627, 5.749022483825684, 6.02368688583374, 6.298351287841797, 6.573016166687012, 6.84768009185791, 7.122344970703125, 7.397009372711182, 7.671673774719238, 7.946338176727295, 8.221002578735352, 8.495667457580566, 8.770331382751465, 9.04499626159668, 9.319660186767578]}, "gradients/decoder.bert.encoder.layer.5.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 8.0, 5.0, 10.0, 11.0, 9.0, 12.0, 10.0, 25.0, 15.0, 11.0, 18.0, 23.0, 21.0, 34.0, 37.0, 41.0, 31.0, 37.0, 34.0, 48.0, 36.0, 39.0, 33.0, 39.0, 40.0, 42.0, 31.0, 31.0, 23.0, 31.0, 27.0, 22.0, 18.0, 28.0, 14.0, 15.0, 18.0, 10.0, 10.0, 8.0, 15.0, 7.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-3.2262632846832275, -3.127998113632202, -3.0297329425811768, -2.9314680099487305, -2.833202838897705, -2.7349376678466797, -2.6366724967956543, -2.538407325744629, -2.4401421546936035, -2.341876983642578, -2.2436118125915527, -2.1453466415405273, -2.047081708908081, -1.9488165378570557, -1.8505513668060303, -1.7522861957550049, -1.6540212631225586, -1.5557560920715332, -1.4574910402297974, -1.359225869178772, -1.2609608173370361, -1.1626956462860107, -1.0644304752349854, -0.9661653637886047, -0.8679002523422241, -0.7696351408958435, -0.6713700294494629, -0.5731048583984375, -0.4748397469520569, -0.37657463550567627, -0.2783094644546509, -0.18004435300827026, -0.08177924156188965, 0.01648588478565216, 0.11475101113319397, 0.21301615238189697, 0.3112812638282776, 0.4095463752746582, 0.5078115463256836, 0.6060766577720642, 0.7043417692184448, 0.8026068806648254, 0.900871992111206, 0.9991371631622314, 1.0974023342132568, 1.1956673860549927, 1.293932557106018, 1.392197608947754, 1.4904627799987793, 1.5887279510498047, 1.6869930028915405, 1.785258173942566, 1.8835232257843018, 1.9817883968353271, 2.0800535678863525, 2.178318738937378, 2.276583671569824, 2.3748488426208496, 2.473114013671875, 2.5713791847229004, 2.6696441173553467, 2.767909288406372, 2.8661744594573975, 2.964439630508423, 3.0627048015594482]}, "gradients/decoder.bert.encoder.layer.5.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 5.0, 13.0, 16.0, 16.0, 25.0, 36.0, 47.0, 59.0, 107.0, 145.0, 247.0, 312.0, 554.0, 794.0, 1213.0, 2057.0, 3362.0, 5814.0, 10099.0, 17516.0, 33247.0, 64025.0, 131685.0, 292347.0, 679873.0, 1176654.0, 954166.0, 441214.0, 191189.0, 88546.0, 44364.0, 23435.0, 13165.0, 7239.0, 4164.0, 2525.0, 1531.0, 910.0, 602.0, 340.0, 237.0, 126.0, 98.0, 53.0, 34.0, 21.0, 15.0, 20.0, 10.0, 2.0, 2.0, 4.0, 2.0, 3.0], "bins": [-7.33203125, -7.12689208984375, -6.9217529296875, -6.71661376953125, -6.511474609375, -6.30633544921875, -6.1011962890625, -5.89605712890625, -5.69091796875, -5.48577880859375, -5.2806396484375, -5.07550048828125, -4.870361328125, -4.66522216796875, -4.4600830078125, -4.25494384765625, -4.0498046875, -3.84466552734375, -3.6395263671875, -3.43438720703125, -3.229248046875, -3.02410888671875, -2.8189697265625, -2.61383056640625, -2.40869140625, -2.20355224609375, -1.9984130859375, -1.79327392578125, -1.588134765625, -1.38299560546875, -1.1778564453125, -0.97271728515625, -0.767578125, -0.56243896484375, -0.3572998046875, -0.15216064453125, 0.052978515625, 0.25811767578125, 0.4632568359375, 0.66839599609375, 0.87353515625, 1.07867431640625, 1.2838134765625, 1.48895263671875, 1.694091796875, 1.89923095703125, 2.1043701171875, 2.30950927734375, 2.5146484375, 2.71978759765625, 2.9249267578125, 3.13006591796875, 3.335205078125, 3.54034423828125, 3.7454833984375, 3.95062255859375, 4.15576171875, 4.36090087890625, 4.5660400390625, 4.77117919921875, 4.976318359375, 5.18145751953125, 5.3865966796875, 5.59173583984375, 5.796875]}, "gradients/decoder.bert.encoder.layer.5.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 9.0, 12.0, 10.0, 6.0, 11.0, 19.0, 17.0, 18.0, 18.0, 28.0, 34.0, 35.0, 28.0, 47.0, 36.0, 44.0, 39.0, 38.0, 46.0, 45.0, 41.0, 40.0, 44.0, 38.0, 38.0, 33.0, 33.0, 23.0, 24.0, 21.0, 13.0, 17.0, 17.0, 13.0, 14.0, 11.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0], "bins": [-3.37890625, -3.284576416015625, -3.19024658203125, -3.095916748046875, -3.0015869140625, -2.907257080078125, -2.81292724609375, -2.718597412109375, -2.624267578125, -2.529937744140625, -2.43560791015625, -2.341278076171875, -2.2469482421875, -2.152618408203125, -2.05828857421875, -1.963958740234375, -1.86962890625, -1.775299072265625, -1.68096923828125, -1.586639404296875, -1.4923095703125, -1.397979736328125, -1.30364990234375, -1.209320068359375, -1.114990234375, -1.020660400390625, -0.92633056640625, -0.832000732421875, -0.7376708984375, -0.643341064453125, -0.54901123046875, -0.454681396484375, -0.3603515625, -0.266021728515625, -0.17169189453125, -0.077362060546875, 0.0169677734375, 0.111297607421875, 0.20562744140625, 0.299957275390625, 0.394287109375, 0.488616943359375, 0.58294677734375, 0.677276611328125, 0.7716064453125, 0.865936279296875, 0.96026611328125, 1.054595947265625, 1.14892578125, 1.243255615234375, 1.33758544921875, 1.431915283203125, 1.5262451171875, 1.620574951171875, 1.71490478515625, 1.809234619140625, 1.903564453125, 1.997894287109375, 2.09222412109375, 2.186553955078125, 2.2808837890625, 2.375213623046875, 2.46954345703125, 2.563873291015625, 2.658203125]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 9.0, 10.0, 16.0, 18.0, 27.0, 53.0, 61.0, 121.0, 165.0, 234.0, 379.0, 574.0, 871.0, 1430.0, 2467.0, 4080.0, 7048.0, 12610.0, 23141.0, 44878.0, 89764.0, 187086.0, 400990.0, 825705.0, 1146397.0, 751888.0, 356572.0, 167262.0, 80713.0, 40437.0, 21336.0, 11641.0, 6467.0, 3779.0, 2219.0, 1423.0, 897.0, 532.0, 341.0, 210.0, 150.0, 99.0, 57.0, 44.0, 20.0, 17.0, 16.0, 9.0, 10.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.87890625, -7.63592529296875, -7.3929443359375, -7.14996337890625, -6.906982421875, -6.66400146484375, -6.4210205078125, -6.17803955078125, -5.93505859375, -5.69207763671875, -5.4490966796875, -5.20611572265625, -4.963134765625, -4.72015380859375, -4.4771728515625, -4.23419189453125, -3.9912109375, -3.74822998046875, -3.5052490234375, -3.26226806640625, -3.019287109375, -2.77630615234375, -2.5333251953125, -2.29034423828125, -2.04736328125, -1.80438232421875, -1.5614013671875, -1.31842041015625, -1.075439453125, -0.83245849609375, -0.5894775390625, -0.34649658203125, -0.103515625, 0.13946533203125, 0.3824462890625, 0.62542724609375, 0.868408203125, 1.11138916015625, 1.3543701171875, 1.59735107421875, 1.84033203125, 2.08331298828125, 2.3262939453125, 2.56927490234375, 2.812255859375, 3.05523681640625, 3.2982177734375, 3.54119873046875, 3.7841796875, 4.02716064453125, 4.2701416015625, 4.51312255859375, 4.756103515625, 4.99908447265625, 5.2420654296875, 5.48504638671875, 5.72802734375, 5.97100830078125, 6.2139892578125, 6.45697021484375, 6.699951171875, 6.94293212890625, 7.1859130859375, 7.42889404296875, 7.671875]}, "gradients/decoder.bert.encoder.layer.5.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 4.0, 4.0, 13.0, 5.0, 15.0, 22.0, 12.0, 26.0, 42.0, 35.0, 58.0, 69.0, 85.0, 124.0, 136.0, 225.0, 226.0, 238.0, 298.0, 284.0, 281.0, 289.0, 281.0, 253.0, 207.0, 161.0, 147.0, 125.0, 101.0, 88.0, 51.0, 36.0, 33.0, 26.0, 17.0, 13.0, 14.0, 8.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.375, -2.3098297119140625, -2.244659423828125, -2.1794891357421875, -2.11431884765625, -2.0491485595703125, -1.983978271484375, -1.9188079833984375, -1.8536376953125, -1.7884674072265625, -1.723297119140625, -1.6581268310546875, -1.59295654296875, -1.5277862548828125, -1.462615966796875, -1.3974456787109375, -1.332275390625, -1.2671051025390625, -1.201934814453125, -1.1367645263671875, -1.07159423828125, -1.0064239501953125, -0.941253662109375, -0.8760833740234375, -0.8109130859375, -0.7457427978515625, -0.680572509765625, -0.6154022216796875, -0.55023193359375, -0.4850616455078125, -0.419891357421875, -0.3547210693359375, -0.28955078125, -0.2243804931640625, -0.159210205078125, -0.0940399169921875, -0.02886962890625, 0.0363006591796875, 0.101470947265625, 0.1666412353515625, 0.2318115234375, 0.2969818115234375, 0.362152099609375, 0.4273223876953125, 0.49249267578125, 0.5576629638671875, 0.622833251953125, 0.6880035400390625, 0.753173828125, 0.8183441162109375, 0.883514404296875, 0.9486846923828125, 1.01385498046875, 1.0790252685546875, 1.144195556640625, 1.2093658447265625, 1.2745361328125, 1.3397064208984375, 1.404876708984375, 1.4700469970703125, 1.53521728515625, 1.6003875732421875, 1.665557861328125, 1.7307281494140625, 1.7958984375]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 15.0, 10.0, 11.0, 21.0, 21.0, 40.0, 43.0, 51.0, 54.0, 72.0, 72.0, 81.0, 73.0, 82.0, 77.0, 61.0, 60.0, 40.0, 40.0, 24.0, 10.0, 9.0, 10.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.115337371826172, -9.808186531066895, -9.501035690307617, -9.19388484954834, -8.886734008789062, -8.579583168029785, -8.272432327270508, -7.965281963348389, -7.658131122589111, -7.350980281829834, -7.043829441070557, -6.736678600311279, -6.42952823638916, -6.122377395629883, -5.8152265548706055, -5.508075714111328, -5.200924873352051, -4.893774032592773, -4.586623191833496, -4.279472351074219, -3.9723217487335205, -3.665170907974243, -3.358020305633545, -3.0508694648742676, -2.7437186241149902, -2.436567783355713, -2.1294169425964355, -1.8222663402557373, -1.51511549949646, -1.2079646587371826, -0.9008139371871948, -0.593663215637207, -0.2865133285522461, 0.020637452602386475, 0.32778823375701904, 0.6349390149116516, 0.9420897960662842, 1.2492406368255615, 1.5563913583755493, 1.863542079925537, 2.1706929206848145, 2.477843761444092, 2.784994602203369, 3.0921452045440674, 3.3992960453033447, 3.706446886062622, 4.01359748840332, 4.320748329162598, 4.627899169921875, 4.935050010681152, 5.24220085144043, 5.549351692199707, 5.856502532958984, 6.163653373718262, 6.470803737640381, 6.777954578399658, 7.0851054191589355, 7.392256259918213, 7.69940710067749, 8.00655746459961, 8.313708305358887, 8.620859146118164, 8.928009986877441, 9.235160827636719, 9.542311668395996]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 3.0, 7.0, 5.0, 4.0, 11.0, 26.0, 19.0, 18.0, 14.0, 13.0, 36.0, 34.0, 36.0, 29.0, 32.0, 34.0, 35.0, 32.0, 42.0, 43.0, 24.0, 36.0, 50.0, 46.0, 35.0, 38.0, 26.0, 30.0, 26.0, 32.0, 26.0, 19.0, 21.0, 19.0, 16.0, 10.0, 9.0, 7.0, 11.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.426629066467285, -3.315779209136963, -3.2049291133880615, -3.09407901763916, -2.983229160308838, -2.8723793029785156, -2.7615292072296143, -2.650679111480713, -2.5398292541503906, -2.4289793968200684, -2.318129301071167, -2.2072792053222656, -2.0964293479919434, -1.9855793714523315, -1.8747293949127197, -1.763879418373108, -1.653029441833496, -1.5421794652938843, -1.4313294887542725, -1.3204795122146606, -1.2096295356750488, -1.098779559135437, -0.9879295825958252, -0.8770796060562134, -0.7662296295166016, -0.6553796529769897, -0.5445296764373779, -0.4336796998977661, -0.3228297233581543, -0.21197974681854248, -0.10112977027893066, 0.009720206260681152, 0.12057018280029297, 0.23142015933990479, 0.3422701358795166, 0.4531201124191284, 0.5639700889587402, 0.674820065498352, 0.7856700420379639, 0.8965200185775757, 1.0073699951171875, 1.1182199716567993, 1.2290699481964111, 1.339919924736023, 1.4507699012756348, 1.5616198778152466, 1.6724698543548584, 1.7833198308944702, 1.894169807434082, 2.0050196647644043, 2.1158697605133057, 2.226719856262207, 2.3375697135925293, 2.4484195709228516, 2.559269666671753, 2.6701197624206543, 2.7809696197509766, 2.891819477081299, 3.0026695728302, 3.1135196685791016, 3.224369525909424, 3.335219383239746, 3.4460694789886475, 3.556919574737549, 3.667769432067871]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 9.0, 8.0, 14.0, 16.0, 18.0, 32.0, 41.0, 71.0, 91.0, 136.0, 198.0, 294.0, 443.0, 736.0, 1210.0, 1979.0, 3407.0, 6287.0, 11134.0, 21249.0, 41730.0, 83827.0, 164038.0, 258373.0, 214263.0, 117138.0, 58207.0, 29122.0, 15020.0, 8018.0, 4530.0, 2634.0, 1575.0, 943.0, 603.0, 373.0, 263.0, 167.0, 130.0, 70.0, 45.0, 30.0, 14.0, 20.0, 16.0, 12.0, 11.0, 6.0, 9.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.767578125, -0.7426071166992188, -0.7176361083984375, -0.6926651000976562, -0.667694091796875, -0.6427230834960938, -0.6177520751953125, -0.5927810668945312, -0.56781005859375, -0.5428390502929688, -0.5178680419921875, -0.49289703369140625, -0.467926025390625, -0.44295501708984375, -0.4179840087890625, -0.39301300048828125, -0.3680419921875, -0.34307098388671875, -0.3180999755859375, -0.29312896728515625, -0.268157958984375, -0.24318695068359375, -0.2182159423828125, -0.19324493408203125, -0.16827392578125, -0.14330291748046875, -0.1183319091796875, -0.09336090087890625, -0.068389892578125, -0.04341888427734375, -0.0184478759765625, 0.00652313232421875, 0.031494140625, 0.05646514892578125, 0.0814361572265625, 0.10640716552734375, 0.131378173828125, 0.15634918212890625, 0.1813201904296875, 0.20629119873046875, 0.23126220703125, 0.25623321533203125, 0.2812042236328125, 0.30617523193359375, 0.331146240234375, 0.35611724853515625, 0.3810882568359375, 0.40605926513671875, 0.4310302734375, 0.45600128173828125, 0.4809722900390625, 0.5059432983398438, 0.530914306640625, 0.5558853149414062, 0.5808563232421875, 0.6058273315429688, 0.63079833984375, 0.6557693481445312, 0.6807403564453125, 0.7057113647460938, 0.730682373046875, 0.7556533813476562, 0.7806243896484375, 0.8055953979492188, 0.83056640625]}, "gradients/decoder.bert.encoder.layer.5.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 1.0, 2.0, 8.0, 5.0, 7.0, 5.0, 9.0, 8.0, 5.0, 15.0, 19.0, 21.0, 23.0, 23.0, 28.0, 29.0, 31.0, 41.0, 35.0, 31.0, 38.0, 42.0, 36.0, 48.0, 41.0, 49.0, 38.0, 47.0, 33.0, 31.0, 37.0, 35.0, 34.0, 26.0, 25.0, 14.0, 19.0, 14.0, 13.0, 7.0, 11.0, 6.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.14031982421875, -3.9993896484375, -3.85845947265625, -3.717529296875, -3.57659912109375, -3.4356689453125, -3.29473876953125, -3.15380859375, -3.01287841796875, -2.8719482421875, -2.73101806640625, -2.590087890625, -2.44915771484375, -2.3082275390625, -2.16729736328125, -2.0263671875, -1.88543701171875, -1.7445068359375, -1.60357666015625, -1.462646484375, -1.32171630859375, -1.1807861328125, -1.03985595703125, -0.89892578125, -0.75799560546875, -0.6170654296875, -0.47613525390625, -0.335205078125, -0.19427490234375, -0.0533447265625, 0.08758544921875, 0.228515625, 0.36944580078125, 0.5103759765625, 0.65130615234375, 0.792236328125, 0.93316650390625, 1.0740966796875, 1.21502685546875, 1.35595703125, 1.49688720703125, 1.6378173828125, 1.77874755859375, 1.919677734375, 2.06060791015625, 2.2015380859375, 2.34246826171875, 2.4833984375, 2.62432861328125, 2.7652587890625, 2.90618896484375, 3.047119140625, 3.18804931640625, 3.3289794921875, 3.46990966796875, 3.61083984375, 3.75177001953125, 3.8927001953125, 4.03363037109375, 4.174560546875, 4.31549072265625, 4.4564208984375, 4.59735107421875, 4.73828125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 13.0, 16.0, 25.0, 43.0, 44.0, 69.0, 112.0, 129.0, 238.0, 449.0, 676.0, 1269.0, 2475.0, 5431.0, 13705.0, 52133.0, 897394.0, 50158.0, 13562.0, 5152.0, 2446.0, 1218.0, 669.0, 402.0, 214.0, 156.0, 94.0, 58.0, 48.0, 38.0, 19.0, 17.0, 17.0, 15.0, 6.0, 7.0, 8.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.791015625, -2.705108642578125, -2.61920166015625, -2.533294677734375, -2.4473876953125, -2.361480712890625, -2.27557373046875, -2.189666748046875, -2.103759765625, -2.017852783203125, -1.93194580078125, -1.846038818359375, -1.7601318359375, -1.674224853515625, -1.58831787109375, -1.502410888671875, -1.41650390625, -1.330596923828125, -1.24468994140625, -1.158782958984375, -1.0728759765625, -0.986968994140625, -0.90106201171875, -0.815155029296875, -0.729248046875, -0.643341064453125, -0.55743408203125, -0.471527099609375, -0.3856201171875, -0.299713134765625, -0.21380615234375, -0.127899169921875, -0.0419921875, 0.043914794921875, 0.12982177734375, 0.215728759765625, 0.3016357421875, 0.387542724609375, 0.47344970703125, 0.559356689453125, 0.645263671875, 0.731170654296875, 0.81707763671875, 0.902984619140625, 0.9888916015625, 1.074798583984375, 1.16070556640625, 1.246612548828125, 1.33251953125, 1.418426513671875, 1.50433349609375, 1.590240478515625, 1.6761474609375, 1.762054443359375, 1.84796142578125, 1.933868408203125, 2.019775390625, 2.105682373046875, 2.19158935546875, 2.277496337890625, 2.3634033203125, 2.449310302734375, 2.53521728515625, 2.621124267578125, 2.70703125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 11.0, 13.0, 11.0, 25.0, 22.0, 25.0, 32.0, 28.0, 44.0, 45.0, 53.0, 53.0, 55.0, 46.0, 69.0, 59.0, 62.0, 42.0, 49.0, 41.0, 35.0, 42.0, 31.0, 28.0, 16.0, 21.0, 10.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.763671875, -3.638580322265625, -3.51348876953125, -3.388397216796875, -3.2633056640625, -3.138214111328125, -3.01312255859375, -2.888031005859375, -2.762939453125, -2.637847900390625, -2.51275634765625, -2.387664794921875, -2.2625732421875, -2.137481689453125, -2.01239013671875, -1.887298583984375, -1.76220703125, -1.637115478515625, -1.51202392578125, -1.386932373046875, -1.2618408203125, -1.136749267578125, -1.01165771484375, -0.886566162109375, -0.761474609375, -0.636383056640625, -0.51129150390625, -0.386199951171875, -0.2611083984375, -0.136016845703125, -0.01092529296875, 0.114166259765625, 0.2392578125, 0.364349365234375, 0.48944091796875, 0.614532470703125, 0.7396240234375, 0.864715576171875, 0.98980712890625, 1.114898681640625, 1.239990234375, 1.365081787109375, 1.49017333984375, 1.615264892578125, 1.7403564453125, 1.865447998046875, 1.99053955078125, 2.115631103515625, 2.24072265625, 2.365814208984375, 2.49090576171875, 2.615997314453125, 2.7410888671875, 2.866180419921875, 2.99127197265625, 3.116363525390625, 3.241455078125, 3.366546630859375, 3.49163818359375, 3.616729736328125, 3.7418212890625, 3.866912841796875, 3.99200439453125, 4.117095947265625, 4.2421875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 3.0, 15.0, 15.0, 13.0, 23.0, 32.0, 50.0, 56.0, 108.0, 159.0, 247.0, 408.0, 744.0, 2176.0, 19853.0, 1011205.0, 10197.0, 1571.0, 644.0, 388.0, 182.0, 146.0, 80.0, 70.0, 37.0, 34.0, 22.0, 23.0, 13.0, 6.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.095703125, -3.00823974609375, -2.9207763671875, -2.83331298828125, -2.745849609375, -2.65838623046875, -2.5709228515625, -2.48345947265625, -2.39599609375, -2.30853271484375, -2.2210693359375, -2.13360595703125, -2.046142578125, -1.95867919921875, -1.8712158203125, -1.78375244140625, -1.6962890625, -1.60882568359375, -1.5213623046875, -1.43389892578125, -1.346435546875, -1.25897216796875, -1.1715087890625, -1.08404541015625, -0.99658203125, -0.90911865234375, -0.8216552734375, -0.73419189453125, -0.646728515625, -0.55926513671875, -0.4718017578125, -0.38433837890625, -0.296875, -0.20941162109375, -0.1219482421875, -0.03448486328125, 0.052978515625, 0.14044189453125, 0.2279052734375, 0.31536865234375, 0.40283203125, 0.49029541015625, 0.5777587890625, 0.66522216796875, 0.752685546875, 0.84014892578125, 0.9276123046875, 1.01507568359375, 1.1025390625, 1.19000244140625, 1.2774658203125, 1.36492919921875, 1.452392578125, 1.53985595703125, 1.6273193359375, 1.71478271484375, 1.80224609375, 1.88970947265625, 1.9771728515625, 2.06463623046875, 2.152099609375, 2.23956298828125, 2.3270263671875, 2.41448974609375, 2.501953125]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 17.0, 39.0, 76.0, 125.0, 176.0, 175.0, 138.0, 115.0, 67.0, 19.0, 14.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.392333984375e-05, -8.132774382829666e-05, -7.873214781284332e-05, -7.613655179738998e-05, -7.354095578193665e-05, -7.094535976648331e-05, -6.834976375102997e-05, -6.575416773557663e-05, -6.315857172012329e-05, -6.056297570466995e-05, -5.7967379689216614e-05, -5.5371783673763275e-05, -5.2776187658309937e-05, -5.01805916428566e-05, -4.758499562740326e-05, -4.498939961194992e-05, -4.239380359649658e-05, -3.9798207581043243e-05, -3.7202611565589905e-05, -3.4607015550136566e-05, -3.201141953468323e-05, -2.941582351922989e-05, -2.682022750377655e-05, -2.422463148832321e-05, -2.1629035472869873e-05, -1.9033439457416534e-05, -1.6437843441963196e-05, -1.3842247426509857e-05, -1.1246651411056519e-05, -8.65105539560318e-06, -6.055459380149841e-06, -3.4598633646965027e-06, -8.642673492431641e-07, 1.7313286662101746e-06, 4.326924681663513e-06, 6.922520697116852e-06, 9.51811671257019e-06, 1.2113712728023529e-05, 1.4709308743476868e-05, 1.7304904758930206e-05, 1.9900500774383545e-05, 2.2496096789836884e-05, 2.5091692805290222e-05, 2.768728882074356e-05, 3.02828848361969e-05, 3.287848085165024e-05, 3.547407686710358e-05, 3.8069672882556915e-05, 4.0665268898010254e-05, 4.326086491346359e-05, 4.585646092891693e-05, 4.845205694437027e-05, 5.104765295982361e-05, 5.364324897527695e-05, 5.6238844990730286e-05, 5.8834441006183624e-05, 6.143003702163696e-05, 6.40256330370903e-05, 6.662122905254364e-05, 6.921682506799698e-05, 7.181242108345032e-05, 7.440801709890366e-05, 7.7003613114357e-05, 7.959920912981033e-05, 8.219480514526367e-05]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 14.0, 20.0, 26.0, 38.0, 68.0, 73.0, 109.0, 187.0, 264.0, 363.0, 581.0, 943.0, 1483.0, 2454.0, 3903.0, 7155.0, 30454.0, 570994.0, 390410.0, 22574.0, 6585.0, 3690.0, 2240.0, 1390.0, 858.0, 558.0, 361.0, 243.0, 151.0, 92.0, 74.0, 70.0, 26.0, 26.0, 20.0, 15.0, 11.0, 2.0, 7.0, 2.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83642578125, -0.8053665161132812, -0.7743072509765625, -0.7432479858398438, -0.712188720703125, -0.6811294555664062, -0.6500701904296875, -0.6190109252929688, -0.58795166015625, -0.5568923950195312, -0.5258331298828125, -0.49477386474609375, -0.463714599609375, -0.43265533447265625, -0.4015960693359375, -0.37053680419921875, -0.3394775390625, -0.30841827392578125, -0.2773590087890625, -0.24629974365234375, -0.215240478515625, -0.18418121337890625, -0.1531219482421875, -0.12206268310546875, -0.09100341796875, -0.05994415283203125, -0.0288848876953125, 0.00217437744140625, 0.033233642578125, 0.06429290771484375, 0.0953521728515625, 0.12641143798828125, 0.157470703125, 0.18852996826171875, 0.2195892333984375, 0.25064849853515625, 0.281707763671875, 0.31276702880859375, 0.3438262939453125, 0.37488555908203125, 0.40594482421875, 0.43700408935546875, 0.4680633544921875, 0.49912261962890625, 0.530181884765625, 0.5612411499023438, 0.5923004150390625, 0.6233596801757812, 0.6544189453125, 0.6854782104492188, 0.7165374755859375, 0.7475967407226562, 0.778656005859375, 0.8097152709960938, 0.8407745361328125, 0.8718338012695312, 0.90289306640625, 0.9339523315429688, 0.9650115966796875, 0.9960708618164062, 1.027130126953125, 1.0581893920898438, 1.0892486572265625, 1.1203079223632812, 1.1513671875]}, "gradients/decoder.bert.encoder.layer.5.crossattention.self.query.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 10.0, 28.0, 46.0, 59.0, 137.0, 220.0, 205.0, 126.0, 56.0, 31.0, 20.0, 10.0, 7.0, 5.0, 4.0, 5.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1239013671875, -0.11959648132324219, -0.11529159545898438, -0.11098670959472656, -0.10668182373046875, -0.10237693786621094, -0.09807205200195312, -0.09376716613769531, -0.0894622802734375, -0.08515739440917969, -0.08085250854492188, -0.07654762268066406, -0.07224273681640625, -0.06793785095214844, -0.06363296508789062, -0.05932807922363281, -0.055023193359375, -0.05071830749511719, -0.046413421630859375, -0.04210853576660156, -0.03780364990234375, -0.03349876403808594, -0.029193878173828125, -0.024888992309570312, -0.0205841064453125, -0.016279220581054688, -0.011974334716796875, -0.0076694488525390625, -0.00336456298828125, 0.0009403228759765625, 0.005245208740234375, 0.009550094604492188, 0.01385498046875, 0.018159866333007812, 0.022464752197265625, 0.026769638061523438, 0.03107452392578125, 0.03537940979003906, 0.039684295654296875, 0.04398918151855469, 0.0482940673828125, 0.05259895324707031, 0.056903839111328125, 0.06120872497558594, 0.06551361083984375, 0.06981849670410156, 0.07412338256835938, 0.07842826843261719, 0.082733154296875, 0.08703804016113281, 0.09134292602539062, 0.09564781188964844, 0.09995269775390625, 0.10425758361816406, 0.10856246948242188, 0.11286735534667969, 0.1171722412109375, 0.12147712707519531, 0.12578201293945312, 0.13008689880371094, 0.13439178466796875, 0.13869667053222656, 0.14300155639648438, 0.1473064422607422, 0.151611328125]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 10.0, 12.0, 12.0, 17.0, 22.0, 23.0, 56.0, 42.0, 59.0, 54.0, 77.0, 82.0, 70.0, 92.0, 66.0, 56.0, 67.0, 49.0, 41.0, 27.0, 19.0, 8.0, 11.0, 6.0, 11.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75455093383789, -9.4525728225708, -9.150594711303711, -8.848617553710938, -8.546639442443848, -8.244661331176758, -7.942683219909668, -7.640705108642578, -7.3387274742126465, -7.036749362945557, -6.734771728515625, -6.432793617248535, -6.130815505981445, -5.828837871551514, -5.526859760284424, -5.224882125854492, -4.922904014587402, -4.6209259033203125, -4.318948268890381, -4.016970157623291, -3.7149922847747803, -3.4130144119262695, -3.1110363006591797, -2.809058427810669, -2.507080554962158, -2.2051026821136475, -1.9031246900558472, -1.6011466979980469, -1.2991688251495361, -0.9971909523010254, -0.6952129602432251, -0.3932349681854248, -0.09125709533691406, 0.21072083711624146, 0.512698769569397, 0.8146767020225525, 1.116654634475708, 1.4186325073242188, 1.720610499382019, 2.0225884914398193, 2.32456636428833, 2.626544237136841, 2.9285221099853516, 3.2305002212524414, 3.532478094100952, 3.834455966949463, 4.136434078216553, 4.438411712646484, 4.740389823913574, 5.042367935180664, 5.344345569610596, 5.6463236808776855, 5.948301315307617, 6.250279426574707, 6.552257537841797, 6.854235649108887, 7.156213283538818, 7.458191394805908, 7.76016902923584, 8.06214714050293, 8.36412525177002, 8.66610336303711, 8.968080520629883, 9.270058631896973, 9.572036743164062]}, "gradients/decoder.bert.encoder.layer.5.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 5.0, 8.0, 5.0, 5.0, 6.0, 8.0, 19.0, 23.0, 18.0, 16.0, 18.0, 21.0, 36.0, 38.0, 25.0, 39.0, 31.0, 31.0, 40.0, 34.0, 43.0, 30.0, 34.0, 39.0, 52.0, 40.0, 32.0, 37.0, 24.0, 28.0, 29.0, 28.0, 25.0, 20.0, 17.0, 14.0, 17.0, 8.0, 7.0, 11.0, 7.0, 8.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.446017265319824, -3.3359527587890625, -3.225888252258301, -3.115823745727539, -3.0057590007781982, -2.8956944942474365, -2.785629987716675, -2.675565481185913, -2.5655007362365723, -2.4554362297058105, -2.345371723175049, -2.235307216644287, -2.1252424716949463, -2.0151779651641846, -1.9051134586334229, -1.7950489521026611, -1.6849844455718994, -1.5749199390411377, -1.4648553133010864, -1.3547908067703247, -1.2447261810302734, -1.1346616744995117, -1.02459716796875, -0.9145326018333435, -0.804468035697937, -0.6944034695625305, -0.584338903427124, -0.4742743968963623, -0.3642098307609558, -0.2541452646255493, -0.1440807580947876, -0.034016191959381104, 0.07604837417602539, 0.1861129254102707, 0.296177476644516, 0.4062420129776001, 0.5163065791130066, 0.6263711452484131, 0.7364356517791748, 0.8465002179145813, 0.9565647840499878, 1.0666292905807495, 1.1766939163208008, 1.2867584228515625, 1.3968229293823242, 1.5068875551223755, 1.6169520616531372, 1.7270166873931885, 1.8370811939239502, 1.947145700454712, 2.0572102069854736, 2.1672749519348145, 2.277339458465576, 2.387403964996338, 2.4974684715270996, 2.6075329780578613, 2.717597484588623, 2.8276619911193848, 2.9377264976501465, 3.047791004180908, 3.157855749130249, 3.2679202556610107, 3.3779847621917725, 3.488049268722534, 3.598114013671875]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 22.0, 32.0, 37.0, 54.0, 60.0, 119.0, 187.0, 249.0, 400.0, 555.0, 818.0, 1322.0, 1912.0, 2958.0, 4451.0, 6910.0, 10695.0, 16877.0, 25965.0, 40191.0, 61249.0, 88925.0, 120059.0, 142063.0, 141763.0, 119038.0, 88131.0, 60305.0, 39904.0, 26167.0, 16648.0, 10709.0, 6814.0, 4439.0, 2849.0, 1887.0, 1222.0, 897.0, 523.0, 388.0, 245.0, 167.0, 125.0, 84.0, 39.0, 32.0, 30.0, 16.0, 9.0, 7.0, 4.0, 4.0, 2.0, 2.0], "bins": [-4.40625, -4.276611328125, -4.14697265625, -4.017333984375, -3.8876953125, -3.758056640625, -3.62841796875, -3.498779296875, -3.369140625, -3.239501953125, -3.10986328125, -2.980224609375, -2.8505859375, -2.720947265625, -2.59130859375, -2.461669921875, -2.33203125, -2.202392578125, -2.07275390625, -1.943115234375, -1.8134765625, -1.683837890625, -1.55419921875, -1.424560546875, -1.294921875, -1.165283203125, -1.03564453125, -0.906005859375, -0.7763671875, -0.646728515625, -0.51708984375, -0.387451171875, -0.2578125, -0.128173828125, 0.00146484375, 0.131103515625, 0.2607421875, 0.390380859375, 0.52001953125, 0.649658203125, 0.779296875, 0.908935546875, 1.03857421875, 1.168212890625, 1.2978515625, 1.427490234375, 1.55712890625, 1.686767578125, 1.81640625, 1.946044921875, 2.07568359375, 2.205322265625, 2.3349609375, 2.464599609375, 2.59423828125, 2.723876953125, 2.853515625, 2.983154296875, 3.11279296875, 3.242431640625, 3.3720703125, 3.501708984375, 3.63134765625, 3.760986328125, 3.890625]}, "gradients/decoder.bert.encoder.layer.5.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 13.0, 1.0, 6.0, 11.0, 5.0, 12.0, 12.0, 14.0, 21.0, 22.0, 24.0, 24.0, 26.0, 34.0, 36.0, 32.0, 36.0, 35.0, 43.0, 62.0, 38.0, 39.0, 37.0, 48.0, 52.0, 33.0, 49.0, 38.0, 26.0, 23.0, 25.0, 21.0, 19.0, 15.0, 13.0, 11.0, 10.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.6484375, -4.510986328125, -4.37353515625, -4.236083984375, -4.0986328125, -3.961181640625, -3.82373046875, -3.686279296875, -3.548828125, -3.411376953125, -3.27392578125, -3.136474609375, -2.9990234375, -2.861572265625, -2.72412109375, -2.586669921875, -2.44921875, -2.311767578125, -2.17431640625, -2.036865234375, -1.8994140625, -1.761962890625, -1.62451171875, -1.487060546875, -1.349609375, -1.212158203125, -1.07470703125, -0.937255859375, -0.7998046875, -0.662353515625, -0.52490234375, -0.387451171875, -0.25, -0.112548828125, 0.02490234375, 0.162353515625, 0.2998046875, 0.437255859375, 0.57470703125, 0.712158203125, 0.849609375, 0.987060546875, 1.12451171875, 1.261962890625, 1.3994140625, 1.536865234375, 1.67431640625, 1.811767578125, 1.94921875, 2.086669921875, 2.22412109375, 2.361572265625, 2.4990234375, 2.636474609375, 2.77392578125, 2.911376953125, 3.048828125, 3.186279296875, 3.32373046875, 3.461181640625, 3.5986328125, 3.736083984375, 3.87353515625, 4.010986328125, 4.1484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 9.0, 13.0, 22.0, 29.0, 45.0, 68.0, 102.0, 173.0, 279.0, 424.0, 616.0, 993.0, 1589.0, 2614.0, 4251.0, 7126.0, 11392.0, 18983.0, 31565.0, 50035.0, 77443.0, 112062.0, 143136.0, 154231.0, 138012.0, 104939.0, 70884.0, 45713.0, 27609.0, 17314.0, 10427.0, 6368.0, 3800.0, 2285.0, 1470.0, 915.0, 563.0, 368.0, 221.0, 156.0, 104.0, 72.0, 37.0, 30.0, 24.0, 14.0, 10.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.83203125, -4.682861328125, -4.53369140625, -4.384521484375, -4.2353515625, -4.086181640625, -3.93701171875, -3.787841796875, -3.638671875, -3.489501953125, -3.34033203125, -3.191162109375, -3.0419921875, -2.892822265625, -2.74365234375, -2.594482421875, -2.4453125, -2.296142578125, -2.14697265625, -1.997802734375, -1.8486328125, -1.699462890625, -1.55029296875, -1.401123046875, -1.251953125, -1.102783203125, -0.95361328125, -0.804443359375, -0.6552734375, -0.506103515625, -0.35693359375, -0.207763671875, -0.05859375, 0.090576171875, 0.23974609375, 0.388916015625, 0.5380859375, 0.687255859375, 0.83642578125, 0.985595703125, 1.134765625, 1.283935546875, 1.43310546875, 1.582275390625, 1.7314453125, 1.880615234375, 2.02978515625, 2.178955078125, 2.328125, 2.477294921875, 2.62646484375, 2.775634765625, 2.9248046875, 3.073974609375, 3.22314453125, 3.372314453125, 3.521484375, 3.670654296875, 3.81982421875, 3.968994140625, 4.1181640625, 4.267333984375, 4.41650390625, 4.565673828125, 4.71484375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 8.0, 17.0, 15.0, 16.0, 19.0, 21.0, 28.0, 26.0, 38.0, 26.0, 40.0, 49.0, 38.0, 32.0, 52.0, 39.0, 49.0, 38.0, 48.0, 43.0, 40.0, 34.0, 41.0, 38.0, 43.0, 31.0, 16.0, 27.0, 13.0, 18.0, 7.0, 10.0, 8.0, 5.0, 11.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.271484375, -3.175506591796875, -3.07952880859375, -2.983551025390625, -2.8875732421875, -2.791595458984375, -2.69561767578125, -2.599639892578125, -2.503662109375, -2.407684326171875, -2.31170654296875, -2.215728759765625, -2.1197509765625, -2.023773193359375, -1.92779541015625, -1.831817626953125, -1.73583984375, -1.639862060546875, -1.54388427734375, -1.447906494140625, -1.3519287109375, -1.255950927734375, -1.15997314453125, -1.063995361328125, -0.968017578125, -0.872039794921875, -0.77606201171875, -0.680084228515625, -0.5841064453125, -0.488128662109375, -0.39215087890625, -0.296173095703125, -0.2001953125, -0.104217529296875, -0.00823974609375, 0.087738037109375, 0.1837158203125, 0.279693603515625, 0.37567138671875, 0.471649169921875, 0.567626953125, 0.663604736328125, 0.75958251953125, 0.855560302734375, 0.9515380859375, 1.047515869140625, 1.14349365234375, 1.239471435546875, 1.33544921875, 1.431427001953125, 1.52740478515625, 1.623382568359375, 1.7193603515625, 1.815338134765625, 1.91131591796875, 2.007293701171875, 2.103271484375, 2.199249267578125, 2.29522705078125, 2.391204833984375, 2.4871826171875, 2.583160400390625, 2.67913818359375, 2.775115966796875, 2.87109375]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 13.0, 16.0, 28.0, 27.0, 47.0, 67.0, 98.0, 159.0, 195.0, 354.0, 542.0, 858.0, 1336.0, 2265.0, 3787.0, 6321.0, 10573.0, 17449.0, 29972.0, 50559.0, 85677.0, 134924.0, 180383.0, 179871.0, 134459.0, 84977.0, 50242.0, 29424.0, 17702.0, 10349.0, 6125.0, 3733.0, 2325.0, 1389.0, 832.0, 498.0, 335.0, 214.0, 132.0, 97.0, 58.0, 31.0, 36.0, 21.0, 20.0, 6.0, 9.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.804901123046875, -2.71722412109375, -2.629547119140625, -2.5418701171875, -2.454193115234375, -2.36651611328125, -2.278839111328125, -2.191162109375, -2.103485107421875, -2.01580810546875, -1.928131103515625, -1.8404541015625, -1.752777099609375, -1.66510009765625, -1.577423095703125, -1.48974609375, -1.402069091796875, -1.31439208984375, -1.226715087890625, -1.1390380859375, -1.051361083984375, -0.96368408203125, -0.876007080078125, -0.788330078125, -0.700653076171875, -0.61297607421875, -0.525299072265625, -0.4376220703125, -0.349945068359375, -0.26226806640625, -0.174591064453125, -0.0869140625, 0.000762939453125, 0.08843994140625, 0.176116943359375, 0.2637939453125, 0.351470947265625, 0.43914794921875, 0.526824951171875, 0.614501953125, 0.702178955078125, 0.78985595703125, 0.877532958984375, 0.9652099609375, 1.052886962890625, 1.14056396484375, 1.228240966796875, 1.31591796875, 1.403594970703125, 1.49127197265625, 1.578948974609375, 1.6666259765625, 1.754302978515625, 1.84197998046875, 1.929656982421875, 2.017333984375, 2.105010986328125, 2.19268798828125, 2.280364990234375, 2.3680419921875, 2.455718994140625, 2.54339599609375, 2.631072998046875, 2.71875]}, "gradients/decoder.bert.encoder.layer.5.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 9.0, 4.0, 20.0, 23.0, 31.0, 45.0, 41.0, 73.0, 78.0, 123.0, 109.0, 101.0, 87.0, 73.0, 53.0, 41.0, 28.0, 15.0, 11.0, 14.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0007257461547851562, -0.00070919468998909, -0.0006926432251930237, -0.0006760917603969574, -0.0006595402956008911, -0.0006429888308048248, -0.0006264373660087585, -0.0006098859012126923, -0.000593334436416626, -0.0005767829716205597, -0.0005602315068244934, -0.0005436800420284271, -0.0005271285772323608, -0.0005105771124362946, -0.0004940256476402283, -0.000477474182844162, -0.0004609227180480957, -0.0004443712532520294, -0.00042781978845596313, -0.00041126832365989685, -0.00039471685886383057, -0.0003781653940677643, -0.000361613929271698, -0.0003450624644756317, -0.00032851099967956543, -0.00031195953488349915, -0.00029540807008743286, -0.0002788566052913666, -0.0002623051404953003, -0.000245753675699234, -0.00022920221090316772, -0.00021265074610710144, -0.00019609928131103516, -0.00017954781651496887, -0.0001629963517189026, -0.0001464448869228363, -0.00012989342212677002, -0.00011334195733070374, -9.679049253463745e-05, -8.023902773857117e-05, -6.368756294250488e-05, -4.71360981464386e-05, -3.0584633350372314e-05, -1.403316855430603e-05, 2.518296241760254e-06, 1.9069761037826538e-05, 3.562122583389282e-05, 5.2172690629959106e-05, 6.872415542602539e-05, 8.527562022209167e-05, 0.00010182708501815796, 0.00011837854981422424, 0.00013493001461029053, 0.0001514814794063568, 0.0001680329442024231, 0.00018458440899848938, 0.00020113587379455566, 0.00021768733859062195, 0.00023423880338668823, 0.0002507902681827545, 0.0002673417329788208, 0.0002838931977748871, 0.00030044466257095337, 0.00031699612736701965, 0.00033354759216308594]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 1.0, 9.0, 13.0, 15.0, 24.0, 28.0, 37.0, 58.0, 83.0, 115.0, 187.0, 241.0, 364.0, 518.0, 745.0, 1063.0, 1677.0, 2717.0, 4129.0, 6904.0, 11707.0, 19952.0, 34439.0, 59247.0, 97491.0, 147145.0, 182001.0, 168438.0, 121741.0, 76860.0, 45198.0, 26272.0, 15101.0, 8984.0, 5507.0, 3204.0, 2084.0, 1360.0, 885.0, 630.0, 426.0, 267.0, 207.0, 147.0, 111.0, 60.0, 47.0, 40.0, 29.0, 18.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.607421875, -2.519775390625, -2.43212890625, -2.344482421875, -2.2568359375, -2.169189453125, -2.08154296875, -1.993896484375, -1.90625, -1.818603515625, -1.73095703125, -1.643310546875, -1.5556640625, -1.468017578125, -1.38037109375, -1.292724609375, -1.205078125, -1.117431640625, -1.02978515625, -0.942138671875, -0.8544921875, -0.766845703125, -0.67919921875, -0.591552734375, -0.50390625, -0.416259765625, -0.32861328125, -0.240966796875, -0.1533203125, -0.065673828125, 0.02197265625, 0.109619140625, 0.197265625, 0.284912109375, 0.37255859375, 0.460205078125, 0.5478515625, 0.635498046875, 0.72314453125, 0.810791015625, 0.8984375, 0.986083984375, 1.07373046875, 1.161376953125, 1.2490234375, 1.336669921875, 1.42431640625, 1.511962890625, 1.599609375, 1.687255859375, 1.77490234375, 1.862548828125, 1.9501953125, 2.037841796875, 2.12548828125, 2.213134765625, 2.30078125, 2.388427734375, 2.47607421875, 2.563720703125, 2.6513671875, 2.739013671875, 2.82666015625, 2.914306640625, 3.001953125]}, "gradients/decoder.bert.encoder.layer.5.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 8.0, 8.0, 9.0, 13.0, 18.0, 16.0, 16.0, 28.0, 26.0, 37.0, 45.0, 51.0, 36.0, 51.0, 51.0, 52.0, 65.0, 53.0, 43.0, 41.0, 43.0, 30.0, 33.0, 29.0, 23.0, 29.0, 20.0, 22.0, 13.0, 17.0, 6.0, 9.0, 10.0, 1.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-0.7255859375, -0.7011795043945312, -0.6767730712890625, -0.6523666381835938, -0.627960205078125, -0.6035537719726562, -0.5791473388671875, -0.5547409057617188, -0.53033447265625, -0.5059280395507812, -0.4815216064453125, -0.45711517333984375, -0.432708740234375, -0.40830230712890625, -0.3838958740234375, -0.35948944091796875, -0.3350830078125, -0.31067657470703125, -0.2862701416015625, -0.26186370849609375, -0.237457275390625, -0.21305084228515625, -0.1886444091796875, -0.16423797607421875, -0.13983154296875, -0.11542510986328125, -0.0910186767578125, -0.06661224365234375, -0.042205810546875, -0.01779937744140625, 0.0066070556640625, 0.03101348876953125, 0.055419921875, 0.07982635498046875, 0.1042327880859375, 0.12863922119140625, 0.153045654296875, 0.17745208740234375, 0.2018585205078125, 0.22626495361328125, 0.25067138671875, 0.27507781982421875, 0.2994842529296875, 0.32389068603515625, 0.348297119140625, 0.37270355224609375, 0.3971099853515625, 0.42151641845703125, 0.4459228515625, 0.47032928466796875, 0.4947357177734375, 0.5191421508789062, 0.543548583984375, 0.5679550170898438, 0.5923614501953125, 0.6167678833007812, 0.64117431640625, 0.6655807495117188, 0.6899871826171875, 0.7143936157226562, 0.738800048828125, 0.7632064819335938, 0.7876129150390625, 0.8120193481445312, 0.83642578125]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 12.0, 10.0, 27.0, 38.0, 31.0, 37.0, 50.0, 68.0, 76.0, 84.0, 85.0, 75.0, 61.0, 57.0, 55.0, 57.0, 45.0, 26.0, 21.0, 18.0, 18.0, 10.0, 5.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.24628734588623, -9.950932502746582, -9.655576705932617, -9.360221862792969, -9.064866065979004, -8.769511222839355, -8.47415542602539, -8.178800582885742, -7.8834452629089355, -7.588089942932129, -7.292734622955322, -6.997379302978516, -6.702024459838867, -6.406668663024902, -6.111313819885254, -5.815958499908447, -5.520603179931641, -5.225247859954834, -4.929892539978027, -4.634537220001221, -4.339181900024414, -4.043827056884766, -3.748471736907959, -3.4531164169311523, -3.1577610969543457, -2.862405776977539, -2.5670504570007324, -2.271695375442505, -1.9763400554656982, -1.6809847354888916, -1.3856295347213745, -1.0902743339538574, -0.7949199676513672, -0.4995647072792053, -0.20420944690704346, 0.09114581346511841, 0.3865010738372803, 0.6818563938140869, 0.977211594581604, 1.272566795349121, 1.5679221153259277, 1.8632774353027344, 2.158632755279541, 2.4539878368377686, 2.749343156814575, 3.044698476791382, 3.3400535583496094, 3.635408878326416, 3.9307641983032227, 4.226119518280029, 4.521474838256836, 4.816830158233643, 5.112185478210449, 5.407540321350098, 5.702895641326904, 5.998250961303711, 6.293606281280518, 6.588961601257324, 6.884316921234131, 7.1796722412109375, 7.475027084350586, 7.770382881164551, 8.0657377243042, 8.361093521118164, 8.656448364257812]}, "gradients/decoder.bert.encoder.layer.4.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 9.0, 9.0, 9.0, 15.0, 20.0, 14.0, 28.0, 15.0, 22.0, 25.0, 37.0, 32.0, 38.0, 44.0, 56.0, 28.0, 40.0, 37.0, 34.0, 38.0, 41.0, 30.0, 40.0, 42.0, 42.0, 29.0, 26.0, 21.0, 28.0, 24.0, 24.0, 10.0, 11.0, 11.0, 7.0, 16.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9239768981933594, -3.804469347000122, -3.6849617958068848, -3.5654542446136475, -3.44594669342041, -3.326439380645752, -3.2069315910339355, -3.0874242782592773, -2.96791672706604, -2.8484091758728027, -2.7289016246795654, -2.609394073486328, -2.489886522293091, -2.3703789710998535, -2.2508716583251953, -2.131364107131958, -2.0118565559387207, -1.8923490047454834, -1.772841453552246, -1.6533339023590088, -1.533826470375061, -1.4143189191818237, -1.2948113679885864, -1.1753039360046387, -1.0557961463928223, -0.936288595199585, -0.8167811036109924, -0.6972735524177551, -0.5777660608291626, -0.4582585096359253, -0.338750958442688, -0.21924346685409546, -0.09973597526550293, 0.019771553575992584, 0.1392790824174881, 0.2587866187095642, 0.3782941401004791, 0.49780166149139404, 0.6173092126846313, 0.7368167042732239, 0.8563242554664612, 0.9758318066596985, 1.095339298248291, 1.2148468494415283, 1.3343544006347656, 1.453861951828003, 1.5733695030212402, 1.692876935005188, 1.8123844861984253, 1.9318920373916626, 2.0513994693756104, 2.1709070205688477, 2.290414571762085, 2.4099221229553223, 2.5294296741485596, 2.648937225341797, 2.768444776535034, 2.8879523277282715, 3.007459878921509, 3.126967430114746, 3.2464749813079834, 3.3659825325012207, 3.485489845275879, 3.604997396469116, 3.7245049476623535]}, "gradients/decoder.bert.encoder.layer.4.output.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 7.0, 3.0, 8.0, 9.0, 14.0, 20.0, 31.0, 37.0, 61.0, 77.0, 107.0, 150.0, 223.0, 291.0, 451.0, 617.0, 940.0, 1371.0, 1972.0, 3029.0, 4739.0, 7350.0, 11924.0, 19351.0, 32823.0, 57676.0, 106448.0, 207877.0, 424379.0, 787195.0, 982918.0, 721523.0, 389529.0, 196682.0, 101068.0, 54841.0, 30738.0, 18364.0, 10899.0, 6698.0, 4113.0, 2701.0, 1721.0, 1091.0, 742.0, 453.0, 308.0, 264.0, 150.0, 113.0, 63.0, 44.0, 28.0, 22.0, 17.0, 8.0, 10.0, 4.0, 3.0, 3.0, 1.0], "bins": [-6.46875, -6.2752685546875, -6.081787109375, -5.8883056640625, -5.69482421875, -5.5013427734375, -5.307861328125, -5.1143798828125, -4.9208984375, -4.7274169921875, -4.533935546875, -4.3404541015625, -4.14697265625, -3.9534912109375, -3.760009765625, -3.5665283203125, -3.373046875, -3.1795654296875, -2.986083984375, -2.7926025390625, -2.59912109375, -2.4056396484375, -2.212158203125, -2.0186767578125, -1.8251953125, -1.6317138671875, -1.438232421875, -1.2447509765625, -1.05126953125, -0.8577880859375, -0.664306640625, -0.4708251953125, -0.27734375, -0.0838623046875, 0.109619140625, 0.3031005859375, 0.49658203125, 0.6900634765625, 0.883544921875, 1.0770263671875, 1.2705078125, 1.4639892578125, 1.657470703125, 1.8509521484375, 2.04443359375, 2.2379150390625, 2.431396484375, 2.6248779296875, 2.818359375, 3.0118408203125, 3.205322265625, 3.3988037109375, 3.59228515625, 3.7857666015625, 3.979248046875, 4.1727294921875, 4.3662109375, 4.5596923828125, 4.753173828125, 4.9466552734375, 5.14013671875, 5.3336181640625, 5.527099609375, 5.7205810546875, 5.9140625]}, "gradients/decoder.bert.encoder.layer.4.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 6.0, 9.0, 3.0, 14.0, 12.0, 16.0, 15.0, 18.0, 20.0, 24.0, 25.0, 29.0, 28.0, 24.0, 36.0, 42.0, 39.0, 31.0, 47.0, 47.0, 46.0, 43.0, 41.0, 43.0, 40.0, 36.0, 39.0, 30.0, 23.0, 28.0, 19.0, 25.0, 21.0, 9.0, 11.0, 19.0, 11.0, 4.0, 5.0, 7.0, 4.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.99609375, -3.88427734375, -3.7724609375, -3.66064453125, -3.548828125, -3.43701171875, -3.3251953125, -3.21337890625, -3.1015625, -2.98974609375, -2.8779296875, -2.76611328125, -2.654296875, -2.54248046875, -2.4306640625, -2.31884765625, -2.20703125, -2.09521484375, -1.9833984375, -1.87158203125, -1.759765625, -1.64794921875, -1.5361328125, -1.42431640625, -1.3125, -1.20068359375, -1.0888671875, -0.97705078125, -0.865234375, -0.75341796875, -0.6416015625, -0.52978515625, -0.41796875, -0.30615234375, -0.1943359375, -0.08251953125, 0.029296875, 0.14111328125, 0.2529296875, 0.36474609375, 0.4765625, 0.58837890625, 0.7001953125, 0.81201171875, 0.923828125, 1.03564453125, 1.1474609375, 1.25927734375, 1.37109375, 1.48291015625, 1.5947265625, 1.70654296875, 1.818359375, 1.93017578125, 2.0419921875, 2.15380859375, 2.265625, 2.37744140625, 2.4892578125, 2.60107421875, 2.712890625, 2.82470703125, 2.9365234375, 3.04833984375, 3.16015625]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 12.0, 15.0, 13.0, 25.0, 28.0, 50.0, 73.0, 115.0, 164.0, 228.0, 363.0, 556.0, 834.0, 1284.0, 2089.0, 3413.0, 5844.0, 9992.0, 17945.0, 33616.0, 64398.0, 132007.0, 282463.0, 608761.0, 1078765.0, 978982.0, 506131.0, 234500.0, 110668.0, 54696.0, 28570.0, 15682.0, 8684.0, 5143.0, 3079.0, 1853.0, 1116.0, 734.0, 477.0, 316.0, 203.0, 126.0, 98.0, 55.0, 40.0, 21.0, 15.0, 15.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.1484375, -8.8614501953125, -8.574462890625, -8.2874755859375, -8.00048828125, -7.7135009765625, -7.426513671875, -7.1395263671875, -6.8525390625, -6.5655517578125, -6.278564453125, -5.9915771484375, -5.70458984375, -5.4176025390625, -5.130615234375, -4.8436279296875, -4.556640625, -4.2696533203125, -3.982666015625, -3.6956787109375, -3.40869140625, -3.1217041015625, -2.834716796875, -2.5477294921875, -2.2607421875, -1.9737548828125, -1.686767578125, -1.3997802734375, -1.11279296875, -0.8258056640625, -0.538818359375, -0.2518310546875, 0.03515625, 0.3221435546875, 0.609130859375, 0.8961181640625, 1.18310546875, 1.4700927734375, 1.757080078125, 2.0440673828125, 2.3310546875, 2.6180419921875, 2.905029296875, 3.1920166015625, 3.47900390625, 3.7659912109375, 4.052978515625, 4.3399658203125, 4.626953125, 4.9139404296875, 5.200927734375, 5.4879150390625, 5.77490234375, 6.0618896484375, 6.348876953125, 6.6358642578125, 6.9228515625, 7.2098388671875, 7.496826171875, 7.7838134765625, 8.07080078125, 8.3577880859375, 8.644775390625, 8.9317626953125, 9.21875]}, "gradients/decoder.bert.encoder.layer.4.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 3.0, 3.0, 9.0, 18.0, 17.0, 33.0, 34.0, 46.0, 44.0, 86.0, 86.0, 131.0, 192.0, 209.0, 238.0, 302.0, 355.0, 340.0, 308.0, 303.0, 266.0, 218.0, 199.0, 152.0, 111.0, 103.0, 70.0, 37.0, 40.0, 30.0, 21.0, 22.0, 13.0, 7.0, 6.0, 3.0, 4.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.422119140625, -2.33447265625, -2.246826171875, -2.1591796875, -2.071533203125, -1.98388671875, -1.896240234375, -1.80859375, -1.720947265625, -1.63330078125, -1.545654296875, -1.4580078125, -1.370361328125, -1.28271484375, -1.195068359375, -1.107421875, -1.019775390625, -0.93212890625, -0.844482421875, -0.7568359375, -0.669189453125, -0.58154296875, -0.493896484375, -0.40625, -0.318603515625, -0.23095703125, -0.143310546875, -0.0556640625, 0.031982421875, 0.11962890625, 0.207275390625, 0.294921875, 0.382568359375, 0.47021484375, 0.557861328125, 0.6455078125, 0.733154296875, 0.82080078125, 0.908447265625, 0.99609375, 1.083740234375, 1.17138671875, 1.259033203125, 1.3466796875, 1.434326171875, 1.52197265625, 1.609619140625, 1.697265625, 1.784912109375, 1.87255859375, 1.960205078125, 2.0478515625, 2.135498046875, 2.22314453125, 2.310791015625, 2.3984375, 2.486083984375, 2.57373046875, 2.661376953125, 2.7490234375, 2.836669921875, 2.92431640625, 3.011962890625, 3.099609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 5.0, 7.0, 15.0, 12.0, 22.0, 25.0, 28.0, 36.0, 40.0, 39.0, 60.0, 45.0, 80.0, 60.0, 61.0, 62.0, 47.0, 54.0, 50.0, 54.0, 42.0, 31.0, 28.0, 20.0, 8.0, 15.0, 11.0, 10.0, 8.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.099714279174805, -9.812762260437012, -9.525810241699219, -9.238858222961426, -8.951906204223633, -8.66495418548584, -8.378002166748047, -8.091050148010254, -7.804098129272461, -7.517146110534668, -7.230194091796875, -6.943242073059082, -6.656290054321289, -6.369338035583496, -6.082386016845703, -5.79543399810791, -5.508482456207275, -5.221530437469482, -4.9345784187316895, -4.6476263999938965, -4.3606743812561035, -4.0737223625183105, -3.7867705821990967, -3.4998185634613037, -3.2128665447235107, -2.9259145259857178, -2.638962507247925, -2.352010726928711, -2.065058708190918, -1.7781065702438354, -1.491154670715332, -1.204202651977539, -0.9172506332397461, -0.6302986145019531, -0.34334665536880493, -0.05639469623565674, 0.23055732250213623, 0.5175093412399292, 0.8044612407684326, 1.0914132595062256, 1.3783652782440186, 1.6653172969818115, 1.9522693157196045, 2.2392210960388184, 2.5261731147766113, 2.8131251335144043, 3.1000771522521973, 3.3870291709899902, 3.673981189727783, 3.960933208465576, 4.247885227203369, 4.534837245941162, 4.821789264678955, 5.108741283416748, 5.395692825317383, 5.682644844055176, 5.969596862792969, 6.256548881530762, 6.543500900268555, 6.830452919006348, 7.117404937744141, 7.404356956481934, 7.691308975219727, 7.9782609939575195, 8.265213012695312]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 2.0, 9.0, 3.0, 5.0, 7.0, 3.0, 6.0, 5.0, 15.0, 10.0, 9.0, 14.0, 20.0, 12.0, 30.0, 29.0, 28.0, 25.0, 32.0, 38.0, 38.0, 36.0, 33.0, 48.0, 46.0, 42.0, 34.0, 44.0, 36.0, 33.0, 32.0, 24.0, 26.0, 29.0, 18.0, 25.0, 24.0, 17.0, 22.0, 13.0, 15.0, 13.0, 10.0, 8.0, 9.0, 8.0, 6.0, 8.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.151684284210205, -4.021500587463379, -3.891317367553711, -3.761133909225464, -3.630950450897217, -3.5007667541503906, -3.3705832958221436, -3.2403998374938965, -3.1102163791656494, -2.9800329208374023, -2.8498494625091553, -2.719666004180908, -2.589482307434082, -2.459299087524414, -2.329115390777588, -2.198931932449341, -2.0687484741210938, -1.9385650157928467, -1.8083815574645996, -1.678197979927063, -1.548014521598816, -1.4178310632705688, -1.2876474857330322, -1.1574640274047852, -1.027280569076538, -0.897097110748291, -0.7669135928153992, -0.6367300748825073, -0.5065466165542603, -0.3763631582260132, -0.24617964029312134, -0.11599612236022949, 0.014186859130859375, 0.14437034726142883, 0.2745538353919983, 0.40473732352256775, 0.5349208116531372, 0.6651042699813843, 0.7952877879142761, 0.925471305847168, 1.055654764175415, 1.185838222503662, 1.3160216808319092, 1.4462052583694458, 1.5763887166976929, 1.70657217502594, 1.8367557525634766, 1.9669392108917236, 2.0971226692199707, 2.2273061275482178, 2.357489585876465, 2.487673044204712, 2.617856502532959, 2.748040199279785, 2.8782236576080322, 3.0084071159362793, 3.1385905742645264, 3.2687740325927734, 3.3989574909210205, 3.5291409492492676, 3.6593246459960938, 3.7895078659057617, 3.919691562652588, 4.049875259399414, 4.180058479309082]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 6.0, 2.0, 10.0, 6.0, 19.0, 26.0, 42.0, 44.0, 62.0, 108.0, 158.0, 213.0, 268.0, 441.0, 581.0, 846.0, 1275.0, 1816.0, 2732.0, 4201.0, 6381.0, 10235.0, 15982.0, 25995.0, 42906.0, 70851.0, 114449.0, 163230.0, 181465.0, 147856.0, 98468.0, 60346.0, 36313.0, 22060.0, 13696.0, 8754.0, 5533.0, 3530.0, 2448.0, 1635.0, 1135.0, 728.0, 539.0, 356.0, 227.0, 149.0, 124.0, 106.0, 60.0, 47.0, 39.0, 27.0, 11.0, 14.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.5869140625, -0.5681838989257812, -0.5494537353515625, -0.5307235717773438, -0.511993408203125, -0.49326324462890625, -0.4745330810546875, -0.45580291748046875, -0.43707275390625, -0.41834259033203125, -0.3996124267578125, -0.38088226318359375, -0.362152099609375, -0.34342193603515625, -0.3246917724609375, -0.30596160888671875, -0.2872314453125, -0.26850128173828125, -0.2497711181640625, -0.23104095458984375, -0.212310791015625, -0.19358062744140625, -0.1748504638671875, -0.15612030029296875, -0.13739013671875, -0.11865997314453125, -0.0999298095703125, -0.08119964599609375, -0.062469482421875, -0.04373931884765625, -0.0250091552734375, -0.00627899169921875, 0.012451171875, 0.03118133544921875, 0.0499114990234375, 0.06864166259765625, 0.087371826171875, 0.10610198974609375, 0.1248321533203125, 0.14356231689453125, 0.16229248046875, 0.18102264404296875, 0.1997528076171875, 0.21848297119140625, 0.237213134765625, 0.25594329833984375, 0.2746734619140625, 0.29340362548828125, 0.3121337890625, 0.33086395263671875, 0.3495941162109375, 0.36832427978515625, 0.387054443359375, 0.40578460693359375, 0.4245147705078125, 0.44324493408203125, 0.46197509765625, 0.48070526123046875, 0.4994354248046875, 0.5181655883789062, 0.536895751953125, 0.5556259155273438, 0.5743560791015625, 0.5930862426757812, 0.61181640625]}, "gradients/decoder.bert.encoder.layer.4.crossattention.output.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 7.0, 5.0, 7.0, 4.0, 8.0, 9.0, 8.0, 11.0, 15.0, 19.0, 17.0, 26.0, 33.0, 24.0, 32.0, 32.0, 31.0, 42.0, 52.0, 37.0, 38.0, 40.0, 40.0, 31.0, 36.0, 33.0, 51.0, 33.0, 28.0, 29.0, 29.0, 25.0, 25.0, 19.0, 15.0, 18.0, 10.0, 15.0, 8.0, 6.0, 8.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.7890625, -4.63934326171875, -4.4896240234375, -4.33990478515625, -4.190185546875, -4.04046630859375, -3.8907470703125, -3.74102783203125, -3.59130859375, -3.44158935546875, -3.2918701171875, -3.14215087890625, -2.992431640625, -2.84271240234375, -2.6929931640625, -2.54327392578125, -2.3935546875, -2.24383544921875, -2.0941162109375, -1.94439697265625, -1.794677734375, -1.64495849609375, -1.4952392578125, -1.34552001953125, -1.19580078125, -1.04608154296875, -0.8963623046875, -0.74664306640625, -0.596923828125, -0.44720458984375, -0.2974853515625, -0.14776611328125, 0.001953125, 0.15167236328125, 0.3013916015625, 0.45111083984375, 0.600830078125, 0.75054931640625, 0.9002685546875, 1.04998779296875, 1.19970703125, 1.34942626953125, 1.4991455078125, 1.64886474609375, 1.798583984375, 1.94830322265625, 2.0980224609375, 2.24774169921875, 2.3974609375, 2.54718017578125, 2.6968994140625, 2.84661865234375, 2.996337890625, 3.14605712890625, 3.2957763671875, 3.44549560546875, 3.59521484375, 3.74493408203125, 3.8946533203125, 4.04437255859375, 4.194091796875, 4.34381103515625, 4.4935302734375, 4.64324951171875, 4.79296875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 7.0, 8.0, 18.0, 22.0, 11.0, 36.0, 46.0, 55.0, 98.0, 138.0, 160.0, 268.0, 396.0, 651.0, 998.0, 1736.0, 2881.0, 5357.0, 10900.0, 25517.0, 179614.0, 750312.0, 38827.0, 14608.0, 6812.0, 3675.0, 2056.0, 1149.0, 777.0, 422.0, 300.0, 204.0, 151.0, 99.0, 79.0, 49.0, 36.0, 26.0, 11.0, 11.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.037109375, -1.97381591796875, -1.9105224609375, -1.84722900390625, -1.783935546875, -1.72064208984375, -1.6573486328125, -1.59405517578125, -1.53076171875, -1.46746826171875, -1.4041748046875, -1.34088134765625, -1.277587890625, -1.21429443359375, -1.1510009765625, -1.08770751953125, -1.0244140625, -0.96112060546875, -0.8978271484375, -0.83453369140625, -0.771240234375, -0.70794677734375, -0.6446533203125, -0.58135986328125, -0.51806640625, -0.45477294921875, -0.3914794921875, -0.32818603515625, -0.264892578125, -0.20159912109375, -0.1383056640625, -0.07501220703125, -0.01171875, 0.05157470703125, 0.1148681640625, 0.17816162109375, 0.241455078125, 0.30474853515625, 0.3680419921875, 0.43133544921875, 0.49462890625, 0.55792236328125, 0.6212158203125, 0.68450927734375, 0.747802734375, 0.81109619140625, 0.8743896484375, 0.93768310546875, 1.0009765625, 1.06427001953125, 1.1275634765625, 1.19085693359375, 1.254150390625, 1.31744384765625, 1.3807373046875, 1.44403076171875, 1.50732421875, 1.57061767578125, 1.6339111328125, 1.69720458984375, 1.760498046875, 1.82379150390625, 1.8870849609375, 1.95037841796875, 2.013671875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 4.0, 11.0, 5.0, 11.0, 10.0, 14.0, 16.0, 22.0, 30.0, 23.0, 26.0, 28.0, 29.0, 48.0, 33.0, 39.0, 40.0, 52.0, 43.0, 41.0, 48.0, 38.0, 38.0, 47.0, 37.0, 40.0, 35.0, 23.0, 30.0, 29.0, 23.0, 18.0, 19.0, 10.0, 10.0, 11.0, 5.0, 3.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3984375, -3.2872314453125, -3.176025390625, -3.0648193359375, -2.95361328125, -2.8424072265625, -2.731201171875, -2.6199951171875, -2.5087890625, -2.3975830078125, -2.286376953125, -2.1751708984375, -2.06396484375, -1.9527587890625, -1.841552734375, -1.7303466796875, -1.619140625, -1.5079345703125, -1.396728515625, -1.2855224609375, -1.17431640625, -1.0631103515625, -0.951904296875, -0.8406982421875, -0.7294921875, -0.6182861328125, -0.507080078125, -0.3958740234375, -0.28466796875, -0.1734619140625, -0.062255859375, 0.0489501953125, 0.16015625, 0.2713623046875, 0.382568359375, 0.4937744140625, 0.60498046875, 0.7161865234375, 0.827392578125, 0.9385986328125, 1.0498046875, 1.1610107421875, 1.272216796875, 1.3834228515625, 1.49462890625, 1.6058349609375, 1.717041015625, 1.8282470703125, 1.939453125, 2.0506591796875, 2.161865234375, 2.2730712890625, 2.38427734375, 2.4954833984375, 2.606689453125, 2.7178955078125, 2.8291015625, 2.9403076171875, 3.051513671875, 3.1627197265625, 3.27392578125, 3.3851318359375, 3.496337890625, 3.6075439453125, 3.71875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 10.0, 10.0, 15.0, 14.0, 25.0, 41.0, 49.0, 67.0, 93.0, 146.0, 225.0, 313.0, 469.0, 794.0, 1199.0, 1960.0, 3468.0, 6175.0, 11469.0, 24630.0, 238272.0, 702039.0, 28225.0, 12712.0, 6578.0, 3704.0, 2114.0, 1348.0, 783.0, 500.0, 315.0, 238.0, 161.0, 112.0, 81.0, 55.0, 32.0, 37.0, 19.0, 10.0, 9.0, 7.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4335823059082031, -0.41916656494140625, -0.4047508239746094, -0.3903350830078125, -0.3759193420410156, -0.36150360107421875, -0.3470878601074219, -0.332672119140625, -0.3182563781738281, -0.30384063720703125, -0.2894248962402344, -0.2750091552734375, -0.2605934143066406, -0.24617767333984375, -0.23176193237304688, -0.21734619140625, -0.20293045043945312, -0.18851470947265625, -0.17409896850585938, -0.1596832275390625, -0.14526748657226562, -0.13085174560546875, -0.11643600463867188, -0.102020263671875, -0.08760452270507812, -0.07318878173828125, -0.058773040771484375, -0.0443572998046875, -0.029941558837890625, -0.01552581787109375, -0.001110076904296875, 0.0133056640625, 0.027721405029296875, 0.04213714599609375, 0.056552886962890625, 0.0709686279296875, 0.08538436889648438, 0.09980010986328125, 0.11421585083007812, 0.128631591796875, 0.14304733276367188, 0.15746307373046875, 0.17187881469726562, 0.1862945556640625, 0.20071029663085938, 0.21512603759765625, 0.22954177856445312, 0.24395751953125, 0.2583732604980469, 0.27278900146484375, 0.2872047424316406, 0.3016204833984375, 0.3160362243652344, 0.33045196533203125, 0.3448677062988281, 0.359283447265625, 0.3736991882324219, 0.38811492919921875, 0.4025306701660156, 0.4169464111328125, 0.4313621520996094, 0.44577789306640625, 0.4601936340332031, 0.474609375]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.key.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 4.0, 3.0, 12.0, 12.0, 12.0, 25.0, 20.0, 22.0, 22.0, 30.0, 19.0, 21.0, 34.0, 22.0, 37.0, 34.0, 41.0, 50.0, 61.0, 35.0, 41.0, 34.0, 33.0, 34.0, 46.0, 23.0, 36.0, 33.0, 28.0, 22.0, 19.0, 17.0, 13.0, 17.0, 15.0, 8.0, 8.0, 4.0, 9.0, 9.0, 6.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.6987323760986328e-05, -1.6470439732074738e-05, -1.5953555703163147e-05, -1.5436671674251556e-05, -1.4919787645339966e-05, -1.4402903616428375e-05, -1.3886019587516785e-05, -1.3369135558605194e-05, -1.2852251529693604e-05, -1.2335367500782013e-05, -1.1818483471870422e-05, -1.1301599442958832e-05, -1.0784715414047241e-05, -1.026783138513565e-05, -9.75094735622406e-06, -9.23406332731247e-06, -8.717179298400879e-06, -8.200295269489288e-06, -7.683411240577698e-06, -7.166527211666107e-06, -6.649643182754517e-06, -6.132759153842926e-06, -5.6158751249313354e-06, -5.098991096019745e-06, -4.582107067108154e-06, -4.065223038196564e-06, -3.548339009284973e-06, -3.0314549803733826e-06, -2.514570951461792e-06, -1.9976869225502014e-06, -1.4808028936386108e-06, -9.639188647270203e-07, -4.470348358154297e-07, 6.984919309616089e-08, 5.867332220077515e-07, 1.103617250919342e-06, 1.6205012798309326e-06, 2.137385308742523e-06, 2.6542693376541138e-06, 3.1711533665657043e-06, 3.688037395477295e-06, 4.2049214243888855e-06, 4.721805453300476e-06, 5.238689482212067e-06, 5.755573511123657e-06, 6.272457540035248e-06, 6.789341568946838e-06, 7.306225597858429e-06, 7.82310962677002e-06, 8.33999365568161e-06, 8.8568776845932e-06, 9.373761713504791e-06, 9.890645742416382e-06, 1.0407529771327972e-05, 1.0924413800239563e-05, 1.1441297829151154e-05, 1.1958181858062744e-05, 1.2475065886974335e-05, 1.2991949915885925e-05, 1.3508833944797516e-05, 1.4025717973709106e-05, 1.4542602002620697e-05, 1.5059486031532288e-05, 1.5576370060443878e-05, 1.609325408935547e-05]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 8.0, 17.0, 12.0, 18.0, 24.0, 32.0, 39.0, 75.0, 93.0, 114.0, 196.0, 232.0, 383.0, 574.0, 990.0, 1698.0, 3086.0, 6042.0, 12936.0, 29452.0, 73571.0, 184243.0, 330250.0, 235627.0, 97502.0, 38291.0, 16435.0, 7595.0, 3792.0, 2024.0, 1065.0, 697.0, 435.0, 289.0, 200.0, 136.0, 111.0, 79.0, 54.0, 34.0, 26.0, 24.0, 17.0, 8.0, 8.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.272705078125, -0.2635078430175781, -0.25431060791015625, -0.24511337280273438, -0.2359161376953125, -0.22671890258789062, -0.21752166748046875, -0.20832443237304688, -0.199127197265625, -0.18992996215820312, -0.18073272705078125, -0.17153549194335938, -0.1623382568359375, -0.15314102172851562, -0.14394378662109375, -0.13474655151367188, -0.12554931640625, -0.11635208129882812, -0.10715484619140625, -0.09795761108398438, -0.0887603759765625, -0.07956314086914062, -0.07036590576171875, -0.061168670654296875, -0.051971435546875, -0.042774200439453125, -0.03357696533203125, -0.024379730224609375, -0.0151824951171875, -0.005985260009765625, 0.00321197509765625, 0.012409210205078125, 0.0216064453125, 0.030803680419921875, 0.04000091552734375, 0.049198150634765625, 0.0583953857421875, 0.06759262084960938, 0.07678985595703125, 0.08598709106445312, 0.095184326171875, 0.10438156127929688, 0.11357879638671875, 0.12277603149414062, 0.1319732666015625, 0.14117050170898438, 0.15036773681640625, 0.15956497192382812, 0.16876220703125, 0.17795944213867188, 0.18715667724609375, 0.19635391235351562, 0.2055511474609375, 0.21474838256835938, 0.22394561767578125, 0.23314285278320312, 0.242340087890625, 0.2515373229980469, 0.26073455810546875, 0.2699317932128906, 0.2791290283203125, 0.2883262634277344, 0.29752349853515625, 0.3067207336425781, 0.31591796875]}, "gradients/decoder.bert.encoder.layer.4.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 8.0, 5.0, 13.0, 20.0, 22.0, 26.0, 54.0, 67.0, 99.0, 106.0, 115.0, 124.0, 94.0, 83.0, 46.0, 47.0, 25.0, 15.0, 13.0, 2.0, 7.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061859130859375, -0.05942106246948242, -0.056982994079589844, -0.054544925689697266, -0.05210685729980469, -0.04966878890991211, -0.04723072052001953, -0.04479265213012695, -0.042354583740234375, -0.0399165153503418, -0.03747844696044922, -0.03504037857055664, -0.03260231018066406, -0.030164241790771484, -0.027726173400878906, -0.025288105010986328, -0.02285003662109375, -0.020411968231201172, -0.017973899841308594, -0.015535831451416016, -0.013097763061523438, -0.01065969467163086, -0.008221626281738281, -0.005783557891845703, -0.003345489501953125, -0.0009074211120605469, 0.0015306472778320312, 0.003968715667724609, 0.0064067840576171875, 0.008844852447509766, 0.011282920837402344, 0.013720989227294922, 0.0161590576171875, 0.018597126007080078, 0.021035194396972656, 0.023473262786865234, 0.025911331176757812, 0.02834939956665039, 0.03078746795654297, 0.03322553634643555, 0.035663604736328125, 0.0381016731262207, 0.04053974151611328, 0.04297780990600586, 0.04541587829589844, 0.047853946685791016, 0.050292015075683594, 0.05273008346557617, 0.05516815185546875, 0.05760622024536133, 0.060044288635253906, 0.062482357025146484, 0.06492042541503906, 0.06735849380493164, 0.06979656219482422, 0.0722346305847168, 0.07467269897460938, 0.07711076736450195, 0.07954883575439453, 0.08198690414428711, 0.08442497253417969, 0.08686304092407227, 0.08930110931396484, 0.09173917770385742, 0.09417724609375]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 6.0, 10.0, 16.0, 14.0, 31.0, 28.0, 31.0, 41.0, 35.0, 56.0, 46.0, 87.0, 55.0, 64.0, 63.0, 51.0, 46.0, 61.0, 46.0, 53.0, 28.0, 31.0, 17.0, 11.0, 12.0, 11.0, 10.0, 10.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.182402610778809, -9.894397735595703, -9.606393814086914, -9.318388938903809, -9.030384063720703, -8.742380142211914, -8.454375267028809, -8.166370391845703, -7.878365993499756, -7.590361595153809, -7.302356719970703, -7.014352321624756, -6.726347923278809, -6.438343048095703, -6.150338649749756, -5.862334251403809, -5.574329376220703, -5.286324977874756, -4.99832010269165, -4.710315704345703, -4.422310829162598, -4.13430643081665, -3.846302032470703, -3.5582973957061768, -3.2702927589416504, -2.982288122177124, -2.6942834854125977, -2.4062790870666504, -2.118274450302124, -1.8302698135375977, -1.5422652959823608, -1.254260778427124, -0.9662561416625977, -0.6782515645027161, -0.3902469873428345, -0.10224241018295288, 0.1857621669769287, 0.4737668037414551, 0.7617713212966919, 1.0497758388519287, 1.337780475616455, 1.6257851123809814, 1.9137896299362183, 2.201794147491455, 2.4897987842559814, 2.777803421020508, 3.065807819366455, 3.3538124561309814, 3.641817092895508, 3.929821729660034, 4.2178263664245605, 4.505830764770508, 4.793835639953613, 5.0818400382995605, 5.369844436645508, 5.657849311828613, 5.9458537101745605, 6.233858108520508, 6.521862983703613, 6.8098673820495605, 7.097871780395508, 7.385876655578613, 7.6738810539245605, 7.961885452270508, 8.249890327453613]}, "gradients/decoder.bert.encoder.layer.4.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 1.0, 2.0, 9.0, 3.0, 4.0, 8.0, 3.0, 6.0, 6.0, 16.0, 10.0, 10.0, 11.0, 20.0, 16.0, 29.0, 33.0, 25.0, 24.0, 36.0, 34.0, 38.0, 39.0, 34.0, 46.0, 45.0, 43.0, 34.0, 44.0, 34.0, 33.0, 33.0, 22.0, 28.0, 26.0, 19.0, 28.0, 21.0, 17.0, 21.0, 12.0, 13.0, 15.0, 9.0, 10.0, 12.0, 6.0, 6.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.1361870765686035, -4.00673770904541, -3.877288818359375, -3.7478396892547607, -3.6183905601501465, -3.488941192626953, -3.359492063522339, -3.2300429344177246, -3.1005938053131104, -2.971144676208496, -2.841695547103882, -2.7122464179992676, -2.582797050476074, -2.453348159790039, -2.3238987922668457, -2.1944496631622314, -2.065000534057617, -1.935551404953003, -1.8061022758483887, -1.6766530275344849, -1.5472038984298706, -1.4177547693252563, -1.2883055210113525, -1.1588563919067383, -1.029407262802124, -0.8999581336975098, -0.7705089449882507, -0.6410597562789917, -0.5116106271743774, -0.3821614980697632, -0.25271230936050415, -0.12326312065124512, 0.006186008453369141, 0.1356351673603058, 0.26508432626724243, 0.3945334851741791, 0.5239826440811157, 0.65343177318573, 0.782880961894989, 0.912330150604248, 1.0417792797088623, 1.1712284088134766, 1.3006775379180908, 1.4301267862319946, 1.5595759153366089, 1.6890250444412231, 1.818474292755127, 1.9479234218597412, 2.0773725509643555, 2.2068216800689697, 2.336270809173584, 2.4657199382781982, 2.5951690673828125, 2.724618434906006, 2.85406756401062, 2.9835166931152344, 3.1129658222198486, 3.242414951324463, 3.371864080429077, 3.5013132095336914, 3.6307625770568848, 3.76021146774292, 3.8896608352661133, 4.019109725952148, 4.148559093475342]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 19.0, 25.0, 33.0, 42.0, 64.0, 57.0, 114.0, 175.0, 268.0, 406.0, 712.0, 1014.0, 1707.0, 2667.0, 4659.0, 7978.0, 13929.0, 25387.0, 45505.0, 79442.0, 127644.0, 174814.0, 185014.0, 148215.0, 96972.0, 57415.0, 32039.0, 17849.0, 9801.0, 5817.0, 3311.0, 2002.0, 1195.0, 729.0, 492.0, 352.0, 215.0, 133.0, 89.0, 85.0, 52.0, 30.0, 19.0, 20.0, 8.0, 12.0, 5.0, 9.0, 3.0, 1.0, 2.0, 0.0, 4.0], "bins": [-7.02734375, -6.815673828125, -6.60400390625, -6.392333984375, -6.1806640625, -5.968994140625, -5.75732421875, -5.545654296875, -5.333984375, -5.122314453125, -4.91064453125, -4.698974609375, -4.4873046875, -4.275634765625, -4.06396484375, -3.852294921875, -3.640625, -3.428955078125, -3.21728515625, -3.005615234375, -2.7939453125, -2.582275390625, -2.37060546875, -2.158935546875, -1.947265625, -1.735595703125, -1.52392578125, -1.312255859375, -1.1005859375, -0.888916015625, -0.67724609375, -0.465576171875, -0.25390625, -0.042236328125, 0.16943359375, 0.381103515625, 0.5927734375, 0.804443359375, 1.01611328125, 1.227783203125, 1.439453125, 1.651123046875, 1.86279296875, 2.074462890625, 2.2861328125, 2.497802734375, 2.70947265625, 2.921142578125, 3.1328125, 3.344482421875, 3.55615234375, 3.767822265625, 3.9794921875, 4.191162109375, 4.40283203125, 4.614501953125, 4.826171875, 5.037841796875, 5.24951171875, 5.461181640625, 5.6728515625, 5.884521484375, 6.09619140625, 6.307861328125, 6.51953125]}, "gradients/decoder.bert.encoder.layer.4.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 6.0, 9.0, 15.0, 7.0, 9.0, 11.0, 12.0, 18.0, 11.0, 13.0, 22.0, 26.0, 29.0, 20.0, 42.0, 35.0, 29.0, 33.0, 40.0, 36.0, 41.0, 48.0, 41.0, 47.0, 33.0, 40.0, 32.0, 30.0, 32.0, 27.0, 35.0, 35.0, 22.0, 22.0, 18.0, 13.0, 11.0, 7.0, 8.0, 12.0, 7.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.598388671875, -4.44287109375, -4.287353515625, -4.1318359375, -3.976318359375, -3.82080078125, -3.665283203125, -3.509765625, -3.354248046875, -3.19873046875, -3.043212890625, -2.8876953125, -2.732177734375, -2.57666015625, -2.421142578125, -2.265625, -2.110107421875, -1.95458984375, -1.799072265625, -1.6435546875, -1.488037109375, -1.33251953125, -1.177001953125, -1.021484375, -0.865966796875, -0.71044921875, -0.554931640625, -0.3994140625, -0.243896484375, -0.08837890625, 0.067138671875, 0.22265625, 0.378173828125, 0.53369140625, 0.689208984375, 0.8447265625, 1.000244140625, 1.15576171875, 1.311279296875, 1.466796875, 1.622314453125, 1.77783203125, 1.933349609375, 2.0888671875, 2.244384765625, 2.39990234375, 2.555419921875, 2.7109375, 2.866455078125, 3.02197265625, 3.177490234375, 3.3330078125, 3.488525390625, 3.64404296875, 3.799560546875, 3.955078125, 4.110595703125, 4.26611328125, 4.421630859375, 4.5771484375, 4.732666015625, 4.88818359375, 5.043701171875, 5.19921875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 9.0, 3.0, 12.0, 12.0, 26.0, 38.0, 41.0, 83.0, 117.0, 166.0, 240.0, 440.0, 670.0, 1071.0, 1735.0, 2806.0, 4538.0, 7433.0, 12606.0, 20684.0, 35068.0, 58236.0, 92629.0, 135269.0, 166747.0, 163167.0, 127013.0, 84877.0, 53045.0, 31620.0, 19023.0, 11494.0, 6874.0, 4020.0, 2524.0, 1553.0, 985.0, 605.0, 355.0, 255.0, 145.0, 113.0, 64.0, 54.0, 38.0, 18.0, 14.0, 8.0, 2.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.16796875, -5.9683837890625, -5.768798828125, -5.5692138671875, -5.36962890625, -5.1700439453125, -4.970458984375, -4.7708740234375, -4.5712890625, -4.3717041015625, -4.172119140625, -3.9725341796875, -3.77294921875, -3.5733642578125, -3.373779296875, -3.1741943359375, -2.974609375, -2.7750244140625, -2.575439453125, -2.3758544921875, -2.17626953125, -1.9766845703125, -1.777099609375, -1.5775146484375, -1.3779296875, -1.1783447265625, -0.978759765625, -0.7791748046875, -0.57958984375, -0.3800048828125, -0.180419921875, 0.0191650390625, 0.21875, 0.4183349609375, 0.617919921875, 0.8175048828125, 1.01708984375, 1.2166748046875, 1.416259765625, 1.6158447265625, 1.8154296875, 2.0150146484375, 2.214599609375, 2.4141845703125, 2.61376953125, 2.8133544921875, 3.012939453125, 3.2125244140625, 3.412109375, 3.6116943359375, 3.811279296875, 4.0108642578125, 4.21044921875, 4.4100341796875, 4.609619140625, 4.8092041015625, 5.0087890625, 5.2083740234375, 5.407958984375, 5.6075439453125, 5.80712890625, 6.0067138671875, 6.206298828125, 6.4058837890625, 6.60546875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 5.0, 10.0, 15.0, 14.0, 30.0, 19.0, 27.0, 27.0, 27.0, 31.0, 42.0, 33.0, 42.0, 38.0, 54.0, 32.0, 51.0, 54.0, 53.0, 45.0, 38.0, 37.0, 30.0, 36.0, 38.0, 29.0, 23.0, 31.0, 14.0, 11.0, 7.0, 10.0, 8.0, 5.0, 6.0, 4.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.105865478515625, -2.99688720703125, -2.887908935546875, -2.7789306640625, -2.669952392578125, -2.56097412109375, -2.451995849609375, -2.343017578125, -2.234039306640625, -2.12506103515625, -2.016082763671875, -1.9071044921875, -1.798126220703125, -1.68914794921875, -1.580169677734375, -1.47119140625, -1.362213134765625, -1.25323486328125, -1.144256591796875, -1.0352783203125, -0.926300048828125, -0.81732177734375, -0.708343505859375, -0.599365234375, -0.490386962890625, -0.38140869140625, -0.272430419921875, -0.1634521484375, -0.054473876953125, 0.05450439453125, 0.163482666015625, 0.2724609375, 0.381439208984375, 0.49041748046875, 0.599395751953125, 0.7083740234375, 0.817352294921875, 0.92633056640625, 1.035308837890625, 1.144287109375, 1.253265380859375, 1.36224365234375, 1.471221923828125, 1.5802001953125, 1.689178466796875, 1.79815673828125, 1.907135009765625, 2.01611328125, 2.125091552734375, 2.23406982421875, 2.343048095703125, 2.4520263671875, 2.561004638671875, 2.66998291015625, 2.778961181640625, 2.887939453125, 2.996917724609375, 3.10589599609375, 3.214874267578125, 3.3238525390625, 3.432830810546875, 3.54180908203125, 3.650787353515625, 3.759765625]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 13.0, 17.0, 32.0, 26.0, 65.0, 83.0, 97.0, 175.0, 212.0, 340.0, 494.0, 752.0, 1098.0, 1646.0, 2646.0, 4428.0, 7786.0, 14356.0, 28377.0, 55497.0, 106157.0, 179049.0, 224345.0, 184406.0, 112044.0, 58383.0, 29914.0, 15389.0, 8034.0, 4672.0, 2737.0, 1777.0, 1129.0, 764.0, 514.0, 334.0, 250.0, 150.0, 131.0, 74.0, 51.0, 35.0, 29.0, 21.0, 11.0, 7.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.57421875, -4.43365478515625, -4.2930908203125, -4.15252685546875, -4.011962890625, -3.87139892578125, -3.7308349609375, -3.59027099609375, -3.44970703125, -3.30914306640625, -3.1685791015625, -3.02801513671875, -2.887451171875, -2.74688720703125, -2.6063232421875, -2.46575927734375, -2.3251953125, -2.18463134765625, -2.0440673828125, -1.90350341796875, -1.762939453125, -1.62237548828125, -1.4818115234375, -1.34124755859375, -1.20068359375, -1.06011962890625, -0.9195556640625, -0.77899169921875, -0.638427734375, -0.49786376953125, -0.3572998046875, -0.21673583984375, -0.076171875, 0.06439208984375, 0.2049560546875, 0.34552001953125, 0.486083984375, 0.62664794921875, 0.7672119140625, 0.90777587890625, 1.04833984375, 1.18890380859375, 1.3294677734375, 1.47003173828125, 1.610595703125, 1.75115966796875, 1.8917236328125, 2.03228759765625, 2.1728515625, 2.31341552734375, 2.4539794921875, 2.59454345703125, 2.735107421875, 2.87567138671875, 3.0162353515625, 3.15679931640625, 3.29736328125, 3.43792724609375, 3.5784912109375, 3.71905517578125, 3.859619140625, 4.00018310546875, 4.1407470703125, 4.28131103515625, 4.421875]}, "gradients/decoder.bert.encoder.layer.4.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 14.0, 10.0, 14.0, 25.0, 25.0, 34.0, 47.0, 41.0, 40.0, 58.0, 71.0, 83.0, 83.0, 74.0, 69.0, 40.0, 49.0, 43.0, 39.0, 24.0, 24.0, 16.0, 11.0, 8.0, 11.0, 7.0, 5.0, 4.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005197525024414062, -0.0005041398108005524, -0.0004885271191596985, -0.0004729144275188446, -0.0004573017358779907, -0.00044168904423713684, -0.00042607635259628296, -0.0004104636609554291, -0.0003948509693145752, -0.0003792382776737213, -0.00036362558603286743, -0.00034801289439201355, -0.00033240020275115967, -0.0003167875111103058, -0.0003011748194694519, -0.000285562127828598, -0.00026994943618774414, -0.00025433674454689026, -0.00023872405290603638, -0.0002231113612651825, -0.0002074986696243286, -0.00019188597798347473, -0.00017627328634262085, -0.00016066059470176697, -0.00014504790306091309, -0.0001294352114200592, -0.00011382251977920532, -9.820982813835144e-05, -8.259713649749756e-05, -6.698444485664368e-05, -5.1371753215789795e-05, -3.575906157493591e-05, -2.014636993408203e-05, -4.533678293228149e-06, 1.1079013347625732e-05, 2.6691704988479614e-05, 4.2304396629333496e-05, 5.791708827018738e-05, 7.352977991104126e-05, 8.914247155189514e-05, 0.00010475516319274902, 0.0001203678548336029, 0.0001359805464744568, 0.00015159323811531067, 0.00016720592975616455, 0.00018281862139701843, 0.00019843131303787231, 0.0002140440046787262, 0.00022965669631958008, 0.00024526938796043396, 0.00026088207960128784, 0.0002764947712421417, 0.0002921074628829956, 0.0003077201545238495, 0.00032333284616470337, 0.00033894553780555725, 0.00035455822944641113, 0.000370170921087265, 0.0003857836127281189, 0.0004013963043689728, 0.00041700899600982666, 0.00043262168765068054, 0.0004482343792915344, 0.0004638470709323883, 0.0004794597625732422]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 7.0, 19.0, 27.0, 30.0, 49.0, 88.0, 107.0, 150.0, 247.0, 416.0, 715.0, 1137.0, 2080.0, 3430.0, 6237.0, 11128.0, 20595.0, 37928.0, 69040.0, 119976.0, 180420.0, 204659.0, 161519.0, 101581.0, 57202.0, 31049.0, 17123.0, 9342.0, 5015.0, 2944.0, 1638.0, 1028.0, 567.0, 374.0, 239.0, 159.0, 93.0, 54.0, 47.0, 40.0, 16.0, 5.0, 9.0, 9.0, 3.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.46875, -4.334716796875, -4.20068359375, -4.066650390625, -3.9326171875, -3.798583984375, -3.66455078125, -3.530517578125, -3.396484375, -3.262451171875, -3.12841796875, -2.994384765625, -2.8603515625, -2.726318359375, -2.59228515625, -2.458251953125, -2.32421875, -2.190185546875, -2.05615234375, -1.922119140625, -1.7880859375, -1.654052734375, -1.52001953125, -1.385986328125, -1.251953125, -1.117919921875, -0.98388671875, -0.849853515625, -0.7158203125, -0.581787109375, -0.44775390625, -0.313720703125, -0.1796875, -0.045654296875, 0.08837890625, 0.222412109375, 0.3564453125, 0.490478515625, 0.62451171875, 0.758544921875, 0.892578125, 1.026611328125, 1.16064453125, 1.294677734375, 1.4287109375, 1.562744140625, 1.69677734375, 1.830810546875, 1.96484375, 2.098876953125, 2.23291015625, 2.366943359375, 2.5009765625, 2.635009765625, 2.76904296875, 2.903076171875, 3.037109375, 3.171142578125, 3.30517578125, 3.439208984375, 3.5732421875, 3.707275390625, 3.84130859375, 3.975341796875, 4.109375]}, "gradients/decoder.bert.encoder.layer.4.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 8.0, 10.0, 13.0, 9.0, 19.0, 26.0, 31.0, 29.0, 45.0, 33.0, 65.0, 71.0, 55.0, 76.0, 95.0, 71.0, 53.0, 52.0, 46.0, 45.0, 32.0, 31.0, 24.0, 20.0, 6.0, 9.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.442626953125, -1.39990234375, -1.357177734375, -1.314453125, -1.271728515625, -1.22900390625, -1.186279296875, -1.1435546875, -1.100830078125, -1.05810546875, -1.015380859375, -0.97265625, -0.929931640625, -0.88720703125, -0.844482421875, -0.8017578125, -0.759033203125, -0.71630859375, -0.673583984375, -0.630859375, -0.588134765625, -0.54541015625, -0.502685546875, -0.4599609375, -0.417236328125, -0.37451171875, -0.331787109375, -0.2890625, -0.246337890625, -0.20361328125, -0.160888671875, -0.1181640625, -0.075439453125, -0.03271484375, 0.010009765625, 0.052734375, 0.095458984375, 0.13818359375, 0.180908203125, 0.2236328125, 0.266357421875, 0.30908203125, 0.351806640625, 0.39453125, 0.437255859375, 0.47998046875, 0.522705078125, 0.5654296875, 0.608154296875, 0.65087890625, 0.693603515625, 0.736328125, 0.779052734375, 0.82177734375, 0.864501953125, 0.9072265625, 0.949951171875, 0.99267578125, 1.035400390625, 1.078125, 1.120849609375, 1.16357421875, 1.206298828125, 1.2490234375]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 1.0, 2.0, 2.0, 10.0, 6.0, 12.0, 15.0, 10.0, 28.0, 28.0, 28.0, 33.0, 43.0, 52.0, 60.0, 58.0, 68.0, 83.0, 56.0, 57.0, 41.0, 56.0, 46.0, 51.0, 30.0, 29.0, 21.0, 18.0, 18.0, 7.0, 10.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.874255180358887, -10.578197479248047, -10.282139778137207, -9.986083030700684, -9.690025329589844, -9.393967628479004, -9.097909927368164, -8.801852226257324, -8.505794525146484, -8.209736824035645, -7.913679599761963, -7.617621898651123, -7.321564674377441, -7.025506973266602, -6.729449272155762, -6.433391571044922, -6.137334823608398, -5.841277122497559, -5.545219898223877, -5.249162197113037, -4.9531049728393555, -4.657047271728516, -4.360989570617676, -4.064931869506836, -3.7688746452331543, -3.4728171825408936, -3.176759719848633, -2.880702018737793, -2.5846445560455322, -2.2885870933532715, -1.9925295114517212, -1.696471929550171, -1.4004154205322266, -1.1043579578399658, -0.8083003759384155, -0.51224285364151, -0.2161853313446045, 0.07987213134765625, 0.37592971324920654, 0.6719872951507568, 0.9680447578430176, 1.2641022205352783, 1.5601598024368286, 1.856217384338379, 2.1522748470306396, 2.4483323097229004, 2.7443900108337402, 3.040447473526001, 3.3365049362182617, 3.6325623989105225, 3.928619861602783, 4.224677562713623, 4.520734786987305, 4.8167924880981445, 5.112850189208984, 5.408907890319824, 5.704965114593506, 6.001022815704346, 6.297080039978027, 6.593137741088867, 6.889195442199707, 7.185252666473389, 7.4813103675842285, 7.77736759185791, 8.07342529296875]}, "gradients/decoder.bert.encoder.layer.3.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 8.0, 2.0, 4.0, 7.0, 11.0, 6.0, 8.0, 10.0, 6.0, 18.0, 19.0, 25.0, 22.0, 22.0, 20.0, 34.0, 36.0, 31.0, 36.0, 39.0, 29.0, 36.0, 50.0, 34.0, 39.0, 37.0, 31.0, 38.0, 33.0, 27.0, 40.0, 25.0, 27.0, 27.0, 24.0, 16.0, 23.0, 19.0, 14.0, 13.0, 16.0, 9.0, 9.0, 5.0, 7.0, 5.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.142911911010742, -4.009039402008057, -3.87516713142395, -3.7412946224212646, -3.607422351837158, -3.4735498428344727, -3.339677333831787, -3.2058050632476807, -3.071932792663574, -2.9380602836608887, -2.8041880130767822, -2.6703155040740967, -2.5364432334899902, -2.4025707244873047, -2.268698215484619, -2.1348259449005127, -2.000953435897827, -1.8670810461044312, -1.7332086563110352, -1.5993361473083496, -1.4654638767242432, -1.3315913677215576, -1.1977189779281616, -1.0638465881347656, -0.9299741983413696, -0.7961018085479736, -0.6622294187545776, -0.5283569693565369, -0.39448457956314087, -0.2606121897697449, -0.1267397403717041, 0.0071326494216918945, 0.1410050392150879, 0.2748774290084839, 0.40874984860420227, 0.5426222681999207, 0.6764946579933167, 0.8103670477867126, 0.9442394971847534, 1.0781118869781494, 1.2119842767715454, 1.3458566665649414, 1.4797290563583374, 1.6136014461517334, 1.747473955154419, 1.8813462257385254, 2.015218734741211, 2.1490912437438965, 2.282963514328003, 2.4168360233306885, 2.550708293914795, 2.6845808029174805, 2.818453073501587, 2.9523255825042725, 3.086197853088379, 3.2200703620910645, 3.35394287109375, 3.4878153800964355, 3.621687650680542, 3.7555601596832275, 3.889432430267334, 4.0233049392700195, 4.157177448272705, 4.291049957275391, 4.424921989440918]}, "gradients/decoder.bert.encoder.layer.3.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 10.0, 5.0, 9.0, 16.0, 22.0, 32.0, 27.0, 62.0, 73.0, 86.0, 150.0, 204.0, 299.0, 450.0, 663.0, 979.0, 1325.0, 1994.0, 3184.0, 4951.0, 7593.0, 12099.0, 19811.0, 33513.0, 59410.0, 110323.0, 215070.0, 432020.0, 779920.0, 964544.0, 718553.0, 392933.0, 197792.0, 102662.0, 54736.0, 31188.0, 18141.0, 11046.0, 6529.0, 4201.0, 2636.0, 1789.0, 1159.0, 679.0, 480.0, 321.0, 215.0, 122.0, 106.0, 53.0, 36.0, 22.0, 14.0, 14.0, 8.0, 6.0, 6.0, 2.0, 2.0], "bins": [-8.328125, -8.086181640625, -7.84423828125, -7.602294921875, -7.3603515625, -7.118408203125, -6.87646484375, -6.634521484375, -6.392578125, -6.150634765625, -5.90869140625, -5.666748046875, -5.4248046875, -5.182861328125, -4.94091796875, -4.698974609375, -4.45703125, -4.215087890625, -3.97314453125, -3.731201171875, -3.4892578125, -3.247314453125, -3.00537109375, -2.763427734375, -2.521484375, -2.279541015625, -2.03759765625, -1.795654296875, -1.5537109375, -1.311767578125, -1.06982421875, -0.827880859375, -0.5859375, -0.343994140625, -0.10205078125, 0.139892578125, 0.3818359375, 0.623779296875, 0.86572265625, 1.107666015625, 1.349609375, 1.591552734375, 1.83349609375, 2.075439453125, 2.3173828125, 2.559326171875, 2.80126953125, 3.043212890625, 3.28515625, 3.527099609375, 3.76904296875, 4.010986328125, 4.2529296875, 4.494873046875, 4.73681640625, 4.978759765625, 5.220703125, 5.462646484375, 5.70458984375, 5.946533203125, 6.1884765625, 6.430419921875, 6.67236328125, 6.914306640625, 7.15625]}, "gradients/decoder.bert.encoder.layer.3.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 2.0, 10.0, 6.0, 7.0, 8.0, 10.0, 21.0, 16.0, 16.0, 32.0, 22.0, 30.0, 27.0, 28.0, 32.0, 43.0, 36.0, 43.0, 33.0, 49.0, 41.0, 50.0, 42.0, 22.0, 41.0, 40.0, 31.0, 28.0, 36.0, 31.0, 10.0, 28.0, 19.0, 19.0, 17.0, 22.0, 10.0, 9.0, 6.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.7890625, -4.65057373046875, -4.5120849609375, -4.37359619140625, -4.235107421875, -4.09661865234375, -3.9581298828125, -3.81964111328125, -3.68115234375, -3.54266357421875, -3.4041748046875, -3.26568603515625, -3.127197265625, -2.98870849609375, -2.8502197265625, -2.71173095703125, -2.5732421875, -2.43475341796875, -2.2962646484375, -2.15777587890625, -2.019287109375, -1.88079833984375, -1.7423095703125, -1.60382080078125, -1.46533203125, -1.32684326171875, -1.1883544921875, -1.04986572265625, -0.911376953125, -0.77288818359375, -0.6343994140625, -0.49591064453125, -0.357421875, -0.21893310546875, -0.0804443359375, 0.05804443359375, 0.196533203125, 0.33502197265625, 0.4735107421875, 0.61199951171875, 0.75048828125, 0.88897705078125, 1.0274658203125, 1.16595458984375, 1.304443359375, 1.44293212890625, 1.5814208984375, 1.71990966796875, 1.8583984375, 1.99688720703125, 2.1353759765625, 2.27386474609375, 2.412353515625, 2.55084228515625, 2.6893310546875, 2.82781982421875, 2.96630859375, 3.10479736328125, 3.2432861328125, 3.38177490234375, 3.520263671875, 3.65875244140625, 3.7972412109375, 3.93572998046875, 4.07421875]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 7.0, 4.0, 17.0, 19.0, 29.0, 34.0, 43.0, 63.0, 109.0, 187.0, 238.0, 344.0, 507.0, 824.0, 1332.0, 2191.0, 3676.0, 6625.0, 11721.0, 21771.0, 41167.0, 81328.0, 165938.0, 346884.0, 709091.0, 1100995.0, 851249.0, 431657.0, 206066.0, 99782.0, 50291.0, 26501.0, 14321.0, 7879.0, 4516.0, 2560.0, 1613.0, 991.0, 595.0, 357.0, 254.0, 163.0, 111.0, 75.0, 59.0, 33.0, 27.0, 9.0, 9.0, 5.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0], "bins": [-11.7890625, -11.427978515625, -11.06689453125, -10.705810546875, -10.3447265625, -9.983642578125, -9.62255859375, -9.261474609375, -8.900390625, -8.539306640625, -8.17822265625, -7.817138671875, -7.4560546875, -7.094970703125, -6.73388671875, -6.372802734375, -6.01171875, -5.650634765625, -5.28955078125, -4.928466796875, -4.5673828125, -4.206298828125, -3.84521484375, -3.484130859375, -3.123046875, -2.761962890625, -2.40087890625, -2.039794921875, -1.6787109375, -1.317626953125, -0.95654296875, -0.595458984375, -0.234375, 0.126708984375, 0.48779296875, 0.848876953125, 1.2099609375, 1.571044921875, 1.93212890625, 2.293212890625, 2.654296875, 3.015380859375, 3.37646484375, 3.737548828125, 4.0986328125, 4.459716796875, 4.82080078125, 5.181884765625, 5.54296875, 5.904052734375, 6.26513671875, 6.626220703125, 6.9873046875, 7.348388671875, 7.70947265625, 8.070556640625, 8.431640625, 8.792724609375, 9.15380859375, 9.514892578125, 9.8759765625, 10.237060546875, 10.59814453125, 10.959228515625, 11.3203125]}, "gradients/decoder.bert.encoder.layer.3.intermediate.dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 12.0, 5.0, 12.0, 14.0, 16.0, 33.0, 31.0, 48.0, 36.0, 61.0, 83.0, 90.0, 98.0, 121.0, 157.0, 179.0, 207.0, 223.0, 266.0, 239.0, 276.0, 259.0, 257.0, 214.0, 200.0, 188.0, 163.0, 106.0, 102.0, 81.0, 60.0, 62.0, 33.0, 25.0, 24.0, 20.0, 8.0, 17.0, 7.0, 11.0, 9.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.479583740234375, -2.38885498046875, -2.298126220703125, -2.2073974609375, -2.116668701171875, -2.02593994140625, -1.935211181640625, -1.844482421875, -1.753753662109375, -1.66302490234375, -1.572296142578125, -1.4815673828125, -1.390838623046875, -1.30010986328125, -1.209381103515625, -1.11865234375, -1.027923583984375, -0.93719482421875, -0.846466064453125, -0.7557373046875, -0.665008544921875, -0.57427978515625, -0.483551025390625, -0.392822265625, -0.302093505859375, -0.21136474609375, -0.120635986328125, -0.0299072265625, 0.060821533203125, 0.15155029296875, 0.242279052734375, 0.3330078125, 0.423736572265625, 0.51446533203125, 0.605194091796875, 0.6959228515625, 0.786651611328125, 0.87738037109375, 0.968109130859375, 1.058837890625, 1.149566650390625, 1.24029541015625, 1.331024169921875, 1.4217529296875, 1.512481689453125, 1.60321044921875, 1.693939208984375, 1.78466796875, 1.875396728515625, 1.96612548828125, 2.056854248046875, 2.1475830078125, 2.238311767578125, 2.32904052734375, 2.419769287109375, 2.510498046875, 2.601226806640625, 2.69195556640625, 2.782684326171875, 2.8734130859375, 2.964141845703125, 3.05487060546875, 3.145599365234375, 3.236328125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 1.0, 4.0, 5.0, 8.0, 6.0, 6.0, 12.0, 11.0, 18.0, 20.0, 26.0, 36.0, 28.0, 31.0, 39.0, 52.0, 51.0, 60.0, 63.0, 70.0, 51.0, 64.0, 49.0, 59.0, 49.0, 19.0, 22.0, 28.0, 29.0, 16.0, 16.0, 15.0, 4.0, 4.0, 10.0, 5.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.572054862976074, -11.243688583374023, -10.915321350097656, -10.586955070495605, -10.258587837219238, -9.930221557617188, -9.60185432434082, -9.27348804473877, -8.945120811462402, -8.616754531860352, -8.288387298583984, -7.960020542144775, -7.631653785705566, -7.303287029266357, -6.974920272827148, -6.646553993225098, -6.318187236785889, -5.98982048034668, -5.661453723907471, -5.333086967468262, -5.004720211029053, -4.676353454589844, -4.347987174987793, -4.019619941711426, -3.691253423690796, -3.362886667251587, -3.034519910812378, -2.706153392791748, -2.377786636352539, -2.04941987991333, -1.721053123474121, -1.392686367034912, -1.0643196105957031, -0.7359528541564941, -0.40758615732192993, -0.07921946048736572, 0.24914729595184326, 0.5775140523910522, 0.9058806896209717, 1.2342474460601807, 1.5626142024993896, 1.8909809589385986, 2.2193477153778076, 2.5477142333984375, 2.8760809898376465, 3.2044477462768555, 3.5328145027160645, 3.8611812591552734, 4.189548015594482, 4.517914772033691, 4.8462815284729, 5.174648284912109, 5.503015041351318, 5.831381797790527, 6.159748077392578, 6.488115310668945, 6.816481590270996, 7.144848346710205, 7.473215103149414, 7.801581859588623, 8.129948616027832, 8.458314895629883, 8.78668212890625, 9.1150484085083, 9.443415641784668]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 8.0, 8.0, 5.0, 4.0, 14.0, 13.0, 18.0, 20.0, 16.0, 16.0, 24.0, 18.0, 22.0, 34.0, 25.0, 23.0, 27.0, 34.0, 33.0, 43.0, 41.0, 33.0, 33.0, 36.0, 29.0, 30.0, 28.0, 34.0, 35.0, 28.0, 21.0, 30.0, 19.0, 18.0, 13.0, 23.0, 18.0, 16.0, 16.0, 11.0, 15.0, 9.0, 12.0, 10.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-5.13959264755249, -4.986419677734375, -4.83324670791626, -4.6800737380981445, -4.5269012451171875, -4.373728275299072, -4.220555305480957, -4.067382335662842, -3.9142093658447266, -3.7610363960266113, -3.607863664627075, -3.45469069480896, -3.3015177249908447, -3.1483449935913086, -2.9951720237731934, -2.841999053955078, -2.688826322555542, -2.5356533527374268, -2.3824806213378906, -2.2293076515197754, -2.07613468170166, -1.9229618310928345, -1.7697889804840088, -1.6166160106658936, -1.4634431600570679, -1.3102703094482422, -1.157097339630127, -1.0039244890213013, -0.8507515788078308, -0.6975786685943604, -0.5444058179855347, -0.39123284816741943, -0.23805999755859375, -0.08488710224628448, 0.06828579306602478, 0.22145867347717285, 0.3746315836906433, 0.5278044939041138, 0.6809773445129395, 0.8341503143310547, 0.9873231649398804, 1.140496015548706, 1.2936689853668213, 1.446841835975647, 1.6000146865844727, 1.753187656402588, 1.9063605070114136, 2.0595335960388184, 2.2127063274383545, 2.3658792972564697, 2.519052028656006, 2.672224998474121, 2.8253979682922363, 2.9785709381103516, 3.1317436695098877, 3.284916639328003, 3.438089370727539, 3.5912623405456543, 3.7444350719451904, 3.8976080417633057, 4.050780773162842, 4.203953742980957, 4.357126712799072, 4.5102996826171875, 4.663472652435303]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 6.0, 14.0, 29.0, 40.0, 49.0, 92.0, 110.0, 173.0, 253.0, 470.0, 630.0, 1037.0, 1560.0, 2389.0, 4061.0, 6665.0, 11178.0, 18844.0, 32728.0, 56465.0, 96404.0, 156026.0, 202654.0, 177368.0, 115041.0, 68073.0, 39233.0, 22682.0, 13437.0, 7867.0, 4834.0, 2965.0, 1765.0, 1146.0, 781.0, 493.0, 300.0, 227.0, 149.0, 101.0, 64.0, 43.0, 26.0, 19.0, 18.0, 13.0, 6.0, 8.0, 4.0, 2.0, 1.0], "bins": [-0.91796875, -0.8922348022460938, -0.8665008544921875, -0.8407669067382812, -0.815032958984375, -0.7892990112304688, -0.7635650634765625, -0.7378311157226562, -0.71209716796875, -0.6863632202148438, -0.6606292724609375, -0.6348953247070312, -0.609161376953125, -0.5834274291992188, -0.5576934814453125, -0.5319595336914062, -0.5062255859375, -0.48049163818359375, -0.4547576904296875, -0.42902374267578125, -0.403289794921875, -0.37755584716796875, -0.3518218994140625, -0.32608795166015625, -0.30035400390625, -0.27462005615234375, -0.2488861083984375, -0.22315216064453125, -0.197418212890625, -0.17168426513671875, -0.1459503173828125, -0.12021636962890625, -0.094482421875, -0.06874847412109375, -0.0430145263671875, -0.01728057861328125, 0.008453369140625, 0.03418731689453125, 0.0599212646484375, 0.08565521240234375, 0.11138916015625, 0.13712310791015625, 0.1628570556640625, 0.18859100341796875, 0.214324951171875, 0.24005889892578125, 0.2657928466796875, 0.29152679443359375, 0.3172607421875, 0.34299468994140625, 0.3687286376953125, 0.39446258544921875, 0.420196533203125, 0.44593048095703125, 0.4716644287109375, 0.49739837646484375, 0.52313232421875, 0.5488662719726562, 0.5746002197265625, 0.6003341674804688, 0.626068115234375, 0.6518020629882812, 0.6775360107421875, 0.7032699584960938, 0.72900390625]}, "gradients/decoder.bert.encoder.layer.3.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 6.0, 8.0, 7.0, 8.0, 13.0, 12.0, 11.0, 22.0, 28.0, 23.0, 27.0, 19.0, 42.0, 30.0, 43.0, 32.0, 41.0, 43.0, 44.0, 37.0, 48.0, 37.0, 38.0, 42.0, 49.0, 33.0, 22.0, 30.0, 29.0, 23.0, 22.0, 20.0, 18.0, 17.0, 17.0, 10.0, 4.0, 10.0, 8.0, 4.0, 9.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-7.5234375, -7.3131103515625, -7.102783203125, -6.8924560546875, -6.68212890625, -6.4718017578125, -6.261474609375, -6.0511474609375, -5.8408203125, -5.6304931640625, -5.420166015625, -5.2098388671875, -4.99951171875, -4.7891845703125, -4.578857421875, -4.3685302734375, -4.158203125, -3.9478759765625, -3.737548828125, -3.5272216796875, -3.31689453125, -3.1065673828125, -2.896240234375, -2.6859130859375, -2.4755859375, -2.2652587890625, -2.054931640625, -1.8446044921875, -1.63427734375, -1.4239501953125, -1.213623046875, -1.0032958984375, -0.79296875, -0.5826416015625, -0.372314453125, -0.1619873046875, 0.04833984375, 0.2586669921875, 0.468994140625, 0.6793212890625, 0.8896484375, 1.0999755859375, 1.310302734375, 1.5206298828125, 1.73095703125, 1.9412841796875, 2.151611328125, 2.3619384765625, 2.572265625, 2.7825927734375, 2.992919921875, 3.2032470703125, 3.41357421875, 3.6239013671875, 3.834228515625, 4.0445556640625, 4.2548828125, 4.4652099609375, 4.675537109375, 4.8858642578125, 5.09619140625, 5.3065185546875, 5.516845703125, 5.7271728515625, 5.9375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 8.0, 3.0, 8.0, 10.0, 19.0, 22.0, 27.0, 53.0, 53.0, 83.0, 106.0, 139.0, 264.0, 351.0, 526.0, 802.0, 1377.0, 2189.0, 4128.0, 7812.0, 16988.0, 50588.0, 816532.0, 102395.0, 22325.0, 9926.0, 4868.0, 2684.0, 1497.0, 941.0, 558.0, 425.0, 267.0, 162.0, 132.0, 81.0, 55.0, 41.0, 37.0, 23.0, 19.0, 9.0, 8.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4512939453125, -2.371337890625, -2.2913818359375, -2.21142578125, -2.1314697265625, -2.051513671875, -1.9715576171875, -1.8916015625, -1.8116455078125, -1.731689453125, -1.6517333984375, -1.57177734375, -1.4918212890625, -1.411865234375, -1.3319091796875, -1.251953125, -1.1719970703125, -1.092041015625, -1.0120849609375, -0.93212890625, -0.8521728515625, -0.772216796875, -0.6922607421875, -0.6123046875, -0.5323486328125, -0.452392578125, -0.3724365234375, -0.29248046875, -0.2125244140625, -0.132568359375, -0.0526123046875, 0.02734375, 0.1072998046875, 0.187255859375, 0.2672119140625, 0.34716796875, 0.4271240234375, 0.507080078125, 0.5870361328125, 0.6669921875, 0.7469482421875, 0.826904296875, 0.9068603515625, 0.98681640625, 1.0667724609375, 1.146728515625, 1.2266845703125, 1.306640625, 1.3865966796875, 1.466552734375, 1.5465087890625, 1.62646484375, 1.7064208984375, 1.786376953125, 1.8663330078125, 1.9462890625, 2.0262451171875, 2.106201171875, 2.1861572265625, 2.26611328125, 2.3460693359375, 2.426025390625, 2.5059814453125, 2.5859375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.value.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 7.0, 6.0, 5.0, 6.0, 7.0, 11.0, 13.0, 15.0, 9.0, 11.0, 20.0, 16.0, 23.0, 29.0, 24.0, 35.0, 36.0, 33.0, 40.0, 44.0, 33.0, 38.0, 36.0, 45.0, 30.0, 28.0, 40.0, 38.0, 28.0, 24.0, 38.0, 33.0, 31.0, 33.0, 22.0, 24.0, 15.0, 10.0, 7.0, 14.0, 7.0, 3.0, 7.0, 8.0, 5.0, 5.0, 1.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.03515625, -3.90655517578125, -3.7779541015625, -3.64935302734375, -3.520751953125, -3.39215087890625, -3.2635498046875, -3.13494873046875, -3.00634765625, -2.87774658203125, -2.7491455078125, -2.62054443359375, -2.491943359375, -2.36334228515625, -2.2347412109375, -2.10614013671875, -1.9775390625, -1.84893798828125, -1.7203369140625, -1.59173583984375, -1.463134765625, -1.33453369140625, -1.2059326171875, -1.07733154296875, -0.94873046875, -0.82012939453125, -0.6915283203125, -0.56292724609375, -0.434326171875, -0.30572509765625, -0.1771240234375, -0.04852294921875, 0.080078125, 0.20867919921875, 0.3372802734375, 0.46588134765625, 0.594482421875, 0.72308349609375, 0.8516845703125, 0.98028564453125, 1.10888671875, 1.23748779296875, 1.3660888671875, 1.49468994140625, 1.623291015625, 1.75189208984375, 1.8804931640625, 2.00909423828125, 2.1376953125, 2.26629638671875, 2.3948974609375, 2.52349853515625, 2.652099609375, 2.78070068359375, 2.9093017578125, 3.03790283203125, 3.16650390625, 3.29510498046875, 3.4237060546875, 3.55230712890625, 3.680908203125, 3.80950927734375, 3.9381103515625, 4.06671142578125, 4.1953125]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 9.0, 11.0, 9.0, 13.0, 18.0, 35.0, 55.0, 65.0, 118.0, 153.0, 248.0, 414.0, 706.0, 1324.0, 2252.0, 4563.0, 9439.0, 21576.0, 117965.0, 836681.0, 29034.0, 11716.0, 5515.0, 2841.0, 1541.0, 847.0, 481.0, 293.0, 196.0, 114.0, 98.0, 65.0, 47.0, 36.0, 23.0, 10.0, 12.0, 5.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.66845703125, -0.6476669311523438, -0.6268768310546875, -0.6060867309570312, -0.585296630859375, -0.5645065307617188, -0.5437164306640625, -0.5229263305664062, -0.50213623046875, -0.48134613037109375, -0.4605560302734375, -0.43976593017578125, -0.418975830078125, -0.39818572998046875, -0.3773956298828125, -0.35660552978515625, -0.3358154296875, -0.31502532958984375, -0.2942352294921875, -0.27344512939453125, -0.252655029296875, -0.23186492919921875, -0.2110748291015625, -0.19028472900390625, -0.16949462890625, -0.14870452880859375, -0.1279144287109375, -0.10712432861328125, -0.086334228515625, -0.06554412841796875, -0.0447540283203125, -0.02396392822265625, -0.003173828125, 0.01761627197265625, 0.0384063720703125, 0.05919647216796875, 0.079986572265625, 0.10077667236328125, 0.1215667724609375, 0.14235687255859375, 0.16314697265625, 0.18393707275390625, 0.2047271728515625, 0.22551727294921875, 0.246307373046875, 0.26709747314453125, 0.2878875732421875, 0.30867767333984375, 0.3294677734375, 0.35025787353515625, 0.3710479736328125, 0.39183807373046875, 0.412628173828125, 0.43341827392578125, 0.4542083740234375, 0.47499847412109375, 0.49578857421875, 0.5165786743164062, 0.5373687744140625, 0.5581588745117188, 0.578948974609375, 0.5997390747070312, 0.6205291748046875, 0.6413192749023438, 0.662109375]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 7.0, 15.0, 17.0, 13.0, 21.0, 24.0, 25.0, 25.0, 46.0, 46.0, 48.0, 49.0, 45.0, 57.0, 57.0, 42.0, 41.0, 59.0, 43.0, 43.0, 46.0, 42.0, 27.0, 23.0, 12.0, 17.0, 18.0, 19.0, 10.0, 11.0, 9.0, 9.0, 4.0, 5.0, 3.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5153160095214844e-05, -2.4388544261455536e-05, -2.3623928427696228e-05, -2.285931259393692e-05, -2.2094696760177612e-05, -2.1330080926418304e-05, -2.0565465092658997e-05, -1.980084925889969e-05, -1.903623342514038e-05, -1.8271617591381073e-05, -1.7507001757621765e-05, -1.6742385923862457e-05, -1.597777009010315e-05, -1.5213154256343842e-05, -1.4448538422584534e-05, -1.3683922588825226e-05, -1.2919306755065918e-05, -1.215469092130661e-05, -1.1390075087547302e-05, -1.0625459253787994e-05, -9.860843420028687e-06, -9.096227586269379e-06, -8.33161175251007e-06, -7.566995918750763e-06, -6.802380084991455e-06, -6.037764251232147e-06, -5.273148417472839e-06, -4.5085325837135315e-06, -3.7439167499542236e-06, -2.9793009161949158e-06, -2.214685082435608e-06, -1.4500692486763e-06, -6.854534149169922e-07, 7.916241884231567e-08, 8.437782526016235e-07, 1.6083940863609314e-06, 2.3730099201202393e-06, 3.137625753879547e-06, 3.902241587638855e-06, 4.666857421398163e-06, 5.431473255157471e-06, 6.1960890889167786e-06, 6.9607049226760864e-06, 7.725320756435394e-06, 8.489936590194702e-06, 9.25455242395401e-06, 1.0019168257713318e-05, 1.0783784091472626e-05, 1.1548399925231934e-05, 1.2313015758991241e-05, 1.307763159275055e-05, 1.3842247426509857e-05, 1.4606863260269165e-05, 1.5371479094028473e-05, 1.613609492778778e-05, 1.690071076154709e-05, 1.7665326595306396e-05, 1.8429942429065704e-05, 1.9194558262825012e-05, 1.995917409658432e-05, 2.0723789930343628e-05, 2.1488405764102936e-05, 2.2253021597862244e-05, 2.301763743162155e-05, 2.378225326538086e-05]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 9.0, 4.0, 8.0, 17.0, 26.0, 49.0, 51.0, 99.0, 124.0, 219.0, 365.0, 535.0, 767.0, 1373.0, 2315.0, 3917.0, 7228.0, 13765.0, 28143.0, 62424.0, 146939.0, 294495.0, 262961.0, 120809.0, 51378.0, 23819.0, 11801.0, 6078.0, 3493.0, 1993.0, 1196.0, 775.0, 474.0, 322.0, 195.0, 131.0, 92.0, 59.0, 36.0, 25.0, 11.0, 4.0, 9.0, 7.0, 9.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32421875, -0.3133697509765625, -0.302520751953125, -0.2916717529296875, -0.28082275390625, -0.2699737548828125, -0.259124755859375, -0.2482757568359375, -0.2374267578125, -0.2265777587890625, -0.215728759765625, -0.2048797607421875, -0.19403076171875, -0.1831817626953125, -0.172332763671875, -0.1614837646484375, -0.150634765625, -0.1397857666015625, -0.128936767578125, -0.1180877685546875, -0.10723876953125, -0.0963897705078125, -0.085540771484375, -0.0746917724609375, -0.0638427734375, -0.0529937744140625, -0.042144775390625, -0.0312957763671875, -0.02044677734375, -0.0095977783203125, 0.001251220703125, 0.0121002197265625, 0.02294921875, 0.0337982177734375, 0.044647216796875, 0.0554962158203125, 0.06634521484375, 0.0771942138671875, 0.088043212890625, 0.0988922119140625, 0.1097412109375, 0.1205902099609375, 0.131439208984375, 0.1422882080078125, 0.15313720703125, 0.1639862060546875, 0.174835205078125, 0.1856842041015625, 0.196533203125, 0.2073822021484375, 0.218231201171875, 0.2290802001953125, 0.23992919921875, 0.2507781982421875, 0.261627197265625, 0.2724761962890625, 0.2833251953125, 0.2941741943359375, 0.305023193359375, 0.3158721923828125, 0.32672119140625, 0.3375701904296875, 0.348419189453125, 0.3592681884765625, 0.3701171875]}, "gradients/decoder.bert.encoder.layer.3.crossattention.self.query.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 6.0, 3.0, 10.0, 6.0, 9.0, 8.0, 22.0, 12.0, 20.0, 17.0, 31.0, 29.0, 39.0, 61.0, 57.0, 71.0, 71.0, 61.0, 68.0, 62.0, 55.0, 48.0, 47.0, 37.0, 29.0, 24.0, 23.0, 15.0, 7.0, 10.0, 10.0, 6.0, 5.0, 7.0, 0.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0751953125, -0.07299518585205078, -0.07079505920410156, -0.06859493255615234, -0.06639480590820312, -0.0641946792602539, -0.06199455261230469, -0.05979442596435547, -0.05759429931640625, -0.05539417266845703, -0.05319404602050781, -0.050993919372558594, -0.048793792724609375, -0.046593666076660156, -0.04439353942871094, -0.04219341278076172, -0.0399932861328125, -0.03779315948486328, -0.03559303283691406, -0.033392906188964844, -0.031192779541015625, -0.028992652893066406, -0.026792526245117188, -0.02459239959716797, -0.02239227294921875, -0.02019214630126953, -0.017992019653320312, -0.015791893005371094, -0.013591766357421875, -0.011391639709472656, -0.009191513061523438, -0.006991386413574219, -0.004791259765625, -0.0025911331176757812, -0.0003910064697265625, 0.0018091201782226562, 0.004009246826171875, 0.006209373474121094, 0.008409500122070312, 0.010609626770019531, 0.01280975341796875, 0.015009880065917969, 0.017210006713867188, 0.019410133361816406, 0.021610260009765625, 0.023810386657714844, 0.026010513305664062, 0.02821063995361328, 0.0304107666015625, 0.03261089324951172, 0.03481101989746094, 0.037011146545410156, 0.039211273193359375, 0.041411399841308594, 0.04361152648925781, 0.04581165313720703, 0.04801177978515625, 0.05021190643310547, 0.05241203308105469, 0.054612159729003906, 0.056812286376953125, 0.059012413024902344, 0.06121253967285156, 0.06341266632080078, 0.06561279296875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 9.0, 13.0, 10.0, 19.0, 27.0, 28.0, 33.0, 27.0, 36.0, 56.0, 46.0, 62.0, 50.0, 73.0, 59.0, 55.0, 57.0, 55.0, 57.0, 31.0, 24.0, 21.0, 27.0, 20.0, 16.0, 16.0, 10.0, 4.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.313261985778809, -10.98647403717041, -10.659685134887695, -10.332897186279297, -10.006109237670898, -9.6793212890625, -9.352532386779785, -9.025744438171387, -8.698955535888672, -8.372167587280273, -8.045378684997559, -7.71859073638916, -7.391802787780762, -7.065014362335205, -6.738225936889648, -6.41143798828125, -6.084650039672852, -5.757861614227295, -5.4310736656188965, -5.10428524017334, -4.777497291564941, -4.450708866119385, -4.123920440673828, -3.7971322536468506, -3.470344066619873, -3.1435558795928955, -2.816767692565918, -2.4899792671203613, -2.163191080093384, -1.8364028930664062, -1.5096145868301392, -1.182826280593872, -0.8560390472412109, -0.5292508006095886, -0.2024625539779663, 0.124325692653656, 0.4511139392852783, 0.7779021263122559, 1.104690432548523, 1.43147873878479, 1.7582669258117676, 2.085055112838745, 2.4118432998657227, 2.7386317253112793, 3.065419912338257, 3.3922080993652344, 3.718996524810791, 4.045784950256348, 4.372572898864746, 4.699361324310303, 5.026149272918701, 5.352937698364258, 5.679725646972656, 6.006514072418213, 6.3333024978637695, 6.660090446472168, 6.986878871917725, 7.313667297363281, 7.64045524597168, 7.967243671417236, 8.294032096862793, 8.620820045471191, 8.94760799407959, 9.274396896362305, 9.601184844970703]}, "gradients/decoder.bert.encoder.layer.3.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 7.0, 9.0, 5.0, 2.0, 15.0, 12.0, 19.0, 21.0, 17.0, 13.0, 21.0, 20.0, 25.0, 28.0, 26.0, 22.0, 30.0, 30.0, 37.0, 42.0, 38.0, 36.0, 33.0, 36.0, 29.0, 34.0, 22.0, 34.0, 36.0, 28.0, 21.0, 27.0, 25.0, 16.0, 14.0, 22.0, 15.0, 19.0, 20.0, 8.0, 15.0, 11.0, 10.0, 12.0, 6.0, 9.0, 3.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0], "bins": [-5.119045257568359, -4.966975212097168, -4.814905166625977, -4.662835121154785, -4.510765075683594, -4.358695030212402, -4.206624984741211, -4.0545549392700195, -3.9024851322174072, -3.750415086746216, -3.5983450412750244, -3.446274995803833, -3.2942051887512207, -3.1421351432800293, -2.990065097808838, -2.8379950523376465, -2.685925006866455, -2.5338549613952637, -2.3817849159240723, -2.229714870452881, -2.0776448249816895, -1.9255748987197876, -1.7735049724578857, -1.6214349269866943, -1.469364881515503, -1.3172948360443115, -1.1652247905731201, -1.0131548643112183, -0.8610848188400269, -0.7090147733688354, -0.5569447875022888, -0.4048748016357422, -0.2528042793273926, -0.10073426365852356, 0.05133575201034546, 0.20340576767921448, 0.3554757833480835, 0.5075458288192749, 0.6596158146858215, 0.8116858005523682, 0.9637558460235596, 1.115825891494751, 1.2678959369659424, 1.4199658632278442, 1.5720359086990356, 1.724105954170227, 1.876175880432129, 2.0282459259033203, 2.1803159713745117, 2.332386016845703, 2.4844560623168945, 2.636526107788086, 2.7885961532592773, 2.9406661987304688, 3.092736005783081, 3.2448060512542725, 3.396876096725464, 3.5489461421966553, 3.7010161876678467, 3.853086233139038, 4.00515604019165, 4.157226085662842, 4.309296131134033, 4.461366176605225, 4.613436222076416]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 6.0, 4.0, 11.0, 11.0, 18.0, 28.0, 32.0, 46.0, 80.0, 136.0, 219.0, 374.0, 593.0, 1094.0, 1967.0, 3370.0, 6079.0, 11233.0, 19925.0, 35497.0, 62672.0, 104269.0, 155483.0, 187211.0, 168896.0, 119638.0, 73788.0, 42559.0, 23549.0, 13176.0, 7212.0, 4024.0, 2235.0, 1310.0, 729.0, 415.0, 250.0, 171.0, 84.0, 50.0, 36.0, 22.0, 21.0, 14.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.92620849609375, -6.6844482421875, -6.44268798828125, -6.200927734375, -5.95916748046875, -5.7174072265625, -5.47564697265625, -5.23388671875, -4.99212646484375, -4.7503662109375, -4.50860595703125, -4.266845703125, -4.02508544921875, -3.7833251953125, -3.54156494140625, -3.2998046875, -3.05804443359375, -2.8162841796875, -2.57452392578125, -2.332763671875, -2.09100341796875, -1.8492431640625, -1.60748291015625, -1.36572265625, -1.12396240234375, -0.8822021484375, -0.64044189453125, -0.398681640625, -0.15692138671875, 0.0848388671875, 0.32659912109375, 0.568359375, 0.81011962890625, 1.0518798828125, 1.29364013671875, 1.535400390625, 1.77716064453125, 2.0189208984375, 2.26068115234375, 2.50244140625, 2.74420166015625, 2.9859619140625, 3.22772216796875, 3.469482421875, 3.71124267578125, 3.9530029296875, 4.19476318359375, 4.4365234375, 4.67828369140625, 4.9200439453125, 5.16180419921875, 5.403564453125, 5.64532470703125, 5.8870849609375, 6.12884521484375, 6.37060546875, 6.61236572265625, 6.8541259765625, 7.09588623046875, 7.337646484375, 7.57940673828125, 7.8211669921875, 8.06292724609375, 8.3046875]}, "gradients/decoder.bert.encoder.layer.3.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 6.0, 12.0, 7.0, 8.0, 7.0, 7.0, 16.0, 14.0, 27.0, 26.0, 19.0, 26.0, 28.0, 30.0, 37.0, 39.0, 37.0, 33.0, 34.0, 43.0, 44.0, 34.0, 33.0, 48.0, 34.0, 25.0, 30.0, 32.0, 27.0, 29.0, 27.0, 25.0, 18.0, 21.0, 8.0, 20.0, 15.0, 17.0, 14.0, 7.0, 15.0, 5.0, 6.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0], "bins": [-6.8671875, -6.67791748046875, -6.4886474609375, -6.29937744140625, -6.110107421875, -5.92083740234375, -5.7315673828125, -5.54229736328125, -5.35302734375, -5.16375732421875, -4.9744873046875, -4.78521728515625, -4.595947265625, -4.40667724609375, -4.2174072265625, -4.02813720703125, -3.8388671875, -3.64959716796875, -3.4603271484375, -3.27105712890625, -3.081787109375, -2.89251708984375, -2.7032470703125, -2.51397705078125, -2.32470703125, -2.13543701171875, -1.9461669921875, -1.75689697265625, -1.567626953125, -1.37835693359375, -1.1890869140625, -0.99981689453125, -0.810546875, -0.62127685546875, -0.4320068359375, -0.24273681640625, -0.053466796875, 0.13580322265625, 0.3250732421875, 0.51434326171875, 0.70361328125, 0.89288330078125, 1.0821533203125, 1.27142333984375, 1.460693359375, 1.64996337890625, 1.8392333984375, 2.02850341796875, 2.2177734375, 2.40704345703125, 2.5963134765625, 2.78558349609375, 2.974853515625, 3.16412353515625, 3.3533935546875, 3.54266357421875, 3.73193359375, 3.92120361328125, 4.1104736328125, 4.29974365234375, 4.489013671875, 4.67828369140625, 4.8675537109375, 5.05682373046875, 5.24609375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 18.0, 34.0, 48.0, 63.0, 109.0, 165.0, 276.0, 400.0, 716.0, 1155.0, 1851.0, 3214.0, 5309.0, 9093.0, 15274.0, 26332.0, 44347.0, 72750.0, 109939.0, 149336.0, 166615.0, 149622.0, 110471.0, 72296.0, 44598.0, 26383.0, 15645.0, 9049.0, 5433.0, 3067.0, 1904.0, 1165.0, 687.0, 440.0, 281.0, 187.0, 103.0, 46.0, 36.0, 29.0, 21.0, 17.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.21246337890625, -6.9835205078125, -6.75457763671875, -6.525634765625, -6.29669189453125, -6.0677490234375, -5.83880615234375, -5.60986328125, -5.38092041015625, -5.1519775390625, -4.92303466796875, -4.694091796875, -4.46514892578125, -4.2362060546875, -4.00726318359375, -3.7783203125, -3.54937744140625, -3.3204345703125, -3.09149169921875, -2.862548828125, -2.63360595703125, -2.4046630859375, -2.17572021484375, -1.94677734375, -1.71783447265625, -1.4888916015625, -1.25994873046875, -1.031005859375, -0.80206298828125, -0.5731201171875, -0.34417724609375, -0.115234375, 0.11370849609375, 0.3426513671875, 0.57159423828125, 0.800537109375, 1.02947998046875, 1.2584228515625, 1.48736572265625, 1.71630859375, 1.94525146484375, 2.1741943359375, 2.40313720703125, 2.632080078125, 2.86102294921875, 3.0899658203125, 3.31890869140625, 3.5478515625, 3.77679443359375, 4.0057373046875, 4.23468017578125, 4.463623046875, 4.69256591796875, 4.9215087890625, 5.15045166015625, 5.37939453125, 5.60833740234375, 5.8372802734375, 6.06622314453125, 6.295166015625, 6.52410888671875, 6.7530517578125, 6.98199462890625, 7.2109375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 12.0, 12.0, 21.0, 19.0, 20.0, 26.0, 34.0, 25.0, 23.0, 35.0, 52.0, 39.0, 42.0, 53.0, 47.0, 48.0, 53.0, 30.0, 41.0, 39.0, 40.0, 37.0, 38.0, 29.0, 36.0, 19.0, 20.0, 15.0, 14.0, 12.0, 14.0, 6.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.14453125, -3.99932861328125, -3.8541259765625, -3.70892333984375, -3.563720703125, -3.41851806640625, -3.2733154296875, -3.12811279296875, -2.98291015625, -2.83770751953125, -2.6925048828125, -2.54730224609375, -2.402099609375, -2.25689697265625, -2.1116943359375, -1.96649169921875, -1.8212890625, -1.67608642578125, -1.5308837890625, -1.38568115234375, -1.240478515625, -1.09527587890625, -0.9500732421875, -0.80487060546875, -0.65966796875, -0.51446533203125, -0.3692626953125, -0.22406005859375, -0.078857421875, 0.06634521484375, 0.2115478515625, 0.35675048828125, 0.501953125, 0.64715576171875, 0.7923583984375, 0.93756103515625, 1.082763671875, 1.22796630859375, 1.3731689453125, 1.51837158203125, 1.66357421875, 1.80877685546875, 1.9539794921875, 2.09918212890625, 2.244384765625, 2.38958740234375, 2.5347900390625, 2.67999267578125, 2.8251953125, 2.97039794921875, 3.1156005859375, 3.26080322265625, 3.406005859375, 3.55120849609375, 3.6964111328125, 3.84161376953125, 3.98681640625, 4.13201904296875, 4.2772216796875, 4.42242431640625, 4.567626953125, 4.71282958984375, 4.8580322265625, 5.00323486328125, 5.1484375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 8.0, 12.0, 21.0, 31.0, 42.0, 45.0, 92.0, 124.0, 200.0, 327.0, 432.0, 655.0, 1007.0, 1561.0, 2324.0, 3715.0, 5504.0, 8906.0, 14205.0, 23116.0, 38822.0, 64578.0, 104458.0, 152241.0, 178155.0, 158649.0, 111552.0, 69447.0, 41606.0, 24913.0, 15100.0, 9473.0, 5980.0, 3899.0, 2519.0, 1598.0, 1109.0, 754.0, 478.0, 330.0, 211.0, 121.0, 81.0, 49.0, 42.0, 30.0, 18.0, 12.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.841796875, -3.711883544921875, -3.58197021484375, -3.452056884765625, -3.3221435546875, -3.192230224609375, -3.06231689453125, -2.932403564453125, -2.802490234375, -2.672576904296875, -2.54266357421875, -2.412750244140625, -2.2828369140625, -2.152923583984375, -2.02301025390625, -1.893096923828125, -1.76318359375, -1.633270263671875, -1.50335693359375, -1.373443603515625, -1.2435302734375, -1.113616943359375, -0.98370361328125, -0.853790283203125, -0.723876953125, -0.593963623046875, -0.46405029296875, -0.334136962890625, -0.2042236328125, -0.074310302734375, 0.05560302734375, 0.185516357421875, 0.3154296875, 0.445343017578125, 0.57525634765625, 0.705169677734375, 0.8350830078125, 0.964996337890625, 1.09490966796875, 1.224822998046875, 1.354736328125, 1.484649658203125, 1.61456298828125, 1.744476318359375, 1.8743896484375, 2.004302978515625, 2.13421630859375, 2.264129638671875, 2.39404296875, 2.523956298828125, 2.65386962890625, 2.783782958984375, 2.9136962890625, 3.043609619140625, 3.17352294921875, 3.303436279296875, 3.433349609375, 3.563262939453125, 3.69317626953125, 3.823089599609375, 3.9530029296875, 4.082916259765625, 4.21282958984375, 4.342742919921875, 4.47265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 4.0, 5.0, 11.0, 9.0, 11.0, 10.0, 19.0, 15.0, 24.0, 21.0, 40.0, 39.0, 57.0, 69.0, 67.0, 60.0, 85.0, 56.0, 58.0, 63.0, 53.0, 52.0, 28.0, 26.0, 29.0, 10.0, 10.0, 11.0, 12.0, 2.0, 5.0, 2.0, 5.0, 9.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044417381286621094, -0.0004290081560611725, -0.00041384249925613403, -0.0003986768424510956, -0.00038351118564605713, -0.0003683455288410187, -0.0003531798720359802, -0.00033801421523094177, -0.0003228485584259033, -0.00030768290162086487, -0.0002925172448158264, -0.00027735158801078796, -0.0002621859312057495, -0.00024702027440071106, -0.0002318546175956726, -0.00021668896079063416, -0.0002015233039855957, -0.00018635764718055725, -0.0001711919903755188, -0.00015602633357048035, -0.0001408606767654419, -0.00012569501996040344, -0.00011052936315536499, -9.536370635032654e-05, -8.019804954528809e-05, -6.503239274024963e-05, -4.986673593521118e-05, -3.470107913017273e-05, -1.9535422325134277e-05, -4.369765520095825e-06, 1.0795891284942627e-05, 2.596154808998108e-05, 4.112720489501953e-05, 5.6292861700057983e-05, 7.145851850509644e-05, 8.662417531013489e-05, 0.00010178983211517334, 0.00011695548892021179, 0.00013212114572525024, 0.0001472868025302887, 0.00016245245933532715, 0.0001776181161403656, 0.00019278377294540405, 0.0002079494297504425, 0.00022311508655548096, 0.0002382807433605194, 0.00025344640016555786, 0.0002686120569705963, 0.00028377771377563477, 0.0002989433705806732, 0.00031410902738571167, 0.0003292746841907501, 0.0003444403409957886, 0.000359605997800827, 0.0003747716546058655, 0.00038993731141090393, 0.0004051029682159424, 0.00042026862502098083, 0.0004354342818260193, 0.00045059993863105774, 0.0004657655954360962, 0.00048093125224113464, 0.0004960969090461731, 0.0005112625658512115, 0.00052642822265625]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 7.0, 14.0, 13.0, 27.0, 30.0, 34.0, 62.0, 107.0, 152.0, 239.0, 347.0, 480.0, 733.0, 1084.0, 1682.0, 2468.0, 3764.0, 5687.0, 9102.0, 14129.0, 22737.0, 37551.0, 62621.0, 99865.0, 143623.0, 171579.0, 158655.0, 117086.0, 74692.0, 44953.0, 27425.0, 16827.0, 10654.0, 6884.0, 4489.0, 2919.0, 1957.0, 1255.0, 889.0, 546.0, 393.0, 270.0, 173.0, 119.0, 77.0, 44.0, 35.0, 23.0, 16.0, 15.0, 4.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0], "bins": [-4.2734375, -4.1427001953125, -4.011962890625, -3.8812255859375, -3.75048828125, -3.6197509765625, -3.489013671875, -3.3582763671875, -3.2275390625, -3.0968017578125, -2.966064453125, -2.8353271484375, -2.70458984375, -2.5738525390625, -2.443115234375, -2.3123779296875, -2.181640625, -2.0509033203125, -1.920166015625, -1.7894287109375, -1.65869140625, -1.5279541015625, -1.397216796875, -1.2664794921875, -1.1357421875, -1.0050048828125, -0.874267578125, -0.7435302734375, -0.61279296875, -0.4820556640625, -0.351318359375, -0.2205810546875, -0.08984375, 0.0408935546875, 0.171630859375, 0.3023681640625, 0.43310546875, 0.5638427734375, 0.694580078125, 0.8253173828125, 0.9560546875, 1.0867919921875, 1.217529296875, 1.3482666015625, 1.47900390625, 1.6097412109375, 1.740478515625, 1.8712158203125, 2.001953125, 2.1326904296875, 2.263427734375, 2.3941650390625, 2.52490234375, 2.6556396484375, 2.786376953125, 2.9171142578125, 3.0478515625, 3.1785888671875, 3.309326171875, 3.4400634765625, 3.57080078125, 3.7015380859375, 3.832275390625, 3.9630126953125, 4.09375]}, "gradients/decoder.bert.encoder.layer.3.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 8.0, 8.0, 18.0, 18.0, 13.0, 18.0, 17.0, 23.0, 15.0, 28.0, 26.0, 33.0, 37.0, 53.0, 51.0, 52.0, 52.0, 52.0, 41.0, 48.0, 39.0, 49.0, 41.0, 26.0, 33.0, 24.0, 22.0, 25.0, 16.0, 14.0, 13.0, 17.0, 9.0, 8.0, 10.0, 7.0, 1.0, 8.0, 3.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.138671875, -1.1033935546875, -1.068115234375, -1.0328369140625, -0.99755859375, -0.9622802734375, -0.927001953125, -0.8917236328125, -0.8564453125, -0.8211669921875, -0.785888671875, -0.7506103515625, -0.71533203125, -0.6800537109375, -0.644775390625, -0.6094970703125, -0.57421875, -0.5389404296875, -0.503662109375, -0.4683837890625, -0.43310546875, -0.3978271484375, -0.362548828125, -0.3272705078125, -0.2919921875, -0.2567138671875, -0.221435546875, -0.1861572265625, -0.15087890625, -0.1156005859375, -0.080322265625, -0.0450439453125, -0.009765625, 0.0255126953125, 0.060791015625, 0.0960693359375, 0.13134765625, 0.1666259765625, 0.201904296875, 0.2371826171875, 0.2724609375, 0.3077392578125, 0.343017578125, 0.3782958984375, 0.41357421875, 0.4488525390625, 0.484130859375, 0.5194091796875, 0.5546875, 0.5899658203125, 0.625244140625, 0.6605224609375, 0.69580078125, 0.7310791015625, 0.766357421875, 0.8016357421875, 0.8369140625, 0.8721923828125, 0.907470703125, 0.9427490234375, 0.97802734375, 1.0133056640625, 1.048583984375, 1.0838623046875, 1.119140625]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 3.0, 3.0, 5.0, 11.0, 12.0, 8.0, 20.0, 11.0, 26.0, 26.0, 27.0, 23.0, 34.0, 35.0, 53.0, 47.0, 57.0, 59.0, 64.0, 47.0, 61.0, 63.0, 55.0, 45.0, 28.0, 34.0, 29.0, 24.0, 17.0, 12.0, 10.0, 12.0, 14.0, 4.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.41679859161377, -11.084955215454102, -10.753110885620117, -10.42126750946045, -10.089423179626465, -9.757579803466797, -9.425735473632812, -9.093892097473145, -8.762048721313477, -8.430205345153809, -8.098361015319824, -7.766517639160156, -7.43467378616333, -7.102829933166504, -6.770986080169678, -6.439142227172852, -6.107298374176025, -5.775454521179199, -5.443610668182373, -5.111766815185547, -4.779923439025879, -4.448079586029053, -4.116235733032227, -3.7843921184539795, -3.4525482654571533, -3.120704412460327, -2.78886079788208, -2.457016944885254, -2.1251730918884277, -1.7933294773101807, -1.4614856243133545, -1.1296420097351074, -0.7977981567382812, -0.46595439314842224, -0.13411062955856323, 0.19773316383361816, 0.5295768976211548, 0.8614206314086914, 1.1932644844055176, 1.5251080989837646, 1.8569519519805908, 2.188795804977417, 2.520639419555664, 2.8524832725524902, 3.1843271255493164, 3.5161707401275635, 3.8480145931243896, 4.179858207702637, 4.511702060699463, 4.843545913696289, 5.175389766693115, 5.507233619689941, 5.839076995849609, 6.1709208488464355, 6.502764701843262, 6.83460807800293, 7.166452407836914, 7.49829626083374, 7.830140113830566, 8.161983489990234, 8.493827819824219, 8.825671195983887, 9.157514572143555, 9.489358901977539, 9.821202278137207]}, "gradients/decoder.bert.encoder.layer.2.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 10.0, 6.0, 6.0, 5.0, 20.0, 18.0, 18.0, 22.0, 24.0, 27.0, 33.0, 31.0, 37.0, 35.0, 36.0, 30.0, 31.0, 37.0, 30.0, 36.0, 51.0, 35.0, 43.0, 33.0, 47.0, 29.0, 33.0, 22.0, 24.0, 23.0, 19.0, 34.0, 20.0, 15.0, 18.0, 8.0, 7.0, 9.0, 2.0, 10.0, 4.0, 3.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.380634307861328, -6.1947736740112305, -6.008913040161133, -5.823052406311035, -5.6371917724609375, -5.45133113861084, -5.265470504760742, -5.0796098709106445, -4.893749237060547, -4.707888603210449, -4.522027969360352, -4.336167335510254, -4.150306701660156, -3.9644460678100586, -3.77858567237854, -3.5927250385284424, -3.406864643096924, -3.221004009246826, -3.0351433753967285, -2.849282741546631, -2.663422107696533, -2.4775614738464355, -2.291701078414917, -2.1058404445648193, -1.9199798107147217, -1.734119176864624, -1.5482585430145264, -1.3623980283737183, -1.1765373945236206, -0.990676760673523, -0.8048162460327148, -0.6189556121826172, -0.43309497833251953, -0.24723437428474426, -0.061373770236968994, 0.12448680400848389, 0.31034743785858154, 0.4962080717086792, 0.6820685863494873, 0.867929220199585, 1.0537898540496826, 1.2396504878997803, 1.425511121749878, 1.611371636390686, 1.7972322702407837, 1.9830929040908813, 2.1689534187316895, 2.354814052581787, 2.5406746864318848, 2.7265353202819824, 2.91239595413208, 3.0982565879821777, 3.2841172218322754, 3.469977855682373, 3.6558382511138916, 3.8416988849639893, 4.027559280395508, 4.2134199142456055, 4.399280548095703, 4.585141181945801, 4.771001815795898, 4.956862449645996, 5.142723083496094, 5.328583717346191, 5.514444351196289]}, "gradients/decoder.bert.encoder.layer.2.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 9.0, 4.0, 11.0, 15.0, 21.0, 31.0, 54.0, 64.0, 87.0, 125.0, 213.0, 296.0, 488.0, 697.0, 1075.0, 1804.0, 2888.0, 4842.0, 8173.0, 14624.0, 26999.0, 52506.0, 110249.0, 248436.0, 582123.0, 1091528.0, 1051196.0, 547900.0, 236433.0, 105534.0, 50073.0, 25167.0, 13317.0, 7149.0, 4223.0, 2433.0, 1412.0, 794.0, 478.0, 324.0, 203.0, 120.0, 81.0, 32.0, 25.0, 10.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.671875, -13.2916259765625, -12.911376953125, -12.5311279296875, -12.15087890625, -11.7706298828125, -11.390380859375, -11.0101318359375, -10.6298828125, -10.2496337890625, -9.869384765625, -9.4891357421875, -9.10888671875, -8.7286376953125, -8.348388671875, -7.9681396484375, -7.587890625, -7.2076416015625, -6.827392578125, -6.4471435546875, -6.06689453125, -5.6866455078125, -5.306396484375, -4.9261474609375, -4.5458984375, -4.1656494140625, -3.785400390625, -3.4051513671875, -3.02490234375, -2.6446533203125, -2.264404296875, -1.8841552734375, -1.50390625, -1.1236572265625, -0.743408203125, -0.3631591796875, 0.01708984375, 0.3973388671875, 0.777587890625, 1.1578369140625, 1.5380859375, 1.9183349609375, 2.298583984375, 2.6788330078125, 3.05908203125, 3.4393310546875, 3.819580078125, 4.1998291015625, 4.580078125, 4.9603271484375, 5.340576171875, 5.7208251953125, 6.10107421875, 6.4813232421875, 6.861572265625, 7.2418212890625, 7.6220703125, 8.0023193359375, 8.382568359375, 8.7628173828125, 9.14306640625, 9.5233154296875, 9.903564453125, 10.2838134765625, 10.6640625]}, "gradients/decoder.bert.encoder.layer.2.output.dense.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 9.0, 12.0, 14.0, 13.0, 13.0, 11.0, 14.0, 21.0, 26.0, 29.0, 25.0, 32.0, 42.0, 33.0, 35.0, 30.0, 35.0, 39.0, 46.0, 42.0, 37.0, 35.0, 38.0, 30.0, 27.0, 27.0, 31.0, 25.0, 19.0, 25.0, 23.0, 22.0, 18.0, 12.0, 11.0, 14.0, 13.0, 8.0, 5.0, 8.0, 5.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.2828369140625, -5.120361328125, -4.9578857421875, -4.79541015625, -4.6329345703125, -4.470458984375, -4.3079833984375, -4.1455078125, -3.9830322265625, -3.820556640625, -3.6580810546875, -3.49560546875, -3.3331298828125, -3.170654296875, -3.0081787109375, -2.845703125, -2.6832275390625, -2.520751953125, -2.3582763671875, -2.19580078125, -2.0333251953125, -1.870849609375, -1.7083740234375, -1.5458984375, -1.3834228515625, -1.220947265625, -1.0584716796875, -0.89599609375, -0.7335205078125, -0.571044921875, -0.4085693359375, -0.24609375, -0.0836181640625, 0.078857421875, 0.2413330078125, 0.40380859375, 0.5662841796875, 0.728759765625, 0.8912353515625, 1.0537109375, 1.2161865234375, 1.378662109375, 1.5411376953125, 1.70361328125, 1.8660888671875, 2.028564453125, 2.1910400390625, 2.353515625, 2.5159912109375, 2.678466796875, 2.8409423828125, 3.00341796875, 3.1658935546875, 3.328369140625, 3.4908447265625, 3.6533203125, 3.8157958984375, 3.978271484375, 4.1407470703125, 4.30322265625, 4.4656982421875, 4.628173828125, 4.7906494140625, 4.953125]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 8.0, 6.0, 12.0, 20.0, 32.0, 56.0, 73.0, 124.0, 192.0, 303.0, 480.0, 780.0, 1281.0, 2081.0, 3533.0, 6419.0, 11118.0, 21092.0, 39984.0, 79870.0, 166077.0, 358955.0, 748727.0, 1125971.0, 837055.0, 410500.0, 190017.0, 91025.0, 45022.0, 23714.0, 12904.0, 6999.0, 3882.0, 2381.0, 1409.0, 837.0, 458.0, 351.0, 214.0, 111.0, 77.0, 46.0, 32.0, 20.0, 15.0, 12.0, 6.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0], "bins": [-16.59375, -16.114013671875, -15.63427734375, -15.154541015625, -14.6748046875, -14.195068359375, -13.71533203125, -13.235595703125, -12.755859375, -12.276123046875, -11.79638671875, -11.316650390625, -10.8369140625, -10.357177734375, -9.87744140625, -9.397705078125, -8.91796875, -8.438232421875, -7.95849609375, -7.478759765625, -6.9990234375, -6.519287109375, -6.03955078125, -5.559814453125, -5.080078125, -4.600341796875, -4.12060546875, -3.640869140625, -3.1611328125, -2.681396484375, -2.20166015625, -1.721923828125, -1.2421875, -0.762451171875, -0.28271484375, 0.197021484375, 0.6767578125, 1.156494140625, 1.63623046875, 2.115966796875, 2.595703125, 3.075439453125, 3.55517578125, 4.034912109375, 4.5146484375, 4.994384765625, 5.47412109375, 5.953857421875, 6.43359375, 6.913330078125, 7.39306640625, 7.872802734375, 8.3525390625, 8.832275390625, 9.31201171875, 9.791748046875, 10.271484375, 10.751220703125, 11.23095703125, 11.710693359375, 12.1904296875, 12.670166015625, 13.14990234375, 13.629638671875, 14.109375]}, "gradients/decoder.bert.encoder.layer.2.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 5.0, 8.0, 13.0, 14.0, 16.0, 34.0, 34.0, 28.0, 52.0, 72.0, 94.0, 121.0, 137.0, 151.0, 183.0, 223.0, 272.0, 299.0, 313.0, 263.0, 266.0, 262.0, 206.0, 198.0, 167.0, 140.0, 125.0, 80.0, 62.0, 52.0, 35.0, 32.0, 26.0, 16.0, 21.0, 12.0, 11.0, 10.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.0792236328125, -3.947509765625, -3.8157958984375, -3.68408203125, -3.5523681640625, -3.420654296875, -3.2889404296875, -3.1572265625, -3.0255126953125, -2.893798828125, -2.7620849609375, -2.63037109375, -2.4986572265625, -2.366943359375, -2.2352294921875, -2.103515625, -1.9718017578125, -1.840087890625, -1.7083740234375, -1.57666015625, -1.4449462890625, -1.313232421875, -1.1815185546875, -1.0498046875, -0.9180908203125, -0.786376953125, -0.6546630859375, -0.52294921875, -0.3912353515625, -0.259521484375, -0.1278076171875, 0.00390625, 0.1356201171875, 0.267333984375, 0.3990478515625, 0.53076171875, 0.6624755859375, 0.794189453125, 0.9259033203125, 1.0576171875, 1.1893310546875, 1.321044921875, 1.4527587890625, 1.58447265625, 1.7161865234375, 1.847900390625, 1.9796142578125, 2.111328125, 2.2430419921875, 2.374755859375, 2.5064697265625, 2.63818359375, 2.7698974609375, 2.901611328125, 3.0333251953125, 3.1650390625, 3.2967529296875, 3.428466796875, 3.5601806640625, 3.69189453125, 3.8236083984375, 3.955322265625, 4.0870361328125, 4.21875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 8.0, 13.0, 11.0, 13.0, 18.0, 26.0, 16.0, 37.0, 43.0, 32.0, 50.0, 48.0, 58.0, 68.0, 59.0, 66.0, 68.0, 48.0, 37.0, 59.0, 40.0, 39.0, 23.0, 25.0, 17.0, 19.0, 11.0, 8.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-17.37887191772461, -16.9278564453125, -16.47684097290039, -16.02582550048828, -15.574809074401855, -15.123793601989746, -14.672778129577637, -14.221762657165527, -13.770747184753418, -13.319731712341309, -12.8687162399292, -12.417699813842773, -11.966684341430664, -11.515668869018555, -11.064653396606445, -10.613637924194336, -10.162622451782227, -9.711606979370117, -9.260591506958008, -8.809576034545898, -8.358559608459473, -7.907544136047363, -7.456528663635254, -7.0055131912231445, -6.554496765136719, -6.103481292724609, -5.652465343475342, -5.201449871063232, -4.750434398651123, -4.2994184494018555, -3.848402976989746, -3.3973875045776367, -2.9463720321655273, -2.495356321334839, -2.0443408489227295, -1.593325138092041, -1.142309546470642, -0.6912939548492432, -0.2402782440185547, 0.2107372283935547, 0.6617529392242432, 1.112768530845642, 1.563784122467041, 2.0147998332977295, 2.465815544128418, 2.9168310165405273, 3.367846727371216, 3.818862199783325, 4.269877910614014, 4.720893383026123, 5.171909332275391, 5.6229248046875, 6.073940277099609, 6.524955749511719, 6.975971698760986, 7.426987171173096, 7.878003120422363, 8.329018592834473, 8.780034065246582, 9.231050491333008, 9.682065963745117, 10.133081436157227, 10.584096908569336, 11.035112380981445, 11.486127853393555]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 5.0, 6.0, 4.0, 7.0, 8.0, 11.0, 11.0, 18.0, 18.0, 18.0, 12.0, 18.0, 22.0, 24.0, 37.0, 29.0, 29.0, 41.0, 34.0, 33.0, 36.0, 28.0, 33.0, 33.0, 39.0, 31.0, 41.0, 34.0, 42.0, 34.0, 31.0, 28.0, 21.0, 24.0, 19.0, 17.0, 15.0, 16.0, 20.0, 8.0, 11.0, 10.0, 12.0, 10.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0], "bins": [-7.343834400177002, -7.12726354598999, -6.910693168640137, -6.694122314453125, -6.4775519371032715, -6.26098108291626, -6.044410705566406, -5.8278398513793945, -5.611269474029541, -5.394698619842529, -5.178128242492676, -4.961557388305664, -4.7449870109558105, -4.528416156768799, -4.311845779418945, -4.095274925231934, -3.878704309463501, -3.6621336936950684, -3.4455630779266357, -3.228992462158203, -3.0124218463897705, -2.795851230621338, -2.579280376434326, -2.3627099990844727, -2.146139144897461, -1.9295685291290283, -1.7129979133605957, -1.496427297592163, -1.2798566818237305, -1.0632859468460083, -0.8467153310775757, -0.6301447153091431, -0.41357421875, -0.1970035880804062, 0.019567042589187622, 0.23613768815994263, 0.45270830392837524, 0.6692789793014526, 0.8858495950698853, 1.1024202108383179, 1.3189908266067505, 1.535561442375183, 1.7521320581436157, 1.968702793121338, 2.1852734088897705, 2.401844024658203, 2.6184146404266357, 2.8349852561950684, 3.051555871963501, 3.2681264877319336, 3.484697103500366, 3.701267719268799, 3.9178383350372314, 4.134408950805664, 4.350979804992676, 4.567550182342529, 4.784121036529541, 5.000691890716553, 5.217262268066406, 5.433833122253418, 5.6504034996032715, 5.866974353790283, 6.083544731140137, 6.300115585327148, 6.516685962677002]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 1.0, 7.0, 8.0, 17.0, 26.0, 27.0, 43.0, 64.0, 102.0, 175.0, 210.0, 316.0, 468.0, 685.0, 1092.0, 1593.0, 2548.0, 3999.0, 6271.0, 9946.0, 16721.0, 27556.0, 45570.0, 75839.0, 121276.0, 172044.0, 183135.0, 142427.0, 92294.0, 56112.0, 33848.0, 20600.0, 12627.0, 7567.0, 4736.0, 3000.0, 1975.0, 1211.0, 767.0, 512.0, 370.0, 231.0, 169.0, 124.0, 85.0, 55.0, 33.0, 29.0, 23.0, 13.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.8875732421875, -0.857177734375, -0.8267822265625, -0.79638671875, -0.7659912109375, -0.735595703125, -0.7052001953125, -0.6748046875, -0.6444091796875, -0.614013671875, -0.5836181640625, -0.55322265625, -0.5228271484375, -0.492431640625, -0.4620361328125, -0.431640625, -0.4012451171875, -0.370849609375, -0.3404541015625, -0.31005859375, -0.2796630859375, -0.249267578125, -0.2188720703125, -0.1884765625, -0.1580810546875, -0.127685546875, -0.0972900390625, -0.06689453125, -0.0364990234375, -0.006103515625, 0.0242919921875, 0.0546875, 0.0850830078125, 0.115478515625, 0.1458740234375, 0.17626953125, 0.2066650390625, 0.237060546875, 0.2674560546875, 0.2978515625, 0.3282470703125, 0.358642578125, 0.3890380859375, 0.41943359375, 0.4498291015625, 0.480224609375, 0.5106201171875, 0.541015625, 0.5714111328125, 0.601806640625, 0.6322021484375, 0.66259765625, 0.6929931640625, 0.723388671875, 0.7537841796875, 0.7841796875, 0.8145751953125, 0.844970703125, 0.8753662109375, 0.90576171875, 0.9361572265625, 0.966552734375, 0.9969482421875, 1.02734375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 6.0, 4.0, 4.0, 16.0, 15.0, 17.0, 25.0, 16.0, 29.0, 25.0, 31.0, 33.0, 42.0, 30.0, 48.0, 42.0, 51.0, 44.0, 51.0, 40.0, 47.0, 41.0, 44.0, 53.0, 34.0, 28.0, 30.0, 23.0, 26.0, 24.0, 15.0, 19.0, 12.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5078125, -10.1968994140625, -9.885986328125, -9.5750732421875, -9.26416015625, -8.9532470703125, -8.642333984375, -8.3314208984375, -8.0205078125, -7.7095947265625, -7.398681640625, -7.0877685546875, -6.77685546875, -6.4659423828125, -6.155029296875, -5.8441162109375, -5.533203125, -5.2222900390625, -4.911376953125, -4.6004638671875, -4.28955078125, -3.9786376953125, -3.667724609375, -3.3568115234375, -3.0458984375, -2.7349853515625, -2.424072265625, -2.1131591796875, -1.80224609375, -1.4913330078125, -1.180419921875, -0.8695068359375, -0.55859375, -0.2476806640625, 0.063232421875, 0.3741455078125, 0.68505859375, 0.9959716796875, 1.306884765625, 1.6177978515625, 1.9287109375, 2.2396240234375, 2.550537109375, 2.8614501953125, 3.17236328125, 3.4832763671875, 3.794189453125, 4.1051025390625, 4.416015625, 4.7269287109375, 5.037841796875, 5.3487548828125, 5.65966796875, 5.9705810546875, 6.281494140625, 6.5924072265625, 6.9033203125, 7.2142333984375, 7.525146484375, 7.8360595703125, 8.14697265625, 8.4578857421875, 8.768798828125, 9.0797119140625, 9.390625]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 12.0, 14.0, 12.0, 25.0, 25.0, 41.0, 35.0, 59.0, 66.0, 104.0, 138.0, 213.0, 261.0, 402.0, 599.0, 870.0, 1377.0, 2170.0, 3759.0, 6720.0, 13175.0, 30256.0, 280944.0, 633917.0, 38925.0, 15295.0, 7669.0, 4309.0, 2452.0, 1553.0, 984.0, 621.0, 468.0, 280.0, 229.0, 156.0, 91.0, 89.0, 72.0, 36.0, 33.0, 27.0, 22.0, 14.0, 6.0, 7.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 4.0], "bins": [-2.84765625, -2.76416015625, -2.6806640625, -2.59716796875, -2.513671875, -2.43017578125, -2.3466796875, -2.26318359375, -2.1796875, -2.09619140625, -2.0126953125, -1.92919921875, -1.845703125, -1.76220703125, -1.6787109375, -1.59521484375, -1.51171875, -1.42822265625, -1.3447265625, -1.26123046875, -1.177734375, -1.09423828125, -1.0107421875, -0.92724609375, -0.84375, -0.76025390625, -0.6767578125, -0.59326171875, -0.509765625, -0.42626953125, -0.3427734375, -0.25927734375, -0.17578125, -0.09228515625, -0.0087890625, 0.07470703125, 0.158203125, 0.24169921875, 0.3251953125, 0.40869140625, 0.4921875, 0.57568359375, 0.6591796875, 0.74267578125, 0.826171875, 0.90966796875, 0.9931640625, 1.07666015625, 1.16015625, 1.24365234375, 1.3271484375, 1.41064453125, 1.494140625, 1.57763671875, 1.6611328125, 1.74462890625, 1.828125, 1.91162109375, 1.9951171875, 2.07861328125, 2.162109375, 2.24560546875, 2.3291015625, 2.41259765625, 2.49609375]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 11.0, 8.0, 9.0, 9.0, 13.0, 10.0, 13.0, 15.0, 22.0, 6.0, 26.0, 22.0, 31.0, 25.0, 25.0, 47.0, 48.0, 28.0, 38.0, 27.0, 40.0, 38.0, 39.0, 41.0, 40.0, 41.0, 44.0, 27.0, 30.0, 31.0, 29.0, 33.0, 19.0, 19.0, 17.0, 7.0, 19.0, 11.0, 19.0, 8.0, 4.0, 7.0, 2.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.0987548828125, -4.935791015625, -4.7728271484375, -4.60986328125, -4.4468994140625, -4.283935546875, -4.1209716796875, -3.9580078125, -3.7950439453125, -3.632080078125, -3.4691162109375, -3.30615234375, -3.1431884765625, -2.980224609375, -2.8172607421875, -2.654296875, -2.4913330078125, -2.328369140625, -2.1654052734375, -2.00244140625, -1.8394775390625, -1.676513671875, -1.5135498046875, -1.3505859375, -1.1876220703125, -1.024658203125, -0.8616943359375, -0.69873046875, -0.5357666015625, -0.372802734375, -0.2098388671875, -0.046875, 0.1160888671875, 0.279052734375, 0.4420166015625, 0.60498046875, 0.7679443359375, 0.930908203125, 1.0938720703125, 1.2568359375, 1.4197998046875, 1.582763671875, 1.7457275390625, 1.90869140625, 2.0716552734375, 2.234619140625, 2.3975830078125, 2.560546875, 2.7235107421875, 2.886474609375, 3.0494384765625, 3.21240234375, 3.3753662109375, 3.538330078125, 3.7012939453125, 3.8642578125, 4.0272216796875, 4.190185546875, 4.3531494140625, 4.51611328125, 4.6790771484375, 4.842041015625, 5.0050048828125, 5.16796875]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 4.0, 15.0, 18.0, 29.0, 33.0, 55.0, 90.0, 117.0, 171.0, 253.0, 412.0, 611.0, 994.0, 1569.0, 2456.0, 4125.0, 6970.0, 12179.0, 23249.0, 98181.0, 823942.0, 33855.0, 16390.0, 9158.0, 5221.0, 3060.0, 1937.0, 1233.0, 767.0, 467.0, 339.0, 203.0, 139.0, 100.0, 54.0, 43.0, 31.0, 26.0, 19.0, 4.0, 11.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.465576171875, -0.4501762390136719, -0.43477630615234375, -0.4193763732910156, -0.4039764404296875, -0.3885765075683594, -0.37317657470703125, -0.3577766418457031, -0.342376708984375, -0.3269767761230469, -0.31157684326171875, -0.2961769104003906, -0.2807769775390625, -0.2653770446777344, -0.24997711181640625, -0.23457717895507812, -0.21917724609375, -0.20377731323242188, -0.18837738037109375, -0.17297744750976562, -0.1575775146484375, -0.14217758178710938, -0.12677764892578125, -0.11137771606445312, -0.095977783203125, -0.08057785034179688, -0.06517791748046875, -0.049777984619140625, -0.0343780517578125, -0.018978118896484375, -0.00357818603515625, 0.011821746826171875, 0.0272216796875, 0.042621612548828125, 0.05802154541015625, 0.07342147827148438, 0.0888214111328125, 0.10422134399414062, 0.11962127685546875, 0.13502120971679688, 0.150421142578125, 0.16582107543945312, 0.18122100830078125, 0.19662094116210938, 0.2120208740234375, 0.22742080688476562, 0.24282073974609375, 0.2582206726074219, 0.27362060546875, 0.2890205383300781, 0.30442047119140625, 0.3198204040527344, 0.3352203369140625, 0.3506202697753906, 0.36602020263671875, 0.3814201354980469, 0.396820068359375, 0.4122200012207031, 0.42761993408203125, 0.4430198669433594, 0.4584197998046875, 0.4738197326660156, 0.48921966552734375, 0.5046195983886719, 0.52001953125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 2.0, 7.0, 7.0, 6.0, 9.0, 8.0, 10.0, 16.0, 23.0, 22.0, 16.0, 19.0, 22.0, 22.0, 32.0, 36.0, 45.0, 32.0, 43.0, 31.0, 34.0, 37.0, 53.0, 35.0, 48.0, 62.0, 35.0, 34.0, 25.0, 39.0, 36.0, 19.0, 19.0, 12.0, 19.0, 16.0, 10.0, 10.0, 9.0, 9.0, 6.0, 8.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.7583370208740234e-05, -1.7012469470500946e-05, -1.6441568732261658e-05, -1.587066799402237e-05, -1.529976725578308e-05, -1.4728866517543793e-05, -1.4157965779304504e-05, -1.3587065041065216e-05, -1.3016164302825928e-05, -1.244526356458664e-05, -1.1874362826347351e-05, -1.1303462088108063e-05, -1.0732561349868774e-05, -1.0161660611629486e-05, -9.590759873390198e-06, -9.01985913515091e-06, -8.448958396911621e-06, -7.878057658672333e-06, -7.3071569204330444e-06, -6.736256182193756e-06, -6.165355443954468e-06, -5.5944547057151794e-06, -5.023553967475891e-06, -4.452653229236603e-06, -3.8817524909973145e-06, -3.310851752758026e-06, -2.739951014518738e-06, -2.1690502762794495e-06, -1.5981495380401611e-06, -1.0272487998008728e-06, -4.5634806156158447e-07, 1.1455267667770386e-07, 6.854534149169922e-07, 1.2563541531562805e-06, 1.8272548913955688e-06, 2.398155629634857e-06, 2.9690563678741455e-06, 3.539957106113434e-06, 4.110857844352722e-06, 4.6817585825920105e-06, 5.252659320831299e-06, 5.823560059070587e-06, 6.3944607973098755e-06, 6.965361535549164e-06, 7.536262273788452e-06, 8.10716301202774e-06, 8.678063750267029e-06, 9.248964488506317e-06, 9.819865226745605e-06, 1.0390765964984894e-05, 1.0961666703224182e-05, 1.153256744146347e-05, 1.2103468179702759e-05, 1.2674368917942047e-05, 1.3245269656181335e-05, 1.3816170394420624e-05, 1.4387071132659912e-05, 1.49579718708992e-05, 1.552887260913849e-05, 1.6099773347377777e-05, 1.6670674085617065e-05, 1.7241574823856354e-05, 1.7812475562095642e-05, 1.838337630033493e-05, 1.895427703857422e-05]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 19.0, 20.0, 40.0, 47.0, 65.0, 121.0, 148.0, 251.0, 414.0, 726.0, 1065.0, 1753.0, 2887.0, 4837.0, 7960.0, 13180.0, 21982.0, 37826.0, 63538.0, 104205.0, 156781.0, 189929.0, 162804.0, 110136.0, 68472.0, 40116.0, 23640.0, 13861.0, 8478.0, 5084.0, 3160.0, 1912.0, 1134.0, 680.0, 416.0, 315.0, 181.0, 124.0, 92.0, 55.0, 24.0, 17.0, 15.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.24658203125, -0.23923492431640625, -0.2318878173828125, -0.22454071044921875, -0.217193603515625, -0.20984649658203125, -0.2024993896484375, -0.19515228271484375, -0.18780517578125, -0.18045806884765625, -0.1731109619140625, -0.16576385498046875, -0.158416748046875, -0.15106964111328125, -0.1437225341796875, -0.13637542724609375, -0.1290283203125, -0.12168121337890625, -0.1143341064453125, -0.10698699951171875, -0.099639892578125, -0.09229278564453125, -0.0849456787109375, -0.07759857177734375, -0.07025146484375, -0.06290435791015625, -0.0555572509765625, -0.04821014404296875, -0.040863037109375, -0.03351593017578125, -0.0261688232421875, -0.01882171630859375, -0.011474609375, -0.00412750244140625, 0.0032196044921875, 0.01056671142578125, 0.017913818359375, 0.02526092529296875, 0.0326080322265625, 0.03995513916015625, 0.04730224609375, 0.05464935302734375, 0.0619964599609375, 0.06934356689453125, 0.076690673828125, 0.08403778076171875, 0.0913848876953125, 0.09873199462890625, 0.1060791015625, 0.11342620849609375, 0.1207733154296875, 0.12812042236328125, 0.135467529296875, 0.14281463623046875, 0.1501617431640625, 0.15750885009765625, 0.16485595703125, 0.17220306396484375, 0.1795501708984375, 0.18689727783203125, 0.194244384765625, 0.20159149169921875, 0.2089385986328125, 0.21628570556640625, 0.2236328125]}, "gradients/decoder.bert.encoder.layer.2.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 7.0, 7.0, 13.0, 20.0, 19.0, 22.0, 26.0, 35.0, 52.0, 56.0, 56.0, 65.0, 52.0, 63.0, 69.0, 56.0, 50.0, 52.0, 43.0, 31.0, 42.0, 27.0, 24.0, 18.0, 16.0, 19.0, 11.0, 12.0, 3.0, 4.0, 8.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08172607421875, -0.07924365997314453, -0.07676124572753906, -0.0742788314819336, -0.07179641723632812, -0.06931400299072266, -0.06683158874511719, -0.06434917449951172, -0.06186676025390625, -0.05938434600830078, -0.05690193176269531, -0.054419517517089844, -0.051937103271484375, -0.049454689025878906, -0.04697227478027344, -0.04448986053466797, -0.0420074462890625, -0.03952503204345703, -0.03704261779785156, -0.034560203552246094, -0.032077789306640625, -0.029595375061035156, -0.027112960815429688, -0.02463054656982422, -0.02214813232421875, -0.01966571807861328, -0.017183303833007812, -0.014700889587402344, -0.012218475341796875, -0.009736061096191406, -0.0072536468505859375, -0.004771232604980469, -0.002288818359375, 0.00019359588623046875, 0.0026760101318359375, 0.005158424377441406, 0.007640838623046875, 0.010123252868652344, 0.012605667114257812, 0.015088081359863281, 0.01757049560546875, 0.02005290985107422, 0.022535324096679688, 0.025017738342285156, 0.027500152587890625, 0.029982566833496094, 0.03246498107910156, 0.03494739532470703, 0.0374298095703125, 0.03991222381591797, 0.04239463806152344, 0.044877052307128906, 0.047359466552734375, 0.049841880798339844, 0.05232429504394531, 0.05480670928955078, 0.05728912353515625, 0.05977153778076172, 0.06225395202636719, 0.06473636627197266, 0.06721878051757812, 0.0697011947631836, 0.07218360900878906, 0.07466602325439453, 0.0771484375]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 1.0, 6.0, 9.0, 7.0, 11.0, 11.0, 15.0, 16.0, 21.0, 20.0, 29.0, 38.0, 37.0, 51.0, 41.0, 59.0, 60.0, 69.0, 53.0, 73.0, 56.0, 40.0, 56.0, 44.0, 40.0, 25.0, 27.0, 22.0, 14.0, 13.0, 11.0, 8.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-17.484338760375977, -17.033742904663086, -16.583148956298828, -16.132553100585938, -15.681957244873047, -15.231362342834473, -14.780767440795898, -14.330171585083008, -13.879576683044434, -13.42898178100586, -12.978385925292969, -12.527791023254395, -12.07719612121582, -11.62660026550293, -11.176005363464355, -10.725410461425781, -10.27481460571289, -9.824219703674316, -9.373623847961426, -8.923028945922852, -8.472433090209961, -8.021838188171387, -7.5712432861328125, -7.12064790725708, -6.670052528381348, -6.219457149505615, -5.768861770629883, -5.318266868591309, -4.867671489715576, -4.417076110839844, -3.9664809703826904, -3.515885829925537, -3.0652894973754883, -2.614694118499756, -2.1640989780426025, -1.7135037183761597, -1.2629084587097168, -0.8123130798339844, -0.36171793937683105, 0.08887720108032227, 0.5394725799560547, 0.9900678396224976, 1.4406630992889404, 1.8912583589553833, 2.341853618621826, 2.7924489974975586, 3.243044137954712, 3.6936392784118652, 4.144234657287598, 4.59483003616333, 5.0454254150390625, 5.496020317077637, 5.946615695953369, 6.397211074829102, 6.847805976867676, 7.298401355743408, 7.748996734619141, 8.199591636657715, 8.650187492370605, 9.10078239440918, 9.55137825012207, 10.001973152160645, 10.452568054199219, 10.90316390991211, 11.353758811950684]}, "gradients/decoder.bert.encoder.layer.2.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 4.0, 5.0, 6.0, 5.0, 6.0, 9.0, 11.0, 8.0, 16.0, 19.0, 18.0, 13.0, 17.0, 22.0, 25.0, 33.0, 34.0, 27.0, 36.0, 38.0, 36.0, 31.0, 31.0, 34.0, 30.0, 35.0, 34.0, 43.0, 32.0, 44.0, 33.0, 29.0, 35.0, 19.0, 24.0, 22.0, 16.0, 15.0, 15.0, 20.0, 7.0, 14.0, 10.0, 11.0, 12.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0], "bins": [-7.346375942230225, -7.1301188468933105, -6.913861274719238, -6.697604179382324, -6.48134708404541, -6.265089511871338, -6.048832416534424, -5.832574844360352, -5.6163177490234375, -5.400060653686523, -5.183803081512451, -4.967545986175537, -4.751288890838623, -4.535031318664551, -4.318774223327637, -4.102517127990723, -3.8862597942352295, -3.6700024604797363, -3.4537453651428223, -3.237488031387329, -3.021230697631836, -2.804973602294922, -2.5887162685394287, -2.3724589347839355, -2.1562018394470215, -1.9399446249008179, -1.7236872911453247, -1.507430076599121, -1.291172742843628, -1.0749155282974243, -0.8586583137512207, -0.6424009799957275, -0.4261436462402344, -0.20988638699054718, 0.006370872259140015, 0.22262811660766602, 0.4388853907585144, 0.6551426649093628, 0.8713998794555664, 1.0876572132110596, 1.3039144277572632, 1.5201716423034668, 1.73642897605896, 1.9526861906051636, 2.168943405151367, 2.3852007389068604, 2.6014580726623535, 2.8177151679992676, 3.0339725017547607, 3.250229835510254, 3.466486930847168, 3.682744264602661, 3.8990015983581543, 4.115258693695068, 4.331516265869141, 4.547773361206055, 4.764030456542969, 4.980287551879883, 5.196545124053955, 5.412802219390869, 5.629059314727783, 5.8453168869018555, 6.0615739822387695, 6.277831077575684, 6.494088649749756]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 7.0, 12.0, 9.0, 15.0, 27.0, 38.0, 54.0, 95.0, 171.0, 216.0, 327.0, 537.0, 832.0, 1340.0, 2107.0, 3418.0, 5432.0, 9032.0, 14908.0, 24689.0, 40779.0, 66387.0, 102621.0, 142483.0, 163895.0, 152142.0, 116363.0, 77741.0, 47921.0, 29417.0, 17544.0, 10856.0, 6448.0, 3930.0, 2448.0, 1617.0, 945.0, 643.0, 399.0, 242.0, 150.0, 110.0, 70.0, 53.0, 28.0, 18.0, 15.0, 8.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0], "bins": [-8.9140625, -8.6492919921875, -8.384521484375, -8.1197509765625, -7.85498046875, -7.5902099609375, -7.325439453125, -7.0606689453125, -6.7958984375, -6.5311279296875, -6.266357421875, -6.0015869140625, -5.73681640625, -5.4720458984375, -5.207275390625, -4.9425048828125, -4.677734375, -4.4129638671875, -4.148193359375, -3.8834228515625, -3.61865234375, -3.3538818359375, -3.089111328125, -2.8243408203125, -2.5595703125, -2.2947998046875, -2.030029296875, -1.7652587890625, -1.50048828125, -1.2357177734375, -0.970947265625, -0.7061767578125, -0.44140625, -0.1766357421875, 0.088134765625, 0.3529052734375, 0.61767578125, 0.8824462890625, 1.147216796875, 1.4119873046875, 1.6767578125, 1.9415283203125, 2.206298828125, 2.4710693359375, 2.73583984375, 3.0006103515625, 3.265380859375, 3.5301513671875, 3.794921875, 4.0596923828125, 4.324462890625, 4.5892333984375, 4.85400390625, 5.1187744140625, 5.383544921875, 5.6483154296875, 5.9130859375, 6.1778564453125, 6.442626953125, 6.7073974609375, 6.97216796875, 7.2369384765625, 7.501708984375, 7.7664794921875, 8.03125]}, "gradients/decoder.bert.encoder.layer.2.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 5.0, 7.0, 3.0, 12.0, 4.0, 6.0, 11.0, 11.0, 23.0, 17.0, 18.0, 21.0, 24.0, 33.0, 34.0, 32.0, 33.0, 24.0, 34.0, 41.0, 29.0, 46.0, 49.0, 33.0, 38.0, 32.0, 35.0, 35.0, 29.0, 29.0, 35.0, 24.0, 28.0, 23.0, 22.0, 15.0, 18.0, 9.0, 14.0, 9.0, 11.0, 7.0, 9.0, 2.0, 5.0, 8.0, 5.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 3.0], "bins": [-7.91796875, -7.6763916015625, -7.434814453125, -7.1932373046875, -6.95166015625, -6.7100830078125, -6.468505859375, -6.2269287109375, -5.9853515625, -5.7437744140625, -5.502197265625, -5.2606201171875, -5.01904296875, -4.7774658203125, -4.535888671875, -4.2943115234375, -4.052734375, -3.8111572265625, -3.569580078125, -3.3280029296875, -3.08642578125, -2.8448486328125, -2.603271484375, -2.3616943359375, -2.1201171875, -1.8785400390625, -1.636962890625, -1.3953857421875, -1.15380859375, -0.9122314453125, -0.670654296875, -0.4290771484375, -0.1875, 0.0540771484375, 0.295654296875, 0.5372314453125, 0.77880859375, 1.0203857421875, 1.261962890625, 1.5035400390625, 1.7451171875, 1.9866943359375, 2.228271484375, 2.4698486328125, 2.71142578125, 2.9530029296875, 3.194580078125, 3.4361572265625, 3.677734375, 3.9193115234375, 4.160888671875, 4.4024658203125, 4.64404296875, 4.8856201171875, 5.127197265625, 5.3687744140625, 5.6103515625, 5.8519287109375, 6.093505859375, 6.3350830078125, 6.57666015625, 6.8182373046875, 7.059814453125, 7.3013916015625, 7.54296875]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 13.0, 17.0, 27.0, 48.0, 88.0, 178.0, 286.0, 424.0, 826.0, 1364.0, 2463.0, 4261.0, 7702.0, 14269.0, 25728.0, 46444.0, 82109.0, 133880.0, 181475.0, 187777.0, 146015.0, 93441.0, 53451.0, 29680.0, 16181.0, 9036.0, 4965.0, 2734.0, 1529.0, 884.0, 507.0, 324.0, 180.0, 90.0, 63.0, 36.0, 17.0, 17.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9962158203125, -9.664306640625, -9.3323974609375, -9.00048828125, -8.6685791015625, -8.336669921875, -8.0047607421875, -7.6728515625, -7.3409423828125, -7.009033203125, -6.6771240234375, -6.34521484375, -6.0133056640625, -5.681396484375, -5.3494873046875, -5.017578125, -4.6856689453125, -4.353759765625, -4.0218505859375, -3.68994140625, -3.3580322265625, -3.026123046875, -2.6942138671875, -2.3623046875, -2.0303955078125, -1.698486328125, -1.3665771484375, -1.03466796875, -0.7027587890625, -0.370849609375, -0.0389404296875, 0.29296875, 0.6248779296875, 0.956787109375, 1.2886962890625, 1.62060546875, 1.9525146484375, 2.284423828125, 2.6163330078125, 2.9482421875, 3.2801513671875, 3.612060546875, 3.9439697265625, 4.27587890625, 4.6077880859375, 4.939697265625, 5.2716064453125, 5.603515625, 5.9354248046875, 6.267333984375, 6.5992431640625, 6.93115234375, 7.2630615234375, 7.594970703125, 7.9268798828125, 8.2587890625, 8.5906982421875, 8.922607421875, 9.2545166015625, 9.58642578125, 9.9183349609375, 10.250244140625, 10.5821533203125, 10.9140625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 7.0, 2.0, 6.0, 6.0, 15.0, 15.0, 7.0, 14.0, 12.0, 19.0, 22.0, 31.0, 30.0, 31.0, 39.0, 38.0, 24.0, 35.0, 36.0, 34.0, 47.0, 42.0, 52.0, 50.0, 42.0, 38.0, 32.0, 28.0, 36.0, 34.0, 27.0, 14.0, 22.0, 30.0, 21.0, 10.0, 7.0, 10.0, 9.0, 11.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.76654052734375, -4.5877685546875, -4.40899658203125, -4.230224609375, -4.05145263671875, -3.8726806640625, -3.69390869140625, -3.51513671875, -3.33636474609375, -3.1575927734375, -2.97882080078125, -2.800048828125, -2.62127685546875, -2.4425048828125, -2.26373291015625, -2.0849609375, -1.90618896484375, -1.7274169921875, -1.54864501953125, -1.369873046875, -1.19110107421875, -1.0123291015625, -0.83355712890625, -0.65478515625, -0.47601318359375, -0.2972412109375, -0.11846923828125, 0.060302734375, 0.23907470703125, 0.4178466796875, 0.59661865234375, 0.775390625, 0.95416259765625, 1.1329345703125, 1.31170654296875, 1.490478515625, 1.66925048828125, 1.8480224609375, 2.02679443359375, 2.20556640625, 2.38433837890625, 2.5631103515625, 2.74188232421875, 2.920654296875, 3.09942626953125, 3.2781982421875, 3.45697021484375, 3.6357421875, 3.81451416015625, 3.9932861328125, 4.17205810546875, 4.350830078125, 4.52960205078125, 4.7083740234375, 4.88714599609375, 5.06591796875, 5.24468994140625, 5.4234619140625, 5.60223388671875, 5.781005859375, 5.95977783203125, 6.1385498046875, 6.31732177734375, 6.49609375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 6.0, 15.0, 35.0, 31.0, 65.0, 80.0, 128.0, 196.0, 321.0, 494.0, 820.0, 1156.0, 1854.0, 2959.0, 4857.0, 8694.0, 14560.0, 25172.0, 42976.0, 71320.0, 110362.0, 152835.0, 172268.0, 152630.0, 110268.0, 71044.0, 42230.0, 24970.0, 14510.0, 8396.0, 4997.0, 3020.0, 1935.0, 1203.0, 719.0, 501.0, 285.0, 217.0, 137.0, 93.0, 61.0, 49.0, 23.0, 20.0, 16.0, 6.0, 4.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.87109375, -4.7164306640625, -4.561767578125, -4.4071044921875, -4.25244140625, -4.0977783203125, -3.943115234375, -3.7884521484375, -3.6337890625, -3.4791259765625, -3.324462890625, -3.1697998046875, -3.01513671875, -2.8604736328125, -2.705810546875, -2.5511474609375, -2.396484375, -2.2418212890625, -2.087158203125, -1.9324951171875, -1.77783203125, -1.6231689453125, -1.468505859375, -1.3138427734375, -1.1591796875, -1.0045166015625, -0.849853515625, -0.6951904296875, -0.54052734375, -0.3858642578125, -0.231201171875, -0.0765380859375, 0.078125, 0.2327880859375, 0.387451171875, 0.5421142578125, 0.69677734375, 0.8514404296875, 1.006103515625, 1.1607666015625, 1.3154296875, 1.4700927734375, 1.624755859375, 1.7794189453125, 1.93408203125, 2.0887451171875, 2.243408203125, 2.3980712890625, 2.552734375, 2.7073974609375, 2.862060546875, 3.0167236328125, 3.17138671875, 3.3260498046875, 3.480712890625, 3.6353759765625, 3.7900390625, 3.9447021484375, 4.099365234375, 4.2540283203125, 4.40869140625, 4.5633544921875, 4.718017578125, 4.8726806640625, 5.02734375]}, "gradients/decoder.bert.encoder.layer.2.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 7.0, 8.0, 15.0, 13.0, 19.0, 15.0, 28.0, 27.0, 32.0, 58.0, 58.0, 41.0, 51.0, 83.0, 55.0, 56.0, 54.0, 61.0, 32.0, 43.0, 40.0, 33.0, 36.0, 22.0, 16.0, 10.0, 10.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005822181701660156, -0.0005652531981468201, -0.0005482882261276245, -0.000531323254108429, -0.0005143582820892334, -0.0004973933100700378, -0.0004804283380508423, -0.00046346336603164673, -0.00044649839401245117, -0.0004295334219932556, -0.00041256844997406006, -0.0003956034779548645, -0.00037863850593566895, -0.0003616735339164734, -0.00034470856189727783, -0.0003277435898780823, -0.0003107786178588867, -0.00029381364583969116, -0.0002768486738204956, -0.00025988370180130005, -0.0002429187297821045, -0.00022595375776290894, -0.00020898878574371338, -0.00019202381372451782, -0.00017505884170532227, -0.0001580938696861267, -0.00014112889766693115, -0.0001241639256477356, -0.00010719895362854004, -9.023398160934448e-05, -7.326900959014893e-05, -5.630403757095337e-05, -3.933906555175781e-05, -2.2374093532562256e-05, -5.409121513366699e-06, 1.1555850505828857e-05, 2.8520822525024414e-05, 4.548579454421997e-05, 6.245076656341553e-05, 7.941573858261108e-05, 9.638071060180664e-05, 0.0001133456826210022, 0.00013031065464019775, 0.0001472756266593933, 0.00016424059867858887, 0.00018120557069778442, 0.00019817054271697998, 0.00021513551473617554, 0.0002321004867553711, 0.00024906545877456665, 0.0002660304307937622, 0.00028299540281295776, 0.0002999603748321533, 0.0003169253468513489, 0.00033389031887054443, 0.00035085529088974, 0.00036782026290893555, 0.0003847852349281311, 0.00040175020694732666, 0.0004187151789665222, 0.0004356801509857178, 0.00045264512300491333, 0.0004696100950241089, 0.00048657506704330444, 0.0005035400390625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 14.0, 13.0, 10.0, 25.0, 30.0, 50.0, 81.0, 98.0, 153.0, 244.0, 312.0, 492.0, 786.0, 1106.0, 1841.0, 2763.0, 4324.0, 6721.0, 10682.0, 16942.0, 27009.0, 42369.0, 64631.0, 94083.0, 125514.0, 145516.0, 141430.0, 115895.0, 84974.0, 57735.0, 37662.0, 23999.0, 14980.0, 9402.0, 5797.0, 3761.0, 2443.0, 1569.0, 1041.0, 685.0, 467.0, 285.0, 198.0, 138.0, 89.0, 66.0, 44.0, 37.0, 24.0, 7.0, 10.0, 9.0, 4.0, 4.0, 1.0], "bins": [-4.90625, -4.7655029296875, -4.624755859375, -4.4840087890625, -4.34326171875, -4.2025146484375, -4.061767578125, -3.9210205078125, -3.7802734375, -3.6395263671875, -3.498779296875, -3.3580322265625, -3.21728515625, -3.0765380859375, -2.935791015625, -2.7950439453125, -2.654296875, -2.5135498046875, -2.372802734375, -2.2320556640625, -2.09130859375, -1.9505615234375, -1.809814453125, -1.6690673828125, -1.5283203125, -1.3875732421875, -1.246826171875, -1.1060791015625, -0.96533203125, -0.8245849609375, -0.683837890625, -0.5430908203125, -0.40234375, -0.2615966796875, -0.120849609375, 0.0198974609375, 0.16064453125, 0.3013916015625, 0.442138671875, 0.5828857421875, 0.7236328125, 0.8643798828125, 1.005126953125, 1.1458740234375, 1.28662109375, 1.4273681640625, 1.568115234375, 1.7088623046875, 1.849609375, 1.9903564453125, 2.131103515625, 2.2718505859375, 2.41259765625, 2.5533447265625, 2.694091796875, 2.8348388671875, 2.9755859375, 3.1163330078125, 3.257080078125, 3.3978271484375, 3.53857421875, 3.6793212890625, 3.820068359375, 3.9608154296875, 4.1015625]}, "gradients/decoder.bert.encoder.layer.2.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 13.0, 10.0, 8.0, 12.0, 15.0, 11.0, 23.0, 21.0, 23.0, 22.0, 29.0, 30.0, 30.0, 38.0, 59.0, 48.0, 45.0, 45.0, 48.0, 36.0, 42.0, 43.0, 41.0, 43.0, 43.0, 37.0, 30.0, 24.0, 22.0, 25.0, 11.0, 21.0, 6.0, 11.0, 10.0, 11.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.4775390625, -1.4342803955078125, -1.391021728515625, -1.3477630615234375, -1.30450439453125, -1.2612457275390625, -1.217987060546875, -1.1747283935546875, -1.1314697265625, -1.0882110595703125, -1.044952392578125, -1.0016937255859375, -0.95843505859375, -0.9151763916015625, -0.871917724609375, -0.8286590576171875, -0.785400390625, -0.7421417236328125, -0.698883056640625, -0.6556243896484375, -0.61236572265625, -0.5691070556640625, -0.525848388671875, -0.4825897216796875, -0.4393310546875, -0.3960723876953125, -0.352813720703125, -0.3095550537109375, -0.26629638671875, -0.2230377197265625, -0.179779052734375, -0.1365203857421875, -0.09326171875, -0.0500030517578125, -0.006744384765625, 0.0365142822265625, 0.07977294921875, 0.1230316162109375, 0.166290283203125, 0.2095489501953125, 0.2528076171875, 0.2960662841796875, 0.339324951171875, 0.3825836181640625, 0.42584228515625, 0.4691009521484375, 0.512359619140625, 0.5556182861328125, 0.598876953125, 0.6421356201171875, 0.685394287109375, 0.7286529541015625, 0.77191162109375, 0.8151702880859375, 0.858428955078125, 0.9016876220703125, 0.9449462890625, 0.9882049560546875, 1.031463623046875, 1.0747222900390625, 1.11798095703125, 1.1612396240234375, 1.204498291015625, 1.2477569580078125, 1.291015625]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 9.0, 9.0, 13.0, 19.0, 21.0, 19.0, 22.0, 21.0, 29.0, 32.0, 48.0, 58.0, 64.0, 42.0, 57.0, 77.0, 59.0, 52.0, 45.0, 60.0, 44.0, 27.0, 36.0, 23.0, 23.0, 12.0, 14.0, 22.0, 7.0, 6.0, 4.0, 8.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-17.58538246154785, -17.135787963867188, -16.686193466186523, -16.23659896850586, -15.787004470825195, -15.337409973144531, -14.887815475463867, -14.438220977783203, -13.988626480102539, -13.539031982421875, -13.089437484741211, -12.639842987060547, -12.190248489379883, -11.740653991699219, -11.291059494018555, -10.84146499633789, -10.391870498657227, -9.942276000976562, -9.492681503295898, -9.043087005615234, -8.59349250793457, -8.143898010253906, -7.694303512573242, -7.244709014892578, -6.795114517211914, -6.34552001953125, -5.895925521850586, -5.446331024169922, -4.996736526489258, -4.547142028808594, -4.09754753112793, -3.6479530334472656, -3.198357582092285, -2.748763084411621, -2.299168586730957, -1.849574089050293, -1.399979591369629, -0.9503850936889648, -0.5007905960083008, -0.05119609832763672, 0.39839839935302734, 0.8479928970336914, 1.2975873947143555, 1.7471818923950195, 2.1967763900756836, 2.6463708877563477, 3.0959653854370117, 3.545559883117676, 3.99515438079834, 4.444748878479004, 4.894343376159668, 5.343937873840332, 5.793532371520996, 6.24312686920166, 6.692721366882324, 7.142315864562988, 7.591910362243652, 8.041504859924316, 8.49109935760498, 8.940693855285645, 9.390288352966309, 9.839882850646973, 10.289477348327637, 10.7390718460083, 11.188666343688965]}, "gradients/decoder.bert.encoder.layer.1.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 10.0, 13.0, 10.0, 12.0, 12.0, 20.0, 26.0, 18.0, 20.0, 24.0, 27.0, 30.0, 28.0, 38.0, 36.0, 43.0, 36.0, 41.0, 38.0, 42.0, 36.0, 39.0, 40.0, 50.0, 25.0, 29.0, 28.0, 26.0, 23.0, 24.0, 19.0, 16.0, 20.0, 13.0, 13.0, 7.0, 12.0, 7.0, 7.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.953724384307861, -7.707611560821533, -7.461498737335205, -7.215385913848877, -6.969273090362549, -6.723160266876221, -6.477047443389893, -6.2309346199035645, -5.984821796417236, -5.738708972930908, -5.49259614944458, -5.246483325958252, -5.000370502471924, -4.754257678985596, -4.508144855499268, -4.2620320320129395, -4.015919208526611, -3.769806385040283, -3.523693561553955, -3.277580738067627, -3.031467914581299, -2.7853550910949707, -2.5392422676086426, -2.2931294441223145, -2.0470166206359863, -1.8009037971496582, -1.55479097366333, -1.308678150177002, -1.0625653266906738, -0.8164525032043457, -0.5703396797180176, -0.32422685623168945, -0.07811403274536133, 0.1679987907409668, 0.4141116142272949, 0.660224437713623, 0.9063372611999512, 1.1524500846862793, 1.3985629081726074, 1.6446757316589355, 1.8907885551452637, 2.136901378631592, 2.38301420211792, 2.629127025604248, 2.875239849090576, 3.1213526725769043, 3.3674654960632324, 3.6135783195495605, 3.8596911430358887, 4.105803966522217, 4.351916790008545, 4.598029613494873, 4.844142436981201, 5.090255260467529, 5.336368083953857, 5.5824809074401855, 5.828593730926514, 6.074706554412842, 6.32081937789917, 6.566932201385498, 6.813045024871826, 7.059157848358154, 7.305270671844482, 7.5513834953308105, 7.797496318817139]}, "gradients/decoder.bert.encoder.layer.1.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 10.0, 9.0, 15.0, 11.0, 30.0, 30.0, 76.0, 68.0, 104.0, 179.0, 239.0, 333.0, 558.0, 780.0, 1191.0, 1792.0, 2729.0, 4202.0, 6833.0, 11256.0, 19449.0, 34943.0, 66782.0, 137725.0, 299143.0, 635918.0, 1037037.0, 941644.0, 515907.0, 237344.0, 111658.0, 55538.0, 29473.0, 16077.0, 9503.0, 5779.0, 3524.0, 2242.0, 1456.0, 894.0, 614.0, 427.0, 266.0, 164.0, 118.0, 68.0, 48.0, 35.0, 30.0, 12.0, 8.0, 1.0, 3.0, 4.0, 2.0, 2.0], "bins": [-15.8984375, -15.4422607421875, -14.986083984375, -14.5299072265625, -14.07373046875, -13.6175537109375, -13.161376953125, -12.7052001953125, -12.2490234375, -11.7928466796875, -11.336669921875, -10.8804931640625, -10.42431640625, -9.9681396484375, -9.511962890625, -9.0557861328125, -8.599609375, -8.1434326171875, -7.687255859375, -7.2310791015625, -6.77490234375, -6.3187255859375, -5.862548828125, -5.4063720703125, -4.9501953125, -4.4940185546875, -4.037841796875, -3.5816650390625, -3.12548828125, -2.6693115234375, -2.213134765625, -1.7569580078125, -1.30078125, -0.8446044921875, -0.388427734375, 0.0677490234375, 0.52392578125, 0.9801025390625, 1.436279296875, 1.8924560546875, 2.3486328125, 2.8048095703125, 3.260986328125, 3.7171630859375, 4.17333984375, 4.6295166015625, 5.085693359375, 5.5418701171875, 5.998046875, 6.4542236328125, 6.910400390625, 7.3665771484375, 7.82275390625, 8.2789306640625, 8.735107421875, 9.1912841796875, 9.6474609375, 10.1036376953125, 10.559814453125, 11.0159912109375, 11.47216796875, 11.9283447265625, 12.384521484375, 12.8406982421875, 13.296875]}, "gradients/decoder.bert.encoder.layer.1.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 9.0, 8.0, 7.0, 12.0, 12.0, 16.0, 13.0, 20.0, 17.0, 10.0, 22.0, 22.0, 36.0, 29.0, 34.0, 47.0, 35.0, 44.0, 40.0, 41.0, 50.0, 48.0, 46.0, 42.0, 41.0, 31.0, 29.0, 38.0, 30.0, 24.0, 23.0, 22.0, 19.0, 8.0, 13.0, 11.0, 8.0, 6.0, 8.0, 5.0, 4.0, 5.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-8.421875, -8.17510986328125, -7.9283447265625, -7.68157958984375, -7.434814453125, -7.18804931640625, -6.9412841796875, -6.69451904296875, -6.44775390625, -6.20098876953125, -5.9542236328125, -5.70745849609375, -5.460693359375, -5.21392822265625, -4.9671630859375, -4.72039794921875, -4.4736328125, -4.22686767578125, -3.9801025390625, -3.73333740234375, -3.486572265625, -3.23980712890625, -2.9930419921875, -2.74627685546875, -2.49951171875, -2.25274658203125, -2.0059814453125, -1.75921630859375, -1.512451171875, -1.26568603515625, -1.0189208984375, -0.77215576171875, -0.525390625, -0.27862548828125, -0.0318603515625, 0.21490478515625, 0.461669921875, 0.70843505859375, 0.9552001953125, 1.20196533203125, 1.44873046875, 1.69549560546875, 1.9422607421875, 2.18902587890625, 2.435791015625, 2.68255615234375, 2.9293212890625, 3.17608642578125, 3.4228515625, 3.66961669921875, 3.9163818359375, 4.16314697265625, 4.409912109375, 4.65667724609375, 4.9034423828125, 5.15020751953125, 5.39697265625, 5.64373779296875, 5.8905029296875, 6.13726806640625, 6.384033203125, 6.63079833984375, 6.8775634765625, 7.12432861328125, 7.37109375]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 6.0, 10.0, 11.0, 11.0, 28.0, 40.0, 70.0, 98.0, 131.0, 155.0, 270.0, 362.0, 565.0, 747.0, 1184.0, 1742.0, 2706.0, 4479.0, 7181.0, 12200.0, 21397.0, 38227.0, 71384.0, 138100.0, 281038.0, 567213.0, 962885.0, 952815.0, 556992.0, 275062.0, 136733.0, 69928.0, 37858.0, 20995.0, 12239.0, 7228.0, 4362.0, 2689.0, 1681.0, 1165.0, 722.0, 502.0, 336.0, 236.0, 159.0, 114.0, 73.0, 46.0, 29.0, 31.0, 21.0, 7.0, 13.0, 3.0, 7.0, 3.0, 2.0, 1.0, 3.0], "bins": [-18.90625, -18.315185546875, -17.72412109375, -17.133056640625, -16.5419921875, -15.950927734375, -15.35986328125, -14.768798828125, -14.177734375, -13.586669921875, -12.99560546875, -12.404541015625, -11.8134765625, -11.222412109375, -10.63134765625, -10.040283203125, -9.44921875, -8.858154296875, -8.26708984375, -7.676025390625, -7.0849609375, -6.493896484375, -5.90283203125, -5.311767578125, -4.720703125, -4.129638671875, -3.53857421875, -2.947509765625, -2.3564453125, -1.765380859375, -1.17431640625, -0.583251953125, 0.0078125, 0.598876953125, 1.18994140625, 1.781005859375, 2.3720703125, 2.963134765625, 3.55419921875, 4.145263671875, 4.736328125, 5.327392578125, 5.91845703125, 6.509521484375, 7.1005859375, 7.691650390625, 8.28271484375, 8.873779296875, 9.46484375, 10.055908203125, 10.64697265625, 11.238037109375, 11.8291015625, 12.420166015625, 13.01123046875, 13.602294921875, 14.193359375, 14.784423828125, 15.37548828125, 15.966552734375, 16.5576171875, 17.148681640625, 17.73974609375, 18.330810546875, 18.921875]}, "gradients/decoder.bert.encoder.layer.1.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 6.0, 4.0, 3.0, 5.0, 7.0, 13.0, 10.0, 16.0, 29.0, 28.0, 33.0, 55.0, 60.0, 79.0, 107.0, 115.0, 161.0, 188.0, 229.0, 227.0, 280.0, 287.0, 304.0, 251.0, 243.0, 223.0, 214.0, 173.0, 155.0, 112.0, 103.0, 85.0, 70.0, 43.0, 30.0, 29.0, 24.0, 21.0, 12.0, 14.0, 7.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.4921875, -5.31744384765625, -5.1427001953125, -4.96795654296875, -4.793212890625, -4.61846923828125, -4.4437255859375, -4.26898193359375, -4.09423828125, -3.91949462890625, -3.7447509765625, -3.57000732421875, -3.395263671875, -3.22052001953125, -3.0457763671875, -2.87103271484375, -2.6962890625, -2.52154541015625, -2.3468017578125, -2.17205810546875, -1.997314453125, -1.82257080078125, -1.6478271484375, -1.47308349609375, -1.29833984375, -1.12359619140625, -0.9488525390625, -0.77410888671875, -0.599365234375, -0.42462158203125, -0.2498779296875, -0.07513427734375, 0.099609375, 0.27435302734375, 0.4490966796875, 0.62384033203125, 0.798583984375, 0.97332763671875, 1.1480712890625, 1.32281494140625, 1.49755859375, 1.67230224609375, 1.8470458984375, 2.02178955078125, 2.196533203125, 2.37127685546875, 2.5460205078125, 2.72076416015625, 2.8955078125, 3.07025146484375, 3.2449951171875, 3.41973876953125, 3.594482421875, 3.76922607421875, 3.9439697265625, 4.11871337890625, 4.29345703125, 4.46820068359375, 4.6429443359375, 4.81768798828125, 4.992431640625, 5.16717529296875, 5.3419189453125, 5.51666259765625, 5.69140625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 3.0, 5.0, 11.0, 16.0, 14.0, 20.0, 23.0, 40.0, 39.0, 42.0, 71.0, 64.0, 73.0, 85.0, 58.0, 69.0, 68.0, 47.0, 56.0, 40.0, 35.0, 23.0, 16.0, 16.0, 15.0, 14.0, 14.0, 4.0, 1.0, 7.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.666440963745117, -22.970821380615234, -22.27520179748535, -21.57958221435547, -20.88396453857422, -20.188344955444336, -19.492725372314453, -18.79710578918457, -18.101486206054688, -17.405866622924805, -16.710247039794922, -16.014629364013672, -15.319009780883789, -14.623390197753906, -13.927770614624023, -13.23215103149414, -12.53653335571289, -11.840913772583008, -11.145295143127441, -10.449675559997559, -9.754056930541992, -9.05843734741211, -8.362817764282227, -7.667198657989502, -6.971579551696777, -6.275960445404053, -5.580341339111328, -4.884721755981445, -4.189102649688721, -3.493483543395996, -2.7978639602661133, -2.1022448539733887, -1.4066276550292969, -0.7110084295272827, -0.015389204025268555, 0.6802301406860352, 1.3758492469787598, 2.0714683532714844, 2.767087936401367, 3.462707042694092, 4.158326148986816, 4.853945255279541, 5.549564361572266, 6.245183944702148, 6.940803050994873, 7.636422157287598, 8.33204174041748, 9.027660369873047, 9.72327995300293, 10.418899536132812, 11.114518165588379, 11.810137748718262, 12.505756378173828, 13.201375961303711, 13.896995544433594, 14.592615127563477, 15.288233757019043, 15.983853340148926, 16.679471969604492, 17.375091552734375, 18.070711135864258, 18.76633071899414, 19.46194839477539, 20.157567977905273, 20.853187561035156]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 10.0, 16.0, 2.0, 8.0, 9.0, 10.0, 19.0, 21.0, 12.0, 19.0, 22.0, 28.0, 32.0, 33.0, 31.0, 39.0, 39.0, 33.0, 47.0, 38.0, 34.0, 36.0, 48.0, 33.0, 46.0, 39.0, 29.0, 27.0, 24.0, 29.0, 33.0, 21.0, 23.0, 18.0, 13.0, 8.0, 11.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-9.95065975189209, -9.642020225524902, -9.333381652832031, -9.024742126464844, -8.716102600097656, -8.407463073730469, -8.098823547363281, -7.79018497467041, -7.481545448303223, -7.172905921936035, -6.864266872406006, -6.555627822875977, -6.246988296508789, -5.938348770141602, -5.629709720611572, -5.321070671081543, -5.0124311447143555, -4.703791618347168, -4.395152568817139, -4.086513519287109, -3.777873992919922, -3.4692347049713135, -3.160595417022705, -2.8519561290740967, -2.5433168411254883, -2.23467755317688, -1.9260382652282715, -1.617398977279663, -1.3087596893310547, -1.0001204013824463, -0.6914811134338379, -0.3828418254852295, -0.0742034912109375, 0.2344357967376709, 0.5430750846862793, 0.8517143726348877, 1.160353660583496, 1.4689929485321045, 1.777632236480713, 2.0862715244293213, 2.3949108123779297, 2.703550100326538, 3.0121893882751465, 3.320828676223755, 3.6294679641723633, 3.9381072521209717, 4.24674654006958, 4.555385589599609, 4.864025115966797, 5.172664642333984, 5.481303691864014, 5.789942741394043, 6.0985822677612305, 6.407221794128418, 6.715860843658447, 7.024499893188477, 7.333139419555664, 7.641778945922852, 7.950417995452881, 8.25905704498291, 8.567696571350098, 8.876336097717285, 9.184974670410156, 9.493614196777344, 9.802253723144531]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 12.0, 17.0, 21.0, 18.0, 31.0, 38.0, 63.0, 85.0, 112.0, 194.0, 248.0, 350.0, 505.0, 777.0, 1111.0, 1745.0, 2516.0, 3873.0, 6105.0, 9765.0, 15929.0, 26572.0, 45568.0, 79688.0, 136007.0, 200244.0, 196743.0, 131516.0, 76686.0, 44003.0, 25536.0, 15416.0, 9493.0, 5883.0, 3840.0, 2512.0, 1681.0, 1128.0, 774.0, 572.0, 359.0, 241.0, 172.0, 126.0, 78.0, 61.0, 48.0, 33.0, 21.0, 13.0, 12.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-1.4287109375, -1.3840179443359375, -1.339324951171875, -1.2946319580078125, -1.24993896484375, -1.2052459716796875, -1.160552978515625, -1.1158599853515625, -1.0711669921875, -1.0264739990234375, -0.981781005859375, -0.9370880126953125, -0.89239501953125, -0.8477020263671875, -0.803009033203125, -0.7583160400390625, -0.713623046875, -0.6689300537109375, -0.624237060546875, -0.5795440673828125, -0.53485107421875, -0.4901580810546875, -0.445465087890625, -0.4007720947265625, -0.3560791015625, -0.3113861083984375, -0.266693115234375, -0.2220001220703125, -0.17730712890625, -0.1326141357421875, -0.087921142578125, -0.0432281494140625, 0.00146484375, 0.0461578369140625, 0.090850830078125, 0.1355438232421875, 0.18023681640625, 0.2249298095703125, 0.269622802734375, 0.3143157958984375, 0.3590087890625, 0.4037017822265625, 0.448394775390625, 0.4930877685546875, 0.53778076171875, 0.5824737548828125, 0.627166748046875, 0.6718597412109375, 0.716552734375, 0.7612457275390625, 0.805938720703125, 0.8506317138671875, 0.89532470703125, 0.9400177001953125, 0.984710693359375, 1.0294036865234375, 1.0740966796875, 1.1187896728515625, 1.163482666015625, 1.2081756591796875, 1.25286865234375, 1.2975616455078125, 1.342254638671875, 1.3869476318359375, 1.431640625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.output.dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 8.0, 5.0, 7.0, 6.0, 8.0, 9.0, 12.0, 21.0, 21.0, 21.0, 21.0, 22.0, 36.0, 33.0, 30.0, 38.0, 49.0, 50.0, 48.0, 40.0, 55.0, 47.0, 36.0, 39.0, 38.0, 38.0, 27.0, 36.0, 18.0, 29.0, 25.0, 17.0, 17.0, 14.0, 17.0, 10.0, 5.0, 10.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.162109375, -10.79296875, -10.423828125, -10.0546875, -9.685546875, -9.31640625, -8.947265625, -8.578125, -8.208984375, -7.83984375, -7.470703125, -7.1015625, -6.732421875, -6.36328125, -5.994140625, -5.625, -5.255859375, -4.88671875, -4.517578125, -4.1484375, -3.779296875, -3.41015625, -3.041015625, -2.671875, -2.302734375, -1.93359375, -1.564453125, -1.1953125, -0.826171875, -0.45703125, -0.087890625, 0.28125, 0.650390625, 1.01953125, 1.388671875, 1.7578125, 2.126953125, 2.49609375, 2.865234375, 3.234375, 3.603515625, 3.97265625, 4.341796875, 4.7109375, 5.080078125, 5.44921875, 5.818359375, 6.1875, 6.556640625, 6.92578125, 7.294921875, 7.6640625, 8.033203125, 8.40234375, 8.771484375, 9.140625, 9.509765625, 9.87890625, 10.248046875, 10.6171875, 10.986328125, 11.35546875, 11.724609375, 12.09375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 10.0, 10.0, 14.0, 18.0, 28.0, 51.0, 70.0, 102.0, 138.0, 200.0, 372.0, 594.0, 989.0, 1758.0, 3606.0, 7583.0, 19085.0, 95487.0, 852141.0, 41233.0, 13283.0, 5621.0, 2684.0, 1443.0, 813.0, 479.0, 247.0, 157.0, 130.0, 70.0, 50.0, 36.0, 18.0, 14.0, 9.0, 10.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.91241455078125, -4.7388916015625, -4.56536865234375, -4.391845703125, -4.21832275390625, -4.0447998046875, -3.87127685546875, -3.69775390625, -3.52423095703125, -3.3507080078125, -3.17718505859375, -3.003662109375, -2.83013916015625, -2.6566162109375, -2.48309326171875, -2.3095703125, -2.13604736328125, -1.9625244140625, -1.78900146484375, -1.615478515625, -1.44195556640625, -1.2684326171875, -1.09490966796875, -0.92138671875, -0.74786376953125, -0.5743408203125, -0.40081787109375, -0.227294921875, -0.05377197265625, 0.1197509765625, 0.29327392578125, 0.466796875, 0.64031982421875, 0.8138427734375, 0.98736572265625, 1.160888671875, 1.33441162109375, 1.5079345703125, 1.68145751953125, 1.85498046875, 2.02850341796875, 2.2020263671875, 2.37554931640625, 2.549072265625, 2.72259521484375, 2.8961181640625, 3.06964111328125, 3.2431640625, 3.41668701171875, 3.5902099609375, 3.76373291015625, 3.937255859375, 4.11077880859375, 4.2843017578125, 4.45782470703125, 4.63134765625, 4.80487060546875, 4.9783935546875, 5.15191650390625, 5.325439453125, 5.49896240234375, 5.6724853515625, 5.84600830078125, 6.01953125]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.value.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 8.0, 4.0, 5.0, 18.0, 10.0, 24.0, 15.0, 22.0, 18.0, 26.0, 23.0, 41.0, 30.0, 33.0, 33.0, 34.0, 51.0, 47.0, 53.0, 39.0, 43.0, 47.0, 34.0, 41.0, 36.0, 36.0, 41.0, 12.0, 23.0, 26.0, 18.0, 25.0, 21.0, 9.0, 6.0, 11.0, 11.0, 5.0, 5.0, 6.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30859375, -7.06488037109375, -6.8211669921875, -6.57745361328125, -6.333740234375, -6.09002685546875, -5.8463134765625, -5.60260009765625, -5.35888671875, -5.11517333984375, -4.8714599609375, -4.62774658203125, -4.384033203125, -4.14031982421875, -3.8966064453125, -3.65289306640625, -3.4091796875, -3.16546630859375, -2.9217529296875, -2.67803955078125, -2.434326171875, -2.19061279296875, -1.9468994140625, -1.70318603515625, -1.45947265625, -1.21575927734375, -0.9720458984375, -0.72833251953125, -0.484619140625, -0.24090576171875, 0.0028076171875, 0.24652099609375, 0.490234375, 0.73394775390625, 0.9776611328125, 1.22137451171875, 1.465087890625, 1.70880126953125, 1.9525146484375, 2.19622802734375, 2.43994140625, 2.68365478515625, 2.9273681640625, 3.17108154296875, 3.414794921875, 3.65850830078125, 3.9022216796875, 4.14593505859375, 4.3896484375, 4.63336181640625, 4.8770751953125, 5.12078857421875, 5.364501953125, 5.60821533203125, 5.8519287109375, 6.09564208984375, 6.33935546875, 6.58306884765625, 6.8267822265625, 7.07049560546875, 7.314208984375, 7.55792236328125, 7.8016357421875, 8.04534912109375, 8.2890625]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 10.0, 16.0, 13.0, 27.0, 29.0, 60.0, 78.0, 118.0, 186.0, 248.0, 400.0, 615.0, 912.0, 1514.0, 2380.0, 4220.0, 7382.0, 14189.0, 30082.0, 751396.0, 182100.0, 24412.0, 12132.0, 6397.0, 3654.0, 2121.0, 1340.0, 821.0, 531.0, 367.0, 257.0, 168.0, 117.0, 82.0, 52.0, 33.0, 26.0, 16.0, 19.0, 11.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.87255859375, -0.8460235595703125, -0.819488525390625, -0.7929534912109375, -0.76641845703125, -0.7398834228515625, -0.713348388671875, -0.6868133544921875, -0.6602783203125, -0.6337432861328125, -0.607208251953125, -0.5806732177734375, -0.55413818359375, -0.5276031494140625, -0.501068115234375, -0.4745330810546875, -0.447998046875, -0.4214630126953125, -0.394927978515625, -0.3683929443359375, -0.34185791015625, -0.3153228759765625, -0.288787841796875, -0.2622528076171875, -0.2357177734375, -0.2091827392578125, -0.182647705078125, -0.1561126708984375, -0.12957763671875, -0.1030426025390625, -0.076507568359375, -0.0499725341796875, -0.0234375, 0.0030975341796875, 0.029632568359375, 0.0561676025390625, 0.08270263671875, 0.1092376708984375, 0.135772705078125, 0.1623077392578125, 0.1888427734375, 0.2153778076171875, 0.241912841796875, 0.2684478759765625, 0.29498291015625, 0.3215179443359375, 0.348052978515625, 0.3745880126953125, 0.401123046875, 0.4276580810546875, 0.454193115234375, 0.4807281494140625, 0.50726318359375, 0.5337982177734375, 0.560333251953125, 0.5868682861328125, 0.6134033203125, 0.6399383544921875, 0.666473388671875, 0.6930084228515625, 0.71954345703125, 0.7460784912109375, 0.772613525390625, 0.7991485595703125, 0.82568359375]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 4.0, 3.0, 7.0, 7.0, 12.0, 14.0, 16.0, 15.0, 19.0, 34.0, 24.0, 26.0, 39.0, 45.0, 50.0, 51.0, 54.0, 46.0, 42.0, 54.0, 45.0, 41.0, 45.0, 57.0, 42.0, 35.0, 24.0, 22.0, 16.0, 21.0, 20.0, 11.0, 15.0, 10.0, 5.0, 7.0, 4.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2470951080322266e-05, -2.1656975150108337e-05, -2.084299921989441e-05, -2.002902328968048e-05, -1.9215047359466553e-05, -1.8401071429252625e-05, -1.7587095499038696e-05, -1.6773119568824768e-05, -1.595914363861084e-05, -1.5145167708396912e-05, -1.4331191778182983e-05, -1.3517215847969055e-05, -1.2703239917755127e-05, -1.1889263987541199e-05, -1.107528805732727e-05, -1.0261312127113342e-05, -9.447336196899414e-06, -8.633360266685486e-06, -7.819384336471558e-06, -7.005408406257629e-06, -6.191432476043701e-06, -5.377456545829773e-06, -4.563480615615845e-06, -3.7495046854019165e-06, -2.9355287551879883e-06, -2.12155282497406e-06, -1.3075768947601318e-06, -4.936009645462036e-07, 3.203749656677246e-07, 1.1343508958816528e-06, 1.948326826095581e-06, 2.7623027563095093e-06, 3.5762786865234375e-06, 4.390254616737366e-06, 5.204230546951294e-06, 6.018206477165222e-06, 6.83218240737915e-06, 7.646158337593079e-06, 8.460134267807007e-06, 9.274110198020935e-06, 1.0088086128234863e-05, 1.0902062058448792e-05, 1.171603798866272e-05, 1.2530013918876648e-05, 1.3343989849090576e-05, 1.4157965779304504e-05, 1.4971941709518433e-05, 1.578591763973236e-05, 1.659989356994629e-05, 1.7413869500160217e-05, 1.8227845430374146e-05, 1.9041821360588074e-05, 1.9855797290802002e-05, 2.066977322101593e-05, 2.148374915122986e-05, 2.2297725081443787e-05, 2.3111701011657715e-05, 2.3925676941871643e-05, 2.473965287208557e-05, 2.55536288022995e-05, 2.6367604732513428e-05, 2.7181580662727356e-05, 2.7995556592941284e-05, 2.8809532523155212e-05, 2.962350845336914e-05]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 4.0, 5.0, 4.0, 11.0, 13.0, 7.0, 25.0, 17.0, 37.0, 64.0, 115.0, 211.0, 363.0, 717.0, 1304.0, 2450.0, 4940.0, 9995.0, 21578.0, 47125.0, 102290.0, 205143.0, 281106.0, 193499.0, 94746.0, 43560.0, 20160.0, 9344.0, 4742.0, 2262.0, 1190.0, 647.0, 360.0, 171.0, 108.0, 78.0, 54.0, 31.0, 18.0, 12.0, 12.0, 10.0, 7.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.5087890625, -0.4920806884765625, -0.475372314453125, -0.4586639404296875, -0.44195556640625, -0.4252471923828125, -0.408538818359375, -0.3918304443359375, -0.3751220703125, -0.3584136962890625, -0.341705322265625, -0.3249969482421875, -0.30828857421875, -0.2915802001953125, -0.274871826171875, -0.2581634521484375, -0.241455078125, -0.2247467041015625, -0.208038330078125, -0.1913299560546875, -0.17462158203125, -0.1579132080078125, -0.141204833984375, -0.1244964599609375, -0.1077880859375, -0.0910797119140625, -0.074371337890625, -0.0576629638671875, -0.04095458984375, -0.0242462158203125, -0.007537841796875, 0.0091705322265625, 0.02587890625, 0.0425872802734375, 0.059295654296875, 0.0760040283203125, 0.09271240234375, 0.1094207763671875, 0.126129150390625, 0.1428375244140625, 0.1595458984375, 0.1762542724609375, 0.192962646484375, 0.2096710205078125, 0.22637939453125, 0.2430877685546875, 0.259796142578125, 0.2765045166015625, 0.293212890625, 0.3099212646484375, 0.326629638671875, 0.3433380126953125, 0.36004638671875, 0.3767547607421875, 0.393463134765625, 0.4101715087890625, 0.4268798828125, 0.4435882568359375, 0.460296630859375, 0.4770050048828125, 0.49371337890625, 0.5104217529296875, 0.527130126953125, 0.5438385009765625, 0.560546875]}, "gradients/decoder.bert.encoder.layer.1.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 9.0, 10.0, 5.0, 15.0, 14.0, 23.0, 35.0, 28.0, 43.0, 64.0, 69.0, 60.0, 71.0, 75.0, 90.0, 69.0, 72.0, 64.0, 39.0, 32.0, 22.0, 24.0, 16.0, 19.0, 10.0, 3.0, 3.0, 4.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.186187744140625, -0.18048095703125, -0.174774169921875, -0.1690673828125, -0.163360595703125, -0.15765380859375, -0.151947021484375, -0.146240234375, -0.140533447265625, -0.13482666015625, -0.129119873046875, -0.1234130859375, -0.117706298828125, -0.11199951171875, -0.106292724609375, -0.1005859375, -0.094879150390625, -0.08917236328125, -0.083465576171875, -0.0777587890625, -0.072052001953125, -0.06634521484375, -0.060638427734375, -0.054931640625, -0.049224853515625, -0.04351806640625, -0.037811279296875, -0.0321044921875, -0.026397705078125, -0.02069091796875, -0.014984130859375, -0.00927734375, -0.003570556640625, 0.00213623046875, 0.007843017578125, 0.0135498046875, 0.019256591796875, 0.02496337890625, 0.030670166015625, 0.036376953125, 0.042083740234375, 0.04779052734375, 0.053497314453125, 0.0592041015625, 0.064910888671875, 0.07061767578125, 0.076324462890625, 0.08203125, 0.087738037109375, 0.09344482421875, 0.099151611328125, 0.1048583984375, 0.110565185546875, 0.11627197265625, 0.121978759765625, 0.127685546875, 0.133392333984375, 0.13909912109375, 0.144805908203125, 0.1505126953125, 0.156219482421875, 0.16192626953125, 0.167633056640625, 0.17333984375]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 6.0, 13.0, 14.0, 14.0, 18.0, 25.0, 46.0, 36.0, 44.0, 69.0, 67.0, 73.0, 81.0, 64.0, 64.0, 65.0, 47.0, 59.0, 35.0, 37.0, 25.0, 13.0, 18.0, 13.0, 12.0, 14.0, 6.0, 2.0, 5.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.153614044189453, -23.462472915649414, -22.771333694458008, -22.08019256591797, -21.389053344726562, -20.697912216186523, -20.006771087646484, -19.315631866455078, -18.624492645263672, -17.933351516723633, -17.242212295532227, -16.551071166992188, -15.859931945800781, -15.168790817260742, -14.47765064239502, -13.786510467529297, -13.095369338989258, -12.404229164123535, -11.713088989257812, -11.021947860717773, -10.330808639526367, -9.639667510986328, -8.948527336120605, -8.257387161254883, -7.56624698638916, -6.8751068115234375, -6.183966636657715, -5.492825984954834, -4.801685810089111, -4.110545635223389, -3.419404983520508, -2.728264808654785, -2.0371227264404297, -1.3459824323654175, -0.6548421382904053, 0.036298274993896484, 0.7274384498596191, 1.4185786247253418, 2.1097192764282227, 2.8008594512939453, 3.491999626159668, 4.183139801025391, 4.874279975891113, 5.565420627593994, 6.256560802459717, 6.9477009773254395, 7.63884162902832, 8.329981803894043, 9.021121978759766, 9.712262153625488, 10.403402328491211, 11.09454345703125, 11.785682678222656, 12.476823806762695, 13.167963981628418, 13.85910415649414, 14.550244331359863, 15.241384506225586, 15.932524681091309, 16.62366485595703, 17.31480598449707, 18.005945205688477, 18.697086334228516, 19.388225555419922, 20.07936668395996]}, "gradients/decoder.bert.encoder.layer.1.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 6.0, 6.0, 20.0, 3.0, 6.0, 9.0, 13.0, 17.0, 21.0, 12.0, 19.0, 16.0, 33.0, 32.0, 35.0, 29.0, 37.0, 38.0, 38.0, 45.0, 39.0, 35.0, 33.0, 48.0, 36.0, 43.0, 41.0, 30.0, 28.0, 21.0, 35.0, 28.0, 22.0, 22.0, 19.0, 13.0, 9.0, 11.0, 10.0, 7.0, 7.0, 3.0, 5.0, 2.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.05845832824707, -9.748851776123047, -9.439245223999023, -9.129639625549316, -8.820033073425293, -8.51042652130127, -8.200819969177246, -7.891213417053223, -7.581607341766357, -7.272000789642334, -6.962394714355469, -6.652788162231445, -6.343181610107422, -6.033575534820557, -5.723968982696533, -5.414362907409668, -5.1047563552856445, -4.795149803161621, -4.485543727874756, -4.175937175750732, -3.866330862045288, -3.5567245483398438, -3.2471179962158203, -2.937511682510376, -2.6279053688049316, -2.3182990550994873, -2.008692741394043, -1.6990861892700195, -1.3894798755645752, -1.0798735618591309, -0.770267128944397, -0.4606606960296631, -0.15105533599853516, 0.15855103731155396, 0.46815741062164307, 0.7777637839317322, 1.0873701572418213, 1.3969764709472656, 1.7065829038619995, 2.0161893367767334, 2.3257956504821777, 2.635401964187622, 2.9450082778930664, 3.25461483001709, 3.564221143722534, 3.8738274574279785, 4.183434009552002, 4.493040084838867, 4.802646636962891, 5.112253189086914, 5.421859264373779, 5.731465816497803, 6.041071891784668, 6.350678443908691, 6.660284996032715, 6.969891548156738, 7.2794976234436035, 7.589104175567627, 7.898710250854492, 8.208316802978516, 8.517923355102539, 8.827529907226562, 9.13713550567627, 9.446742057800293, 9.756348609924316]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 16.0, 21.0, 22.0, 40.0, 65.0, 82.0, 119.0, 208.0, 311.0, 456.0, 658.0, 1022.0, 1477.0, 2237.0, 3447.0, 5261.0, 7790.0, 12128.0, 18322.0, 28694.0, 43800.0, 67374.0, 98738.0, 133001.0, 152243.0, 141185.0, 109757.0, 76332.0, 50160.0, 32374.0, 21059.0, 13701.0, 8941.0, 5796.0, 3911.0, 2580.0, 1708.0, 1120.0, 791.0, 540.0, 340.0, 224.0, 157.0, 113.0, 79.0, 40.0, 41.0, 20.0, 15.0, 18.0, 10.0, 3.0, 5.0, 1.0, 2.0], "bins": [-11.5390625, -11.1961669921875, -10.853271484375, -10.5103759765625, -10.16748046875, -9.8245849609375, -9.481689453125, -9.1387939453125, -8.7958984375, -8.4530029296875, -8.110107421875, -7.7672119140625, -7.42431640625, -7.0814208984375, -6.738525390625, -6.3956298828125, -6.052734375, -5.7098388671875, -5.366943359375, -5.0240478515625, -4.68115234375, -4.3382568359375, -3.995361328125, -3.6524658203125, -3.3095703125, -2.9666748046875, -2.623779296875, -2.2808837890625, -1.93798828125, -1.5950927734375, -1.252197265625, -0.9093017578125, -0.56640625, -0.2235107421875, 0.119384765625, 0.4622802734375, 0.80517578125, 1.1480712890625, 1.490966796875, 1.8338623046875, 2.1767578125, 2.5196533203125, 2.862548828125, 3.2054443359375, 3.54833984375, 3.8912353515625, 4.234130859375, 4.5770263671875, 4.919921875, 5.2628173828125, 5.605712890625, 5.9486083984375, 6.29150390625, 6.6343994140625, 6.977294921875, 7.3201904296875, 7.6630859375, 8.0059814453125, 8.348876953125, 8.6917724609375, 9.03466796875, 9.3775634765625, 9.720458984375, 10.0633544921875, 10.40625]}, "gradients/decoder.bert.encoder.layer.1.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 12.0, 10.0, 16.0, 10.0, 20.0, 14.0, 18.0, 25.0, 16.0, 36.0, 31.0, 42.0, 54.0, 39.0, 52.0, 38.0, 38.0, 53.0, 39.0, 45.0, 56.0, 44.0, 40.0, 40.0, 28.0, 24.0, 23.0, 28.0, 21.0, 17.0, 12.0, 10.0, 5.0, 6.0, 3.0, 7.0, 5.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8984375, -11.5035400390625, -11.108642578125, -10.7137451171875, -10.31884765625, -9.9239501953125, -9.529052734375, -9.1341552734375, -8.7392578125, -8.3443603515625, -7.949462890625, -7.5545654296875, -7.15966796875, -6.7647705078125, -6.369873046875, -5.9749755859375, -5.580078125, -5.1851806640625, -4.790283203125, -4.3953857421875, -4.00048828125, -3.6055908203125, -3.210693359375, -2.8157958984375, -2.4208984375, -2.0260009765625, -1.631103515625, -1.2362060546875, -0.84130859375, -0.4464111328125, -0.051513671875, 0.3433837890625, 0.73828125, 1.1331787109375, 1.528076171875, 1.9229736328125, 2.31787109375, 2.7127685546875, 3.107666015625, 3.5025634765625, 3.8974609375, 4.2923583984375, 4.687255859375, 5.0821533203125, 5.47705078125, 5.8719482421875, 6.266845703125, 6.6617431640625, 7.056640625, 7.4515380859375, 7.846435546875, 8.2413330078125, 8.63623046875, 9.0311279296875, 9.426025390625, 9.8209228515625, 10.2158203125, 10.6107177734375, 11.005615234375, 11.4005126953125, 11.79541015625, 12.1903076171875, 12.585205078125, 12.9801025390625, 13.375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 13.0, 15.0, 21.0, 34.0, 51.0, 104.0, 176.0, 253.0, 523.0, 852.0, 1557.0, 2753.0, 4992.0, 9427.0, 18472.0, 36812.0, 74367.0, 144065.0, 225440.0, 227839.0, 146876.0, 76077.0, 37661.0, 18724.0, 9701.0, 5163.0, 2923.0, 1562.0, 857.0, 482.0, 315.0, 162.0, 112.0, 70.0, 45.0, 34.0, 15.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.046875, -18.412353515625, -17.77783203125, -17.143310546875, -16.5087890625, -15.874267578125, -15.23974609375, -14.605224609375, -13.970703125, -13.336181640625, -12.70166015625, -12.067138671875, -11.4326171875, -10.798095703125, -10.16357421875, -9.529052734375, -8.89453125, -8.260009765625, -7.62548828125, -6.990966796875, -6.3564453125, -5.721923828125, -5.08740234375, -4.452880859375, -3.818359375, -3.183837890625, -2.54931640625, -1.914794921875, -1.2802734375, -0.645751953125, -0.01123046875, 0.623291015625, 1.2578125, 1.892333984375, 2.52685546875, 3.161376953125, 3.7958984375, 4.430419921875, 5.06494140625, 5.699462890625, 6.333984375, 6.968505859375, 7.60302734375, 8.237548828125, 8.8720703125, 9.506591796875, 10.14111328125, 10.775634765625, 11.41015625, 12.044677734375, 12.67919921875, 13.313720703125, 13.9482421875, 14.582763671875, 15.21728515625, 15.851806640625, 16.486328125, 17.120849609375, 17.75537109375, 18.389892578125, 19.0244140625, 19.658935546875, 20.29345703125, 20.927978515625, 21.5625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 3.0, 9.0, 8.0, 11.0, 13.0, 12.0, 23.0, 13.0, 20.0, 22.0, 26.0, 32.0, 35.0, 30.0, 33.0, 35.0, 35.0, 36.0, 36.0, 42.0, 56.0, 33.0, 30.0, 38.0, 43.0, 41.0, 25.0, 28.0, 32.0, 23.0, 30.0, 24.0, 14.0, 8.0, 16.0, 24.0, 13.0, 12.0, 8.0, 10.0, 8.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33984375, -7.10040283203125, -6.8609619140625, -6.62152099609375, -6.382080078125, -6.14263916015625, -5.9031982421875, -5.66375732421875, -5.42431640625, -5.18487548828125, -4.9454345703125, -4.70599365234375, -4.466552734375, -4.22711181640625, -3.9876708984375, -3.74822998046875, -3.5087890625, -3.26934814453125, -3.0299072265625, -2.79046630859375, -2.551025390625, -2.31158447265625, -2.0721435546875, -1.83270263671875, -1.59326171875, -1.35382080078125, -1.1143798828125, -0.87493896484375, -0.635498046875, -0.39605712890625, -0.1566162109375, 0.08282470703125, 0.322265625, 0.56170654296875, 0.8011474609375, 1.04058837890625, 1.280029296875, 1.51947021484375, 1.7589111328125, 1.99835205078125, 2.23779296875, 2.47723388671875, 2.7166748046875, 2.95611572265625, 3.195556640625, 3.43499755859375, 3.6744384765625, 3.91387939453125, 4.1533203125, 4.39276123046875, 4.6322021484375, 4.87164306640625, 5.111083984375, 5.35052490234375, 5.5899658203125, 5.82940673828125, 6.06884765625, 6.30828857421875, 6.5477294921875, 6.78717041015625, 7.026611328125, 7.26605224609375, 7.5054931640625, 7.74493408203125, 7.984375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 10.0, 13.0, 20.0, 23.0, 49.0, 81.0, 126.0, 170.0, 272.0, 415.0, 690.0, 1066.0, 1779.0, 2999.0, 5096.0, 9468.0, 18204.0, 38130.0, 85346.0, 187133.0, 291096.0, 214732.0, 100859.0, 44598.0, 21216.0, 10671.0, 5730.0, 3342.0, 1991.0, 1182.0, 722.0, 463.0, 313.0, 191.0, 137.0, 74.0, 49.0, 37.0, 21.0, 14.0, 6.0, 11.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -15.993896484375, -15.48779296875, -14.981689453125, -14.4755859375, -13.969482421875, -13.46337890625, -12.957275390625, -12.451171875, -11.945068359375, -11.43896484375, -10.932861328125, -10.4267578125, -9.920654296875, -9.41455078125, -8.908447265625, -8.40234375, -7.896240234375, -7.39013671875, -6.884033203125, -6.3779296875, -5.871826171875, -5.36572265625, -4.859619140625, -4.353515625, -3.847412109375, -3.34130859375, -2.835205078125, -2.3291015625, -1.822998046875, -1.31689453125, -0.810791015625, -0.3046875, 0.201416015625, 0.70751953125, 1.213623046875, 1.7197265625, 2.225830078125, 2.73193359375, 3.238037109375, 3.744140625, 4.250244140625, 4.75634765625, 5.262451171875, 5.7685546875, 6.274658203125, 6.78076171875, 7.286865234375, 7.79296875, 8.299072265625, 8.80517578125, 9.311279296875, 9.8173828125, 10.323486328125, 10.82958984375, 11.335693359375, 11.841796875, 12.347900390625, 12.85400390625, 13.360107421875, 13.8662109375, 14.372314453125, 14.87841796875, 15.384521484375, 15.890625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 15.0, 24.0, 38.0, 48.0, 66.0, 99.0, 112.0, 130.0, 125.0, 99.0, 67.0, 40.0, 39.0, 18.0, 14.0, 6.0, 5.0, 6.0, 5.0, 8.0, 0.0, 4.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0021152496337890625, -0.0020520389080047607, -0.001988828182220459, -0.0019256174564361572, -0.0018624067306518555, -0.0017991960048675537, -0.001735985279083252, -0.0016727745532989502, -0.0016095638275146484, -0.0015463531017303467, -0.001483142375946045, -0.0014199316501617432, -0.0013567209243774414, -0.0012935101985931396, -0.0012302994728088379, -0.0011670887470245361, -0.0011038780212402344, -0.0010406672954559326, -0.0009774565696716309, -0.0009142458438873291, -0.0008510351181030273, -0.0007878243923187256, -0.0007246136665344238, -0.0006614029407501221, -0.0005981922149658203, -0.0005349814891815186, -0.0004717707633972168, -0.00040856003761291504, -0.0003453493118286133, -0.0002821385860443115, -0.00021892786026000977, -0.000155717134475708, -9.250640869140625e-05, -2.9295682907104492e-05, 3.3915042877197266e-05, 9.712576866149902e-05, 0.00016033649444580078, 0.00022354722023010254, 0.0002867579460144043, 0.00034996867179870605, 0.0004131793975830078, 0.00047639012336730957, 0.0005396008491516113, 0.0006028115749359131, 0.0006660223007202148, 0.0007292330265045166, 0.0007924437522888184, 0.0008556544780731201, 0.0009188652038574219, 0.0009820759296417236, 0.0010452866554260254, 0.0011084973812103271, 0.001171708106994629, 0.0012349188327789307, 0.0012981295585632324, 0.0013613402843475342, 0.001424551010131836, 0.0014877617359161377, 0.0015509724617004395, 0.0016141831874847412, 0.001677393913269043, 0.0017406046390533447, 0.0018038153648376465, 0.0018670260906219482, 0.00193023681640625]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 10.0, 15.0, 10.0, 17.0, 28.0, 31.0, 40.0, 67.0, 102.0, 143.0, 213.0, 283.0, 395.0, 727.0, 1108.0, 1657.0, 2590.0, 4259.0, 7306.0, 13148.0, 24474.0, 46591.0, 93395.0, 179572.0, 251538.0, 197615.0, 106089.0, 53910.0, 27542.0, 14651.0, 8161.0, 4736.0, 2878.0, 1766.0, 1152.0, 777.0, 491.0, 329.0, 227.0, 176.0, 104.0, 70.0, 49.0, 30.0, 28.0, 24.0, 8.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-13.7421875, -13.3072509765625, -12.872314453125, -12.4373779296875, -12.00244140625, -11.5675048828125, -11.132568359375, -10.6976318359375, -10.2626953125, -9.8277587890625, -9.392822265625, -8.9578857421875, -8.52294921875, -8.0880126953125, -7.653076171875, -7.2181396484375, -6.783203125, -6.3482666015625, -5.913330078125, -5.4783935546875, -5.04345703125, -4.6085205078125, -4.173583984375, -3.7386474609375, -3.3037109375, -2.8687744140625, -2.433837890625, -1.9989013671875, -1.56396484375, -1.1290283203125, -0.694091796875, -0.2591552734375, 0.17578125, 0.6107177734375, 1.045654296875, 1.4805908203125, 1.91552734375, 2.3504638671875, 2.785400390625, 3.2203369140625, 3.6552734375, 4.0902099609375, 4.525146484375, 4.9600830078125, 5.39501953125, 5.8299560546875, 6.264892578125, 6.6998291015625, 7.134765625, 7.5697021484375, 8.004638671875, 8.4395751953125, 8.87451171875, 9.3094482421875, 9.744384765625, 10.1793212890625, 10.6142578125, 11.0491943359375, 11.484130859375, 11.9190673828125, 12.35400390625, 12.7889404296875, 13.223876953125, 13.6588134765625, 14.09375]}, "gradients/decoder.bert.encoder.layer.1.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 11.0, 11.0, 21.0, 22.0, 20.0, 31.0, 36.0, 58.0, 59.0, 68.0, 75.0, 98.0, 81.0, 82.0, 76.0, 52.0, 49.0, 37.0, 26.0, 16.0, 16.0, 11.0, 7.0, 11.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.67388916015625, -5.5274658203125, -5.38104248046875, -5.234619140625, -5.08819580078125, -4.9417724609375, -4.79534912109375, -4.64892578125, -4.50250244140625, -4.3560791015625, -4.20965576171875, -4.063232421875, -3.91680908203125, -3.7703857421875, -3.62396240234375, -3.4775390625, -3.33111572265625, -3.1846923828125, -3.03826904296875, -2.891845703125, -2.74542236328125, -2.5989990234375, -2.45257568359375, -2.30615234375, -2.15972900390625, -2.0133056640625, -1.86688232421875, -1.720458984375, -1.57403564453125, -1.4276123046875, -1.28118896484375, -1.134765625, -0.98834228515625, -0.8419189453125, -0.69549560546875, -0.549072265625, -0.40264892578125, -0.2562255859375, -0.10980224609375, 0.03662109375, 0.18304443359375, 0.3294677734375, 0.47589111328125, 0.622314453125, 0.76873779296875, 0.9151611328125, 1.06158447265625, 1.2080078125, 1.35443115234375, 1.5008544921875, 1.64727783203125, 1.793701171875, 1.94012451171875, 2.0865478515625, 2.23297119140625, 2.37939453125, 2.52581787109375, 2.6722412109375, 2.81866455078125, 2.965087890625, 3.11151123046875, 3.2579345703125, 3.40435791015625, 3.55078125]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 1.0, 4.0, 5.0, 16.0, 4.0, 10.0, 13.0, 21.0, 26.0, 33.0, 43.0, 46.0, 62.0, 65.0, 62.0, 82.0, 67.0, 73.0, 49.0, 65.0, 51.0, 45.0, 38.0, 35.0, 18.0, 22.0, 14.0, 7.0, 5.0, 7.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.947654724121094, -24.218374252319336, -23.489093780517578, -22.759815216064453, -22.030534744262695, -21.301254272460938, -20.57197380065918, -19.842693328857422, -19.113414764404297, -18.38413429260254, -17.65485382080078, -16.925575256347656, -16.1962947845459, -15.46701431274414, -14.737733840942383, -14.008454322814941, -13.279173851013184, -12.549893379211426, -11.820613861083984, -11.091333389282227, -10.362053871154785, -9.632773399353027, -8.903493881225586, -8.174213409423828, -7.4449334144592285, -6.715653419494629, -5.986373424530029, -5.25709342956543, -4.527812957763672, -3.7985332012176514, -3.0692529678344727, -2.339972972869873, -1.6106929779052734, -0.881412923336029, -0.15213286876678467, 0.5771472454071045, 1.306427240371704, 2.0357072353363037, 2.7649874687194824, 3.494267463684082, 4.223547458648682, 4.952827453613281, 5.682107448577881, 6.4113874435424805, 7.140667915344238, 7.86994743347168, 8.599227905273438, 9.328508377075195, 10.057787895202637, 10.787068367004395, 11.516347885131836, 12.245628356933594, 12.974907875061035, 13.704188346862793, 14.433467864990234, 15.162748336791992, 15.89202880859375, 16.621309280395508, 17.350589752197266, 18.07986831665039, 18.80914878845215, 19.538429260253906, 20.267709732055664, 20.996990203857422, 21.726268768310547]}, "gradients/decoder.bert.encoder.layer.0.output.LayerNorm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 6.0, 6.0, 6.0, 5.0, 4.0, 5.0, 5.0, 4.0, 13.0, 14.0, 12.0, 14.0, 16.0, 15.0, 17.0, 22.0, 25.0, 27.0, 19.0, 28.0, 38.0, 38.0, 49.0, 46.0, 31.0, 30.0, 52.0, 45.0, 33.0, 33.0, 37.0, 38.0, 33.0, 27.0, 34.0, 20.0, 22.0, 21.0, 19.0, 21.0, 16.0, 12.0, 14.0, 8.0, 5.0, 5.0, 5.0, 7.0, 4.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.778368949890137, -10.42904281616211, -10.079717636108398, -9.730391502380371, -9.38106632232666, -9.031740188598633, -8.682415008544922, -8.333088874816895, -7.983763217926025, -7.634437561035156, -7.285111904144287, -6.935786247253418, -6.586460113525391, -6.23713493347168, -5.887808799743652, -5.538483142852783, -5.189157485961914, -4.839831829071045, -4.490506172180176, -4.141180038452148, -3.7918546199798584, -3.4425289630889893, -3.093203067779541, -2.743877410888672, -2.3945517539978027, -2.0452260971069336, -1.695900321006775, -1.3465745449066162, -0.9972488880157471, -0.6479232311248779, -0.2985973358154297, 0.05072832107543945, 0.4000539779663086, 0.7493796944618225, 1.0987054109573364, 1.4480311870574951, 1.7973568439483643, 2.1466825008392334, 2.4960083961486816, 2.845334053039551, 3.19465970993042, 3.543985366821289, 3.893311023712158, 4.242636680603027, 4.591962814331055, 4.941287994384766, 5.290614128112793, 5.639939785003662, 5.989265441894531, 6.3385910987854, 6.6879167556762695, 7.037242889404297, 7.386568069458008, 7.735894203186035, 8.085220336914062, 8.434545516967773, 8.783870697021484, 9.133196830749512, 9.482522010803223, 9.83184814453125, 10.181173324584961, 10.530499458312988, 10.879825592041016, 11.229150772094727, 11.578476905822754]}, "gradients/decoder.bert.encoder.layer.0.output.dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 6.0, 5.0, 2.0, 5.0, 8.0, 16.0, 19.0, 31.0, 39.0, 46.0, 68.0, 93.0, 131.0, 192.0, 284.0, 423.0, 622.0, 932.0, 1424.0, 2214.0, 3475.0, 6026.0, 10561.0, 20107.0, 42129.0, 95281.0, 244619.0, 649963.0, 1251706.0, 1068706.0, 477663.0, 178803.0, 71653.0, 31914.0, 15394.0, 8185.0, 4647.0, 2656.0, 1612.0, 987.0, 625.0, 345.0, 242.0, 161.0, 100.0, 57.0, 39.0, 23.0, 20.0, 17.0, 7.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.375, -25.61767578125, -24.8603515625, -24.10302734375, -23.345703125, -22.58837890625, -21.8310546875, -21.07373046875, -20.31640625, -19.55908203125, -18.8017578125, -18.04443359375, -17.287109375, -16.52978515625, -15.7724609375, -15.01513671875, -14.2578125, -13.50048828125, -12.7431640625, -11.98583984375, -11.228515625, -10.47119140625, -9.7138671875, -8.95654296875, -8.19921875, -7.44189453125, -6.6845703125, -5.92724609375, -5.169921875, -4.41259765625, -3.6552734375, -2.89794921875, -2.140625, -1.38330078125, -0.6259765625, 0.13134765625, 0.888671875, 1.64599609375, 2.4033203125, 3.16064453125, 3.91796875, 4.67529296875, 5.4326171875, 6.18994140625, 6.947265625, 7.70458984375, 8.4619140625, 9.21923828125, 9.9765625, 10.73388671875, 11.4912109375, 12.24853515625, 13.005859375, 13.76318359375, 14.5205078125, 15.27783203125, 16.03515625, 16.79248046875, 17.5498046875, 18.30712890625, 19.064453125, 19.82177734375, 20.5791015625, 21.33642578125, 22.09375]}, "gradients/decoder.bert.encoder.layer.0.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 2.0, 6.0, 5.0, 5.0, 4.0, 18.0, 4.0, 16.0, 21.0, 24.0, 20.0, 18.0, 30.0, 28.0, 24.0, 20.0, 33.0, 34.0, 37.0, 48.0, 44.0, 41.0, 46.0, 38.0, 38.0, 37.0, 45.0, 36.0, 38.0, 26.0, 37.0, 34.0, 16.0, 18.0, 20.0, 14.0, 17.0, 14.0, 6.0, 7.0, 7.0, 2.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.6015625, -12.219482421875, -11.83740234375, -11.455322265625, -11.0732421875, -10.691162109375, -10.30908203125, -9.927001953125, -9.544921875, -9.162841796875, -8.78076171875, -8.398681640625, -8.0166015625, -7.634521484375, -7.25244140625, -6.870361328125, -6.48828125, -6.106201171875, -5.72412109375, -5.342041015625, -4.9599609375, -4.577880859375, -4.19580078125, -3.813720703125, -3.431640625, -3.049560546875, -2.66748046875, -2.285400390625, -1.9033203125, -1.521240234375, -1.13916015625, -0.757080078125, -0.375, 0.007080078125, 0.38916015625, 0.771240234375, 1.1533203125, 1.535400390625, 1.91748046875, 2.299560546875, 2.681640625, 3.063720703125, 3.44580078125, 3.827880859375, 4.2099609375, 4.592041015625, 4.97412109375, 5.356201171875, 5.73828125, 6.120361328125, 6.50244140625, 6.884521484375, 7.2666015625, 7.648681640625, 8.03076171875, 8.412841796875, 8.794921875, 9.177001953125, 9.55908203125, 9.941162109375, 10.3232421875, 10.705322265625, 11.08740234375, 11.469482421875, 11.8515625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 7.0, 13.0, 19.0, 21.0, 64.0, 84.0, 134.0, 191.0, 305.0, 493.0, 760.0, 1199.0, 2016.0, 3254.0, 5983.0, 11249.0, 21931.0, 47053.0, 111589.0, 293156.0, 805060.0, 1468642.0, 876051.0, 322839.0, 120922.0, 50897.0, 23437.0, 11722.0, 6343.0, 3367.0, 2101.0, 1294.0, 753.0, 471.0, 308.0, 190.0, 123.0, 82.0, 52.0, 38.0, 17.0, 20.0, 14.0, 5.0, 4.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.78125, -40.57177734375, -39.3623046875, -38.15283203125, -36.943359375, -35.73388671875, -34.5244140625, -33.31494140625, -32.10546875, -30.89599609375, -29.6865234375, -28.47705078125, -27.267578125, -26.05810546875, -24.8486328125, -23.63916015625, -22.4296875, -21.22021484375, -20.0107421875, -18.80126953125, -17.591796875, -16.38232421875, -15.1728515625, -13.96337890625, -12.75390625, -11.54443359375, -10.3349609375, -9.12548828125, -7.916015625, -6.70654296875, -5.4970703125, -4.28759765625, -3.078125, -1.86865234375, -0.6591796875, 0.55029296875, 1.759765625, 2.96923828125, 4.1787109375, 5.38818359375, 6.59765625, 7.80712890625, 9.0166015625, 10.22607421875, 11.435546875, 12.64501953125, 13.8544921875, 15.06396484375, 16.2734375, 17.48291015625, 18.6923828125, 19.90185546875, 21.111328125, 22.32080078125, 23.5302734375, 24.73974609375, 25.94921875, 27.15869140625, 28.3681640625, 29.57763671875, 30.787109375, 31.99658203125, 33.2060546875, 34.41552734375, 35.625]}, "gradients/decoder.bert.encoder.layer.0.intermediate.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 10.0, 6.0, 4.0, 10.0, 9.0, 21.0, 26.0, 32.0, 34.0, 55.0, 62.0, 69.0, 98.0, 122.0, 158.0, 139.0, 222.0, 254.0, 277.0, 293.0, 300.0, 327.0, 279.0, 270.0, 206.0, 177.0, 147.0, 113.0, 82.0, 54.0, 44.0, 39.0, 28.0, 25.0, 20.0, 18.0, 13.0, 8.0, 6.0, 5.0, 6.0, 5.0, 0.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7734375, -8.5018310546875, -8.230224609375, -7.9586181640625, -7.68701171875, -7.4154052734375, -7.143798828125, -6.8721923828125, -6.6005859375, -6.3289794921875, -6.057373046875, -5.7857666015625, -5.51416015625, -5.2425537109375, -4.970947265625, -4.6993408203125, -4.427734375, -4.1561279296875, -3.884521484375, -3.6129150390625, -3.34130859375, -3.0697021484375, -2.798095703125, -2.5264892578125, -2.2548828125, -1.9832763671875, -1.711669921875, -1.4400634765625, -1.16845703125, -0.8968505859375, -0.625244140625, -0.3536376953125, -0.08203125, 0.1895751953125, 0.461181640625, 0.7327880859375, 1.00439453125, 1.2760009765625, 1.547607421875, 1.8192138671875, 2.0908203125, 2.3624267578125, 2.634033203125, 2.9056396484375, 3.17724609375, 3.4488525390625, 3.720458984375, 3.9920654296875, 4.263671875, 4.5352783203125, 4.806884765625, 5.0784912109375, 5.35009765625, 5.6217041015625, 5.893310546875, 6.1649169921875, 6.4365234375, 6.7081298828125, 6.979736328125, 7.2513427734375, 7.52294921875, 7.7945556640625, 8.066162109375, 8.3377685546875, 8.609375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 4.0, 10.0, 7.0, 14.0, 18.0, 18.0, 23.0, 25.0, 45.0, 55.0, 73.0, 69.0, 86.0, 89.0, 63.0, 84.0, 63.0, 73.0, 38.0, 30.0, 33.0, 27.0, 18.0, 14.0, 9.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.48189926147461, -42.149715423583984, -40.81753158569336, -39.4853515625, -38.153167724609375, -36.82098388671875, -35.488800048828125, -34.1566162109375, -32.824432373046875, -31.49224853515625, -30.160066604614258, -28.827882766723633, -27.49570083618164, -26.163516998291016, -24.83133316040039, -23.499149322509766, -22.166969299316406, -20.83478546142578, -19.50260353088379, -18.170419692993164, -16.838237762451172, -15.506053924560547, -14.173870086669922, -12.841687202453613, -11.509504318237305, -10.177321434020996, -8.845138549804688, -7.5129547119140625, -6.180771827697754, -4.848588943481445, -3.5164055824279785, -2.1842222213745117, -0.8520393371582031, 0.48014378547668457, 1.8123269081115723, 3.14451003074646, 4.476693153381348, 5.808876037597656, 7.141059398651123, 8.47324275970459, 9.805425643920898, 11.137608528137207, 12.469791412353516, 13.80197525024414, 15.13415813446045, 16.466341018676758, 17.798524856567383, 19.130706787109375, 20.462890625, 21.795074462890625, 23.127256393432617, 24.459440231323242, 25.791622161865234, 27.12380599975586, 28.455989837646484, 29.78817367553711, 31.1203556060791, 32.452537536621094, 33.78472137451172, 35.116905212402344, 36.44908905029297, 37.781272888183594, 39.11345291137695, 40.44563674926758, 41.7778205871582]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 10.0, 11.0, 10.0, 10.0, 14.0, 23.0, 26.0, 18.0, 31.0, 34.0, 31.0, 44.0, 35.0, 42.0, 48.0, 45.0, 49.0, 46.0, 48.0, 48.0, 43.0, 40.0, 31.0, 28.0, 33.0, 31.0, 29.0, 20.0, 20.0, 20.0, 13.0, 9.0, 7.0, 9.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.327486038208008, -19.72764778137207, -19.127809524536133, -18.527971267700195, -17.928131103515625, -17.328292846679688, -16.72845458984375, -16.128616333007812, -15.528778076171875, -14.928939819335938, -14.3291015625, -13.729262351989746, -13.129424095153809, -12.529585838317871, -11.929746627807617, -11.32990837097168, -10.730070114135742, -10.130231857299805, -9.530393600463867, -8.930554389953613, -8.330716133117676, -7.730877876281738, -7.131039142608643, -6.531200408935547, -5.931362152099609, -5.331523895263672, -4.731685161590576, -4.1318464279174805, -3.532008171081543, -2.9321696758270264, -2.3323311805725098, -1.732492446899414, -1.1326560974121094, -0.5328176021575928, 0.06702089309692383, 0.6668593883514404, 1.266697883605957, 1.8665363788604736, 2.4663748741149902, 3.066213607788086, 3.6660518646240234, 4.265890121459961, 4.865728855133057, 5.465567588806152, 6.06540584564209, 6.665244102478027, 7.265082836151123, 7.864921569824219, 8.464759826660156, 9.064598083496094, 9.664436340332031, 10.264275550842285, 10.864113807678223, 11.46395206451416, 12.063791275024414, 12.663629531860352, 13.263467788696289, 13.863306045532227, 14.463144302368164, 15.062983512878418, 15.662821769714355, 16.26266098022461, 16.862499237060547, 17.462337493896484, 18.062175750732422]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 14.0, 15.0, 27.0, 34.0, 52.0, 74.0, 93.0, 119.0, 212.0, 353.0, 457.0, 729.0, 1087.0, 1670.0, 2507.0, 3925.0, 6105.0, 9554.0, 15934.0, 26600.0, 46321.0, 81192.0, 144783.0, 221323.0, 200613.0, 119909.0, 67479.0, 38294.0, 22320.0, 13353.0, 8425.0, 5290.0, 3418.0, 2078.0, 1378.0, 948.0, 612.0, 412.0, 260.0, 190.0, 121.0, 72.0, 57.0, 52.0, 31.0, 22.0, 14.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-2.62890625, -2.54632568359375, -2.4637451171875, -2.38116455078125, -2.298583984375, -2.21600341796875, -2.1334228515625, -2.05084228515625, -1.96826171875, -1.88568115234375, -1.8031005859375, -1.72052001953125, -1.637939453125, -1.55535888671875, -1.4727783203125, -1.39019775390625, -1.3076171875, -1.22503662109375, -1.1424560546875, -1.05987548828125, -0.977294921875, -0.89471435546875, -0.8121337890625, -0.72955322265625, -0.64697265625, -0.56439208984375, -0.4818115234375, -0.39923095703125, -0.316650390625, -0.23406982421875, -0.1514892578125, -0.06890869140625, 0.013671875, 0.09625244140625, 0.1788330078125, 0.26141357421875, 0.343994140625, 0.42657470703125, 0.5091552734375, 0.59173583984375, 0.67431640625, 0.75689697265625, 0.8394775390625, 0.92205810546875, 1.004638671875, 1.08721923828125, 1.1697998046875, 1.25238037109375, 1.3349609375, 1.41754150390625, 1.5001220703125, 1.58270263671875, 1.665283203125, 1.74786376953125, 1.8304443359375, 1.91302490234375, 1.99560546875, 2.07818603515625, 2.1607666015625, 2.24334716796875, 2.325927734375, 2.40850830078125, 2.4910888671875, 2.57366943359375, 2.65625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 11.0, 10.0, 9.0, 12.0, 21.0, 18.0, 22.0, 30.0, 22.0, 24.0, 19.0, 32.0, 42.0, 35.0, 51.0, 27.0, 36.0, 43.0, 50.0, 45.0, 41.0, 38.0, 44.0, 40.0, 29.0, 28.0, 33.0, 27.0, 23.0, 19.0, 16.0, 16.0, 14.0, 5.0, 13.0, 6.0, 7.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.984375, -19.35791015625, -18.7314453125, -18.10498046875, -17.478515625, -16.85205078125, -16.2255859375, -15.59912109375, -14.97265625, -14.34619140625, -13.7197265625, -13.09326171875, -12.466796875, -11.84033203125, -11.2138671875, -10.58740234375, -9.9609375, -9.33447265625, -8.7080078125, -8.08154296875, -7.455078125, -6.82861328125, -6.2021484375, -5.57568359375, -4.94921875, -4.32275390625, -3.6962890625, -3.06982421875, -2.443359375, -1.81689453125, -1.1904296875, -0.56396484375, 0.0625, 0.68896484375, 1.3154296875, 1.94189453125, 2.568359375, 3.19482421875, 3.8212890625, 4.44775390625, 5.07421875, 5.70068359375, 6.3271484375, 6.95361328125, 7.580078125, 8.20654296875, 8.8330078125, 9.45947265625, 10.0859375, 10.71240234375, 11.3388671875, 11.96533203125, 12.591796875, 13.21826171875, 13.8447265625, 14.47119140625, 15.09765625, 15.72412109375, 16.3505859375, 16.97705078125, 17.603515625, 18.22998046875, 18.8564453125, 19.48291015625, 20.109375]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 16.0, 11.0, 16.0, 16.0, 24.0, 40.0, 58.0, 74.0, 113.0, 160.0, 232.0, 380.0, 512.0, 824.0, 1294.0, 2251.0, 4143.0, 7679.0, 17034.0, 53417.0, 838213.0, 81577.0, 20076.0, 9061.0, 4555.0, 2570.0, 1541.0, 882.0, 554.0, 384.0, 243.0, 170.0, 118.0, 101.0, 56.0, 43.0, 35.0, 24.0, 10.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0], "bins": [-8.5546875, -8.3209228515625, -8.087158203125, -7.8533935546875, -7.61962890625, -7.3858642578125, -7.152099609375, -6.9183349609375, -6.6845703125, -6.4508056640625, -6.217041015625, -5.9832763671875, -5.74951171875, -5.5157470703125, -5.281982421875, -5.0482177734375, -4.814453125, -4.5806884765625, -4.346923828125, -4.1131591796875, -3.87939453125, -3.6456298828125, -3.411865234375, -3.1781005859375, -2.9443359375, -2.7105712890625, -2.476806640625, -2.2430419921875, -2.00927734375, -1.7755126953125, -1.541748046875, -1.3079833984375, -1.07421875, -0.8404541015625, -0.606689453125, -0.3729248046875, -0.13916015625, 0.0946044921875, 0.328369140625, 0.5621337890625, 0.7958984375, 1.0296630859375, 1.263427734375, 1.4971923828125, 1.73095703125, 1.9647216796875, 2.198486328125, 2.4322509765625, 2.666015625, 2.8997802734375, 3.133544921875, 3.3673095703125, 3.60107421875, 3.8348388671875, 4.068603515625, 4.3023681640625, 4.5361328125, 4.7698974609375, 5.003662109375, 5.2374267578125, 5.47119140625, 5.7049560546875, 5.938720703125, 6.1724853515625, 6.40625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.value.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 7.0, 12.0, 12.0, 9.0, 14.0, 12.0, 18.0, 19.0, 25.0, 23.0, 32.0, 30.0, 33.0, 39.0, 33.0, 37.0, 44.0, 58.0, 48.0, 40.0, 48.0, 50.0, 40.0, 44.0, 36.0, 39.0, 34.0, 29.0, 17.0, 21.0, 15.0, 17.0, 14.0, 14.0, 7.0, 9.0, 5.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.578125, -13.171875, -12.765625, -12.359375, -11.953125, -11.546875, -11.140625, -10.734375, -10.328125, -9.921875, -9.515625, -9.109375, -8.703125, -8.296875, -7.890625, -7.484375, -7.078125, -6.671875, -6.265625, -5.859375, -5.453125, -5.046875, -4.640625, -4.234375, -3.828125, -3.421875, -3.015625, -2.609375, -2.203125, -1.796875, -1.390625, -0.984375, -0.578125, -0.171875, 0.234375, 0.640625, 1.046875, 1.453125, 1.859375, 2.265625, 2.671875, 3.078125, 3.484375, 3.890625, 4.296875, 4.703125, 5.109375, 5.515625, 5.921875, 6.328125, 6.734375, 7.140625, 7.546875, 7.953125, 8.359375, 8.765625, 9.171875, 9.578125, 9.984375, 10.390625, 10.796875, 11.203125, 11.609375, 12.015625, 12.421875]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 19.0, 14.0, 30.0, 33.0, 47.0, 69.0, 97.0, 140.0, 196.0, 384.0, 530.0, 837.0, 1356.0, 2229.0, 4160.0, 7858.0, 15736.0, 37813.0, 877374.0, 58803.0, 19653.0, 9415.0, 4925.0, 2670.0, 1615.0, 930.0, 568.0, 333.0, 247.0, 176.0, 93.0, 56.0, 48.0, 22.0, 27.0, 14.0, 14.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6708984375, -1.6240081787109375, -1.577117919921875, -1.5302276611328125, -1.48333740234375, -1.4364471435546875, -1.389556884765625, -1.3426666259765625, -1.2957763671875, -1.2488861083984375, -1.201995849609375, -1.1551055908203125, -1.10821533203125, -1.0613250732421875, -1.014434814453125, -0.9675445556640625, -0.920654296875, -0.8737640380859375, -0.826873779296875, -0.7799835205078125, -0.73309326171875, -0.6862030029296875, -0.639312744140625, -0.5924224853515625, -0.5455322265625, -0.4986419677734375, -0.451751708984375, -0.4048614501953125, -0.35797119140625, -0.3110809326171875, -0.264190673828125, -0.2173004150390625, -0.17041015625, -0.1235198974609375, -0.076629638671875, -0.0297393798828125, 0.01715087890625, 0.0640411376953125, 0.110931396484375, 0.1578216552734375, 0.2047119140625, 0.2516021728515625, 0.298492431640625, 0.3453826904296875, 0.39227294921875, 0.4391632080078125, 0.486053466796875, 0.5329437255859375, 0.579833984375, 0.6267242431640625, 0.673614501953125, 0.7205047607421875, 0.76739501953125, 0.8142852783203125, 0.861175537109375, 0.9080657958984375, 0.9549560546875, 1.0018463134765625, 1.048736572265625, 1.0956268310546875, 1.14251708984375, 1.1894073486328125, 1.236297607421875, 1.2831878662109375, 1.330078125]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.key.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 1.0, 8.0, 2.0, 6.0, 11.0, 7.0, 26.0, 17.0, 27.0, 34.0, 34.0, 30.0, 40.0, 51.0, 48.0, 51.0, 52.0, 57.0, 63.0, 52.0, 50.0, 34.0, 48.0, 30.0, 46.0, 32.0, 21.0, 20.0, 16.0, 16.0, 16.0, 18.0, 7.0, 8.0, 4.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.8683414459228516e-05, -3.740284591913223e-05, -3.612227737903595e-05, -3.484170883893967e-05, -3.3561140298843384e-05, -3.22805717587471e-05, -3.100000321865082e-05, -2.9719434678554535e-05, -2.8438866138458252e-05, -2.715829759836197e-05, -2.5877729058265686e-05, -2.4597160518169403e-05, -2.331659197807312e-05, -2.2036023437976837e-05, -2.0755454897880554e-05, -1.947488635778427e-05, -1.8194317817687988e-05, -1.6913749277591705e-05, -1.5633180737495422e-05, -1.435261219739914e-05, -1.3072043657302856e-05, -1.1791475117206573e-05, -1.051090657711029e-05, -9.230338037014008e-06, -7.949769496917725e-06, -6.669200956821442e-06, -5.388632416725159e-06, -4.108063876628876e-06, -2.8274953365325928e-06, -1.5469267964363098e-06, -2.6635825634002686e-07, 1.014210283756256e-06, 2.294778823852539e-06, 3.575347363948822e-06, 4.855915904045105e-06, 6.136484444141388e-06, 7.417052984237671e-06, 8.697621524333954e-06, 9.978190064430237e-06, 1.125875860452652e-05, 1.2539327144622803e-05, 1.3819895684719086e-05, 1.5100464224815369e-05, 1.638103276491165e-05, 1.7661601305007935e-05, 1.8942169845104218e-05, 2.02227383852005e-05, 2.1503306925296783e-05, 2.2783875465393066e-05, 2.406444400548935e-05, 2.5345012545585632e-05, 2.6625581085681915e-05, 2.7906149625778198e-05, 2.918671816587448e-05, 3.0467286705970764e-05, 3.174785524606705e-05, 3.302842378616333e-05, 3.430899232625961e-05, 3.5589560866355896e-05, 3.687012940645218e-05, 3.815069794654846e-05, 3.9431266486644745e-05, 4.071183502674103e-05, 4.199240356683731e-05, 4.3272972106933594e-05]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 13.0, 20.0, 37.0, 41.0, 69.0, 109.0, 175.0, 267.0, 415.0, 666.0, 1116.0, 1923.0, 3407.0, 6298.0, 11915.0, 23021.0, 45435.0, 92075.0, 175556.0, 252648.0, 205127.0, 112716.0, 55933.0, 27806.0, 14184.0, 7515.0, 4113.0, 2383.0, 1342.0, 832.0, 487.0, 279.0, 220.0, 114.0, 95.0, 49.0, 46.0, 34.0, 19.0, 10.0, 3.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.77490234375, -0.7511672973632812, -0.7274322509765625, -0.7036972045898438, -0.679962158203125, -0.6562271118164062, -0.6324920654296875, -0.6087570190429688, -0.58502197265625, -0.5612869262695312, -0.5375518798828125, -0.5138168334960938, -0.490081787109375, -0.46634674072265625, -0.4426116943359375, -0.41887664794921875, -0.3951416015625, -0.37140655517578125, -0.3476715087890625, -0.32393646240234375, -0.300201416015625, -0.27646636962890625, -0.2527313232421875, -0.22899627685546875, -0.20526123046875, -0.18152618408203125, -0.1577911376953125, -0.13405609130859375, -0.110321044921875, -0.08658599853515625, -0.0628509521484375, -0.03911590576171875, -0.015380859375, 0.00835418701171875, 0.0320892333984375, 0.05582427978515625, 0.079559326171875, 0.10329437255859375, 0.1270294189453125, 0.15076446533203125, 0.17449951171875, 0.19823455810546875, 0.2219696044921875, 0.24570465087890625, 0.269439697265625, 0.29317474365234375, 0.3169097900390625, 0.34064483642578125, 0.3643798828125, 0.38811492919921875, 0.4118499755859375, 0.43558502197265625, 0.459320068359375, 0.48305511474609375, 0.5067901611328125, 0.5305252075195312, 0.55426025390625, 0.5779953002929688, 0.6017303466796875, 0.6254653930664062, 0.649200439453125, 0.6729354858398438, 0.6966705322265625, 0.7204055786132812, 0.744140625]}, "gradients/decoder.bert.encoder.layer.0.crossattention.self.query.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 10.0, 5.0, 13.0, 14.0, 23.0, 22.0, 33.0, 52.0, 51.0, 58.0, 83.0, 81.0, 76.0, 61.0, 83.0, 57.0, 57.0, 52.0, 47.0, 33.0, 25.0, 23.0, 12.0, 10.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2119140625, -0.20371627807617188, -0.19551849365234375, -0.18732070922851562, -0.1791229248046875, -0.17092514038085938, -0.16272735595703125, -0.15452957153320312, -0.146331787109375, -0.13813400268554688, -0.12993621826171875, -0.12173843383789062, -0.1135406494140625, -0.10534286499023438, -0.09714508056640625, -0.08894729614257812, -0.08074951171875, -0.07255172729492188, -0.06435394287109375, -0.056156158447265625, -0.0479583740234375, -0.039760589599609375, -0.03156280517578125, -0.023365020751953125, -0.015167236328125, -0.006969451904296875, 0.00122833251953125, 0.009426116943359375, 0.0176239013671875, 0.025821685791015625, 0.03401947021484375, 0.042217254638671875, 0.0504150390625, 0.058612823486328125, 0.06681060791015625, 0.07500839233398438, 0.0832061767578125, 0.09140396118164062, 0.09960174560546875, 0.10779953002929688, 0.115997314453125, 0.12419509887695312, 0.13239288330078125, 0.14059066772460938, 0.1487884521484375, 0.15698623657226562, 0.16518402099609375, 0.17338180541992188, 0.18157958984375, 0.18977737426757812, 0.19797515869140625, 0.20617294311523438, 0.2143707275390625, 0.22256851196289062, 0.23076629638671875, 0.23896408081054688, 0.247161865234375, 0.2553596496582031, 0.26355743408203125, 0.2717552185058594, 0.2799530029296875, 0.2881507873535156, 0.29634857177734375, 0.3045463562011719, 0.312744140625]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 6.0, 10.0, 17.0, 16.0, 23.0, 21.0, 28.0, 51.0, 52.0, 86.0, 69.0, 88.0, 76.0, 79.0, 72.0, 63.0, 70.0, 31.0, 33.0, 33.0, 20.0, 17.0, 14.0, 6.0, 5.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.14012145996094, -41.805110931396484, -40.47010040283203, -39.135093688964844, -37.80008316040039, -36.46507263183594, -35.13006591796875, -33.7950553894043, -32.460044860839844, -31.12503433227539, -29.79002571105957, -28.45501708984375, -27.120006561279297, -25.784996032714844, -24.449987411499023, -23.114978790283203, -21.77996826171875, -20.444957733154297, -19.109949111938477, -17.774940490722656, -16.439929962158203, -15.104920387268066, -13.76991081237793, -12.434901237487793, -11.099891662597656, -9.76488208770752, -8.429872512817383, -7.094862937927246, -5.759853363037109, -4.424843788146973, -3.089834213256836, -1.7548246383666992, -0.4198188781738281, 0.9151906967163086, 2.2502002716064453, 3.585209846496582, 4.920219421386719, 6.2552289962768555, 7.590238571166992, 8.925248146057129, 10.260257720947266, 11.595267295837402, 12.930276870727539, 14.265286445617676, 15.600296020507812, 16.935306549072266, 18.270315170288086, 19.605323791503906, 20.94033432006836, 22.275344848632812, 23.610353469848633, 24.945362091064453, 26.280372619628906, 27.61538314819336, 28.95039176940918, 30.285400390625, 31.620410919189453, 32.955421447753906, 34.290428161621094, 35.62543869018555, 36.96044921875, 38.29545974731445, 39.630470275878906, 40.965476989746094, 42.30048751831055]}, "gradients/decoder.bert.encoder.layer.0.attention.output.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 10.0, 13.0, 10.0, 10.0, 11.0, 12.0, 23.0, 25.0, 21.0, 29.0, 33.0, 32.0, 40.0, 38.0, 43.0, 44.0, 47.0, 51.0, 46.0, 48.0, 49.0, 42.0, 36.0, 37.0, 27.0, 28.0, 35.0, 29.0, 21.0, 19.0, 22.0, 10.0, 12.0, 7.0, 10.0, 6.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.5731201171875, -19.966615676879883, -19.360111236572266, -18.75360679626465, -18.14710235595703, -17.540597915649414, -16.934093475341797, -16.327587127685547, -15.721083641052246, -15.114579200744629, -14.508074760437012, -13.901570320129395, -13.295064926147461, -12.688560485839844, -12.082056045532227, -11.47555160522461, -10.869047164916992, -10.262542724609375, -9.656038284301758, -9.04953384399414, -8.443029403686523, -7.836524486541748, -7.230019569396973, -6.6235151290893555, -6.017010688781738, -5.410506248474121, -4.804001808166504, -4.1974968910217285, -3.5909924507141113, -2.984488010406494, -2.377983331680298, -1.7714786529541016, -1.1649742126464844, -0.5584696531295776, 0.0480349063873291, 0.6545394659042358, 1.2610440254211426, 1.8675484657287598, 2.474053144454956, 3.0805578231811523, 3.6870622634887695, 4.293566703796387, 4.900071144104004, 5.506576061248779, 6.1130805015563965, 6.719584941864014, 7.326089859008789, 7.932594299316406, 8.539098739624023, 9.14560317993164, 9.752107620239258, 10.358612060546875, 10.965116500854492, 11.57162094116211, 12.178126335144043, 12.78463077545166, 13.391135215759277, 13.997639656066895, 14.604144096374512, 15.210648536682129, 15.817153930664062, 16.42365837097168, 17.030162811279297, 17.636667251586914, 18.24317169189453]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 6.0, 15.0, 17.0, 28.0, 49.0, 67.0, 88.0, 142.0, 188.0, 285.0, 413.0, 566.0, 777.0, 1192.0, 1792.0, 2631.0, 3779.0, 5997.0, 9123.0, 14755.0, 23935.0, 40241.0, 68816.0, 114528.0, 168787.0, 189364.0, 152537.0, 98586.0, 58525.0, 34310.0, 20429.0, 12606.0, 8035.0, 5292.0, 3368.0, 2352.0, 1606.0, 953.0, 770.0, 528.0, 350.0, 234.0, 162.0, 111.0, 80.0, 50.0, 39.0, 16.0, 12.0, 9.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.53125, -19.896484375, -19.26171875, -18.626953125, -17.9921875, -17.357421875, -16.72265625, -16.087890625, -15.453125, -14.818359375, -14.18359375, -13.548828125, -12.9140625, -12.279296875, -11.64453125, -11.009765625, -10.375, -9.740234375, -9.10546875, -8.470703125, -7.8359375, -7.201171875, -6.56640625, -5.931640625, -5.296875, -4.662109375, -4.02734375, -3.392578125, -2.7578125, -2.123046875, -1.48828125, -0.853515625, -0.21875, 0.416015625, 1.05078125, 1.685546875, 2.3203125, 2.955078125, 3.58984375, 4.224609375, 4.859375, 5.494140625, 6.12890625, 6.763671875, 7.3984375, 8.033203125, 8.66796875, 9.302734375, 9.9375, 10.572265625, 11.20703125, 11.841796875, 12.4765625, 13.111328125, 13.74609375, 14.380859375, 15.015625, 15.650390625, 16.28515625, 16.919921875, 17.5546875, 18.189453125, 18.82421875, 19.458984375, 20.09375]}, "gradients/decoder.bert.encoder.layer.0.attention.output.dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 5.0, 4.0, 5.0, 6.0, 12.0, 11.0, 22.0, 15.0, 21.0, 23.0, 25.0, 25.0, 24.0, 31.0, 39.0, 45.0, 41.0, 38.0, 51.0, 47.0, 62.0, 48.0, 43.0, 36.0, 51.0, 32.0, 29.0, 40.0, 30.0, 23.0, 18.0, 17.0, 18.0, 12.0, 10.0, 12.0, 8.0, 4.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0], "bins": [-23.953125, -23.32421875, -22.6953125, -22.06640625, -21.4375, -20.80859375, -20.1796875, -19.55078125, -18.921875, -18.29296875, -17.6640625, -17.03515625, -16.40625, -15.77734375, -15.1484375, -14.51953125, -13.890625, -13.26171875, -12.6328125, -12.00390625, -11.375, -10.74609375, -10.1171875, -9.48828125, -8.859375, -8.23046875, -7.6015625, -6.97265625, -6.34375, -5.71484375, -5.0859375, -4.45703125, -3.828125, -3.19921875, -2.5703125, -1.94140625, -1.3125, -0.68359375, -0.0546875, 0.57421875, 1.203125, 1.83203125, 2.4609375, 3.08984375, 3.71875, 4.34765625, 4.9765625, 5.60546875, 6.234375, 6.86328125, 7.4921875, 8.12109375, 8.75, 9.37890625, 10.0078125, 10.63671875, 11.265625, 11.89453125, 12.5234375, 13.15234375, 13.78125, 14.41015625, 15.0390625, 15.66796875, 16.296875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 8.0, 12.0, 12.0, 19.0, 30.0, 53.0, 70.0, 121.0, 169.0, 236.0, 362.0, 546.0, 814.0, 1245.0, 1936.0, 3051.0, 4913.0, 7861.0, 13112.0, 22049.0, 38202.0, 67804.0, 117949.0, 182642.0, 207099.0, 155486.0, 93811.0, 52769.0, 30238.0, 17677.0, 10581.0, 6392.0, 3951.0, 2550.0, 1662.0, 1108.0, 714.0, 431.0, 309.0, 189.0, 129.0, 79.0, 59.0, 35.0, 34.0, 15.0, 10.0, 4.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.328125, -27.392822265625, -26.45751953125, -25.522216796875, -24.5869140625, -23.651611328125, -22.71630859375, -21.781005859375, -20.845703125, -19.910400390625, -18.97509765625, -18.039794921875, -17.1044921875, -16.169189453125, -15.23388671875, -14.298583984375, -13.36328125, -12.427978515625, -11.49267578125, -10.557373046875, -9.6220703125, -8.686767578125, -7.75146484375, -6.816162109375, -5.880859375, -4.945556640625, -4.01025390625, -3.074951171875, -2.1396484375, -1.204345703125, -0.26904296875, 0.666259765625, 1.6015625, 2.536865234375, 3.47216796875, 4.407470703125, 5.3427734375, 6.278076171875, 7.21337890625, 8.148681640625, 9.083984375, 10.019287109375, 10.95458984375, 11.889892578125, 12.8251953125, 13.760498046875, 14.69580078125, 15.631103515625, 16.56640625, 17.501708984375, 18.43701171875, 19.372314453125, 20.3076171875, 21.242919921875, 22.17822265625, 23.113525390625, 24.048828125, 24.984130859375, 25.91943359375, 26.854736328125, 27.7900390625, 28.725341796875, 29.66064453125, 30.595947265625, 31.53125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.value.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 3.0, 8.0, 5.0, 10.0, 4.0, 6.0, 8.0, 11.0, 16.0, 17.0, 16.0, 17.0, 23.0, 35.0, 23.0, 50.0, 26.0, 35.0, 47.0, 45.0, 47.0, 40.0, 52.0, 33.0, 42.0, 36.0, 38.0, 35.0, 38.0, 34.0, 23.0, 19.0, 27.0, 27.0, 22.0, 11.0, 13.0, 11.0, 14.0, 12.0, 4.0, 6.0, 4.0, 4.0, 4.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3515625, -10.962158203125, -10.57275390625, -10.183349609375, -9.7939453125, -9.404541015625, -9.01513671875, -8.625732421875, -8.236328125, -7.846923828125, -7.45751953125, -7.068115234375, -6.6787109375, -6.289306640625, -5.89990234375, -5.510498046875, -5.12109375, -4.731689453125, -4.34228515625, -3.952880859375, -3.5634765625, -3.174072265625, -2.78466796875, -2.395263671875, -2.005859375, -1.616455078125, -1.22705078125, -0.837646484375, -0.4482421875, -0.058837890625, 0.33056640625, 0.719970703125, 1.109375, 1.498779296875, 1.88818359375, 2.277587890625, 2.6669921875, 3.056396484375, 3.44580078125, 3.835205078125, 4.224609375, 4.614013671875, 5.00341796875, 5.392822265625, 5.7822265625, 6.171630859375, 6.56103515625, 6.950439453125, 7.33984375, 7.729248046875, 8.11865234375, 8.508056640625, 8.8974609375, 9.286865234375, 9.67626953125, 10.065673828125, 10.455078125, 10.844482421875, 11.23388671875, 11.623291015625, 12.0126953125, 12.402099609375, 12.79150390625, 13.180908203125, 13.5703125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 6.0, 14.0, 11.0, 22.0, 26.0, 46.0, 60.0, 108.0, 141.0, 210.0, 294.0, 428.0, 687.0, 1093.0, 1664.0, 2731.0, 4531.0, 7720.0, 13522.0, 25709.0, 51235.0, 106695.0, 202641.0, 257463.0, 182316.0, 92094.0, 44456.0, 22573.0, 12034.0, 6938.0, 4072.0, 2591.0, 1522.0, 986.0, 633.0, 426.0, 265.0, 186.0, 128.0, 69.0, 65.0, 46.0, 31.0, 23.0, 14.0, 6.0, 6.0, 11.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.4052734375, -17.779296875, -17.1533203125, -16.52734375, -15.9013671875, -15.275390625, -14.6494140625, -14.0234375, -13.3974609375, -12.771484375, -12.1455078125, -11.51953125, -10.8935546875, -10.267578125, -9.6416015625, -9.015625, -8.3896484375, -7.763671875, -7.1376953125, -6.51171875, -5.8857421875, -5.259765625, -4.6337890625, -4.0078125, -3.3818359375, -2.755859375, -2.1298828125, -1.50390625, -0.8779296875, -0.251953125, 0.3740234375, 1.0, 1.6259765625, 2.251953125, 2.8779296875, 3.50390625, 4.1298828125, 4.755859375, 5.3818359375, 6.0078125, 6.6337890625, 7.259765625, 7.8857421875, 8.51171875, 9.1376953125, 9.763671875, 10.3896484375, 11.015625, 11.6416015625, 12.267578125, 12.8935546875, 13.51953125, 14.1455078125, 14.771484375, 15.3974609375, 16.0234375, 16.6494140625, 17.275390625, 17.9013671875, 18.52734375, 19.1533203125, 19.779296875, 20.4052734375, 21.03125]}, "gradients/decoder.bert.encoder.layer.0.attention.self.key.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 8.0, 7.0, 9.0, 18.0, 14.0, 19.0, 25.0, 22.0, 33.0, 44.0, 74.0, 92.0, 79.0, 82.0, 81.0, 72.0, 76.0, 57.0, 41.0, 28.0, 19.0, 19.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.0021779239177703857, -0.0021089911460876465, -0.0020400583744049072, -0.001971125602722168, -0.0019021928310394287, -0.0018332600593566895, -0.0017643272876739502, -0.001695394515991211, -0.0016264617443084717, -0.0015575289726257324, -0.0014885962009429932, -0.001419663429260254, -0.0013507306575775146, -0.0012817978858947754, -0.0012128651142120361, -0.0011439323425292969, -0.0010749995708465576, -0.0010060667991638184, -0.0009371340274810791, -0.0008682012557983398, -0.0007992684841156006, -0.0007303357124328613, -0.0006614029407501221, -0.0005924701690673828, -0.0005235373973846436, -0.0004546046257019043, -0.00038567185401916504, -0.0003167390823364258, -0.0002478063106536865, -0.00017887353897094727, -0.00010994076728820801, -4.100799560546875e-05, 2.7924776077270508e-05, 9.685754776000977e-05, 0.00016579031944274902, 0.00023472309112548828, 0.00030365586280822754, 0.0003725886344909668, 0.00044152140617370605, 0.0005104541778564453, 0.0005793869495391846, 0.0006483197212219238, 0.0007172524929046631, 0.0007861852645874023, 0.0008551180362701416, 0.0009240508079528809, 0.0009929835796356201, 0.0010619163513183594, 0.0011308491230010986, 0.0011997818946838379, 0.0012687146663665771, 0.0013376474380493164, 0.0014065802097320557, 0.001475512981414795, 0.0015444457530975342, 0.0016133785247802734, 0.0016823112964630127, 0.001751244068145752, 0.0018201768398284912, 0.0018891096115112305, 0.0019580423831939697, 0.002026975154876709, 0.0020959079265594482, 0.0021648406982421875]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 14.0, 21.0, 36.0, 50.0, 57.0, 99.0, 134.0, 168.0, 241.0, 367.0, 560.0, 803.0, 1291.0, 2093.0, 3475.0, 5592.0, 10330.0, 19105.0, 37284.0, 78492.0, 163228.0, 262228.0, 225455.0, 119018.0, 56119.0, 27500.0, 14619.0, 7982.0, 4504.0, 2762.0, 1691.0, 1088.0, 698.0, 424.0, 299.0, 236.0, 131.0, 99.0, 82.0, 52.0, 40.0, 23.0, 16.0, 14.0, 5.0, 5.0, 4.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.3125, -17.717529296875, -17.12255859375, -16.527587890625, -15.9326171875, -15.337646484375, -14.74267578125, -14.147705078125, -13.552734375, -12.957763671875, -12.36279296875, -11.767822265625, -11.1728515625, -10.577880859375, -9.98291015625, -9.387939453125, -8.79296875, -8.197998046875, -7.60302734375, -7.008056640625, -6.4130859375, -5.818115234375, -5.22314453125, -4.628173828125, -4.033203125, -3.438232421875, -2.84326171875, -2.248291015625, -1.6533203125, -1.058349609375, -0.46337890625, 0.131591796875, 0.7265625, 1.321533203125, 1.91650390625, 2.511474609375, 3.1064453125, 3.701416015625, 4.29638671875, 4.891357421875, 5.486328125, 6.081298828125, 6.67626953125, 7.271240234375, 7.8662109375, 8.461181640625, 9.05615234375, 9.651123046875, 10.24609375, 10.841064453125, 11.43603515625, 12.031005859375, 12.6259765625, 13.220947265625, 13.81591796875, 14.410888671875, 15.005859375, 15.600830078125, 16.19580078125, 16.790771484375, 17.3857421875, 17.980712890625, 18.57568359375, 19.170654296875, 19.765625]}, "gradients/decoder.bert.encoder.layer.0.attention.self.query.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 9.0, 13.0, 12.0, 8.0, 20.0, 20.0, 25.0, 22.0, 29.0, 31.0, 25.0, 49.0, 47.0, 59.0, 58.0, 56.0, 66.0, 50.0, 40.0, 39.0, 46.0, 38.0, 49.0, 31.0, 22.0, 23.0, 25.0, 11.0, 14.0, 9.0, 8.0, 2.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-3.939453125, -3.817626953125, -3.69580078125, -3.573974609375, -3.4521484375, -3.330322265625, -3.20849609375, -3.086669921875, -2.96484375, -2.843017578125, -2.72119140625, -2.599365234375, -2.4775390625, -2.355712890625, -2.23388671875, -2.112060546875, -1.990234375, -1.868408203125, -1.74658203125, -1.624755859375, -1.5029296875, -1.381103515625, -1.25927734375, -1.137451171875, -1.015625, -0.893798828125, -0.77197265625, -0.650146484375, -0.5283203125, -0.406494140625, -0.28466796875, -0.162841796875, -0.041015625, 0.080810546875, 0.20263671875, 0.324462890625, 0.4462890625, 0.568115234375, 0.68994140625, 0.811767578125, 0.93359375, 1.055419921875, 1.17724609375, 1.299072265625, 1.4208984375, 1.542724609375, 1.66455078125, 1.786376953125, 1.908203125, 2.030029296875, 2.15185546875, 2.273681640625, 2.3955078125, 2.517333984375, 2.63916015625, 2.760986328125, 2.8828125, 3.004638671875, 3.12646484375, 3.248291015625, 3.3701171875, 3.491943359375, 3.61376953125, 3.735595703125, 3.857421875]}, "gradients/decoder.bert.embeddings.LayerNorm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 8.0, 5.0, 4.0, 11.0, 16.0, 20.0, 25.0, 24.0, 29.0, 24.0, 49.0, 67.0, 68.0, 58.0, 69.0, 76.0, 72.0, 59.0, 50.0, 63.0, 43.0, 35.0, 31.0, 23.0, 22.0, 11.0, 11.0, 10.0, 5.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.53688430786133, -37.30178451538086, -36.06668472290039, -34.83158493041992, -33.59648513793945, -32.36138153076172, -31.126283645629883, -29.89118194580078, -28.656082153320312, -27.420982360839844, -26.185882568359375, -24.950782775878906, -23.715681076049805, -22.480581283569336, -21.245481491088867, -20.010379791259766, -18.77528190612793, -17.54018211364746, -16.305082321166992, -15.069981575012207, -13.834880828857422, -12.599781036376953, -11.364681243896484, -10.1295804977417, -8.89448070526123, -7.6593804359436035, -6.424280166625977, -5.189180374145508, -3.954080104827881, -2.718979835510254, -1.4838800430297852, -0.248779296875, 0.9863204956054688, 2.2214207649230957, 3.4565207958221436, 4.691620826721191, 5.926721096038818, 7.161821365356445, 8.396921157836914, 9.6320219039917, 10.867121696472168, 12.102221488952637, 13.337322235107422, 14.57242202758789, 15.80752182006836, 17.042621612548828, 18.277721405029297, 19.5128231048584, 20.747922897338867, 21.983022689819336, 23.218122482299805, 24.453224182128906, 25.688323974609375, 26.923423767089844, 28.158523559570312, 29.39362335205078, 30.62872314453125, 31.86382293701172, 33.09892272949219, 34.334022521972656, 35.569122314453125, 36.804222106933594, 38.03932189941406, 39.2744255065918, 40.509525299072266]}, "gradients/decoder.bert.embeddings.LayerNorm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 10.0, 6.0, 5.0, 13.0, 14.0, 10.0, 13.0, 14.0, 18.0, 26.0, 33.0, 25.0, 35.0, 41.0, 51.0, 53.0, 54.0, 51.0, 56.0, 46.0, 51.0, 47.0, 44.0, 41.0, 37.0, 25.0, 22.0, 24.0, 26.0, 17.0, 17.0, 15.0, 13.0, 9.0, 7.0, 5.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.1720027923584, -27.324731826782227, -26.477462768554688, -25.630191802978516, -24.782920837402344, -23.935651779174805, -23.088380813598633, -22.241111755371094, -21.393840789794922, -20.54656982421875, -19.69930076599121, -18.85202980041504, -18.0047607421875, -17.157489776611328, -16.310218811035156, -15.4629487991333, -14.615678787231445, -13.76840877532959, -12.921138763427734, -12.073867797851562, -11.226597785949707, -10.379327774047852, -9.53205680847168, -8.684786796569824, -7.837516784667969, -6.990246772766113, -6.1429762840271, -5.295705795288086, -4.4484357833862305, -3.601165771484375, -2.7538952827453613, -1.9066247940063477, -1.0593547821044922, -0.21208453178405762, 0.635185718536377, 1.4824559688568115, 2.329726219177246, 3.1769962310791016, 4.024266719818115, 4.871537208557129, 5.718807220458984, 6.56607723236084, 7.4133477210998535, 8.260618209838867, 9.107888221740723, 9.955158233642578, 10.80242919921875, 11.649699211120605, 12.496969223022461, 13.344239234924316, 14.191509246826172, 15.038780212402344, 15.8860502243042, 16.733320236206055, 17.580591201782227, 18.427860260009766, 19.275131225585938, 20.12240219116211, 20.96967124938965, 21.81694221496582, 22.66421127319336, 23.51148223876953, 24.358753204345703, 25.206024169921875, 26.053293228149414]}, "gradients/decoder.bert.embeddings.position_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 9.0, 11.0, 9.0, 14.0, 16.0, 19.0, 15.0, 24.0, 28.0, 25.0, 33.0, 63.0, 92.0, 184.0, 374.0, 682.0, 1439.0, 3415.0, 507871.0, 5862.0, 1996.0, 917.0, 457.0, 226.0, 115.0, 92.0, 66.0, 31.0, 24.0, 17.0, 20.0, 13.0, 13.0, 12.0, 10.0, 20.0, 6.0, 4.0, 4.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-774.417236328125, -752.728271484375, -731.0392456054688, -709.3502807617188, -687.6612548828125, -665.9722900390625, -644.2833251953125, -622.5942993164062, -600.9053344726562, -579.2163696289062, -557.52734375, -535.83837890625, -514.1493530273438, -492.46038818359375, -470.7713928222656, -449.0823974609375, -427.3934020996094, -405.70440673828125, -384.0154113769531, -362.326416015625, -340.637451171875, -318.9484558105469, -297.25946044921875, -275.57049560546875, -253.88148498535156, -232.19248962402344, -210.50350952148438, -188.81451416015625, -167.12551879882812, -145.43653869628906, -123.74754333496094, -102.05856323242188, -80.36956787109375, -58.680580139160156, -36.9915885925293, -15.302597045898438, 6.386390686035156, 28.07537841796875, 49.764373779296875, 71.45335388183594, 93.14234924316406, 114.83133697509766, 136.52032470703125, 158.20932006835938, 179.8983154296875, 201.58729553222656, 223.2762908935547, 244.96527099609375, 266.6542663574219, 288.34326171875, 310.0322570800781, 331.72125244140625, 353.41021728515625, 375.0992126464844, 396.7882080078125, 418.4771728515625, 440.16619873046875, 461.8551940917969, 483.544189453125, 505.233154296875, 526.9221801757812, 548.6111450195312, 570.3001708984375, 591.9891357421875, 613.6781005859375]}, "gradients/decoder.bert.embeddings.token_type_embeddings.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 8.0, 9.0, 7.0, 6.0, 8.0, 13.0, 13.0, 9.0, 16.0, 16.0, 26.0, 34.0, 24.0, 31.0, 43.0, 43.0, 49.0, 55.0, 51.0, 1080.0, 56.0, 50.0, 43.0, 46.0, 43.0, 40.0, 27.0, 22.0, 25.0, 22.0, 26.0, 13.0, 16.0, 13.0, 12.0, 5.0, 8.0, 2.0, 10.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-912.578857421875, -885.506103515625, -858.4334106445312, -831.3606567382812, -804.2879638671875, -777.2152099609375, -750.1424560546875, -723.0697021484375, -695.9970092773438, -668.9242553710938, -641.8515625, -614.77880859375, -587.7060546875, -560.6333618164062, -533.5606079101562, -506.4878845214844, -479.4151611328125, -452.3424377441406, -425.26971435546875, -398.19696044921875, -371.1242370605469, -344.051513671875, -316.978759765625, -289.9060363769531, -262.83331298828125, -235.76058959960938, -208.68785095214844, -181.6151123046875, -154.54238891601562, -127.46966552734375, -100.39692687988281, -73.32418823242188, -46.25140380859375, -19.178672790527344, 7.8940582275390625, 34.96678924560547, 62.039520263671875, 89.11224365234375, 116.18498229980469, 143.25772094726562, 170.3304443359375, 197.40316772460938, 224.4759063720703, 251.54864501953125, 278.6213684082031, 305.694091796875, 332.766845703125, 359.8395690917969, 386.91229248046875, 413.9850158691406, 441.0577392578125, 468.1304931640625, 495.2032165527344, 522.2759399414062, 549.3486938476562, 576.42138671875, 603.494140625, 630.56689453125, 657.6395874023438, 684.7123413085938, 711.7850341796875, 738.8577880859375, 765.9305419921875, 793.0032958984375, 820.0759887695312]}, "gradients/decoder.bert.embeddings.word_embeddings.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 6.0, 5.0, 14.0, 14.0, 20.0, 24.0, 32.0, 49.0, 68.0, 68.0, 83.0, 102.0, 143.0, 155.0, 200.0, 235.0, 320.0, 419.0, 521.0, 661.0, 958.0, 1068.0, 1451.0, 2004.0, 4214.0, 19206.0, 31198024.0, 10843.0, 4036.0, 3086.0, 2397.0, 1548.0, 1290.0, 607.0, 229.0, 100.0, 70.0, 56.0, 26.0, 29.0, 20.0, 21.0, 20.0, 15.0, 9.0, 12.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-880.484375, -855.5458984375, -830.6073608398438, -805.6688842773438, -780.7304077148438, -755.7919311523438, -730.8533935546875, -705.9149169921875, -680.9764404296875, -656.0379638671875, -631.0994262695312, -606.1609497070312, -581.2224731445312, -556.2839965820312, -531.345458984375, -506.406982421875, -481.4684753417969, -456.52996826171875, -431.59149169921875, -406.6529846191406, -381.7145080566406, -356.7760009765625, -331.8375244140625, -306.8990173339844, -281.96051025390625, -257.0220031738281, -232.08352661132812, -207.14501953125, -182.20654296875, -157.26803588867188, -132.3295440673828, -107.39105224609375, -82.45257568359375, -57.51408386230469, -32.57558822631836, -7.637092590332031, 17.30139923095703, 42.239891052246094, 67.17839050292969, 92.11688232421875, 117.05537414550781, 141.99386596679688, 166.93235778808594, 191.870849609375, 216.80935668945312, 241.74783325195312, 266.68634033203125, 291.62481689453125, 316.5633239746094, 341.5018310546875, 366.4403076171875, 391.3788146972656, 416.3172912597656, 441.25579833984375, 466.19427490234375, 491.1327819824219, 516.0712890625, 541.009765625, 565.9483032226562, 590.8867797851562, 615.8252563476562, 640.7637329101562, 665.7022705078125, 690.6407470703125, 715.5792236328125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 13.0, 9.0, 10.0, 12.0, 15.0, 27.0, 21.0, 40.0, 33.0, 42.0, 51.0, 56.0, 71.0, 91.0, 68.0, 74.0, 58.0, 57.0, 43.0, 30.0, 30.0, 21.0, 18.0, 21.0, 10.0, 8.0, 16.0, 8.0, 10.0, 6.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-515.4827270507812, -501.5868225097656, -487.6909484863281, -473.7950439453125, -459.899169921875, -446.0032653808594, -432.10736083984375, -418.21148681640625, -404.3155822753906, -390.419677734375, -376.5238037109375, -362.6278991699219, -348.7320251464844, -334.83612060546875, -320.94024658203125, -307.0443420410156, -293.1484375, -279.2525329589844, -265.3566589355469, -251.46075439453125, -237.5648651123047, -223.66897583007812, -209.77308654785156, -195.877197265625, -181.9813232421875, -168.08543395996094, -154.18954467773438, -140.29364013671875, -126.39775085449219, -112.50186157226562, -98.60597229003906, -84.71007537841797, -70.81417846679688, -56.91828536987305, -43.02239227294922, -29.126502990722656, -15.230609893798828, -1.334716796875, 12.561172485351562, 26.457069396972656, 40.35295867919922, 54.24885177612305, 68.14474487304688, 82.04063415527344, 95.9365234375, 109.8324203491211, 123.72830963134766, 137.62420654296875, 151.5200958251953, 165.41598510742188, 179.31187438964844, 193.207763671875, 207.10366821289062, 220.9995574951172, 234.89544677734375, 248.79135131835938, 262.6872253417969, 276.5831298828125, 290.47900390625, 304.3749084472656, 318.2707824707031, 332.16668701171875, 346.06256103515625, 359.9584655761719, 373.8543701171875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 12.0, 10.0, 16.0, 13.0, 19.0, 12.0, 25.0, 23.0, 24.0, 37.0, 33.0, 34.0, 54.0, 86.0, 75.0, 89.0, 71.0, 57.0, 39.0, 33.0, 33.0, 29.0, 32.0, 19.0, 16.0, 21.0, 7.0, 8.0, 11.0, 10.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.020751953125, -669.9324340820312, -646.8441772460938, -623.755859375, -600.6676025390625, -577.5792846679688, -554.490966796875, -531.4027099609375, -508.31439208984375, -485.2261047363281, -462.1378173828125, -439.04949951171875, -415.9612121582031, -392.8729248046875, -369.7846374511719, -346.69635009765625, -323.6080627441406, -300.519775390625, -277.4314880371094, -254.3431854248047, -231.2548828125, -208.16659545898438, -185.07830810546875, -161.99000549316406, -138.90171813964844, -115.81342315673828, -92.72512817382812, -69.6368408203125, -46.548545837402344, -23.460250854492188, -0.3719635009765625, 22.716339111328125, 45.80462646484375, 68.8929214477539, 91.98121643066406, 115.06950378417969, 138.15780639648438, 161.24609375, 184.33438110351562, 207.4226837158203, 230.51097106933594, 253.59925842285156, 276.68756103515625, 299.7758483886719, 322.8641357421875, 345.95245361328125, 369.04071044921875, 392.1290283203125, 415.2173156738281, 438.30560302734375, 461.3938903808594, 484.482177734375, 507.57049560546875, 530.6588134765625, 553.7470703125, 576.8353881835938, 599.9236450195312, 623.011962890625, 646.1002197265625, 669.1885375976562, 692.2767944335938, 715.3651123046875, 738.453369140625, 761.5416870117188, 784.6300048828125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 8.0, 24.0, 22.0, 39.0, 60.0, 98.0, 179.0, 255.0, 418.0, 686.0, 1021.0, 1681.0, 2668.0, 4259.0, 6588.0, 11093.0, 17703.0, 28708.0, 48592.0, 82383.0, 144257.0, 263641.0, 533397.0, 1477572.0, 771378.0, 356542.0, 187770.0, 103516.0, 59946.0, 34925.0, 20818.0, 12610.0, 7751.0, 4897.0, 3123.0, 1940.0, 1291.0, 789.0, 550.0, 353.0, 229.0, 181.0, 103.0, 59.0, 48.0, 35.0, 27.0, 13.0, 9.0, 10.0, 6.0, 9.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3046875, -9.979736328125, -9.65478515625, -9.329833984375, -9.0048828125, -8.679931640625, -8.35498046875, -8.030029296875, -7.705078125, -7.380126953125, -7.05517578125, -6.730224609375, -6.4052734375, -6.080322265625, -5.75537109375, -5.430419921875, -5.10546875, -4.780517578125, -4.45556640625, -4.130615234375, -3.8056640625, -3.480712890625, -3.15576171875, -2.830810546875, -2.505859375, -2.180908203125, -1.85595703125, -1.531005859375, -1.2060546875, -0.881103515625, -0.55615234375, -0.231201171875, 0.09375, 0.418701171875, 0.74365234375, 1.068603515625, 1.3935546875, 1.718505859375, 2.04345703125, 2.368408203125, 2.693359375, 3.018310546875, 3.34326171875, 3.668212890625, 3.9931640625, 4.318115234375, 4.64306640625, 4.968017578125, 5.29296875, 5.617919921875, 5.94287109375, 6.267822265625, 6.5927734375, 6.917724609375, 7.24267578125, 7.567626953125, 7.892578125, 8.217529296875, 8.54248046875, 8.867431640625, 9.1923828125, 9.517333984375, 9.84228515625, 10.167236328125, 10.4921875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 8.0, 3.0, 3.0, 8.0, 14.0, 10.0, 11.0, 14.0, 16.0, 14.0, 19.0, 28.0, 42.0, 34.0, 31.0, 31.0, 53.0, 51.0, 57.0, 54.0, 47.0, 69.0, 35.0, 50.0, 40.0, 35.0, 34.0, 31.0, 32.0, 24.0, 21.0, 21.0, 11.0, 8.0, 10.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.99755859375, -0.9640884399414062, -0.9306182861328125, -0.8971481323242188, -0.863677978515625, -0.8302078247070312, -0.7967376708984375, -0.7632675170898438, -0.72979736328125, -0.6963272094726562, -0.6628570556640625, -0.6293869018554688, -0.595916748046875, -0.5624465942382812, -0.5289764404296875, -0.49550628662109375, -0.4620361328125, -0.42856597900390625, -0.3950958251953125, -0.36162567138671875, -0.328155517578125, -0.29468536376953125, -0.2612152099609375, -0.22774505615234375, -0.19427490234375, -0.16080474853515625, -0.1273345947265625, -0.09386444091796875, -0.060394287109375, -0.02692413330078125, 0.0065460205078125, 0.04001617431640625, 0.073486328125, 0.10695648193359375, 0.1404266357421875, 0.17389678955078125, 0.207366943359375, 0.24083709716796875, 0.2743072509765625, 0.30777740478515625, 0.34124755859375, 0.37471771240234375, 0.4081878662109375, 0.44165802001953125, 0.475128173828125, 0.5085983276367188, 0.5420684814453125, 0.5755386352539062, 0.6090087890625, 0.6424789428710938, 0.6759490966796875, 0.7094192504882812, 0.742889404296875, 0.7763595581054688, 0.8098297119140625, 0.8432998657226562, 0.87677001953125, 0.9102401733398438, 0.9437103271484375, 0.9771804809570312, 1.010650634765625, 1.0441207885742188, 1.0775909423828125, 1.1110610961914062, 1.14453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 9.0, 3.0, 7.0, 11.0, 14.0, 17.0, 18.0, 26.0, 53.0, 68.0, 95.0, 204.0, 369.0, 723.0, 1691.0, 4430.0, 12890.0, 41263.0, 156289.0, 707722.0, 2228516.0, 798413.0, 174907.0, 44778.0, 13638.0, 4714.0, 1823.0, 779.0, 345.0, 175.0, 111.0, 54.0, 34.0, 26.0, 18.0, 17.0, 12.0, 12.0, 3.0, 2.0, 6.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.1328125, -14.6947021484375, -14.256591796875, -13.8184814453125, -13.38037109375, -12.9422607421875, -12.504150390625, -12.0660400390625, -11.6279296875, -11.1898193359375, -10.751708984375, -10.3135986328125, -9.87548828125, -9.4373779296875, -8.999267578125, -8.5611572265625, -8.123046875, -7.6849365234375, -7.246826171875, -6.8087158203125, -6.37060546875, -5.9324951171875, -5.494384765625, -5.0562744140625, -4.6181640625, -4.1800537109375, -3.741943359375, -3.3038330078125, -2.86572265625, -2.4276123046875, -1.989501953125, -1.5513916015625, -1.11328125, -0.6751708984375, -0.237060546875, 0.2010498046875, 0.63916015625, 1.0772705078125, 1.515380859375, 1.9534912109375, 2.3916015625, 2.8297119140625, 3.267822265625, 3.7059326171875, 4.14404296875, 4.5821533203125, 5.020263671875, 5.4583740234375, 5.896484375, 6.3345947265625, 6.772705078125, 7.2108154296875, 7.64892578125, 8.0870361328125, 8.525146484375, 8.9632568359375, 9.4013671875, 9.8394775390625, 10.277587890625, 10.7156982421875, 11.15380859375, 11.5919189453125, 12.030029296875, 12.4681396484375, 12.90625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 11.0, 14.0, 21.0, 17.0, 32.0, 31.0, 37.0, 46.0, 74.0, 78.0, 116.0, 144.0, 173.0, 214.0, 246.0, 286.0, 387.0, 474.0, 310.0, 281.0, 223.0, 203.0, 130.0, 117.0, 99.0, 71.0, 57.0, 41.0, 40.0, 27.0, 12.0, 16.0, 10.0, 10.0, 12.0, 3.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -4.0042724609375, -3.887451171875, -3.7706298828125, -3.65380859375, -3.5369873046875, -3.420166015625, -3.3033447265625, -3.1865234375, -3.0697021484375, -2.952880859375, -2.8360595703125, -2.71923828125, -2.6024169921875, -2.485595703125, -2.3687744140625, -2.251953125, -2.1351318359375, -2.018310546875, -1.9014892578125, -1.78466796875, -1.6678466796875, -1.551025390625, -1.4342041015625, -1.3173828125, -1.2005615234375, -1.083740234375, -0.9669189453125, -0.85009765625, -0.7332763671875, -0.616455078125, -0.4996337890625, -0.3828125, -0.2659912109375, -0.149169921875, -0.0323486328125, 0.08447265625, 0.2012939453125, 0.318115234375, 0.4349365234375, 0.5517578125, 0.6685791015625, 0.785400390625, 0.9022216796875, 1.01904296875, 1.1358642578125, 1.252685546875, 1.3695068359375, 1.486328125, 1.6031494140625, 1.719970703125, 1.8367919921875, 1.95361328125, 2.0704345703125, 2.187255859375, 2.3040771484375, 2.4208984375, 2.5377197265625, 2.654541015625, 2.7713623046875, 2.88818359375, 3.0050048828125, 3.121826171875, 3.2386474609375, 3.35546875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 11.0, 5.0, 5.0, 11.0, 18.0, 24.0, 23.0, 31.0, 38.0, 53.0, 61.0, 80.0, 82.0, 92.0, 73.0, 76.0, 55.0, 68.0, 51.0, 27.0, 26.0, 21.0, 20.0, 8.0, 8.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.129074096679688, -26.11540412902832, -25.101736068725586, -24.08806610107422, -23.074398040771484, -22.060728073120117, -21.04705810546875, -20.033390045166016, -19.01972198486328, -18.006052017211914, -16.99238395690918, -15.978713989257812, -14.965045928955078, -13.951375961303711, -12.93770694732666, -11.92403793334961, -10.910367965698242, -9.896698951721191, -8.88302993774414, -7.869360446929932, -6.855691432952881, -5.84202241897583, -4.828352928161621, -3.8146839141845703, -2.8010149002075195, -1.7873457670211792, -0.7736766338348389, 0.23999261856079102, 1.2536616325378418, 2.2673306465148926, 3.2810001373291016, 4.294669151306152, 5.308338165283203, 6.322007179260254, 7.335676193237305, 8.349346160888672, 9.363014221191406, 10.376684188842773, 11.390353202819824, 12.404022216796875, 13.417691230773926, 14.431360244750977, 15.445029258728027, 16.458698272705078, 17.472368240356445, 18.48603630065918, 19.499706268310547, 20.51337432861328, 21.52704429626465, 22.540714263916016, 23.55438232421875, 24.568052291870117, 25.58172035217285, 26.59539031982422, 27.609058380126953, 28.62272834777832, 29.636398315429688, 30.650068283081055, 31.66373634338379, 32.677406311035156, 33.69107437133789, 34.704742431640625, 35.718414306640625, 36.73208236694336, 37.745750427246094]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 1.0, 5.0, 5.0, 11.0, 8.0, 9.0, 16.0, 13.0, 20.0, 22.0, 34.0, 34.0, 40.0, 37.0, 35.0, 38.0, 48.0, 56.0, 47.0, 50.0, 50.0, 45.0, 30.0, 44.0, 43.0, 31.0, 32.0, 42.0, 35.0, 18.0, 18.0, 23.0, 10.0, 13.0, 10.0, 8.0, 6.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.053157806396484, -28.218116760253906, -27.383075714111328, -26.54803466796875, -25.712993621826172, -24.877952575683594, -24.042911529541016, -23.207868576049805, -22.372827529907227, -21.53778648376465, -20.70274543762207, -19.867704391479492, -19.032663345336914, -18.197620391845703, -17.362579345703125, -16.527538299560547, -15.692498207092285, -14.857457160949707, -14.022416114807129, -13.187374114990234, -12.352333068847656, -11.517292022705078, -10.6822509765625, -9.847209930419922, -9.012168884277344, -8.177127838134766, -7.342086315155029, -6.507045269012451, -5.672003746032715, -4.836962699890137, -4.001921653747559, -3.1668801307678223, -2.331838607788086, -1.4967973232269287, -0.661756157875061, 0.17328500747680664, 1.0083262920379639, 1.843367576599121, 2.678408622741699, 3.5134501457214355, 4.348491191864014, 5.183532238006592, 6.018573760986328, 6.853614807128906, 7.688655853271484, 8.523696899414062, 9.35873794555664, 10.193779945373535, 11.028820991516113, 11.863862037658691, 12.69890308380127, 13.533945083618164, 14.368986129760742, 15.20402717590332, 16.0390682220459, 16.874109268188477, 17.709150314331055, 18.544191360473633, 19.37923240661621, 20.21427345275879, 21.049314498901367, 21.884357452392578, 22.719398498535156, 23.554439544677734, 24.389480590820312]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 2.0, 11.0, 10.0, 15.0, 30.0, 31.0, 34.0, 65.0, 85.0, 147.0, 275.0, 448.0, 625.0, 1055.0, 1832.0, 3102.0, 5030.0, 8501.0, 14493.0, 25984.0, 48620.0, 102034.0, 232388.0, 306626.0, 149003.0, 67990.0, 34549.0, 18778.0, 10663.0, 6320.0, 3752.0, 2350.0, 1418.0, 860.0, 544.0, 316.0, 213.0, 131.0, 78.0, 40.0, 31.0, 38.0, 14.0, 7.0, 9.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-8.1953125, -7.9691162109375, -7.742919921875, -7.5167236328125, -7.29052734375, -7.0643310546875, -6.838134765625, -6.6119384765625, -6.3857421875, -6.1595458984375, -5.933349609375, -5.7071533203125, -5.48095703125, -5.2547607421875, -5.028564453125, -4.8023681640625, -4.576171875, -4.3499755859375, -4.123779296875, -3.8975830078125, -3.67138671875, -3.4451904296875, -3.218994140625, -2.9927978515625, -2.7666015625, -2.5404052734375, -2.314208984375, -2.0880126953125, -1.86181640625, -1.6356201171875, -1.409423828125, -1.1832275390625, -0.95703125, -0.7308349609375, -0.504638671875, -0.2784423828125, -0.05224609375, 0.1739501953125, 0.400146484375, 0.6263427734375, 0.8525390625, 1.0787353515625, 1.304931640625, 1.5311279296875, 1.75732421875, 1.9835205078125, 2.209716796875, 2.4359130859375, 2.662109375, 2.8883056640625, 3.114501953125, 3.3406982421875, 3.56689453125, 3.7930908203125, 4.019287109375, 4.2454833984375, 4.4716796875, 4.6978759765625, 4.924072265625, 5.1502685546875, 5.37646484375, 5.6026611328125, 5.828857421875, 6.0550537109375, 6.28125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 4.0, 3.0, 8.0, 13.0, 21.0, 20.0, 11.0, 20.0, 25.0, 29.0, 28.0, 32.0, 45.0, 55.0, 59.0, 60.0, 50.0, 44.0, 57.0, 47.0, 44.0, 75.0, 40.0, 37.0, 32.0, 21.0, 28.0, 23.0, 13.0, 15.0, 11.0, 12.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.39453125, -1.348419189453125, -1.30230712890625, -1.256195068359375, -1.2100830078125, -1.163970947265625, -1.11785888671875, -1.071746826171875, -1.025634765625, -0.979522705078125, -0.93341064453125, -0.887298583984375, -0.8411865234375, -0.795074462890625, -0.74896240234375, -0.702850341796875, -0.65673828125, -0.610626220703125, -0.56451416015625, -0.518402099609375, -0.4722900390625, -0.426177978515625, -0.38006591796875, -0.333953857421875, -0.287841796875, -0.241729736328125, -0.19561767578125, -0.149505615234375, -0.1033935546875, -0.057281494140625, -0.01116943359375, 0.034942626953125, 0.0810546875, 0.127166748046875, 0.17327880859375, 0.219390869140625, 0.2655029296875, 0.311614990234375, 0.35772705078125, 0.403839111328125, 0.449951171875, 0.496063232421875, 0.54217529296875, 0.588287353515625, 0.6343994140625, 0.680511474609375, 0.72662353515625, 0.772735595703125, 0.81884765625, 0.864959716796875, 0.91107177734375, 0.957183837890625, 1.0032958984375, 1.049407958984375, 1.09552001953125, 1.141632080078125, 1.187744140625, 1.233856201171875, 1.27996826171875, 1.326080322265625, 1.3721923828125, 1.418304443359375, 1.46441650390625, 1.510528564453125, 1.556640625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 8.0, 6.0, 13.0, 19.0, 15.0, 28.0, 46.0, 66.0, 90.0, 145.0, 239.0, 414.0, 726.0, 1380.0, 2804.0, 6278.0, 15182.0, 42691.0, 152937.0, 536633.0, 203307.0, 53112.0, 18230.0, 7182.0, 3348.0, 1573.0, 825.0, 473.0, 276.0, 167.0, 108.0, 71.0, 46.0, 34.0, 24.0, 16.0, 12.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.54296875, -7.25933837890625, -6.9757080078125, -6.69207763671875, -6.408447265625, -6.12481689453125, -5.8411865234375, -5.55755615234375, -5.27392578125, -4.99029541015625, -4.7066650390625, -4.42303466796875, -4.139404296875, -3.85577392578125, -3.5721435546875, -3.28851318359375, -3.0048828125, -2.72125244140625, -2.4376220703125, -2.15399169921875, -1.870361328125, -1.58673095703125, -1.3031005859375, -1.01947021484375, -0.73583984375, -0.45220947265625, -0.1685791015625, 0.11505126953125, 0.398681640625, 0.68231201171875, 0.9659423828125, 1.24957275390625, 1.533203125, 1.81683349609375, 2.1004638671875, 2.38409423828125, 2.667724609375, 2.95135498046875, 3.2349853515625, 3.51861572265625, 3.80224609375, 4.08587646484375, 4.3695068359375, 4.65313720703125, 4.936767578125, 5.22039794921875, 5.5040283203125, 5.78765869140625, 6.0712890625, 6.35491943359375, 6.6385498046875, 6.92218017578125, 7.205810546875, 7.48944091796875, 7.7730712890625, 8.05670166015625, 8.34033203125, 8.62396240234375, 8.9075927734375, 9.19122314453125, 9.474853515625, 9.75848388671875, 10.0421142578125, 10.32574462890625, 10.609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 6.0, 6.0, 6.0, 9.0, 10.0, 12.0, 10.0, 19.0, 23.0, 16.0, 27.0, 28.0, 26.0, 42.0, 34.0, 33.0, 34.0, 42.0, 32.0, 34.0, 42.0, 42.0, 24.0, 40.0, 41.0, 34.0, 43.0, 32.0, 23.0, 36.0, 28.0, 24.0, 12.0, 18.0, 19.0, 11.0, 14.0, 15.0, 5.0, 7.0, 4.0, 11.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.93359375, -5.74249267578125, -5.5513916015625, -5.36029052734375, -5.169189453125, -4.97808837890625, -4.7869873046875, -4.59588623046875, -4.40478515625, -4.21368408203125, -4.0225830078125, -3.83148193359375, -3.640380859375, -3.44927978515625, -3.2581787109375, -3.06707763671875, -2.8759765625, -2.68487548828125, -2.4937744140625, -2.30267333984375, -2.111572265625, -1.92047119140625, -1.7293701171875, -1.53826904296875, -1.34716796875, -1.15606689453125, -0.9649658203125, -0.77386474609375, -0.582763671875, -0.39166259765625, -0.2005615234375, -0.00946044921875, 0.181640625, 0.37274169921875, 0.5638427734375, 0.75494384765625, 0.946044921875, 1.13714599609375, 1.3282470703125, 1.51934814453125, 1.71044921875, 1.90155029296875, 2.0926513671875, 2.28375244140625, 2.474853515625, 2.66595458984375, 2.8570556640625, 3.04815673828125, 3.2392578125, 3.43035888671875, 3.6214599609375, 3.81256103515625, 4.003662109375, 4.19476318359375, 4.3858642578125, 4.57696533203125, 4.76806640625, 4.95916748046875, 5.1502685546875, 5.34136962890625, 5.532470703125, 5.72357177734375, 5.9146728515625, 6.10577392578125, 6.296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 3.0, 4.0, 9.0, 6.0, 6.0, 12.0, 23.0, 32.0, 57.0, 78.0, 118.0, 228.0, 405.0, 797.0, 1804.0, 5222.0, 21943.0, 342291.0, 632683.0, 32172.0, 6457.0, 2125.0, 971.0, 449.0, 260.0, 141.0, 73.0, 55.0, 34.0, 31.0, 17.0, 14.0, 4.0, 12.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.296875, -15.73681640625, -15.1767578125, -14.61669921875, -14.056640625, -13.49658203125, -12.9365234375, -12.37646484375, -11.81640625, -11.25634765625, -10.6962890625, -10.13623046875, -9.576171875, -9.01611328125, -8.4560546875, -7.89599609375, -7.3359375, -6.77587890625, -6.2158203125, -5.65576171875, -5.095703125, -4.53564453125, -3.9755859375, -3.41552734375, -2.85546875, -2.29541015625, -1.7353515625, -1.17529296875, -0.615234375, -0.05517578125, 0.5048828125, 1.06494140625, 1.625, 2.18505859375, 2.7451171875, 3.30517578125, 3.865234375, 4.42529296875, 4.9853515625, 5.54541015625, 6.10546875, 6.66552734375, 7.2255859375, 7.78564453125, 8.345703125, 8.90576171875, 9.4658203125, 10.02587890625, 10.5859375, 11.14599609375, 11.7060546875, 12.26611328125, 12.826171875, 13.38623046875, 13.9462890625, 14.50634765625, 15.06640625, 15.62646484375, 16.1865234375, 16.74658203125, 17.306640625, 17.86669921875, 18.4267578125, 18.98681640625, 19.546875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 8.0, 8.0, 7.0, 17.0, 32.0, 42.0, 61.0, 87.0, 143.0, 144.0, 128.0, 107.0, 72.0, 45.0, 36.0, 23.0, 20.0, 7.0, 5.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007219314575195312, -0.0007022097706794739, -0.0006824880838394165, -0.0006627663969993591, -0.0006430447101593018, -0.0006233230233192444, -0.000603601336479187, -0.0005838796496391296, -0.0005641579627990723, -0.0005444362759590149, -0.0005247145891189575, -0.0005049929022789001, -0.0004852712154388428, -0.0004655495285987854, -0.00044582784175872803, -0.00042610615491867065, -0.0004063844680786133, -0.0003866627812385559, -0.00036694109439849854, -0.00034721940755844116, -0.0003274977207183838, -0.0003077760338783264, -0.00028805434703826904, -0.00026833266019821167, -0.0002486109733581543, -0.00022888928651809692, -0.00020916759967803955, -0.00018944591283798218, -0.0001697242259979248, -0.00015000253915786743, -0.00013028085231781006, -0.00011055916547775269, -9.083747863769531e-05, -7.111579179763794e-05, -5.1394104957580566e-05, -3.167241811752319e-05, -1.195073127746582e-05, 7.770955562591553e-06, 2.7492642402648926e-05, 4.72143292427063e-05, 6.693601608276367e-05, 8.665770292282104e-05, 0.00010637938976287842, 0.0001261010766029358, 0.00014582276344299316, 0.00016554445028305054, 0.0001852661371231079, 0.00020498782396316528, 0.00022470951080322266, 0.00024443119764328003, 0.0002641528844833374, 0.0002838745713233948, 0.00030359625816345215, 0.0003233179450035095, 0.0003430396318435669, 0.00036276131868362427, 0.00038248300552368164, 0.000402204692363739, 0.0004219263792037964, 0.00044164806604385376, 0.00046136975288391113, 0.0004810914397239685, 0.0005008131265640259, 0.0005205348134040833, 0.0005402565002441406]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 8.0, 11.0, 17.0, 20.0, 46.0, 70.0, 105.0, 156.0, 292.0, 544.0, 1010.0, 2167.0, 4860.0, 12847.0, 43382.0, 217307.0, 573739.0, 142609.0, 31684.0, 10003.0, 3897.0, 1797.0, 858.0, 501.0, 254.0, 141.0, 76.0, 48.0, 34.0, 31.0, 17.0, 12.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4375, -10.1339111328125, -9.830322265625, -9.5267333984375, -9.22314453125, -8.9195556640625, -8.615966796875, -8.3123779296875, -8.0087890625, -7.7052001953125, -7.401611328125, -7.0980224609375, -6.79443359375, -6.4908447265625, -6.187255859375, -5.8836669921875, -5.580078125, -5.2764892578125, -4.972900390625, -4.6693115234375, -4.36572265625, -4.0621337890625, -3.758544921875, -3.4549560546875, -3.1513671875, -2.8477783203125, -2.544189453125, -2.2406005859375, -1.93701171875, -1.6334228515625, -1.329833984375, -1.0262451171875, -0.72265625, -0.4190673828125, -0.115478515625, 0.1881103515625, 0.49169921875, 0.7952880859375, 1.098876953125, 1.4024658203125, 1.7060546875, 2.0096435546875, 2.313232421875, 2.6168212890625, 2.92041015625, 3.2239990234375, 3.527587890625, 3.8311767578125, 4.134765625, 4.4383544921875, 4.741943359375, 5.0455322265625, 5.34912109375, 5.6527099609375, 5.956298828125, 6.2598876953125, 6.5634765625, 6.8670654296875, 7.170654296875, 7.4742431640625, 7.77783203125, 8.0814208984375, 8.385009765625, 8.6885986328125, 8.9921875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 9.0, 11.0, 10.0, 22.0, 11.0, 31.0, 29.0, 39.0, 38.0, 49.0, 43.0, 72.0, 75.0, 82.0, 68.0, 71.0, 66.0, 55.0, 48.0, 32.0, 31.0, 15.0, 22.0, 16.0, 8.0, 8.0, 9.0, 8.0, 1.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.24725341796875, -4.0804443359375, -3.91363525390625, -3.746826171875, -3.58001708984375, -3.4132080078125, -3.24639892578125, -3.07958984375, -2.91278076171875, -2.7459716796875, -2.57916259765625, -2.412353515625, -2.24554443359375, -2.0787353515625, -1.91192626953125, -1.7451171875, -1.57830810546875, -1.4114990234375, -1.24468994140625, -1.077880859375, -0.91107177734375, -0.7442626953125, -0.57745361328125, -0.41064453125, -0.24383544921875, -0.0770263671875, 0.08978271484375, 0.256591796875, 0.42340087890625, 0.5902099609375, 0.75701904296875, 0.923828125, 1.09063720703125, 1.2574462890625, 1.42425537109375, 1.591064453125, 1.75787353515625, 1.9246826171875, 2.09149169921875, 2.25830078125, 2.42510986328125, 2.5919189453125, 2.75872802734375, 2.925537109375, 3.09234619140625, 3.2591552734375, 3.42596435546875, 3.5927734375, 3.75958251953125, 3.9263916015625, 4.09320068359375, 4.260009765625, 4.42681884765625, 4.5936279296875, 4.76043701171875, 4.92724609375, 5.09405517578125, 5.2608642578125, 5.42767333984375, 5.594482421875, 5.76129150390625, 5.9281005859375, 6.09490966796875, 6.26171875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 9.0, 12.0, 15.0, 13.0, 34.0, 54.0, 113.0, 203.0, 228.0, 143.0, 65.0, 48.0, 22.0, 16.0, 6.0, 8.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.15704345703125, -149.9176025390625, -146.67816162109375, -143.438720703125, -140.19927978515625, -136.9598388671875, -133.7203826904297, -130.48094177246094, -127.24150085449219, -124.00205993652344, -120.76261901855469, -117.5231704711914, -114.28372955322266, -111.0442886352539, -107.80484771728516, -104.56539916992188, -101.32595825195312, -98.08651733398438, -94.84707641601562, -91.60762786865234, -88.3681869506836, -85.12874603271484, -81.8893051147461, -78.64985656738281, -75.4104232788086, -72.17098236083984, -68.9315414428711, -65.69209289550781, -62.45265197753906, -59.21321105957031, -55.97377014160156, -52.73432540893555, -49.4948844909668, -46.25544357299805, -43.01599884033203, -39.77655792236328, -36.537113189697266, -33.297672271728516, -30.058229446411133, -26.81878662109375, -23.579343795776367, -20.339900970458984, -17.1004581451416, -13.861016273498535, -10.621573448181152, -7.382131576538086, -4.142688751220703, -0.9032459259033203, 2.3361968994140625, 5.575639724731445, 8.815082550048828, 12.054524421691895, 15.293967247009277, 18.533409118652344, 21.772851943969727, 25.01229476928711, 28.251737594604492, 31.491180419921875, 34.730621337890625, 37.97006607055664, 41.20950698852539, 44.448951721191406, 47.688392639160156, 50.927833557128906, 54.16727828979492]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 8.0, 10.0, 8.0, 13.0, 43.0, 86.0, 90.0, 128.0, 167.0, 136.0, 109.0, 67.0, 44.0, 27.0, 17.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-193.52972412109375, -188.77713012695312, -184.0245361328125, -179.27194213867188, -174.51934814453125, -169.76675415039062, -165.01416015625, -160.26156616210938, -155.50897216796875, -150.75637817382812, -146.0037841796875, -141.25119018554688, -136.49859619140625, -131.74600219726562, -126.99340057373047, -122.24080657958984, -117.48820495605469, -112.73561096191406, -107.98301696777344, -103.23042297363281, -98.47782897949219, -93.72523498535156, -88.9726333618164, -84.22003936767578, -79.46744537353516, -74.71485137939453, -69.9622573852539, -65.20966339111328, -60.45706558227539, -55.704471588134766, -50.951873779296875, -46.19927978515625, -41.446693420410156, -36.69409942626953, -31.941503524780273, -27.188907623291016, -22.43631362915039, -17.683719635009766, -12.931123733520508, -8.17852783203125, -3.425933837890625, 1.3266611099243164, 6.079256057739258, 10.8318510055542, 15.58444595336914, 20.337039947509766, 25.089635848999023, 29.84223175048828, 34.594825744628906, 39.34741973876953, 44.100013732910156, 48.85261154174805, 53.60520553588867, 58.3577995300293, 63.11039733886719, 67.86299133300781, 72.61558532714844, 77.36817932128906, 82.12077331542969, 86.87336730957031, 91.62596130371094, 96.37855529785156, 101.13115692138672, 105.88375091552734, 110.63634490966797]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 2.0, 7.0, 3.0, 9.0, 13.0, 18.0, 28.0, 35.0, 49.0, 70.0, 115.0, 172.0, 363.0, 758.0, 1585.0, 3460.0, 7893.0, 19224.0, 56255.0, 227910.0, 3425098.0, 337482.0, 72969.0, 24202.0, 9249.0, 3960.0, 1755.0, 797.0, 381.0, 180.0, 101.0, 56.0, 34.0, 10.0, 14.0, 10.0, 6.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.625, -42.5234375, -41.421875, -40.3203125, -39.21875, -38.1171875, -37.015625, -35.9140625, -34.8125, -33.7109375, -32.609375, -31.5078125, -30.40625, -29.3046875, -28.203125, -27.1015625, -26.0, -24.8984375, -23.796875, -22.6953125, -21.59375, -20.4921875, -19.390625, -18.2890625, -17.1875, -16.0859375, -14.984375, -13.8828125, -12.78125, -11.6796875, -10.578125, -9.4765625, -8.375, -7.2734375, -6.171875, -5.0703125, -3.96875, -2.8671875, -1.765625, -0.6640625, 0.4375, 1.5390625, 2.640625, 3.7421875, 4.84375, 5.9453125, 7.046875, 8.1484375, 9.25, 10.3515625, 11.453125, 12.5546875, 13.65625, 14.7578125, 15.859375, 16.9609375, 18.0625, 19.1640625, 20.265625, 21.3671875, 22.46875, 23.5703125, 24.671875, 25.7734375, 26.875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 9.0, 15.0, 18.0, 23.0, 30.0, 30.0, 37.0, 56.0, 74.0, 80.0, 74.0, 67.0, 67.0, 69.0, 68.0, 54.0, 55.0, 36.0, 35.0, 21.0, 14.0, 19.0, 6.0, 5.0, 5.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.708984375, -2.6436767578125, -2.578369140625, -2.5130615234375, -2.44775390625, -2.3824462890625, -2.317138671875, -2.2518310546875, -2.1865234375, -2.1212158203125, -2.055908203125, -1.9906005859375, -1.92529296875, -1.8599853515625, -1.794677734375, -1.7293701171875, -1.6640625, -1.5987548828125, -1.533447265625, -1.4681396484375, -1.40283203125, -1.3375244140625, -1.272216796875, -1.2069091796875, -1.1416015625, -1.0762939453125, -1.010986328125, -0.9456787109375, -0.88037109375, -0.8150634765625, -0.749755859375, -0.6844482421875, -0.619140625, -0.5538330078125, -0.488525390625, -0.4232177734375, -0.35791015625, -0.2926025390625, -0.227294921875, -0.1619873046875, -0.0966796875, -0.0313720703125, 0.033935546875, 0.0992431640625, 0.16455078125, 0.2298583984375, 0.295166015625, 0.3604736328125, 0.42578125, 0.4910888671875, 0.556396484375, 0.6217041015625, 0.68701171875, 0.7523193359375, 0.817626953125, 0.8829345703125, 0.9482421875, 1.0135498046875, 1.078857421875, 1.1441650390625, 1.20947265625, 1.2747802734375, 1.340087890625, 1.4053955078125, 1.470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 5.0, 9.0, 13.0, 17.0, 28.0, 54.0, 51.0, 80.0, 144.0, 193.0, 338.0, 506.0, 852.0, 1231.0, 2178.0, 3849.0, 7004.0, 14045.0, 29196.0, 67946.0, 186606.0, 732713.0, 2670402.0, 298521.0, 99016.0, 40082.0, 18553.0, 9098.0, 4830.0, 2529.0, 1564.0, 977.0, 607.0, 350.0, 259.0, 151.0, 81.0, 64.0, 49.0, 25.0, 21.0, 17.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.6875, -20.044921875, -19.40234375, -18.759765625, -18.1171875, -17.474609375, -16.83203125, -16.189453125, -15.546875, -14.904296875, -14.26171875, -13.619140625, -12.9765625, -12.333984375, -11.69140625, -11.048828125, -10.40625, -9.763671875, -9.12109375, -8.478515625, -7.8359375, -7.193359375, -6.55078125, -5.908203125, -5.265625, -4.623046875, -3.98046875, -3.337890625, -2.6953125, -2.052734375, -1.41015625, -0.767578125, -0.125, 0.517578125, 1.16015625, 1.802734375, 2.4453125, 3.087890625, 3.73046875, 4.373046875, 5.015625, 5.658203125, 6.30078125, 6.943359375, 7.5859375, 8.228515625, 8.87109375, 9.513671875, 10.15625, 10.798828125, 11.44140625, 12.083984375, 12.7265625, 13.369140625, 14.01171875, 14.654296875, 15.296875, 15.939453125, 16.58203125, 17.224609375, 17.8671875, 18.509765625, 19.15234375, 19.794921875, 20.4375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 15.0, 11.0, 14.0, 16.0, 24.0, 34.0, 28.0, 54.0, 60.0, 78.0, 126.0, 175.0, 286.0, 1156.0, 1001.0, 279.0, 206.0, 113.0, 86.0, 59.0, 54.0, 43.0, 32.0, 35.0, 24.0, 16.0, 3.0, 9.0, 3.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.828125, -4.68609619140625, -4.5440673828125, -4.40203857421875, -4.260009765625, -4.11798095703125, -3.9759521484375, -3.83392333984375, -3.69189453125, -3.54986572265625, -3.4078369140625, -3.26580810546875, -3.123779296875, -2.98175048828125, -2.8397216796875, -2.69769287109375, -2.5556640625, -2.41363525390625, -2.2716064453125, -2.12957763671875, -1.987548828125, -1.84552001953125, -1.7034912109375, -1.56146240234375, -1.41943359375, -1.27740478515625, -1.1353759765625, -0.99334716796875, -0.851318359375, -0.70928955078125, -0.5672607421875, -0.42523193359375, -0.283203125, -0.14117431640625, 0.0008544921875, 0.14288330078125, 0.284912109375, 0.42694091796875, 0.5689697265625, 0.71099853515625, 0.85302734375, 0.99505615234375, 1.1370849609375, 1.27911376953125, 1.421142578125, 1.56317138671875, 1.7052001953125, 1.84722900390625, 1.9892578125, 2.13128662109375, 2.2733154296875, 2.41534423828125, 2.557373046875, 2.69940185546875, 2.8414306640625, 2.98345947265625, 3.12548828125, 3.26751708984375, 3.4095458984375, 3.55157470703125, 3.693603515625, 3.83563232421875, 3.9776611328125, 4.11968994140625, 4.26171875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 16.0, 37.0, 125.0, 273.0, 250.0, 169.0, 67.0, 33.0, 12.0, 10.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.41628646850586, -23.110261917114258, -20.804237365722656, -18.498210906982422, -16.192188262939453, -13.886162757873535, -11.580137252807617, -9.274112701416016, -6.968088150024414, -4.6620635986328125, -2.3560385704040527, -0.05001354217529297, 2.2560110092163086, 4.56203556060791, 6.868061065673828, 9.17408561706543, 11.480110168457031, 13.786134719848633, 16.092159271240234, 18.39818572998047, 20.704208374023438, 23.010234832763672, 25.316259384155273, 27.622283935546875, 29.928308486938477, 32.23433303833008, 34.54035949707031, 36.84638214111328, 39.152408599853516, 41.458431243896484, 43.76445770263672, 46.07048034667969, 48.376502990722656, 50.68252944946289, 52.98855209350586, 55.294578552246094, 57.60060119628906, 59.9066276550293, 62.21265411376953, 64.5186767578125, 66.82469940185547, 69.13072204589844, 71.43675231933594, 73.7427749633789, 76.04879760742188, 78.35482025146484, 80.66085052490234, 82.96687316894531, 85.27290344238281, 87.57892608642578, 89.88495635986328, 92.19097900390625, 94.49700164794922, 96.80302429199219, 99.10905456542969, 101.41507720947266, 103.72109985351562, 106.0271224975586, 108.3331527709961, 110.63917541503906, 112.94519805908203, 115.251220703125, 117.5572509765625, 119.86327362060547, 122.16929626464844]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 11.0, 6.0, 7.0, 11.0, 20.0, 10.0, 25.0, 20.0, 27.0, 27.0, 27.0, 43.0, 28.0, 41.0, 46.0, 55.0, 52.0, 57.0, 44.0, 44.0, 51.0, 54.0, 51.0, 30.0, 34.0, 33.0, 34.0, 25.0, 13.0, 14.0, 12.0, 14.0, 8.0, 2.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-21.712379455566406, -21.021015167236328, -20.329652786254883, -19.638288497924805, -18.94692611694336, -18.25556182861328, -17.564197540283203, -16.872833251953125, -16.18147087097168, -15.490107536315918, -14.798744201660156, -14.107379913330078, -13.416016578674316, -12.724653244018555, -12.033288955688477, -11.341925621032715, -10.650562286376953, -9.959198951721191, -9.26783561706543, -8.576471328735352, -7.88510799407959, -7.193744659423828, -6.502380847930908, -5.811017036437988, -5.119653701782227, -4.428290367126465, -3.736926555633545, -3.045562982559204, -2.3541994094848633, -1.6628358364105225, -0.9714722633361816, -0.2801084518432617, 0.4112548828125, 1.1026184558868408, 1.7939820289611816, 2.4853456020355225, 3.1767091751098633, 3.868072748184204, 4.559436321258545, 5.250800132751465, 5.942163467407227, 6.633526802062988, 7.324890613555908, 8.016254425048828, 8.70761775970459, 9.398981094360352, 10.09034538269043, 10.781708717346191, 11.473072052001953, 12.164435386657715, 12.855798721313477, 13.547163009643555, 14.238526344299316, 14.929889678955078, 15.621253967285156, 16.312618255615234, 17.00398063659668, 17.695344924926758, 18.386707305908203, 19.07807159423828, 19.76943588256836, 20.460798263549805, 21.152162551879883, 21.843524932861328, 22.534889221191406]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 6.0, 6.0, 16.0, 26.0, 27.0, 38.0, 72.0, 120.0, 179.0, 290.0, 400.0, 605.0, 992.0, 1531.0, 2453.0, 4067.0, 7288.0, 14040.0, 30030.0, 76133.0, 286752.0, 441064.0, 105337.0, 38389.0, 17233.0, 8677.0, 4931.0, 2865.0, 1729.0, 1162.0, 737.0, 464.0, 328.0, 182.0, 135.0, 82.0, 60.0, 28.0, 20.0, 15.0, 11.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0], "bins": [-23.25, -22.6405029296875, -22.031005859375, -21.4215087890625, -20.81201171875, -20.2025146484375, -19.593017578125, -18.9835205078125, -18.3740234375, -17.7645263671875, -17.155029296875, -16.5455322265625, -15.93603515625, -15.3265380859375, -14.717041015625, -14.1075439453125, -13.498046875, -12.8885498046875, -12.279052734375, -11.6695556640625, -11.06005859375, -10.4505615234375, -9.841064453125, -9.2315673828125, -8.6220703125, -8.0125732421875, -7.403076171875, -6.7935791015625, -6.18408203125, -5.5745849609375, -4.965087890625, -4.3555908203125, -3.74609375, -3.1365966796875, -2.527099609375, -1.9176025390625, -1.30810546875, -0.6986083984375, -0.089111328125, 0.5203857421875, 1.1298828125, 1.7393798828125, 2.348876953125, 2.9583740234375, 3.56787109375, 4.1773681640625, 4.786865234375, 5.3963623046875, 6.005859375, 6.6153564453125, 7.224853515625, 7.8343505859375, 8.44384765625, 9.0533447265625, 9.662841796875, 10.2723388671875, 10.8818359375, 11.4913330078125, 12.100830078125, 12.7103271484375, 13.31982421875, 13.9293212890625, 14.538818359375, 15.1483154296875, 15.7578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 3.0, 5.0, 7.0, 5.0, 7.0, 10.0, 12.0, 10.0, 10.0, 21.0, 20.0, 15.0, 16.0, 27.0, 23.0, 34.0, 39.0, 38.0, 47.0, 48.0, 49.0, 53.0, 46.0, 35.0, 37.0, 43.0, 37.0, 46.0, 37.0, 25.0, 30.0, 32.0, 23.0, 14.0, 19.0, 11.0, 6.0, 13.0, 7.0, 13.0, 3.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.296875, -1.254852294921875, -1.21282958984375, -1.170806884765625, -1.1287841796875, -1.086761474609375, -1.04473876953125, -1.002716064453125, -0.960693359375, -0.918670654296875, -0.87664794921875, -0.834625244140625, -0.7926025390625, -0.750579833984375, -0.70855712890625, -0.666534423828125, -0.62451171875, -0.582489013671875, -0.54046630859375, -0.498443603515625, -0.4564208984375, -0.414398193359375, -0.37237548828125, -0.330352783203125, -0.288330078125, -0.246307373046875, -0.20428466796875, -0.162261962890625, -0.1202392578125, -0.078216552734375, -0.03619384765625, 0.005828857421875, 0.0478515625, 0.089874267578125, 0.13189697265625, 0.173919677734375, 0.2159423828125, 0.257965087890625, 0.29998779296875, 0.342010498046875, 0.384033203125, 0.426055908203125, 0.46807861328125, 0.510101318359375, 0.5521240234375, 0.594146728515625, 0.63616943359375, 0.678192138671875, 0.72021484375, 0.762237548828125, 0.80426025390625, 0.846282958984375, 0.8883056640625, 0.930328369140625, 0.97235107421875, 1.014373779296875, 1.056396484375, 1.098419189453125, 1.14044189453125, 1.182464599609375, 1.2244873046875, 1.266510009765625, 1.30853271484375, 1.350555419921875, 1.392578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 6.0, 1.0, 4.0, 5.0, 1.0, 12.0, 9.0, 9.0, 13.0, 16.0, 94.0, 523.0, 16315.0, 1022282.0, 8688.0, 396.0, 74.0, 25.0, 15.0, 10.0, 15.0, 4.0, 6.0, 5.0, 4.0, 4.0, 6.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.3125, -101.6083984375, -97.904296875, -94.2001953125, -90.49609375, -86.7919921875, -83.087890625, -79.3837890625, -75.6796875, -71.9755859375, -68.271484375, -64.5673828125, -60.86328125, -57.1591796875, -53.455078125, -49.7509765625, -46.046875, -42.3427734375, -38.638671875, -34.9345703125, -31.23046875, -27.5263671875, -23.822265625, -20.1181640625, -16.4140625, -12.7099609375, -9.005859375, -5.3017578125, -1.59765625, 2.1064453125, 5.810546875, 9.5146484375, 13.21875, 16.9228515625, 20.626953125, 24.3310546875, 28.03515625, 31.7392578125, 35.443359375, 39.1474609375, 42.8515625, 46.5556640625, 50.259765625, 53.9638671875, 57.66796875, 61.3720703125, 65.076171875, 68.7802734375, 72.484375, 76.1884765625, 79.892578125, 83.5966796875, 87.30078125, 91.0048828125, 94.708984375, 98.4130859375, 102.1171875, 105.8212890625, 109.525390625, 113.2294921875, 116.93359375, 120.6376953125, 124.341796875, 128.0458984375, 131.75]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 10.0, 10.0, 18.0, 16.0, 22.0, 15.0, 26.0, 26.0, 32.0, 43.0, 32.0, 42.0, 49.0, 47.0, 48.0, 53.0, 51.0, 42.0, 60.0, 36.0, 35.0, 43.0, 32.0, 29.0, 26.0, 28.0, 18.0, 17.0, 18.0, 10.0, 14.0, 3.0, 6.0, 1.0, 5.0, 3.0, 1.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.84375, -6.606689453125, -6.36962890625, -6.132568359375, -5.8955078125, -5.658447265625, -5.42138671875, -5.184326171875, -4.947265625, -4.710205078125, -4.47314453125, -4.236083984375, -3.9990234375, -3.761962890625, -3.52490234375, -3.287841796875, -3.05078125, -2.813720703125, -2.57666015625, -2.339599609375, -2.1025390625, -1.865478515625, -1.62841796875, -1.391357421875, -1.154296875, -0.917236328125, -0.68017578125, -0.443115234375, -0.2060546875, 0.031005859375, 0.26806640625, 0.505126953125, 0.7421875, 0.979248046875, 1.21630859375, 1.453369140625, 1.6904296875, 1.927490234375, 2.16455078125, 2.401611328125, 2.638671875, 2.875732421875, 3.11279296875, 3.349853515625, 3.5869140625, 3.823974609375, 4.06103515625, 4.298095703125, 4.53515625, 4.772216796875, 5.00927734375, 5.246337890625, 5.4833984375, 5.720458984375, 5.95751953125, 6.194580078125, 6.431640625, 6.668701171875, 6.90576171875, 7.142822265625, 7.3798828125, 7.616943359375, 7.85400390625, 8.091064453125, 8.328125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 7.0, 8.0, 14.0, 10.0, 22.0, 51.0, 236.0, 4229.0, 1040773.0, 2883.0, 200.0, 43.0, 14.0, 15.0, 7.0, 14.0, 3.0, 4.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.375, -170.583984375, -164.79296875, -159.001953125, -153.2109375, -147.419921875, -141.62890625, -135.837890625, -130.046875, -124.255859375, -118.46484375, -112.673828125, -106.8828125, -101.091796875, -95.30078125, -89.509765625, -83.71875, -77.927734375, -72.13671875, -66.345703125, -60.5546875, -54.763671875, -48.97265625, -43.181640625, -37.390625, -31.599609375, -25.80859375, -20.017578125, -14.2265625, -8.435546875, -2.64453125, 3.146484375, 8.9375, 14.728515625, 20.51953125, 26.310546875, 32.1015625, 37.892578125, 43.68359375, 49.474609375, 55.265625, 61.056640625, 66.84765625, 72.638671875, 78.4296875, 84.220703125, 90.01171875, 95.802734375, 101.59375, 107.384765625, 113.17578125, 118.966796875, 124.7578125, 130.548828125, 136.33984375, 142.130859375, 147.921875, 153.712890625, 159.50390625, 165.294921875, 171.0859375, 176.876953125, 182.66796875, 188.458984375, 194.25]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 10.0, 12.0, 16.0, 13.0, 26.0, 38.0, 61.0, 77.0, 124.0, 169.0, 122.0, 99.0, 75.0, 54.0, 34.0, 12.0, 7.0, 9.0, 8.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007829666137695312, -0.0007590055465698242, -0.0007350444793701172, -0.0007110834121704102, -0.0006871223449707031, -0.0006631612777709961, -0.0006392002105712891, -0.000615239143371582, -0.000591278076171875, -0.000567317008972168, -0.0005433559417724609, -0.0005193948745727539, -0.0004954338073730469, -0.00047147274017333984, -0.0004475116729736328, -0.0004235506057739258, -0.00039958953857421875, -0.0003756284713745117, -0.0003516674041748047, -0.00032770633697509766, -0.0003037452697753906, -0.0002797842025756836, -0.00025582313537597656, -0.00023186206817626953, -0.0002079010009765625, -0.00018393993377685547, -0.00015997886657714844, -0.0001360177993774414, -0.00011205673217773438, -8.809566497802734e-05, -6.413459777832031e-05, -4.017353057861328e-05, -1.621246337890625e-05, 7.748603820800781e-06, 3.170967102050781e-05, 5.5670738220214844e-05, 7.963180541992188e-05, 0.0001035928726196289, 0.00012755393981933594, 0.00015151500701904297, 0.00017547607421875, 0.00019943714141845703, 0.00022339820861816406, 0.0002473592758178711, 0.0002713203430175781, 0.00029528141021728516, 0.0003192424774169922, 0.0003432035446166992, 0.00036716461181640625, 0.0003911256790161133, 0.0004150867462158203, 0.00043904781341552734, 0.0004630088806152344, 0.0004869699478149414, 0.0005109310150146484, 0.0005348920822143555, 0.0005588531494140625, 0.0005828142166137695, 0.0006067752838134766, 0.0006307363510131836, 0.0006546974182128906, 0.0006786584854125977, 0.0007026195526123047, 0.0007265806198120117, 0.0007505416870117188]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 9.0, 18.0, 6.0, 14.0, 27.0, 42.0, 54.0, 94.0, 117.0, 159.0, 240.0, 372.0, 540.0, 909.0, 1358.0, 2384.0, 4282.0, 8294.0, 20655.0, 87557.0, 688707.0, 179668.0, 30434.0, 10604.0, 5017.0, 2764.0, 1551.0, 931.0, 615.0, 356.0, 242.0, 167.0, 107.0, 77.0, 66.0, 35.0, 21.0, 14.0, 18.0, 5.0, 8.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.21875, -26.41015625, -25.6015625, -24.79296875, -23.984375, -23.17578125, -22.3671875, -21.55859375, -20.75, -19.94140625, -19.1328125, -18.32421875, -17.515625, -16.70703125, -15.8984375, -15.08984375, -14.28125, -13.47265625, -12.6640625, -11.85546875, -11.046875, -10.23828125, -9.4296875, -8.62109375, -7.8125, -7.00390625, -6.1953125, -5.38671875, -4.578125, -3.76953125, -2.9609375, -2.15234375, -1.34375, -0.53515625, 0.2734375, 1.08203125, 1.890625, 2.69921875, 3.5078125, 4.31640625, 5.125, 5.93359375, 6.7421875, 7.55078125, 8.359375, 9.16796875, 9.9765625, 10.78515625, 11.59375, 12.40234375, 13.2109375, 14.01953125, 14.828125, 15.63671875, 16.4453125, 17.25390625, 18.0625, 18.87109375, 19.6796875, 20.48828125, 21.296875, 22.10546875, 22.9140625, 23.72265625, 24.53125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 6.0, 1.0, 2.0, 6.0, 6.0, 9.0, 5.0, 17.0, 16.0, 21.0, 48.0, 46.0, 89.0, 119.0, 237.0, 119.0, 92.0, 48.0, 38.0, 16.0, 21.0, 13.0, 5.0, 5.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.578125, -17.0819091796875, -16.585693359375, -16.0894775390625, -15.59326171875, -15.0970458984375, -14.600830078125, -14.1046142578125, -13.6083984375, -13.1121826171875, -12.615966796875, -12.1197509765625, -11.62353515625, -11.1273193359375, -10.631103515625, -10.1348876953125, -9.638671875, -9.1424560546875, -8.646240234375, -8.1500244140625, -7.65380859375, -7.1575927734375, -6.661376953125, -6.1651611328125, -5.6689453125, -5.1727294921875, -4.676513671875, -4.1802978515625, -3.68408203125, -3.1878662109375, -2.691650390625, -2.1954345703125, -1.69921875, -1.2030029296875, -0.706787109375, -0.2105712890625, 0.28564453125, 0.7818603515625, 1.278076171875, 1.7742919921875, 2.2705078125, 2.7667236328125, 3.262939453125, 3.7591552734375, 4.25537109375, 4.7515869140625, 5.247802734375, 5.7440185546875, 6.240234375, 6.7364501953125, 7.232666015625, 7.7288818359375, 8.22509765625, 8.7213134765625, 9.217529296875, 9.7137451171875, 10.2099609375, 10.7061767578125, 11.202392578125, 11.6986083984375, 12.19482421875, 12.6910400390625, 13.187255859375, 13.6834716796875, 14.1796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 10.0, 11.0, 10.0, 16.0, 25.0, 48.0, 59.0, 73.0, 109.0, 123.0, 130.0, 116.0, 78.0, 74.0, 39.0, 26.0, 18.0, 13.0, 13.0, 7.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.41889953613281, -85.94677734375, -83.47464752197266, -81.00252532958984, -78.53040313720703, -76.05827331542969, -73.58615112304688, -71.11402893066406, -68.64190673828125, -66.16978454589844, -63.69765853881836, -61.22553253173828, -58.75341033935547, -56.28128433227539, -53.80915832519531, -51.3370361328125, -48.864906311035156, -46.39278030395508, -43.920658111572266, -41.44853210449219, -38.976409912109375, -36.5042839050293, -34.03215789794922, -31.560033798217773, -29.087909698486328, -26.615785598754883, -24.143661499023438, -21.67153549194336, -19.199411392211914, -16.72728729248047, -14.255162239074707, -11.783037185668945, -9.3109130859375, -6.8387885093688965, -4.366663932800293, -1.8945393562316895, 0.5775852203369141, 3.0497093200683594, 5.521834373474121, 7.993959426879883, 10.466083526611328, 12.938207626342773, 15.410332679748535, 17.882457733154297, 20.354581832885742, 22.826705932617188, 25.298831939697266, 27.77095603942871, 30.243080139160156, 32.715206146240234, 35.18732833862305, 37.659454345703125, 40.13157653808594, 42.603702545166016, 45.075828552246094, 47.547950744628906, 50.020076751708984, 52.49220275878906, 54.964324951171875, 57.43645095825195, 59.90857696533203, 62.380699157714844, 64.85282135009766, 67.324951171875, 69.79707336425781]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 6.0, 9.0, 6.0, 9.0, 5.0, 16.0, 14.0, 20.0, 21.0, 24.0, 27.0, 40.0, 44.0, 34.0, 57.0, 60.0, 57.0, 46.0, 56.0, 63.0, 48.0, 61.0, 39.0, 40.0, 34.0, 28.0, 25.0, 23.0, 16.0, 14.0, 9.0, 14.0, 3.0, 6.0, 3.0, 3.0, 5.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-49.00212097167969, -47.37638473510742, -45.750648498535156, -44.124916076660156, -42.49917984008789, -40.873443603515625, -39.24770736694336, -37.621971130371094, -35.996238708496094, -34.37050247192383, -32.74476623535156, -31.11903190612793, -29.493297576904297, -27.86756134033203, -26.241825103759766, -24.616090774536133, -22.990354537963867, -21.3646183013916, -19.73888397216797, -18.113147735595703, -16.48741340637207, -14.861677169799805, -13.235941886901855, -11.610206604003906, -9.984471321105957, -8.358736038208008, -6.733000755310059, -5.107264995574951, -3.481529712677002, -1.8557939529418945, -0.2300586700439453, 1.395676612854004, 3.021411895751953, 4.647147178649902, 6.272882461547852, 7.898618221282959, 9.52435302734375, 11.150089263916016, 12.775824546813965, 14.401559829711914, 16.027294158935547, 17.653030395507812, 19.278764724731445, 20.90450096130371, 22.530235290527344, 24.15597152709961, 25.781707763671875, 27.407442092895508, 29.033178329467773, 30.65891456604004, 32.28464889526367, 33.91038513183594, 35.5361213684082, 37.16185760498047, 38.78759002685547, 40.413326263427734, 42.0390625, 43.664798736572266, 45.29053497314453, 46.91626739501953, 48.5420036315918, 50.16773986816406, 51.79347610473633, 53.419212341308594, 55.044944763183594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 5.0, 7.0, 9.0, 15.0, 16.0, 29.0, 33.0, 58.0, 96.0, 158.0, 182.0, 298.0, 486.0, 728.0, 1147.0, 1939.0, 3298.0, 5962.0, 11832.0, 27691.0, 85336.0, 1535081.0, 2377271.0, 87939.0, 28811.0, 12182.0, 5869.0, 3117.0, 1798.0, 1067.0, 669.0, 416.0, 215.0, 179.0, 111.0, 68.0, 63.0, 36.0, 19.0, 15.0, 10.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-44.15625, -42.962890625, -41.76953125, -40.576171875, -39.3828125, -38.189453125, -36.99609375, -35.802734375, -34.609375, -33.416015625, -32.22265625, -31.029296875, -29.8359375, -28.642578125, -27.44921875, -26.255859375, -25.0625, -23.869140625, -22.67578125, -21.482421875, -20.2890625, -19.095703125, -17.90234375, -16.708984375, -15.515625, -14.322265625, -13.12890625, -11.935546875, -10.7421875, -9.548828125, -8.35546875, -7.162109375, -5.96875, -4.775390625, -3.58203125, -2.388671875, -1.1953125, -0.001953125, 1.19140625, 2.384765625, 3.578125, 4.771484375, 5.96484375, 7.158203125, 8.3515625, 9.544921875, 10.73828125, 11.931640625, 13.125, 14.318359375, 15.51171875, 16.705078125, 17.8984375, 19.091796875, 20.28515625, 21.478515625, 22.671875, 23.865234375, 25.05859375, 26.251953125, 27.4453125, 28.638671875, 29.83203125, 31.025390625, 32.21875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 3.0, 5.0, 4.0, 7.0, 4.0, 13.0, 11.0, 5.0, 15.0, 10.0, 16.0, 17.0, 21.0, 23.0, 18.0, 17.0, 36.0, 37.0, 38.0, 42.0, 43.0, 45.0, 35.0, 42.0, 35.0, 43.0, 38.0, 43.0, 43.0, 36.0, 39.0, 32.0, 27.0, 21.0, 20.0, 23.0, 21.0, 9.0, 11.0, 8.0, 10.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2844696044921875, -1.243743896484375, -1.2030181884765625, -1.16229248046875, -1.1215667724609375, -1.080841064453125, -1.0401153564453125, -0.9993896484375, -0.9586639404296875, -0.917938232421875, -0.8772125244140625, -0.83648681640625, -0.7957611083984375, -0.755035400390625, -0.7143096923828125, -0.673583984375, -0.6328582763671875, -0.592132568359375, -0.5514068603515625, -0.51068115234375, -0.4699554443359375, -0.429229736328125, -0.3885040283203125, -0.3477783203125, -0.3070526123046875, -0.266326904296875, -0.2256011962890625, -0.18487548828125, -0.1441497802734375, -0.103424072265625, -0.0626983642578125, -0.02197265625, 0.0187530517578125, 0.059478759765625, 0.1002044677734375, 0.14093017578125, 0.1816558837890625, 0.222381591796875, 0.2631072998046875, 0.3038330078125, 0.3445587158203125, 0.385284423828125, 0.4260101318359375, 0.46673583984375, 0.5074615478515625, 0.548187255859375, 0.5889129638671875, 0.629638671875, 0.6703643798828125, 0.711090087890625, 0.7518157958984375, 0.79254150390625, 0.8332672119140625, 0.873992919921875, 0.9147186279296875, 0.9554443359375, 0.9961700439453125, 1.036895751953125, 1.0776214599609375, 1.11834716796875, 1.1590728759765625, 1.199798583984375, 1.2405242919921875, 1.28125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 2.0, 8.0, 12.0, 16.0, 24.0, 31.0, 34.0, 56.0, 106.0, 267.0, 1297.0, 17173.0, 3504416.0, 658125.0, 11186.0, 996.0, 234.0, 95.0, 42.0, 34.0, 32.0, 27.0, 11.0, 11.0, 9.0, 10.0, 7.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-94.875, -90.91015625, -86.9453125, -82.98046875, -79.015625, -75.05078125, -71.0859375, -67.12109375, -63.15625, -59.19140625, -55.2265625, -51.26171875, -47.296875, -43.33203125, -39.3671875, -35.40234375, -31.4375, -27.47265625, -23.5078125, -19.54296875, -15.578125, -11.61328125, -7.6484375, -3.68359375, 0.28125, 4.24609375, 8.2109375, 12.17578125, 16.140625, 20.10546875, 24.0703125, 28.03515625, 32.0, 35.96484375, 39.9296875, 43.89453125, 47.859375, 51.82421875, 55.7890625, 59.75390625, 63.71875, 67.68359375, 71.6484375, 75.61328125, 79.578125, 83.54296875, 87.5078125, 91.47265625, 95.4375, 99.40234375, 103.3671875, 107.33203125, 111.296875, 115.26171875, 119.2265625, 123.19140625, 127.15625, 131.12109375, 135.0859375, 139.05078125, 143.015625, 146.98046875, 150.9453125, 154.91015625, 158.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 12.0, 10.0, 10.0, 11.0, 16.0, 36.0, 22.0, 29.0, 50.0, 59.0, 95.0, 133.0, 171.0, 365.0, 1962.0, 398.0, 203.0, 140.0, 95.0, 46.0, 49.0, 34.0, 21.0, 16.0, 12.0, 24.0, 8.0, 9.0, 7.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.41015625, -5.2579345703125, -5.105712890625, -4.9534912109375, -4.80126953125, -4.6490478515625, -4.496826171875, -4.3446044921875, -4.1923828125, -4.0401611328125, -3.887939453125, -3.7357177734375, -3.58349609375, -3.4312744140625, -3.279052734375, -3.1268310546875, -2.974609375, -2.8223876953125, -2.670166015625, -2.5179443359375, -2.36572265625, -2.2135009765625, -2.061279296875, -1.9090576171875, -1.7568359375, -1.6046142578125, -1.452392578125, -1.3001708984375, -1.14794921875, -0.9957275390625, -0.843505859375, -0.6912841796875, -0.5390625, -0.3868408203125, -0.234619140625, -0.0823974609375, 0.06982421875, 0.2220458984375, 0.374267578125, 0.5264892578125, 0.6787109375, 0.8309326171875, 0.983154296875, 1.1353759765625, 1.28759765625, 1.4398193359375, 1.592041015625, 1.7442626953125, 1.896484375, 2.0487060546875, 2.200927734375, 2.3531494140625, 2.50537109375, 2.6575927734375, 2.809814453125, 2.9620361328125, 3.1142578125, 3.2664794921875, 3.418701171875, 3.5709228515625, 3.72314453125, 3.8753662109375, 4.027587890625, 4.1798095703125, 4.33203125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 5.0, 8.0, 14.0, 31.0, 47.0, 111.0, 184.0, 215.0, 187.0, 110.0, 45.0, 26.0, 16.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.04010009765625, -37.99589920043945, -35.951698303222656, -33.907493591308594, -31.863292694091797, -29.819091796875, -27.77488899230957, -25.73068618774414, -23.686485290527344, -21.642284393310547, -19.598081588745117, -17.553878784179688, -15.50967788696289, -13.465476036071777, -11.421274185180664, -9.37707233428955, -7.3328704833984375, -5.288668632507324, -3.244466781616211, -1.2002649307250977, 0.8439369201660156, 2.888138771057129, 4.932340621948242, 6.9765424728393555, 9.020744323730469, 11.064946174621582, 13.109148025512695, 15.153349876403809, 17.197551727294922, 19.24175262451172, 21.28595542907715, 23.330158233642578, 25.374359130859375, 27.418560028076172, 29.4627628326416, 31.50696563720703, 33.55116653442383, 35.595367431640625, 37.63957214355469, 39.683773040771484, 41.72797393798828, 43.77217483520508, 45.816375732421875, 47.86058044433594, 49.904781341552734, 51.94898223876953, 53.993186950683594, 56.03738784790039, 58.08158874511719, 60.125789642333984, 62.16999053955078, 64.21419525146484, 66.25839233398438, 68.30259704589844, 70.3468017578125, 72.39099884033203, 74.4352035522461, 76.47940826416016, 78.52360534667969, 80.56781005859375, 82.61201477050781, 84.65621185302734, 86.7004165649414, 88.74461364746094, 90.788818359375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 10.0, 9.0, 11.0, 17.0, 24.0, 38.0, 41.0, 44.0, 58.0, 56.0, 55.0, 67.0, 52.0, 68.0, 62.0, 50.0, 59.0, 40.0, 42.0, 37.0, 27.0, 28.0, 23.0, 15.0, 19.0, 10.0, 8.0, 1.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.928178787231445, -21.188501358032227, -20.448823928833008, -19.70914649963379, -18.96946907043457, -18.22979164123535, -17.490114212036133, -16.750436782836914, -16.010759353637695, -15.271081924438477, -14.531404495239258, -13.791727066040039, -13.05204963684082, -12.312372207641602, -11.572694778442383, -10.833017349243164, -10.093339920043945, -9.353662490844727, -8.613985061645508, -7.874307632446289, -7.13463020324707, -6.394952774047852, -5.655275344848633, -4.915597915649414, -4.175920486450195, -3.4362430572509766, -2.696565628051758, -1.956888198852539, -1.2172107696533203, -0.47753334045410156, 0.2621440887451172, 1.001821517944336, 1.7414970397949219, 2.4811744689941406, 3.2208518981933594, 3.960529327392578, 4.700206756591797, 5.439884185791016, 6.179561614990234, 6.919239044189453, 7.658916473388672, 8.39859390258789, 9.13827133178711, 9.877948760986328, 10.617626190185547, 11.357303619384766, 12.096981048583984, 12.836658477783203, 13.576335906982422, 14.31601333618164, 15.05569076538086, 15.795368194580078, 16.535045623779297, 17.274723052978516, 18.014400482177734, 18.754077911376953, 19.493755340576172, 20.23343276977539, 20.97311019897461, 21.712787628173828, 22.452465057373047, 23.192142486572266, 23.931819915771484, 24.671497344970703, 25.411174774169922]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 11.0, 6.0, 6.0, 11.0, 14.0, 8.0, 24.0, 22.0, 23.0, 20.0, 18.0, 37.0, 26.0, 36.0, 41.0, 63.0, 244.0, 2123.0, 22033.0, 367558.0, 608510.0, 43181.0, 3700.0, 444.0, 77.0, 35.0, 44.0, 34.0, 30.0, 31.0, 24.0, 18.0, 15.0, 13.0, 22.0, 11.0, 10.0, 3.0, 1.0, 9.0, 9.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-70.1875, -68.296875, -66.40625, -64.515625, -62.625, -60.734375, -58.84375, -56.953125, -55.0625, -53.171875, -51.28125, -49.390625, -47.5, -45.609375, -43.71875, -41.828125, -39.9375, -38.046875, -36.15625, -34.265625, -32.375, -30.484375, -28.59375, -26.703125, -24.8125, -22.921875, -21.03125, -19.140625, -17.25, -15.359375, -13.46875, -11.578125, -9.6875, -7.796875, -5.90625, -4.015625, -2.125, -0.234375, 1.65625, 3.546875, 5.4375, 7.328125, 9.21875, 11.109375, 13.0, 14.890625, 16.78125, 18.671875, 20.5625, 22.453125, 24.34375, 26.234375, 28.125, 30.015625, 31.90625, 33.796875, 35.6875, 37.578125, 39.46875, 41.359375, 43.25, 45.140625, 47.03125, 48.921875, 50.8125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 14.0, 25.0, 35.0, 69.0, 86.0, 109.0, 152.0, 146.0, 134.0, 110.0, 57.0, 34.0, 21.0, 9.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.435546875, -1.292327880859375, -1.14910888671875, -1.005889892578125, -0.8626708984375, -0.719451904296875, -0.57623291015625, -0.433013916015625, -0.289794921875, -0.146575927734375, -0.00335693359375, 0.139862060546875, 0.2830810546875, 0.426300048828125, 0.56951904296875, 0.712738037109375, 0.85595703125, 0.999176025390625, 1.14239501953125, 1.285614013671875, 1.4288330078125, 1.572052001953125, 1.71527099609375, 1.858489990234375, 2.001708984375, 2.144927978515625, 2.28814697265625, 2.431365966796875, 2.5745849609375, 2.717803955078125, 2.86102294921875, 3.004241943359375, 3.1474609375, 3.290679931640625, 3.43389892578125, 3.577117919921875, 3.7203369140625, 3.863555908203125, 4.00677490234375, 4.149993896484375, 4.293212890625, 4.436431884765625, 4.57965087890625, 4.722869873046875, 4.8660888671875, 5.009307861328125, 5.15252685546875, 5.295745849609375, 5.43896484375, 5.582183837890625, 5.72540283203125, 5.868621826171875, 6.0118408203125, 6.155059814453125, 6.29827880859375, 6.441497802734375, 6.584716796875, 6.727935791015625, 6.87115478515625, 7.014373779296875, 7.1575927734375, 7.300811767578125, 7.44403076171875, 7.587249755859375, 7.73046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 9.0, 6.0, 10.0, 13.0, 12.0, 15.0, 43.0, 54.0, 60.0, 103.0, 140.0, 161.0, 262.0, 394.0, 606.0, 904.0, 1463.0, 2569.0, 4270.0, 7750.0, 14447.0, 27949.0, 55181.0, 106608.0, 187590.0, 241053.0, 181821.0, 102935.0, 53010.0, 26877.0, 13895.0, 7456.0, 4226.0, 2444.0, 1470.0, 905.0, 556.0, 382.0, 272.0, 182.0, 155.0, 80.0, 64.0, 50.0, 23.0, 34.0, 18.0, 13.0, 10.0, 5.0, 5.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.3203125, -13.850341796875, -13.38037109375, -12.910400390625, -12.4404296875, -11.970458984375, -11.50048828125, -11.030517578125, -10.560546875, -10.090576171875, -9.62060546875, -9.150634765625, -8.6806640625, -8.210693359375, -7.74072265625, -7.270751953125, -6.80078125, -6.330810546875, -5.86083984375, -5.390869140625, -4.9208984375, -4.450927734375, -3.98095703125, -3.510986328125, -3.041015625, -2.571044921875, -2.10107421875, -1.631103515625, -1.1611328125, -0.691162109375, -0.22119140625, 0.248779296875, 0.71875, 1.188720703125, 1.65869140625, 2.128662109375, 2.5986328125, 3.068603515625, 3.53857421875, 4.008544921875, 4.478515625, 4.948486328125, 5.41845703125, 5.888427734375, 6.3583984375, 6.828369140625, 7.29833984375, 7.768310546875, 8.23828125, 8.708251953125, 9.17822265625, 9.648193359375, 10.1181640625, 10.588134765625, 11.05810546875, 11.528076171875, 11.998046875, 12.468017578125, 12.93798828125, 13.407958984375, 13.8779296875, 14.347900390625, 14.81787109375, 15.287841796875, 15.7578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 9.0, 6.0, 11.0, 15.0, 19.0, 11.0, 14.0, 27.0, 18.0, 21.0, 28.0, 31.0, 34.0, 43.0, 44.0, 32.0, 30.0, 43.0, 45.0, 34.0, 38.0, 46.0, 29.0, 45.0, 29.0, 44.0, 28.0, 35.0, 33.0, 27.0, 24.0, 22.0, 9.0, 14.0, 7.0, 10.0, 6.0, 1.0, 6.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.5089111328125, -8.205322265625, -7.9017333984375, -7.59814453125, -7.2945556640625, -6.990966796875, -6.6873779296875, -6.3837890625, -6.0802001953125, -5.776611328125, -5.4730224609375, -5.16943359375, -4.8658447265625, -4.562255859375, -4.2586669921875, -3.955078125, -3.6514892578125, -3.347900390625, -3.0443115234375, -2.74072265625, -2.4371337890625, -2.133544921875, -1.8299560546875, -1.5263671875, -1.2227783203125, -0.919189453125, -0.6156005859375, -0.31201171875, -0.0084228515625, 0.295166015625, 0.5987548828125, 0.90234375, 1.2059326171875, 1.509521484375, 1.8131103515625, 2.11669921875, 2.4202880859375, 2.723876953125, 3.0274658203125, 3.3310546875, 3.6346435546875, 3.938232421875, 4.2418212890625, 4.54541015625, 4.8489990234375, 5.152587890625, 5.4561767578125, 5.759765625, 6.0633544921875, 6.366943359375, 6.6705322265625, 6.97412109375, 7.2777099609375, 7.581298828125, 7.8848876953125, 8.1884765625, 8.4920654296875, 8.795654296875, 9.0992431640625, 9.40283203125, 9.7064208984375, 10.010009765625, 10.3135986328125, 10.6171875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 7.0, 17.0, 18.0, 21.0, 41.0, 42.0, 77.0, 104.0, 158.0, 255.0, 411.0, 662.0, 1251.0, 2291.0, 4532.0, 10023.0, 25797.0, 71400.0, 206698.0, 375768.0, 222574.0, 77899.0, 27547.0, 10705.0, 4753.0, 2337.0, 1217.0, 705.0, 449.0, 263.0, 171.0, 116.0, 74.0, 44.0, 36.0, 25.0, 13.0, 12.0, 9.0, 5.0, 9.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0], "bins": [-15.5390625, -15.101806640625, -14.66455078125, -14.227294921875, -13.7900390625, -13.352783203125, -12.91552734375, -12.478271484375, -12.041015625, -11.603759765625, -11.16650390625, -10.729248046875, -10.2919921875, -9.854736328125, -9.41748046875, -8.980224609375, -8.54296875, -8.105712890625, -7.66845703125, -7.231201171875, -6.7939453125, -6.356689453125, -5.91943359375, -5.482177734375, -5.044921875, -4.607666015625, -4.17041015625, -3.733154296875, -3.2958984375, -2.858642578125, -2.42138671875, -1.984130859375, -1.546875, -1.109619140625, -0.67236328125, -0.235107421875, 0.2021484375, 0.639404296875, 1.07666015625, 1.513916015625, 1.951171875, 2.388427734375, 2.82568359375, 3.262939453125, 3.7001953125, 4.137451171875, 4.57470703125, 5.011962890625, 5.44921875, 5.886474609375, 6.32373046875, 6.760986328125, 7.1982421875, 7.635498046875, 8.07275390625, 8.510009765625, 8.947265625, 9.384521484375, 9.82177734375, 10.259033203125, 10.6962890625, 11.133544921875, 11.57080078125, 12.008056640625, 12.4453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 8.0, 4.0, 2.0, 5.0, 11.0, 16.0, 17.0, 28.0, 32.0, 42.0, 64.0, 80.0, 93.0, 114.0, 117.0, 102.0, 66.0, 53.0, 34.0, 37.0, 19.0, 17.0, 12.0, 8.0, 5.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020732879638671875, -0.0019927024841308594, -0.0019121170043945312, -0.0018315315246582031, -0.001750946044921875, -0.0016703605651855469, -0.0015897750854492188, -0.0015091896057128906, -0.0014286041259765625, -0.0013480186462402344, -0.0012674331665039062, -0.0011868476867675781, -0.00110626220703125, -0.0010256767272949219, -0.0009450912475585938, -0.0008645057678222656, -0.0007839202880859375, -0.0007033348083496094, -0.0006227493286132812, -0.0005421638488769531, -0.000461578369140625, -0.0003809928894042969, -0.00030040740966796875, -0.00021982192993164062, -0.0001392364501953125, -5.8650970458984375e-05, 2.193450927734375e-05, 0.00010251998901367188, 0.00018310546875, 0.0002636909484863281, 0.00034427642822265625, 0.0004248619079589844, 0.0005054473876953125, 0.0005860328674316406, 0.0006666183471679688, 0.0007472038269042969, 0.000827789306640625, 0.0009083747863769531, 0.0009889602661132812, 0.0010695457458496094, 0.0011501312255859375, 0.0012307167053222656, 0.0013113021850585938, 0.0013918876647949219, 0.00147247314453125, 0.0015530586242675781, 0.0016336441040039062, 0.0017142295837402344, 0.0017948150634765625, 0.0018754005432128906, 0.0019559860229492188, 0.002036571502685547, 0.002117156982421875, 0.002197742462158203, 0.0022783279418945312, 0.0023589134216308594, 0.0024394989013671875, 0.0025200843811035156, 0.0026006698608398438, 0.002681255340576172, 0.0027618408203125, 0.002842426300048828, 0.0029230117797851562, 0.0030035972595214844, 0.0030841827392578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 3.0, 10.0, 9.0, 14.0, 31.0, 34.0, 50.0, 67.0, 127.0, 177.0, 305.0, 484.0, 851.0, 1506.0, 2955.0, 6069.0, 14789.0, 40602.0, 134706.0, 398756.0, 306603.0, 90785.0, 28476.0, 10663.0, 4861.0, 2340.0, 1318.0, 775.0, 418.0, 245.0, 167.0, 119.0, 61.0, 54.0, 27.0, 25.0, 15.0, 19.0, 7.0, 9.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.1943359375, -16.654296875, -16.1142578125, -15.57421875, -15.0341796875, -14.494140625, -13.9541015625, -13.4140625, -12.8740234375, -12.333984375, -11.7939453125, -11.25390625, -10.7138671875, -10.173828125, -9.6337890625, -9.09375, -8.5537109375, -8.013671875, -7.4736328125, -6.93359375, -6.3935546875, -5.853515625, -5.3134765625, -4.7734375, -4.2333984375, -3.693359375, -3.1533203125, -2.61328125, -2.0732421875, -1.533203125, -0.9931640625, -0.453125, 0.0869140625, 0.626953125, 1.1669921875, 1.70703125, 2.2470703125, 2.787109375, 3.3271484375, 3.8671875, 4.4072265625, 4.947265625, 5.4873046875, 6.02734375, 6.5673828125, 7.107421875, 7.6474609375, 8.1875, 8.7275390625, 9.267578125, 9.8076171875, 10.34765625, 10.8876953125, 11.427734375, 11.9677734375, 12.5078125, 13.0478515625, 13.587890625, 14.1279296875, 14.66796875, 15.2080078125, 15.748046875, 16.2880859375, 16.828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 9.0, 17.0, 18.0, 12.0, 36.0, 41.0, 45.0, 64.0, 68.0, 77.0, 67.0, 68.0, 94.0, 73.0, 46.0, 52.0, 46.0, 28.0, 26.0, 15.0, 22.0, 16.0, 9.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1953125, -7.914306640625, -7.63330078125, -7.352294921875, -7.0712890625, -6.790283203125, -6.50927734375, -6.228271484375, -5.947265625, -5.666259765625, -5.38525390625, -5.104248046875, -4.8232421875, -4.542236328125, -4.26123046875, -3.980224609375, -3.69921875, -3.418212890625, -3.13720703125, -2.856201171875, -2.5751953125, -2.294189453125, -2.01318359375, -1.732177734375, -1.451171875, -1.170166015625, -0.88916015625, -0.608154296875, -0.3271484375, -0.046142578125, 0.23486328125, 0.515869140625, 0.796875, 1.077880859375, 1.35888671875, 1.639892578125, 1.9208984375, 2.201904296875, 2.48291015625, 2.763916015625, 3.044921875, 3.325927734375, 3.60693359375, 3.887939453125, 4.1689453125, 4.449951171875, 4.73095703125, 5.011962890625, 5.29296875, 5.573974609375, 5.85498046875, 6.135986328125, 6.4169921875, 6.697998046875, 6.97900390625, 7.260009765625, 7.541015625, 7.822021484375, 8.10302734375, 8.384033203125, 8.6650390625, 8.946044921875, 9.22705078125, 9.508056640625, 9.7890625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 12.0, 33.0, 43.0, 82.0, 107.0, 153.0, 168.0, 153.0, 93.0, 62.0, 30.0, 23.0, 11.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-168.18307495117188, -162.0477294921875, -155.91236877441406, -149.7770233154297, -143.64166259765625, -137.50631713867188, -131.3709716796875, -125.2356185913086, -119.10026550292969, -112.96491241455078, -106.82955932617188, -100.6942138671875, -94.5588607788086, -88.42350769042969, -82.28816223144531, -76.1528091430664, -70.0174560546875, -63.882102966308594, -57.74675369262695, -51.61140441894531, -45.476051330566406, -39.3406982421875, -33.20534896850586, -27.06999969482422, -20.934646606445312, -14.799295425415039, -8.663944244384766, -2.528593063354492, 3.6067581176757812, 9.742109298706055, 15.877460479736328, 22.01280975341797, 28.148178100585938, 34.283531188964844, 40.418880462646484, 46.554229736328125, 52.68958282470703, 58.82493591308594, 64.96028137207031, 71.09563446044922, 77.23098754882812, 83.36634063720703, 89.50169372558594, 95.63703918457031, 101.77239227294922, 107.90774536132812, 114.0430908203125, 120.1784439086914, 126.31379699707031, 132.4491424560547, 138.58450317382812, 144.7198486328125, 150.85519409179688, 156.9905548095703, 163.1259002685547, 169.26126098632812, 175.3966064453125, 181.53195190429688, 187.6673126220703, 193.8026580810547, 199.93801879882812, 206.0733642578125, 212.20870971679688, 218.34405517578125, 224.4794158935547]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 22.0, 28.0, 28.0, 42.0, 46.0, 54.0, 43.0, 50.0, 63.0, 63.0, 70.0, 47.0, 57.0, 55.0, 47.0, 46.0, 35.0, 34.0, 21.0, 26.0, 24.0, 10.0, 7.0, 7.0, 9.0, 7.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.76068115234375, -89.60670471191406, -86.4527359008789, -83.29875946044922, -80.14479064941406, -76.99081420898438, -73.83683776855469, -70.68286895751953, -67.52890014648438, -64.37492370605469, -61.22095489501953, -58.066978454589844, -54.91300964355469, -51.759033203125, -48.60506057739258, -45.451087951660156, -42.29711151123047, -39.14313888549805, -35.989166259765625, -32.83518981933594, -29.68121910095215, -26.527246475219727, -23.373271942138672, -20.21929931640625, -17.065326690673828, -13.911354064941406, -10.757380485534668, -7.60340690612793, -4.449434280395508, -1.295461654663086, 1.8585128784179688, 5.012485504150391, 8.166458129882812, 11.320430755615234, 14.474404335021973, 17.62837791442871, 20.782350540161133, 23.936323165893555, 27.09029769897461, 30.24427032470703, 33.39824295043945, 36.552215576171875, 39.7061882019043, 42.86016082763672, 46.014137268066406, 49.16810607910156, 52.32208251953125, 55.47605514526367, 58.630027770996094, 61.784000396728516, 64.93797302246094, 68.09194946289062, 71.24591827392578, 74.39989471435547, 77.55386352539062, 80.70783996582031, 83.86181640625, 87.01579284667969, 90.16976165771484, 93.32373809814453, 96.47770690917969, 99.63168334960938, 102.78565979003906, 105.93962860107422, 109.09359741210938]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 14.0, 28.0, 59.0, 123.0, 449.0, 3360.0, 98816.0, 4068077.0, 20883.0, 1638.0, 414.0, 152.0, 84.0, 54.0, 27.0, 29.0, 22.0, 9.0, 11.0, 6.0, 7.0, 9.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.1875, -120.2431640625, -113.298828125, -106.3544921875, -99.41015625, -92.4658203125, -85.521484375, -78.5771484375, -71.6328125, -64.6884765625, -57.744140625, -50.7998046875, -43.85546875, -36.9111328125, -29.966796875, -23.0224609375, -16.078125, -9.1337890625, -2.189453125, 4.7548828125, 11.69921875, 18.6435546875, 25.587890625, 32.5322265625, 39.4765625, 46.4208984375, 53.365234375, 60.3095703125, 67.25390625, 74.1982421875, 81.142578125, 88.0869140625, 95.03125, 101.9755859375, 108.919921875, 115.8642578125, 122.80859375, 129.7529296875, 136.697265625, 143.6416015625, 150.5859375, 157.5302734375, 164.474609375, 171.4189453125, 178.36328125, 185.3076171875, 192.251953125, 199.1962890625, 206.140625, 213.0849609375, 220.029296875, 226.9736328125, 233.91796875, 240.8623046875, 247.806640625, 254.7509765625, 261.6953125, 268.6396484375, 275.583984375, 282.5283203125, 289.47265625, 296.4169921875, 303.361328125, 310.3056640625, 317.25]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 15.0, 30.0, 49.0, 68.0, 101.0, 127.0, 128.0, 122.0, 109.0, 101.0, 64.0, 40.0, 18.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3828125, -3.203125, -3.0234375, -2.84375, -2.6640625, -2.484375, -2.3046875, -2.125, -1.9453125, -1.765625, -1.5859375, -1.40625, -1.2265625, -1.046875, -0.8671875, -0.6875, -0.5078125, -0.328125, -0.1484375, 0.03125, 0.2109375, 0.390625, 0.5703125, 0.75, 0.9296875, 1.109375, 1.2890625, 1.46875, 1.6484375, 1.828125, 2.0078125, 2.1875, 2.3671875, 2.546875, 2.7265625, 2.90625, 3.0859375, 3.265625, 3.4453125, 3.625, 3.8046875, 3.984375, 4.1640625, 4.34375, 4.5234375, 4.703125, 4.8828125, 5.0625, 5.2421875, 5.421875, 5.6015625, 5.78125, 5.9609375, 6.140625, 6.3203125, 6.5, 6.6796875, 6.859375, 7.0390625, 7.21875, 7.3984375, 7.578125, 7.7578125, 7.9375, 8.1171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 12.0, 10.0, 4.0, 13.0, 32.0, 33.0, 56.0, 93.0, 209.0, 375.0, 593.0, 1277.0, 2629.0, 6459.0, 17289.0, 50495.0, 194083.0, 3083280.0, 672751.0, 112789.0, 32400.0, 11250.0, 4374.0, 1940.0, 900.0, 423.0, 220.0, 111.0, 62.0, 40.0, 28.0, 19.0, 6.0, 5.0, 5.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.125, -49.56689453125, -48.0087890625, -46.45068359375, -44.892578125, -43.33447265625, -41.7763671875, -40.21826171875, -38.66015625, -37.10205078125, -35.5439453125, -33.98583984375, -32.427734375, -30.86962890625, -29.3115234375, -27.75341796875, -26.1953125, -24.63720703125, -23.0791015625, -21.52099609375, -19.962890625, -18.40478515625, -16.8466796875, -15.28857421875, -13.73046875, -12.17236328125, -10.6142578125, -9.05615234375, -7.498046875, -5.93994140625, -4.3818359375, -2.82373046875, -1.265625, 0.29248046875, 1.8505859375, 3.40869140625, 4.966796875, 6.52490234375, 8.0830078125, 9.64111328125, 11.19921875, 12.75732421875, 14.3154296875, 15.87353515625, 17.431640625, 18.98974609375, 20.5478515625, 22.10595703125, 23.6640625, 25.22216796875, 26.7802734375, 28.33837890625, 29.896484375, 31.45458984375, 33.0126953125, 34.57080078125, 36.12890625, 37.68701171875, 39.2451171875, 40.80322265625, 42.361328125, 43.91943359375, 45.4775390625, 47.03564453125, 48.59375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 9.0, 18.0, 21.0, 21.0, 32.0, 34.0, 35.0, 39.0, 60.0, 70.0, 88.0, 162.0, 310.0, 1434.0, 815.0, 263.0, 177.0, 114.0, 89.0, 55.0, 52.0, 36.0, 20.0, 17.0, 16.0, 17.0, 9.0, 7.0, 7.0, 4.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.8046875, -8.5662841796875, -8.327880859375, -8.0894775390625, -7.85107421875, -7.6126708984375, -7.374267578125, -7.1358642578125, -6.8974609375, -6.6590576171875, -6.420654296875, -6.1822509765625, -5.94384765625, -5.7054443359375, -5.467041015625, -5.2286376953125, -4.990234375, -4.7518310546875, -4.513427734375, -4.2750244140625, -4.03662109375, -3.7982177734375, -3.559814453125, -3.3214111328125, -3.0830078125, -2.8446044921875, -2.606201171875, -2.3677978515625, -2.12939453125, -1.8909912109375, -1.652587890625, -1.4141845703125, -1.17578125, -0.9373779296875, -0.698974609375, -0.4605712890625, -0.22216796875, 0.0162353515625, 0.254638671875, 0.4930419921875, 0.7314453125, 0.9698486328125, 1.208251953125, 1.4466552734375, 1.68505859375, 1.9234619140625, 2.161865234375, 2.4002685546875, 2.638671875, 2.8770751953125, 3.115478515625, 3.3538818359375, 3.59228515625, 3.8306884765625, 4.069091796875, 4.3074951171875, 4.5458984375, 4.7843017578125, 5.022705078125, 5.2611083984375, 5.49951171875, 5.7379150390625, 5.976318359375, 6.2147216796875, 6.453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 14.0, 22.0, 44.0, 113.0, 209.0, 251.0, 178.0, 108.0, 26.0, 21.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.11924743652344, -76.93621826171875, -72.75318145751953, -68.57014465332031, -64.38711547851562, -60.20408248901367, -56.02104949951172, -51.838016510009766, -47.65498352050781, -43.47195053100586, -39.288917541503906, -35.10588455200195, -30.9228515625, -26.739818572998047, -22.556785583496094, -18.37375259399414, -14.190719604492188, -10.007686614990234, -5.824653625488281, -1.6416206359863281, 2.541412353515625, 6.724445343017578, 10.907478332519531, 15.090511322021484, 19.273544311523438, 23.45657730102539, 27.639610290527344, 31.822643280029297, 36.00567626953125, 40.1887092590332, 44.371742248535156, 48.55477523803711, 52.737823486328125, 56.92085647583008, 61.10388946533203, 65.28692626953125, 69.46995544433594, 73.65298461914062, 77.83602142333984, 82.01905822753906, 86.20208740234375, 90.38511657714844, 94.56815338134766, 98.75119018554688, 102.93421936035156, 107.11724853515625, 111.30028533935547, 115.48332214355469, 119.66635131835938, 123.84938049316406, 128.03240966796875, 132.2154541015625, 136.3984832763672, 140.58151245117188, 144.76455688476562, 148.9475860595703, 153.130615234375, 157.3136444091797, 161.49667358398438, 165.67971801757812, 169.8627471923828, 174.0457763671875, 178.22882080078125, 182.41184997558594, 186.59487915039062]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 8.0, 8.0, 22.0, 16.0, 11.0, 28.0, 29.0, 35.0, 39.0, 29.0, 31.0, 45.0, 39.0, 51.0, 74.0, 68.0, 63.0, 46.0, 52.0, 48.0, 39.0, 46.0, 29.0, 33.0, 30.0, 18.0, 16.0, 14.0, 4.0, 10.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-52.939788818359375, -51.66326904296875, -50.38675308227539, -49.110233306884766, -47.833717346191406, -46.55719757080078, -45.28068161010742, -44.0041618347168, -42.72764587402344, -41.45112609863281, -40.17461013793945, -38.89809036254883, -37.62157440185547, -36.345054626464844, -35.068538665771484, -33.79201889038086, -32.515499114990234, -31.238981246948242, -29.96246337890625, -28.685945510864258, -27.409427642822266, -26.13290786743164, -24.85638999938965, -23.579872131347656, -22.303354263305664, -21.026836395263672, -19.75031852722168, -18.473800659179688, -17.197280883789062, -15.920763969421387, -14.644245147705078, -13.367727279663086, -12.09121322631836, -10.814695358276367, -9.538177490234375, -8.261658668518066, -6.985140800476074, -5.708622932434082, -4.432104587554932, -3.1555862426757812, -1.879068374633789, -0.6025502681732178, 0.6739678382873535, 1.9504859447479248, 3.227004051208496, 4.503521919250488, 5.780040264129639, 7.056558609008789, 8.333076477050781, 9.609594345092773, 10.886112213134766, 12.162631034851074, 13.439148902893066, 14.715666770935059, 15.992185592651367, 17.26870346069336, 18.54522132873535, 19.821739196777344, 21.098257064819336, 22.374774932861328, 23.651294708251953, 24.927810668945312, 26.204330444335938, 27.48084831237793, 28.757366180419922]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 7.0, 8.0, 6.0, 10.0, 14.0, 11.0, 13.0, 13.0, 20.0, 23.0, 29.0, 40.0, 39.0, 72.0, 86.0, 157.0, 241.0, 399.0, 870.0, 2517.0, 11406.0, 79577.0, 533715.0, 361882.0, 46411.0, 7351.0, 1833.0, 690.0, 372.0, 230.0, 128.0, 96.0, 55.0, 42.0, 35.0, 33.0, 31.0, 23.0, 16.0, 8.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-44.71875, -43.2216796875, -41.724609375, -40.2275390625, -38.73046875, -37.2333984375, -35.736328125, -34.2392578125, -32.7421875, -31.2451171875, -29.748046875, -28.2509765625, -26.75390625, -25.2568359375, -23.759765625, -22.2626953125, -20.765625, -19.2685546875, -17.771484375, -16.2744140625, -14.77734375, -13.2802734375, -11.783203125, -10.2861328125, -8.7890625, -7.2919921875, -5.794921875, -4.2978515625, -2.80078125, -1.3037109375, 0.193359375, 1.6904296875, 3.1875, 4.6845703125, 6.181640625, 7.6787109375, 9.17578125, 10.6728515625, 12.169921875, 13.6669921875, 15.1640625, 16.6611328125, 18.158203125, 19.6552734375, 21.15234375, 22.6494140625, 24.146484375, 25.6435546875, 27.140625, 28.6376953125, 30.134765625, 31.6318359375, 33.12890625, 34.6259765625, 36.123046875, 37.6201171875, 39.1171875, 40.6142578125, 42.111328125, 43.6083984375, 45.10546875, 46.6025390625, 48.099609375, 49.5966796875, 51.09375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 13.0, 28.0, 55.0, 74.0, 117.0, 155.0, 140.0, 149.0, 110.0, 65.0, 47.0, 23.0, 13.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.296875, -6.0828857421875, -5.868896484375, -5.6549072265625, -5.44091796875, -5.2269287109375, -5.012939453125, -4.7989501953125, -4.5849609375, -4.3709716796875, -4.156982421875, -3.9429931640625, -3.72900390625, -3.5150146484375, -3.301025390625, -3.0870361328125, -2.873046875, -2.6590576171875, -2.445068359375, -2.2310791015625, -2.01708984375, -1.8031005859375, -1.589111328125, -1.3751220703125, -1.1611328125, -0.9471435546875, -0.733154296875, -0.5191650390625, -0.30517578125, -0.0911865234375, 0.122802734375, 0.3367919921875, 0.55078125, 0.7647705078125, 0.978759765625, 1.1927490234375, 1.40673828125, 1.6207275390625, 1.834716796875, 2.0487060546875, 2.2626953125, 2.4766845703125, 2.690673828125, 2.9046630859375, 3.11865234375, 3.3326416015625, 3.546630859375, 3.7606201171875, 3.974609375, 4.1885986328125, 4.402587890625, 4.6165771484375, 4.83056640625, 5.0445556640625, 5.258544921875, 5.4725341796875, 5.6865234375, 5.9005126953125, 6.114501953125, 6.3284912109375, 6.54248046875, 6.7564697265625, 6.970458984375, 7.1844482421875, 7.3984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 5.0, 7.0, 8.0, 7.0, 15.0, 19.0, 27.0, 38.0, 63.0, 81.0, 169.0, 247.0, 335.0, 547.0, 997.0, 1795.0, 3481.0, 7535.0, 18106.0, 47233.0, 131751.0, 336893.0, 308139.0, 117440.0, 42658.0, 16484.0, 6965.0, 3253.0, 1669.0, 924.0, 562.0, 368.0, 233.0, 151.0, 116.0, 67.0, 46.0, 37.0, 23.0, 22.0, 16.0, 9.0, 5.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-23.4375, -22.72607421875, -22.0146484375, -21.30322265625, -20.591796875, -19.88037109375, -19.1689453125, -18.45751953125, -17.74609375, -17.03466796875, -16.3232421875, -15.61181640625, -14.900390625, -14.18896484375, -13.4775390625, -12.76611328125, -12.0546875, -11.34326171875, -10.6318359375, -9.92041015625, -9.208984375, -8.49755859375, -7.7861328125, -7.07470703125, -6.36328125, -5.65185546875, -4.9404296875, -4.22900390625, -3.517578125, -2.80615234375, -2.0947265625, -1.38330078125, -0.671875, 0.03955078125, 0.7509765625, 1.46240234375, 2.173828125, 2.88525390625, 3.5966796875, 4.30810546875, 5.01953125, 5.73095703125, 6.4423828125, 7.15380859375, 7.865234375, 8.57666015625, 9.2880859375, 9.99951171875, 10.7109375, 11.42236328125, 12.1337890625, 12.84521484375, 13.556640625, 14.26806640625, 14.9794921875, 15.69091796875, 16.40234375, 17.11376953125, 17.8251953125, 18.53662109375, 19.248046875, 19.95947265625, 20.6708984375, 21.38232421875, 22.09375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 14.0, 13.0, 25.0, 21.0, 19.0, 20.0, 30.0, 23.0, 36.0, 40.0, 34.0, 41.0, 61.0, 43.0, 39.0, 44.0, 47.0, 52.0, 40.0, 33.0, 43.0, 30.0, 34.0, 31.0, 26.0, 23.0, 24.0, 15.0, 12.0, 12.0, 11.0, 8.0, 14.0, 4.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.3214111328125, -10.892822265625, -10.4642333984375, -10.03564453125, -9.6070556640625, -9.178466796875, -8.7498779296875, -8.3212890625, -7.8927001953125, -7.464111328125, -7.0355224609375, -6.60693359375, -6.1783447265625, -5.749755859375, -5.3211669921875, -4.892578125, -4.4639892578125, -4.035400390625, -3.6068115234375, -3.17822265625, -2.7496337890625, -2.321044921875, -1.8924560546875, -1.4638671875, -1.0352783203125, -0.606689453125, -0.1781005859375, 0.25048828125, 0.6790771484375, 1.107666015625, 1.5362548828125, 1.96484375, 2.3934326171875, 2.822021484375, 3.2506103515625, 3.67919921875, 4.1077880859375, 4.536376953125, 4.9649658203125, 5.3935546875, 5.8221435546875, 6.250732421875, 6.6793212890625, 7.10791015625, 7.5364990234375, 7.965087890625, 8.3936767578125, 8.822265625, 9.2508544921875, 9.679443359375, 10.1080322265625, 10.53662109375, 10.9652099609375, 11.393798828125, 11.8223876953125, 12.2509765625, 12.6795654296875, 13.108154296875, 13.5367431640625, 13.96533203125, 14.3939208984375, 14.822509765625, 15.2510986328125, 15.6796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 5.0, 10.0, 21.0, 13.0, 15.0, 37.0, 65.0, 79.0, 109.0, 159.0, 293.0, 591.0, 1170.0, 2746.0, 7550.0, 28130.0, 140546.0, 539039.0, 260361.0, 48638.0, 11981.0, 3838.0, 1525.0, 690.0, 363.0, 214.0, 119.0, 78.0, 62.0, 25.0, 16.0, 17.0, 13.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.53125, -20.910400390625, -20.28955078125, -19.668701171875, -19.0478515625, -18.427001953125, -17.80615234375, -17.185302734375, -16.564453125, -15.943603515625, -15.32275390625, -14.701904296875, -14.0810546875, -13.460205078125, -12.83935546875, -12.218505859375, -11.59765625, -10.976806640625, -10.35595703125, -9.735107421875, -9.1142578125, -8.493408203125, -7.87255859375, -7.251708984375, -6.630859375, -6.010009765625, -5.38916015625, -4.768310546875, -4.1474609375, -3.526611328125, -2.90576171875, -2.284912109375, -1.6640625, -1.043212890625, -0.42236328125, 0.198486328125, 0.8193359375, 1.440185546875, 2.06103515625, 2.681884765625, 3.302734375, 3.923583984375, 4.54443359375, 5.165283203125, 5.7861328125, 6.406982421875, 7.02783203125, 7.648681640625, 8.26953125, 8.890380859375, 9.51123046875, 10.132080078125, 10.7529296875, 11.373779296875, 11.99462890625, 12.615478515625, 13.236328125, 13.857177734375, 14.47802734375, 15.098876953125, 15.7197265625, 16.340576171875, 16.96142578125, 17.582275390625, 18.203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 4.0, 9.0, 14.0, 11.0, 13.0, 18.0, 19.0, 30.0, 29.0, 37.0, 35.0, 37.0, 55.0, 57.0, 74.0, 95.0, 73.0, 61.0, 57.0, 49.0, 35.0, 30.0, 29.0, 19.0, 24.0, 27.0, 10.0, 9.0, 10.0, 3.0, 4.0, 5.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001495361328125, -0.0014433115720748901, -0.0013912618160247803, -0.0013392120599746704, -0.0012871623039245605, -0.0012351125478744507, -0.0011830627918243408, -0.001131013035774231, -0.001078963279724121, -0.0010269135236740112, -0.0009748637676239014, -0.0009228140115737915, -0.0008707642555236816, -0.0008187144994735718, -0.0007666647434234619, -0.000714614987373352, -0.0006625652313232422, -0.0006105154752731323, -0.0005584657192230225, -0.0005064159631729126, -0.00045436620712280273, -0.00040231645107269287, -0.000350266695022583, -0.00029821693897247314, -0.0002461671829223633, -0.00019411742687225342, -0.00014206767082214355, -9.001791477203369e-05, -3.796815872192383e-05, 1.4081597328186035e-05, 6.61313533782959e-05, 0.00011818110942840576, 0.00017023086547851562, 0.0002222806215286255, 0.00027433037757873535, 0.0003263801336288452, 0.0003784298896789551, 0.00043047964572906494, 0.0004825294017791748, 0.0005345791578292847, 0.0005866289138793945, 0.0006386786699295044, 0.0006907284259796143, 0.0007427781820297241, 0.000794827938079834, 0.0008468776941299438, 0.0008989274501800537, 0.0009509772062301636, 0.0010030269622802734, 0.0010550767183303833, 0.0011071264743804932, 0.001159176230430603, 0.0012112259864807129, 0.0012632757425308228, 0.0013153254985809326, 0.0013673752546310425, 0.0014194250106811523, 0.0014714747667312622, 0.001523524522781372, 0.001575574278831482, 0.0016276240348815918, 0.0016796737909317017, 0.0017317235469818115, 0.0017837733030319214, 0.0018358230590820312]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 5.0, 7.0, 9.0, 25.0, 36.0, 71.0, 82.0, 203.0, 415.0, 955.0, 2558.0, 8391.0, 46375.0, 541848.0, 402948.0, 34355.0, 6693.0, 2103.0, 699.0, 355.0, 166.0, 89.0, 63.0, 39.0, 24.0, 9.0, 10.0, 4.0, 8.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.66162109375, -32.5732421875, -31.48486328125, -30.396484375, -29.30810546875, -28.2197265625, -27.13134765625, -26.04296875, -24.95458984375, -23.8662109375, -22.77783203125, -21.689453125, -20.60107421875, -19.5126953125, -18.42431640625, -17.3359375, -16.24755859375, -15.1591796875, -14.07080078125, -12.982421875, -11.89404296875, -10.8056640625, -9.71728515625, -8.62890625, -7.54052734375, -6.4521484375, -5.36376953125, -4.275390625, -3.18701171875, -2.0986328125, -1.01025390625, 0.078125, 1.16650390625, 2.2548828125, 3.34326171875, 4.431640625, 5.52001953125, 6.6083984375, 7.69677734375, 8.78515625, 9.87353515625, 10.9619140625, 12.05029296875, 13.138671875, 14.22705078125, 15.3154296875, 16.40380859375, 17.4921875, 18.58056640625, 19.6689453125, 20.75732421875, 21.845703125, 22.93408203125, 24.0224609375, 25.11083984375, 26.19921875, 27.28759765625, 28.3759765625, 29.46435546875, 30.552734375, 31.64111328125, 32.7294921875, 33.81787109375, 34.90625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 9.0, 4.0, 6.0, 11.0, 15.0, 18.0, 20.0, 23.0, 34.0, 35.0, 45.0, 65.0, 68.0, 82.0, 71.0, 85.0, 82.0, 61.0, 46.0, 36.0, 42.0, 27.0, 20.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 0.0, 6.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.484375, -9.21697998046875, -8.9495849609375, -8.68218994140625, -8.414794921875, -8.14739990234375, -7.8800048828125, -7.61260986328125, -7.34521484375, -7.07781982421875, -6.8104248046875, -6.54302978515625, -6.275634765625, -6.00823974609375, -5.7408447265625, -5.47344970703125, -5.2060546875, -4.93865966796875, -4.6712646484375, -4.40386962890625, -4.136474609375, -3.86907958984375, -3.6016845703125, -3.33428955078125, -3.06689453125, -2.79949951171875, -2.5321044921875, -2.26470947265625, -1.997314453125, -1.72991943359375, -1.4625244140625, -1.19512939453125, -0.927734375, -0.66033935546875, -0.3929443359375, -0.12554931640625, 0.141845703125, 0.40924072265625, 0.6766357421875, 0.94403076171875, 1.21142578125, 1.47882080078125, 1.7462158203125, 2.01361083984375, 2.281005859375, 2.54840087890625, 2.8157958984375, 3.08319091796875, 3.3505859375, 3.61798095703125, 3.8853759765625, 4.15277099609375, 4.420166015625, 4.68756103515625, 4.9549560546875, 5.22235107421875, 5.48974609375, 5.75714111328125, 6.0245361328125, 6.29193115234375, 6.559326171875, 6.82672119140625, 7.0941162109375, 7.36151123046875, 7.62890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 14.0, 15.0, 29.0, 43.0, 68.0, 121.0, 148.0, 154.0, 173.0, 92.0, 60.0, 31.0, 19.0, 13.0, 11.0, 6.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-212.89096069335938, -206.52386474609375, -200.15676879882812, -193.7896728515625, -187.42257690429688, -181.0554656982422, -174.68836975097656, -168.32127380371094, -161.9541778564453, -155.5870819091797, -149.21998596191406, -142.85289001464844, -136.48577880859375, -130.11868286132812, -123.7515869140625, -117.38449096679688, -111.01739501953125, -104.65029907226562, -98.283203125, -91.91609954833984, -85.54900360107422, -79.1819076538086, -72.81480407714844, -66.44770812988281, -60.08061218261719, -53.71351623535156, -47.34641647338867, -40.97931671142578, -34.612220764160156, -28.2451229095459, -21.87802505493164, -15.51092529296875, -9.143844604492188, -2.7767467498779297, 3.590351104736328, 9.957448959350586, 16.324546813964844, 22.6916446685791, 29.05874252319336, 35.42584228515625, 41.792938232421875, 48.1600341796875, 54.52713394165039, 60.89423370361328, 67.2613296508789, 73.62842559814453, 79.99552917480469, 86.36262512207031, 92.72972106933594, 99.09681701660156, 105.46391296386719, 111.83101654052734, 118.19811248779297, 124.5652084350586, 130.93231201171875, 137.29940795898438, 143.66650390625, 150.03359985351562, 156.40069580078125, 162.76779174804688, 169.1348876953125, 175.5019989013672, 181.8690948486328, 188.23619079589844, 194.60328674316406]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 11.0, 7.0, 13.0, 19.0, 19.0, 22.0, 24.0, 38.0, 38.0, 45.0, 55.0, 53.0, 66.0, 66.0, 62.0, 50.0, 54.0, 48.0, 41.0, 49.0, 37.0, 40.0, 24.0, 34.0, 13.0, 21.0, 13.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.28388977050781, -119.3560562133789, -115.42822265625, -111.50039672851562, -107.57256317138672, -103.64472961425781, -99.7168960571289, -95.7890625, -91.86123657226562, -87.93340301513672, -84.00556945800781, -80.07774353027344, -76.14990997314453, -72.22207641601562, -68.29424285888672, -64.36640930175781, -60.43857955932617, -56.510746002197266, -52.582916259765625, -48.65508270263672, -44.72725296020508, -40.79941940307617, -36.87158966064453, -32.943756103515625, -29.01592445373535, -25.088092803955078, -21.160261154174805, -17.23242950439453, -13.304596900939941, -9.376764297485352, -5.448932647705078, -1.5211009979248047, 2.4067306518554688, 6.334562301635742, 10.262393951416016, 14.190226554870605, 18.118057250976562, 22.04589080810547, 25.973722457885742, 29.901554107666016, 33.829383850097656, 37.75721740722656, 41.6850471496582, 45.61288070678711, 49.54071044921875, 53.468544006347656, 57.39637756347656, 61.3242073059082, 65.25204467773438, 69.17987823486328, 73.10771179199219, 77.03553771972656, 80.96337127685547, 84.89120483398438, 88.81903839111328, 92.74687194824219, 96.67469787597656, 100.60253143310547, 104.53036499023438, 108.45819091796875, 112.38602447509766, 116.31385803222656, 120.24169158935547, 124.16952514648438, 128.09735107421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 12.0, 17.0, 22.0, 37.0, 69.0, 98.0, 186.0, 339.0, 808.0, 2366.0, 10029.0, 69226.0, 3847943.0, 235919.0, 20484.0, 4198.0, 1260.0, 521.0, 245.0, 166.0, 101.0, 74.0, 39.0, 29.0, 26.0, 13.0, 15.0, 6.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-91.25, -88.54296875, -85.8359375, -83.12890625, -80.421875, -77.71484375, -75.0078125, -72.30078125, -69.59375, -66.88671875, -64.1796875, -61.47265625, -58.765625, -56.05859375, -53.3515625, -50.64453125, -47.9375, -45.23046875, -42.5234375, -39.81640625, -37.109375, -34.40234375, -31.6953125, -28.98828125, -26.28125, -23.57421875, -20.8671875, -18.16015625, -15.453125, -12.74609375, -10.0390625, -7.33203125, -4.625, -1.91796875, 0.7890625, 3.49609375, 6.203125, 8.91015625, 11.6171875, 14.32421875, 17.03125, 19.73828125, 22.4453125, 25.15234375, 27.859375, 30.56640625, 33.2734375, 35.98046875, 38.6875, 41.39453125, 44.1015625, 46.80859375, 49.515625, 52.22265625, 54.9296875, 57.63671875, 60.34375, 63.05078125, 65.7578125, 68.46484375, 71.171875, 73.87890625, 76.5859375, 79.29296875, 82.0]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 15.0, 16.0, 39.0, 47.0, 48.0, 60.0, 84.0, 91.0, 105.0, 91.0, 83.0, 70.0, 69.0, 55.0, 30.0, 33.0, 20.0, 9.0, 12.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75390625, -3.58984375, -3.42578125, -3.26171875, -3.09765625, -2.93359375, -2.76953125, -2.60546875, -2.44140625, -2.27734375, -2.11328125, -1.94921875, -1.78515625, -1.62109375, -1.45703125, -1.29296875, -1.12890625, -0.96484375, -0.80078125, -0.63671875, -0.47265625, -0.30859375, -0.14453125, 0.01953125, 0.18359375, 0.34765625, 0.51171875, 0.67578125, 0.83984375, 1.00390625, 1.16796875, 1.33203125, 1.49609375, 1.66015625, 1.82421875, 1.98828125, 2.15234375, 2.31640625, 2.48046875, 2.64453125, 2.80859375, 2.97265625, 3.13671875, 3.30078125, 3.46484375, 3.62890625, 3.79296875, 3.95703125, 4.12109375, 4.28515625, 4.44921875, 4.61328125, 4.77734375, 4.94140625, 5.10546875, 5.26953125, 5.43359375, 5.59765625, 5.76171875, 5.92578125, 6.08984375, 6.25390625, 6.41796875, 6.58203125, 6.74609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 1.0, 15.0, 22.0, 20.0, 37.0, 45.0, 65.0, 157.0, 573.0, 3845.0, 137995.0, 4027512.0, 21783.0, 1494.0, 325.0, 138.0, 64.0, 40.0, 50.0, 28.0, 23.0, 11.0, 15.0, 11.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.875, -142.828125, -137.78125, -132.734375, -127.6875, -122.640625, -117.59375, -112.546875, -107.5, -102.453125, -97.40625, -92.359375, -87.3125, -82.265625, -77.21875, -72.171875, -67.125, -62.078125, -57.03125, -51.984375, -46.9375, -41.890625, -36.84375, -31.796875, -26.75, -21.703125, -16.65625, -11.609375, -6.5625, -1.515625, 3.53125, 8.578125, 13.625, 18.671875, 23.71875, 28.765625, 33.8125, 38.859375, 43.90625, 48.953125, 54.0, 59.046875, 64.09375, 69.140625, 74.1875, 79.234375, 84.28125, 89.328125, 94.375, 99.421875, 104.46875, 109.515625, 114.5625, 119.609375, 124.65625, 129.703125, 134.75, 139.796875, 144.84375, 149.890625, 154.9375, 159.984375, 165.03125, 170.078125, 175.125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 7.0, 6.0, 11.0, 24.0, 52.0, 110.0, 283.0, 1353.0, 1748.0, 276.0, 102.0, 59.0, 23.0, 14.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5, -12.825927734375, -12.15185546875, -11.477783203125, -10.8037109375, -10.129638671875, -9.45556640625, -8.781494140625, -8.107421875, -7.433349609375, -6.75927734375, -6.085205078125, -5.4111328125, -4.737060546875, -4.06298828125, -3.388916015625, -2.71484375, -2.040771484375, -1.36669921875, -0.692626953125, -0.0185546875, 0.655517578125, 1.32958984375, 2.003662109375, 2.677734375, 3.351806640625, 4.02587890625, 4.699951171875, 5.3740234375, 6.048095703125, 6.72216796875, 7.396240234375, 8.0703125, 8.744384765625, 9.41845703125, 10.092529296875, 10.7666015625, 11.440673828125, 12.11474609375, 12.788818359375, 13.462890625, 14.136962890625, 14.81103515625, 15.485107421875, 16.1591796875, 16.833251953125, 17.50732421875, 18.181396484375, 18.85546875, 19.529541015625, 20.20361328125, 20.877685546875, 21.5517578125, 22.225830078125, 22.89990234375, 23.573974609375, 24.248046875, 24.922119140625, 25.59619140625, 26.270263671875, 26.9443359375, 27.618408203125, 28.29248046875, 28.966552734375, 29.640625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 11.0, 13.0, 26.0, 58.0, 87.0, 157.0, 197.0, 193.0, 117.0, 63.0, 44.0, 23.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.9610595703125, -169.48158264160156, -166.00210571289062, -162.52261352539062, -159.0431365966797, -155.56365966796875, -152.0841827392578, -148.60470581054688, -145.12522888183594, -141.645751953125, -138.16627502441406, -134.68679809570312, -131.20730590820312, -127.72782897949219, -124.24835205078125, -120.76887512207031, -117.28938293457031, -113.80990600585938, -110.3304214477539, -106.85094451904297, -103.37146759033203, -99.89198303222656, -96.41250610351562, -92.93302917480469, -89.45355224609375, -85.97407531738281, -82.49459075927734, -79.0151138305664, -75.53563690185547, -72.05615234375, -68.57667541503906, -65.09719848632812, -61.617713928222656, -58.13823318481445, -54.658756256103516, -51.17927551269531, -47.69979476928711, -44.220314025878906, -40.74083709716797, -37.261356353759766, -33.78187561035156, -30.302396774291992, -26.82291603088379, -23.34343719482422, -19.863956451416016, -16.384477615356445, -12.904998779296875, -9.425518035888672, -5.946041107177734, -2.4665615558624268, 1.0129179954528809, 4.492397308349609, 7.971877098083496, 11.451356887817383, 14.930835723876953, 18.410316467285156, 21.889795303344727, 25.369274139404297, 28.8487548828125, 32.32823181152344, 35.80771255493164, 39.287193298339844, 42.76667022705078, 46.24615478515625, 49.72563171386719]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 9.0, 5.0, 15.0, 18.0, 15.0, 20.0, 33.0, 32.0, 45.0, 45.0, 55.0, 54.0, 41.0, 57.0, 69.0, 74.0, 52.0, 50.0, 52.0, 37.0, 32.0, 23.0, 24.0, 21.0, 27.0, 26.0, 11.0, 8.0, 8.0, 10.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-46.37733840942383, -44.99847412109375, -43.619606018066406, -42.24074172973633, -40.86187744140625, -39.483009338378906, -38.10414505004883, -36.72528076171875, -35.346412658691406, -33.96754837036133, -32.588680267333984, -31.209815979003906, -29.830949783325195, -28.452083587646484, -27.073219299316406, -25.694353103637695, -24.315486907958984, -22.936620712280273, -21.557754516601562, -20.178890228271484, -18.800024032592773, -17.421157836914062, -16.042293548583984, -14.663427352905273, -13.284561157226562, -11.905694961547852, -10.526829719543457, -9.147964477539062, -7.769098281860352, -6.390232563018799, -5.011366844177246, -3.6325016021728516, -2.2536354064941406, -0.8747696876525879, 0.5040960311889648, 1.8829617500305176, 3.2618274688720703, 4.640693187713623, 6.019558906555176, 7.39842414855957, 8.777290344238281, 10.156156539916992, 11.535021781921387, 12.913887023925781, 14.292753219604492, 15.671619415283203, 17.05048370361328, 18.429349899291992, 19.808216094970703, 21.187082290649414, 22.565948486328125, 23.944812774658203, 25.323678970336914, 26.702545166015625, 28.081409454345703, 29.460275650024414, 30.839141845703125, 32.2180061340332, 33.59687423706055, 34.975738525390625, 36.35460662841797, 37.73347091674805, 39.112335205078125, 40.49120330810547, 41.87006759643555]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 6.0, 12.0, 17.0, 13.0, 31.0, 38.0, 49.0, 75.0, 112.0, 239.0, 396.0, 782.0, 1829.0, 5157.0, 21559.0, 123663.0, 539650.0, 290565.0, 49073.0, 9979.0, 2841.0, 1144.0, 508.0, 283.0, 165.0, 129.0, 62.0, 52.0, 38.0, 15.0, 11.0, 16.0, 8.0, 8.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.9375, -33.67822265625, -32.4189453125, -31.15966796875, -29.900390625, -28.64111328125, -27.3818359375, -26.12255859375, -24.86328125, -23.60400390625, -22.3447265625, -21.08544921875, -19.826171875, -18.56689453125, -17.3076171875, -16.04833984375, -14.7890625, -13.52978515625, -12.2705078125, -11.01123046875, -9.751953125, -8.49267578125, -7.2333984375, -5.97412109375, -4.71484375, -3.45556640625, -2.1962890625, -0.93701171875, 0.322265625, 1.58154296875, 2.8408203125, 4.10009765625, 5.359375, 6.61865234375, 7.8779296875, 9.13720703125, 10.396484375, 11.65576171875, 12.9150390625, 14.17431640625, 15.43359375, 16.69287109375, 17.9521484375, 19.21142578125, 20.470703125, 21.72998046875, 22.9892578125, 24.24853515625, 25.5078125, 26.76708984375, 28.0263671875, 29.28564453125, 30.544921875, 31.80419921875, 33.0634765625, 34.32275390625, 35.58203125, 36.84130859375, 38.1005859375, 39.35986328125, 40.619140625, 41.87841796875, 43.1376953125, 44.39697265625, 45.65625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 11.0, 6.0, 24.0, 30.0, 53.0, 62.0, 89.0, 87.0, 115.0, 117.0, 111.0, 78.0, 74.0, 52.0, 36.0, 17.0, 10.0, 12.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87109375, -5.662353515625, -5.45361328125, -5.244873046875, -5.0361328125, -4.827392578125, -4.61865234375, -4.409912109375, -4.201171875, -3.992431640625, -3.78369140625, -3.574951171875, -3.3662109375, -3.157470703125, -2.94873046875, -2.739990234375, -2.53125, -2.322509765625, -2.11376953125, -1.905029296875, -1.6962890625, -1.487548828125, -1.27880859375, -1.070068359375, -0.861328125, -0.652587890625, -0.44384765625, -0.235107421875, -0.0263671875, 0.182373046875, 0.39111328125, 0.599853515625, 0.80859375, 1.017333984375, 1.22607421875, 1.434814453125, 1.6435546875, 1.852294921875, 2.06103515625, 2.269775390625, 2.478515625, 2.687255859375, 2.89599609375, 3.104736328125, 3.3134765625, 3.522216796875, 3.73095703125, 3.939697265625, 4.1484375, 4.357177734375, 4.56591796875, 4.774658203125, 4.9833984375, 5.192138671875, 5.40087890625, 5.609619140625, 5.818359375, 6.027099609375, 6.23583984375, 6.444580078125, 6.6533203125, 6.862060546875, 7.07080078125, 7.279541015625, 7.48828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 9.0, 9.0, 14.0, 18.0, 20.0, 25.0, 31.0, 36.0, 49.0, 81.0, 100.0, 174.0, 226.0, 379.0, 594.0, 952.0, 1730.0, 3053.0, 6309.0, 13794.0, 32718.0, 83322.0, 203381.0, 332941.0, 215034.0, 89196.0, 35165.0, 14637.0, 6654.0, 3395.0, 1717.0, 982.0, 591.0, 377.0, 246.0, 167.0, 125.0, 80.0, 63.0, 45.0, 32.0, 15.0, 24.0, 9.0, 11.0, 10.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-18.0625, -17.48974609375, -16.9169921875, -16.34423828125, -15.771484375, -15.19873046875, -14.6259765625, -14.05322265625, -13.48046875, -12.90771484375, -12.3349609375, -11.76220703125, -11.189453125, -10.61669921875, -10.0439453125, -9.47119140625, -8.8984375, -8.32568359375, -7.7529296875, -7.18017578125, -6.607421875, -6.03466796875, -5.4619140625, -4.88916015625, -4.31640625, -3.74365234375, -3.1708984375, -2.59814453125, -2.025390625, -1.45263671875, -0.8798828125, -0.30712890625, 0.265625, 0.83837890625, 1.4111328125, 1.98388671875, 2.556640625, 3.12939453125, 3.7021484375, 4.27490234375, 4.84765625, 5.42041015625, 5.9931640625, 6.56591796875, 7.138671875, 7.71142578125, 8.2841796875, 8.85693359375, 9.4296875, 10.00244140625, 10.5751953125, 11.14794921875, 11.720703125, 12.29345703125, 12.8662109375, 13.43896484375, 14.01171875, 14.58447265625, 15.1572265625, 15.72998046875, 16.302734375, 16.87548828125, 17.4482421875, 18.02099609375, 18.59375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 5.0, 6.0, 8.0, 11.0, 10.0, 24.0, 20.0, 31.0, 28.0, 30.0, 31.0, 32.0, 38.0, 38.0, 47.0, 50.0, 49.0, 49.0, 38.0, 39.0, 51.0, 51.0, 37.0, 36.0, 31.0, 31.0, 28.0, 20.0, 20.0, 10.0, 19.0, 13.0, 10.0, 10.0, 5.0, 1.0, 6.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.9375, -14.44677734375, -13.9560546875, -13.46533203125, -12.974609375, -12.48388671875, -11.9931640625, -11.50244140625, -11.01171875, -10.52099609375, -10.0302734375, -9.53955078125, -9.048828125, -8.55810546875, -8.0673828125, -7.57666015625, -7.0859375, -6.59521484375, -6.1044921875, -5.61376953125, -5.123046875, -4.63232421875, -4.1416015625, -3.65087890625, -3.16015625, -2.66943359375, -2.1787109375, -1.68798828125, -1.197265625, -0.70654296875, -0.2158203125, 0.27490234375, 0.765625, 1.25634765625, 1.7470703125, 2.23779296875, 2.728515625, 3.21923828125, 3.7099609375, 4.20068359375, 4.69140625, 5.18212890625, 5.6728515625, 6.16357421875, 6.654296875, 7.14501953125, 7.6357421875, 8.12646484375, 8.6171875, 9.10791015625, 9.5986328125, 10.08935546875, 10.580078125, 11.07080078125, 11.5615234375, 12.05224609375, 12.54296875, 13.03369140625, 13.5244140625, 14.01513671875, 14.505859375, 14.99658203125, 15.4873046875, 15.97802734375, 16.46875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 3.0, 9.0, 13.0, 13.0, 29.0, 27.0, 41.0, 66.0, 114.0, 166.0, 306.0, 620.0, 1131.0, 2731.0, 7388.0, 24498.0, 97795.0, 365961.0, 394590.0, 111668.0, 27325.0, 8317.0, 3041.0, 1244.0, 614.0, 332.0, 185.0, 124.0, 70.0, 42.0, 22.0, 26.0, 18.0, 8.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.6171875, -12.24658203125, -11.8759765625, -11.50537109375, -11.134765625, -10.76416015625, -10.3935546875, -10.02294921875, -9.65234375, -9.28173828125, -8.9111328125, -8.54052734375, -8.169921875, -7.79931640625, -7.4287109375, -7.05810546875, -6.6875, -6.31689453125, -5.9462890625, -5.57568359375, -5.205078125, -4.83447265625, -4.4638671875, -4.09326171875, -3.72265625, -3.35205078125, -2.9814453125, -2.61083984375, -2.240234375, -1.86962890625, -1.4990234375, -1.12841796875, -0.7578125, -0.38720703125, -0.0166015625, 0.35400390625, 0.724609375, 1.09521484375, 1.4658203125, 1.83642578125, 2.20703125, 2.57763671875, 2.9482421875, 3.31884765625, 3.689453125, 4.06005859375, 4.4306640625, 4.80126953125, 5.171875, 5.54248046875, 5.9130859375, 6.28369140625, 6.654296875, 7.02490234375, 7.3955078125, 7.76611328125, 8.13671875, 8.50732421875, 8.8779296875, 9.24853515625, 9.619140625, 9.98974609375, 10.3603515625, 10.73095703125, 11.1015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 6.0, 5.0, 7.0, 6.0, 13.0, 18.0, 22.0, 53.0, 42.0, 57.0, 85.0, 96.0, 84.0, 128.0, 97.0, 64.0, 52.0, 46.0, 38.0, 16.0, 18.0, 17.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00231170654296875, -0.00224873423576355, -0.0021857619285583496, -0.0021227896213531494, -0.0020598173141479492, -0.001996845006942749, -0.0019338726997375488, -0.0018709003925323486, -0.0018079280853271484, -0.0017449557781219482, -0.001681983470916748, -0.0016190111637115479, -0.0015560388565063477, -0.0014930665493011475, -0.0014300942420959473, -0.001367121934890747, -0.0013041496276855469, -0.0012411773204803467, -0.0011782050132751465, -0.0011152327060699463, -0.001052260398864746, -0.000989288091659546, -0.0009263157844543457, -0.0008633434772491455, -0.0008003711700439453, -0.0007373988628387451, -0.0006744265556335449, -0.0006114542484283447, -0.0005484819412231445, -0.00048550963401794434, -0.00042253732681274414, -0.00035956501960754395, -0.00029659271240234375, -0.00023362040519714355, -0.00017064809799194336, -0.00010767579078674316, -4.470348358154297e-05, 1.8268823623657227e-05, 8.124113082885742e-05, 0.00014421343803405762, 0.0002071857452392578, 0.000270158052444458, 0.0003331303596496582, 0.0003961026668548584, 0.0004590749740600586, 0.0005220472812652588, 0.000585019588470459, 0.0006479918956756592, 0.0007109642028808594, 0.0007739365100860596, 0.0008369088172912598, 0.00089988112449646, 0.0009628534317016602, 0.0010258257389068604, 0.0010887980461120605, 0.0011517703533172607, 0.001214742660522461, 0.0012777149677276611, 0.0013406872749328613, 0.0014036595821380615, 0.0014666318893432617, 0.001529604196548462, 0.0015925765037536621, 0.0016555488109588623, 0.0017185211181640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 12.0, 18.0, 22.0, 37.0, 62.0, 79.0, 125.0, 246.0, 443.0, 880.0, 1727.0, 4279.0, 11922.0, 38277.0, 157413.0, 473758.0, 267175.0, 63416.0, 17569.0, 6216.0, 2487.0, 1107.0, 558.0, 256.0, 178.0, 98.0, 57.0, 44.0, 25.0, 19.0, 12.0, 11.0, 7.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-16.015625, -15.612060546875, -15.20849609375, -14.804931640625, -14.4013671875, -13.997802734375, -13.59423828125, -13.190673828125, -12.787109375, -12.383544921875, -11.97998046875, -11.576416015625, -11.1728515625, -10.769287109375, -10.36572265625, -9.962158203125, -9.55859375, -9.155029296875, -8.75146484375, -8.347900390625, -7.9443359375, -7.540771484375, -7.13720703125, -6.733642578125, -6.330078125, -5.926513671875, -5.52294921875, -5.119384765625, -4.7158203125, -4.312255859375, -3.90869140625, -3.505126953125, -3.1015625, -2.697998046875, -2.29443359375, -1.890869140625, -1.4873046875, -1.083740234375, -0.68017578125, -0.276611328125, 0.126953125, 0.530517578125, 0.93408203125, 1.337646484375, 1.7412109375, 2.144775390625, 2.54833984375, 2.951904296875, 3.35546875, 3.759033203125, 4.16259765625, 4.566162109375, 4.9697265625, 5.373291015625, 5.77685546875, 6.180419921875, 6.583984375, 6.987548828125, 7.39111328125, 7.794677734375, 8.1982421875, 8.601806640625, 9.00537109375, 9.408935546875, 9.8125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 5.0, 7.0, 8.0, 6.0, 11.0, 19.0, 18.0, 20.0, 13.0, 26.0, 39.0, 46.0, 67.0, 59.0, 54.0, 60.0, 70.0, 59.0, 59.0, 41.0, 54.0, 40.0, 37.0, 38.0, 26.0, 21.0, 17.0, 10.0, 14.0, 7.0, 8.0, 10.0, 3.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -6.0323486328125, -5.842041015625, -5.6517333984375, -5.46142578125, -5.2711181640625, -5.080810546875, -4.8905029296875, -4.7001953125, -4.5098876953125, -4.319580078125, -4.1292724609375, -3.93896484375, -3.7486572265625, -3.558349609375, -3.3680419921875, -3.177734375, -2.9874267578125, -2.797119140625, -2.6068115234375, -2.41650390625, -2.2261962890625, -2.035888671875, -1.8455810546875, -1.6552734375, -1.4649658203125, -1.274658203125, -1.0843505859375, -0.89404296875, -0.7037353515625, -0.513427734375, -0.3231201171875, -0.1328125, 0.0574951171875, 0.247802734375, 0.4381103515625, 0.62841796875, 0.8187255859375, 1.009033203125, 1.1993408203125, 1.3896484375, 1.5799560546875, 1.770263671875, 1.9605712890625, 2.15087890625, 2.3411865234375, 2.531494140625, 2.7218017578125, 2.912109375, 3.1024169921875, 3.292724609375, 3.4830322265625, 3.67333984375, 3.8636474609375, 4.053955078125, 4.2442626953125, 4.4345703125, 4.6248779296875, 4.815185546875, 5.0054931640625, 5.19580078125, 5.3861083984375, 5.576416015625, 5.7667236328125, 5.95703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 11.0, 27.0, 48.0, 68.0, 97.0, 147.0, 145.0, 157.0, 114.0, 67.0, 53.0, 26.0, 10.0, 10.0, 4.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.79756164550781, -117.58443450927734, -112.37130737304688, -107.1581802368164, -101.94505310058594, -96.73193359375, -91.51880645751953, -86.30567932128906, -81.0925521850586, -75.87942504882812, -70.66629791259766, -65.45317077636719, -60.240047454833984, -55.026920318603516, -49.81379699707031, -44.600669860839844, -39.387542724609375, -34.174415588378906, -28.96129035949707, -23.748165130615234, -18.535037994384766, -13.321910858154297, -8.108785629272461, -2.895660400390625, 2.3174667358398438, 7.530592918395996, 12.743719100952148, 17.956844329833984, 23.169971466064453, 28.383098602294922, 33.596221923828125, 38.809349060058594, 44.0224609375, 49.23558807373047, 54.44871520996094, 59.66183853149414, 64.87496948242188, 70.08808898925781, 75.30121612548828, 80.51434326171875, 85.72747039794922, 90.94059753417969, 96.15372467041016, 101.36685180664062, 106.57997131347656, 111.79310607910156, 117.0062255859375, 122.21935272216797, 127.43247985839844, 132.64559936523438, 137.85873413085938, 143.0718536376953, 148.2849884033203, 153.49810791015625, 158.71124267578125, 163.9243621826172, 169.13748168945312, 174.35060119628906, 179.56373596191406, 184.77685546875, 189.989990234375, 195.20310974121094, 200.41624450683594, 205.62936401367188, 210.84249877929688]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 8.0, 5.0, 10.0, 5.0, 18.0, 11.0, 25.0, 28.0, 34.0, 35.0, 42.0, 44.0, 47.0, 50.0, 71.0, 69.0, 48.0, 50.0, 60.0, 54.0, 50.0, 43.0, 34.0, 29.0, 29.0, 18.0, 18.0, 16.0, 12.0, 10.0, 5.0, 5.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.1722412109375, -100.70118713378906, -97.23013305664062, -93.75908660888672, -90.28803253173828, -86.81697845458984, -83.34593200683594, -79.8748779296875, -76.40382385253906, -72.93276977539062, -69.46171569824219, -65.99066925048828, -62.519615173339844, -59.048561096191406, -55.577510833740234, -52.10646057128906, -48.635406494140625, -45.16435241699219, -41.693302154541016, -38.222251892089844, -34.751197814941406, -31.2801456451416, -27.809093475341797, -24.338041305541992, -20.866989135742188, -17.395936965942383, -13.924884796142578, -10.453832626342773, -6.982780456542969, -3.511728286743164, -0.040676116943359375, 3.4303760528564453, 6.90142822265625, 10.372480392456055, 13.84353256225586, 17.314584732055664, 20.78563690185547, 24.256689071655273, 27.727741241455078, 31.198793411254883, 34.66984558105469, 38.140899658203125, 41.6119499206543, 45.08300018310547, 48.554054260253906, 52.025108337402344, 55.496158599853516, 58.96720886230469, 62.438262939453125, 65.90931701660156, 69.38037109375, 72.8514175415039, 76.32247161865234, 79.79352569580078, 83.26457214355469, 86.73562622070312, 90.20668029785156, 93.677734375, 97.14878845214844, 100.61983489990234, 104.09088897705078, 107.56194305419922, 111.03298950195312, 114.50404357910156, 117.97509765625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 15.0, 13.0, 23.0, 29.0, 33.0, 53.0, 82.0, 171.0, 291.0, 706.0, 2048.0, 7909.0, 49407.0, 3824029.0, 281664.0, 20788.0, 4437.0, 1406.0, 519.0, 269.0, 132.0, 84.0, 43.0, 33.0, 21.0, 13.0, 12.0, 10.0, 4.0, 5.0, 3.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.48486328125, -47.3134765625, -45.14208984375, -42.970703125, -40.79931640625, -38.6279296875, -36.45654296875, -34.28515625, -32.11376953125, -29.9423828125, -27.77099609375, -25.599609375, -23.42822265625, -21.2568359375, -19.08544921875, -16.9140625, -14.74267578125, -12.5712890625, -10.39990234375, -8.228515625, -6.05712890625, -3.8857421875, -1.71435546875, 0.45703125, 2.62841796875, 4.7998046875, 6.97119140625, 9.142578125, 11.31396484375, 13.4853515625, 15.65673828125, 17.828125, 19.99951171875, 22.1708984375, 24.34228515625, 26.513671875, 28.68505859375, 30.8564453125, 33.02783203125, 35.19921875, 37.37060546875, 39.5419921875, 41.71337890625, 43.884765625, 46.05615234375, 48.2275390625, 50.39892578125, 52.5703125, 54.74169921875, 56.9130859375, 59.08447265625, 61.255859375, 63.42724609375, 65.5986328125, 67.77001953125, 69.94140625, 72.11279296875, 74.2841796875, 76.45556640625, 78.626953125, 80.79833984375, 82.9697265625, 85.14111328125, 87.3125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 23.0, 43.0, 65.0, 69.0, 101.0, 114.0, 113.0, 132.0, 107.0, 84.0, 57.0, 33.0, 17.0, 11.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.35546875, -7.11444091796875, -6.8734130859375, -6.63238525390625, -6.391357421875, -6.15032958984375, -5.9093017578125, -5.66827392578125, -5.42724609375, -5.18621826171875, -4.9451904296875, -4.70416259765625, -4.463134765625, -4.22210693359375, -3.9810791015625, -3.74005126953125, -3.4990234375, -3.25799560546875, -3.0169677734375, -2.77593994140625, -2.534912109375, -2.29388427734375, -2.0528564453125, -1.81182861328125, -1.57080078125, -1.32977294921875, -1.0887451171875, -0.84771728515625, -0.606689453125, -0.36566162109375, -0.1246337890625, 0.11639404296875, 0.357421875, 0.59844970703125, 0.8394775390625, 1.08050537109375, 1.321533203125, 1.56256103515625, 1.8035888671875, 2.04461669921875, 2.28564453125, 2.52667236328125, 2.7677001953125, 3.00872802734375, 3.249755859375, 3.49078369140625, 3.7318115234375, 3.97283935546875, 4.2138671875, 4.45489501953125, 4.6959228515625, 4.93695068359375, 5.177978515625, 5.41900634765625, 5.6600341796875, 5.90106201171875, 6.14208984375, 6.38311767578125, 6.6241455078125, 6.86517333984375, 7.106201171875, 7.34722900390625, 7.5882568359375, 7.82928466796875, 8.0703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 5.0, 10.0, 24.0, 30.0, 28.0, 68.0, 82.0, 144.0, 220.0, 446.0, 871.0, 2105.0, 6579.0, 31736.0, 362594.0, 3661634.0, 105379.0, 15636.0, 3960.0, 1348.0, 588.0, 263.0, 162.0, 104.0, 65.0, 61.0, 29.0, 29.0, 17.0, 16.0, 16.0, 11.0, 9.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.625, -48.89599609375, -47.1669921875, -45.43798828125, -43.708984375, -41.97998046875, -40.2509765625, -38.52197265625, -36.79296875, -35.06396484375, -33.3349609375, -31.60595703125, -29.876953125, -28.14794921875, -26.4189453125, -24.68994140625, -22.9609375, -21.23193359375, -19.5029296875, -17.77392578125, -16.044921875, -14.31591796875, -12.5869140625, -10.85791015625, -9.12890625, -7.39990234375, -5.6708984375, -3.94189453125, -2.212890625, -0.48388671875, 1.2451171875, 2.97412109375, 4.703125, 6.43212890625, 8.1611328125, 9.89013671875, 11.619140625, 13.34814453125, 15.0771484375, 16.80615234375, 18.53515625, 20.26416015625, 21.9931640625, 23.72216796875, 25.451171875, 27.18017578125, 28.9091796875, 30.63818359375, 32.3671875, 34.09619140625, 35.8251953125, 37.55419921875, 39.283203125, 41.01220703125, 42.7412109375, 44.47021484375, 46.19921875, 47.92822265625, 49.6572265625, 51.38623046875, 53.115234375, 54.84423828125, 56.5732421875, 58.30224609375, 60.03125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 11.0, 11.0, 13.0, 26.0, 55.0, 79.0, 140.0, 340.0, 1772.0, 1001.0, 274.0, 128.0, 74.0, 40.0, 32.0, 19.0, 20.0, 11.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6328125, -9.2607421875, -8.888671875, -8.5166015625, -8.14453125, -7.7724609375, -7.400390625, -7.0283203125, -6.65625, -6.2841796875, -5.912109375, -5.5400390625, -5.16796875, -4.7958984375, -4.423828125, -4.0517578125, -3.6796875, -3.3076171875, -2.935546875, -2.5634765625, -2.19140625, -1.8193359375, -1.447265625, -1.0751953125, -0.703125, -0.3310546875, 0.041015625, 0.4130859375, 0.78515625, 1.1572265625, 1.529296875, 1.9013671875, 2.2734375, 2.6455078125, 3.017578125, 3.3896484375, 3.76171875, 4.1337890625, 4.505859375, 4.8779296875, 5.25, 5.6220703125, 5.994140625, 6.3662109375, 6.73828125, 7.1103515625, 7.482421875, 7.8544921875, 8.2265625, 8.5986328125, 8.970703125, 9.3427734375, 9.71484375, 10.0869140625, 10.458984375, 10.8310546875, 11.203125, 11.5751953125, 11.947265625, 12.3193359375, 12.69140625, 13.0634765625, 13.435546875, 13.8076171875, 14.1796875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 7.0, 24.0, 81.0, 226.0, 368.0, 200.0, 64.0, 28.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.130615234375, -159.07444763183594, -154.0182647705078, -148.96209716796875, -143.9059295654297, -138.84976196289062, -133.7935791015625, -128.73741149902344, -123.68123626708984, -118.62506103515625, -113.56889343261719, -108.5127182006836, -103.45654296875, -98.40037536621094, -93.34420013427734, -88.28802490234375, -83.23185729980469, -78.1756820678711, -73.11951446533203, -68.06333923339844, -63.00716781616211, -57.95099639892578, -52.89482116699219, -47.83864974975586, -42.78247833251953, -37.7263069152832, -32.670135498046875, -27.61396026611328, -22.557788848876953, -17.501617431640625, -12.445444107055664, -7.389270782470703, -2.3331146240234375, 2.723057746887207, 7.779230117797852, 12.835402488708496, 17.89157485961914, 22.94774627685547, 28.00391960144043, 33.06009292602539, 38.11626434326172, 43.17243576049805, 48.228607177734375, 53.28478240966797, 58.3409538269043, 63.397125244140625, 68.45330047607422, 73.50947570800781, 78.56564331054688, 83.62181854248047, 88.67798614501953, 93.73416137695312, 98.79032897949219, 103.84650421142578, 108.90267944335938, 113.95884704589844, 119.01502227783203, 124.07119750976562, 129.1273651123047, 134.18353271484375, 139.23971557617188, 144.29588317871094, 149.35205078125, 154.40823364257812, 159.4644012451172]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 13.0, 16.0, 17.0, 24.0, 23.0, 31.0, 27.0, 35.0, 46.0, 48.0, 52.0, 59.0, 56.0, 48.0, 43.0, 60.0, 56.0, 48.0, 49.0, 33.0, 30.0, 25.0, 24.0, 26.0, 20.0, 22.0, 9.0, 9.0, 9.0, 8.0, 3.0, 4.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-34.57499313354492, -33.52218246459961, -32.4693717956543, -31.416561126708984, -30.363750457763672, -29.31093978881836, -28.258127212524414, -27.2053165435791, -26.15250587463379, -25.099695205688477, -24.046884536743164, -22.99407386779785, -21.941261291503906, -20.888450622558594, -19.83563995361328, -18.78282928466797, -17.730018615722656, -16.677207946777344, -15.624397277832031, -14.571585655212402, -13.51877498626709, -12.465964317321777, -11.413152694702148, -10.360342025756836, -9.307531356811523, -8.254720687866211, -7.20190954208374, -6.1490983963012695, -5.096287727355957, -4.0434770584106445, -2.990665912628174, -1.9378547668457031, -0.8850479125976562, 0.16776299476623535, 1.220573902130127, 2.2733848094940186, 3.32619571685791, 4.379006385803223, 5.431817531585693, 6.484628677368164, 7.537439346313477, 8.590250015258789, 9.643060684204102, 10.69587230682373, 11.748682975769043, 12.801493644714355, 13.854305267333984, 14.907115936279297, 15.95992660522461, 17.012737274169922, 18.065547943115234, 19.118358612060547, 20.17116928100586, 21.223979949951172, 22.276792526245117, 23.32960319519043, 24.382413864135742, 25.435224533081055, 26.488035202026367, 27.54084587097168, 28.593658447265625, 29.646469116210938, 30.69927978515625, 31.752090454101562, 32.804901123046875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 8.0, 14.0, 22.0, 27.0, 36.0, 66.0, 120.0, 181.0, 321.0, 661.0, 1298.0, 3242.0, 10603.0, 47955.0, 276624.0, 547801.0, 125986.0, 23313.0, 6091.0, 2102.0, 926.0, 456.0, 234.0, 157.0, 94.0, 60.0, 45.0, 27.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.84375, -31.6396484375, -30.435546875, -29.2314453125, -28.02734375, -26.8232421875, -25.619140625, -24.4150390625, -23.2109375, -22.0068359375, -20.802734375, -19.5986328125, -18.39453125, -17.1904296875, -15.986328125, -14.7822265625, -13.578125, -12.3740234375, -11.169921875, -9.9658203125, -8.76171875, -7.5576171875, -6.353515625, -5.1494140625, -3.9453125, -2.7412109375, -1.537109375, -0.3330078125, 0.87109375, 2.0751953125, 3.279296875, 4.4833984375, 5.6875, 6.8916015625, 8.095703125, 9.2998046875, 10.50390625, 11.7080078125, 12.912109375, 14.1162109375, 15.3203125, 16.5244140625, 17.728515625, 18.9326171875, 20.13671875, 21.3408203125, 22.544921875, 23.7490234375, 24.953125, 26.1572265625, 27.361328125, 28.5654296875, 29.76953125, 30.9736328125, 32.177734375, 33.3818359375, 34.5859375, 35.7900390625, 36.994140625, 38.1982421875, 39.40234375, 40.6064453125, 41.810546875, 43.0146484375, 44.21875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 9.0, 18.0, 31.0, 45.0, 56.0, 82.0, 109.0, 111.0, 117.0, 110.0, 87.0, 75.0, 54.0, 40.0, 18.0, 12.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28125, -6.0513916015625, -5.821533203125, -5.5916748046875, -5.36181640625, -5.1319580078125, -4.902099609375, -4.6722412109375, -4.4423828125, -4.2125244140625, -3.982666015625, -3.7528076171875, -3.52294921875, -3.2930908203125, -3.063232421875, -2.8333740234375, -2.603515625, -2.3736572265625, -2.143798828125, -1.9139404296875, -1.68408203125, -1.4542236328125, -1.224365234375, -0.9945068359375, -0.7646484375, -0.5347900390625, -0.304931640625, -0.0750732421875, 0.15478515625, 0.3846435546875, 0.614501953125, 0.8443603515625, 1.07421875, 1.3040771484375, 1.533935546875, 1.7637939453125, 1.99365234375, 2.2235107421875, 2.453369140625, 2.6832275390625, 2.9130859375, 3.1429443359375, 3.372802734375, 3.6026611328125, 3.83251953125, 4.0623779296875, 4.292236328125, 4.5220947265625, 4.751953125, 4.9818115234375, 5.211669921875, 5.4415283203125, 5.67138671875, 5.9012451171875, 6.131103515625, 6.3609619140625, 6.5908203125, 6.8206787109375, 7.050537109375, 7.2803955078125, 7.51025390625, 7.7401123046875, 7.969970703125, 8.1998291015625, 8.4296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 15.0, 22.0, 22.0, 31.0, 35.0, 59.0, 78.0, 116.0, 175.0, 242.0, 408.0, 708.0, 1224.0, 2340.0, 4933.0, 11159.0, 28581.0, 77736.0, 209624.0, 370461.0, 211554.0, 78651.0, 28607.0, 11182.0, 4968.0, 2341.0, 1245.0, 684.0, 459.0, 279.0, 194.0, 129.0, 92.0, 47.0, 36.0, 25.0, 20.0, 15.0, 9.0, 8.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.74072265625, -14.1845703125, -13.62841796875, -13.072265625, -12.51611328125, -11.9599609375, -11.40380859375, -10.84765625, -10.29150390625, -9.7353515625, -9.17919921875, -8.623046875, -8.06689453125, -7.5107421875, -6.95458984375, -6.3984375, -5.84228515625, -5.2861328125, -4.72998046875, -4.173828125, -3.61767578125, -3.0615234375, -2.50537109375, -1.94921875, -1.39306640625, -0.8369140625, -0.28076171875, 0.275390625, 0.83154296875, 1.3876953125, 1.94384765625, 2.5, 3.05615234375, 3.6123046875, 4.16845703125, 4.724609375, 5.28076171875, 5.8369140625, 6.39306640625, 6.94921875, 7.50537109375, 8.0615234375, 8.61767578125, 9.173828125, 9.72998046875, 10.2861328125, 10.84228515625, 11.3984375, 11.95458984375, 12.5107421875, 13.06689453125, 13.623046875, 14.17919921875, 14.7353515625, 15.29150390625, 15.84765625, 16.40380859375, 16.9599609375, 17.51611328125, 18.072265625, 18.62841796875, 19.1845703125, 19.74072265625, 20.296875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 6.0, 11.0, 14.0, 9.0, 12.0, 18.0, 21.0, 17.0, 24.0, 39.0, 39.0, 29.0, 46.0, 35.0, 49.0, 62.0, 41.0, 57.0, 56.0, 43.0, 34.0, 45.0, 39.0, 36.0, 25.0, 17.0, 35.0, 28.0, 27.0, 8.0, 19.0, 14.0, 14.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3046875, -13.833984375, -13.36328125, -12.892578125, -12.421875, -11.951171875, -11.48046875, -11.009765625, -10.5390625, -10.068359375, -9.59765625, -9.126953125, -8.65625, -8.185546875, -7.71484375, -7.244140625, -6.7734375, -6.302734375, -5.83203125, -5.361328125, -4.890625, -4.419921875, -3.94921875, -3.478515625, -3.0078125, -2.537109375, -2.06640625, -1.595703125, -1.125, -0.654296875, -0.18359375, 0.287109375, 0.7578125, 1.228515625, 1.69921875, 2.169921875, 2.640625, 3.111328125, 3.58203125, 4.052734375, 4.5234375, 4.994140625, 5.46484375, 5.935546875, 6.40625, 6.876953125, 7.34765625, 7.818359375, 8.2890625, 8.759765625, 9.23046875, 9.701171875, 10.171875, 10.642578125, 11.11328125, 11.583984375, 12.0546875, 12.525390625, 12.99609375, 13.466796875, 13.9375, 14.408203125, 14.87890625, 15.349609375, 15.8203125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 8.0, 6.0, 2.0, 5.0, 7.0, 5.0, 4.0, 16.0, 26.0, 23.0, 36.0, 51.0, 62.0, 121.0, 223.0, 347.0, 611.0, 1265.0, 3037.0, 8332.0, 29202.0, 123858.0, 439001.0, 332363.0, 79479.0, 19811.0, 6095.0, 2232.0, 1040.0, 470.0, 276.0, 167.0, 106.0, 68.0, 57.0, 31.0, 23.0, 24.0, 12.0, 12.0, 6.0, 6.0, 6.0, 9.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0], "bins": [-10.546875, -10.225830078125, -9.90478515625, -9.583740234375, -9.2626953125, -8.941650390625, -8.62060546875, -8.299560546875, -7.978515625, -7.657470703125, -7.33642578125, -7.015380859375, -6.6943359375, -6.373291015625, -6.05224609375, -5.731201171875, -5.41015625, -5.089111328125, -4.76806640625, -4.447021484375, -4.1259765625, -3.804931640625, -3.48388671875, -3.162841796875, -2.841796875, -2.520751953125, -2.19970703125, -1.878662109375, -1.5576171875, -1.236572265625, -0.91552734375, -0.594482421875, -0.2734375, 0.047607421875, 0.36865234375, 0.689697265625, 1.0107421875, 1.331787109375, 1.65283203125, 1.973876953125, 2.294921875, 2.615966796875, 2.93701171875, 3.258056640625, 3.5791015625, 3.900146484375, 4.22119140625, 4.542236328125, 4.86328125, 5.184326171875, 5.50537109375, 5.826416015625, 6.1474609375, 6.468505859375, 6.78955078125, 7.110595703125, 7.431640625, 7.752685546875, 8.07373046875, 8.394775390625, 8.7158203125, 9.036865234375, 9.35791015625, 9.678955078125, 10.0]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 10.0, 15.0, 14.0, 10.0, 22.0, 33.0, 40.0, 53.0, 59.0, 60.0, 70.0, 78.0, 91.0, 71.0, 81.0, 50.0, 42.0, 39.0, 31.0, 23.0, 13.0, 18.0, 12.0, 8.0, 8.0, 6.0, 2.0, 7.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014743804931640625, -0.0014344602823257446, -0.0013945400714874268, -0.0013546198606491089, -0.001314699649810791, -0.0012747794389724731, -0.0012348592281341553, -0.0011949390172958374, -0.0011550188064575195, -0.0011150985956192017, -0.0010751783847808838, -0.001035258173942566, -0.000995337963104248, -0.0009554177522659302, -0.0009154975414276123, -0.0008755773305892944, -0.0008356571197509766, -0.0007957369089126587, -0.0007558166980743408, -0.000715896487236023, -0.0006759762763977051, -0.0006360560655593872, -0.0005961358547210693, -0.0005562156438827515, -0.0005162954330444336, -0.0004763752222061157, -0.00043645501136779785, -0.00039653480052948, -0.0003566145896911621, -0.00031669437885284424, -0.00027677416801452637, -0.0002368539571762085, -0.00019693374633789062, -0.00015701353549957275, -0.00011709332466125488, -7.717311382293701e-05, -3.725290298461914e-05, 2.6673078536987305e-06, 4.25875186920166e-05, 8.250772953033447e-05, 0.00012242794036865234, 0.00016234815120697021, 0.00020226836204528809, 0.00024218857288360596, 0.00028210878372192383, 0.0003220289945602417, 0.00036194920539855957, 0.00040186941623687744, 0.0004417896270751953, 0.0004817098379135132, 0.0005216300487518311, 0.0005615502595901489, 0.0006014704704284668, 0.0006413906812667847, 0.0006813108921051025, 0.0007212311029434204, 0.0007611513137817383, 0.0008010715246200562, 0.000840991735458374, 0.0008809119462966919, 0.0009208321571350098, 0.0009607523679733276, 0.0010006725788116455, 0.0010405927896499634, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 10.0, 19.0, 23.0, 27.0, 26.0, 79.0, 111.0, 173.0, 342.0, 592.0, 1171.0, 2240.0, 5011.0, 12955.0, 41201.0, 166137.0, 483733.0, 245848.0, 58999.0, 17626.0, 6381.0, 2796.0, 1407.0, 669.0, 400.0, 208.0, 128.0, 88.0, 53.0, 20.0, 23.0, 19.0, 13.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-12.53125, -12.189208984375, -11.84716796875, -11.505126953125, -11.1630859375, -10.821044921875, -10.47900390625, -10.136962890625, -9.794921875, -9.452880859375, -9.11083984375, -8.768798828125, -8.4267578125, -8.084716796875, -7.74267578125, -7.400634765625, -7.05859375, -6.716552734375, -6.37451171875, -6.032470703125, -5.6904296875, -5.348388671875, -5.00634765625, -4.664306640625, -4.322265625, -3.980224609375, -3.63818359375, -3.296142578125, -2.9541015625, -2.612060546875, -2.27001953125, -1.927978515625, -1.5859375, -1.243896484375, -0.90185546875, -0.559814453125, -0.2177734375, 0.124267578125, 0.46630859375, 0.808349609375, 1.150390625, 1.492431640625, 1.83447265625, 2.176513671875, 2.5185546875, 2.860595703125, 3.20263671875, 3.544677734375, 3.88671875, 4.228759765625, 4.57080078125, 4.912841796875, 5.2548828125, 5.596923828125, 5.93896484375, 6.281005859375, 6.623046875, 6.965087890625, 7.30712890625, 7.649169921875, 7.9912109375, 8.333251953125, 8.67529296875, 9.017333984375, 9.359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 5.0, 8.0, 9.0, 12.0, 19.0, 24.0, 33.0, 33.0, 42.0, 61.0, 56.0, 71.0, 85.0, 80.0, 72.0, 74.0, 60.0, 53.0, 36.0, 36.0, 22.0, 12.0, 16.0, 15.0, 10.0, 8.0, 10.0, 3.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.92279052734375, -5.7205810546875, -5.51837158203125, -5.316162109375, -5.11395263671875, -4.9117431640625, -4.70953369140625, -4.50732421875, -4.30511474609375, -4.1029052734375, -3.90069580078125, -3.698486328125, -3.49627685546875, -3.2940673828125, -3.09185791015625, -2.8896484375, -2.68743896484375, -2.4852294921875, -2.28302001953125, -2.080810546875, -1.87860107421875, -1.6763916015625, -1.47418212890625, -1.27197265625, -1.06976318359375, -0.8675537109375, -0.66534423828125, -0.463134765625, -0.26092529296875, -0.0587158203125, 0.14349365234375, 0.345703125, 0.54791259765625, 0.7501220703125, 0.95233154296875, 1.154541015625, 1.35675048828125, 1.5589599609375, 1.76116943359375, 1.96337890625, 2.16558837890625, 2.3677978515625, 2.57000732421875, 2.772216796875, 2.97442626953125, 3.1766357421875, 3.37884521484375, 3.5810546875, 3.78326416015625, 3.9854736328125, 4.18768310546875, 4.389892578125, 4.59210205078125, 4.7943115234375, 4.99652099609375, 5.19873046875, 5.40093994140625, 5.6031494140625, 5.80535888671875, 6.007568359375, 6.20977783203125, 6.4119873046875, 6.61419677734375, 6.81640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 14.0, 21.0, 58.0, 137.0, 237.0, 273.0, 159.0, 75.0, 22.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.6604919433594, -280.36700439453125, -271.0735168457031, -261.780029296875, -252.48654174804688, -243.19305419921875, -233.89956665039062, -224.6060791015625, -215.31259155273438, -206.01910400390625, -196.72561645507812, -187.43212890625, -178.13864135742188, -168.84515380859375, -159.55166625976562, -150.2581787109375, -140.96469116210938, -131.67120361328125, -122.37771606445312, -113.084228515625, -103.79074096679688, -94.49725341796875, -85.20376586914062, -75.9102783203125, -66.61679077148438, -57.32330322265625, -48.029815673828125, -38.736328125, -29.442840576171875, -20.14935302734375, -10.855865478515625, -1.5623779296875, 7.73114013671875, 17.024627685546875, 26.318115234375, 35.611602783203125, 44.90509033203125, 54.198577880859375, 63.4920654296875, 72.78555297851562, 82.07904052734375, 91.37252807617188, 100.666015625, 109.95950317382812, 119.25299072265625, 128.54647827148438, 137.8399658203125, 147.13345336914062, 156.42694091796875, 165.72042846679688, 175.013916015625, 184.30740356445312, 193.60089111328125, 202.89437866210938, 212.1878662109375, 221.48135375976562, 230.77484130859375, 240.06832885742188, 249.36181640625, 258.6553039550781, 267.94879150390625, 277.2422790527344, 286.5357666015625, 295.8292541503906, 305.12274169921875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 8.0, 3.0, 10.0, 14.0, 11.0, 24.0, 22.0, 18.0, 14.0, 36.0, 27.0, 36.0, 40.0, 43.0, 56.0, 51.0, 62.0, 53.0, 48.0, 33.0, 57.0, 47.0, 49.0, 46.0, 32.0, 24.0, 17.0, 25.0, 20.0, 14.0, 23.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-88.94471740722656, -86.02000427246094, -83.09529876708984, -80.17058563232422, -77.2458724975586, -74.32115936279297, -71.39645385742188, -68.47174072265625, -65.54702758789062, -62.622318267822266, -59.69760513305664, -56.77289581298828, -53.848182678222656, -50.9234733581543, -47.99876403808594, -45.07405090332031, -42.14934158325195, -39.224632263183594, -36.29991912841797, -33.37520980834961, -30.450496673583984, -27.525787353515625, -24.601076126098633, -21.67636489868164, -18.75165367126465, -15.826942443847656, -12.902231216430664, -9.977520942687988, -7.052809715270996, -4.128098487854004, -1.2033882141113281, 1.721323013305664, 4.646034240722656, 7.570745468139648, 10.49545669555664, 13.420166969299316, 16.344879150390625, 19.269588470458984, 22.194299697875977, 25.11901092529297, 28.04372215270996, 30.968433380126953, 33.89314270019531, 36.81785583496094, 39.7425651550293, 42.66727828979492, 45.59198760986328, 48.516700744628906, 51.441410064697266, 54.366119384765625, 57.29083251953125, 60.21554183959961, 63.140254974365234, 66.0649642944336, 68.98967742919922, 71.91438293457031, 74.83909606933594, 77.76380920410156, 80.68851470947266, 83.61322784423828, 86.5379409790039, 89.46265411376953, 92.38735961914062, 95.31207275390625, 98.23678588867188]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 4.0, 14.0, 16.0, 14.0, 14.0, 32.0, 63.0, 63.0, 118.0, 228.0, 412.0, 975.0, 2533.0, 8095.0, 36898.0, 504503.0, 3555053.0, 66350.0, 12475.0, 3636.0, 1377.0, 617.0, 295.0, 168.0, 94.0, 60.0, 42.0, 24.0, 20.0, 17.0, 20.0, 7.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-58.6875, -56.91748046875, -55.1474609375, -53.37744140625, -51.607421875, -49.83740234375, -48.0673828125, -46.29736328125, -44.52734375, -42.75732421875, -40.9873046875, -39.21728515625, -37.447265625, -35.67724609375, -33.9072265625, -32.13720703125, -30.3671875, -28.59716796875, -26.8271484375, -25.05712890625, -23.287109375, -21.51708984375, -19.7470703125, -17.97705078125, -16.20703125, -14.43701171875, -12.6669921875, -10.89697265625, -9.126953125, -7.35693359375, -5.5869140625, -3.81689453125, -2.046875, -0.27685546875, 1.4931640625, 3.26318359375, 5.033203125, 6.80322265625, 8.5732421875, 10.34326171875, 12.11328125, 13.88330078125, 15.6533203125, 17.42333984375, 19.193359375, 20.96337890625, 22.7333984375, 24.50341796875, 26.2734375, 28.04345703125, 29.8134765625, 31.58349609375, 33.353515625, 35.12353515625, 36.8935546875, 38.66357421875, 40.43359375, 42.20361328125, 43.9736328125, 45.74365234375, 47.513671875, 49.28369140625, 51.0537109375, 52.82373046875, 54.59375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 12.0, 31.0, 48.0, 56.0, 69.0, 82.0, 107.0, 139.0, 115.0, 107.0, 76.0, 53.0, 43.0, 21.0, 15.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.581298828125, -6.34228515625, -6.103271484375, -5.8642578125, -5.625244140625, -5.38623046875, -5.147216796875, -4.908203125, -4.669189453125, -4.43017578125, -4.191162109375, -3.9521484375, -3.713134765625, -3.47412109375, -3.235107421875, -2.99609375, -2.757080078125, -2.51806640625, -2.279052734375, -2.0400390625, -1.801025390625, -1.56201171875, -1.322998046875, -1.083984375, -0.844970703125, -0.60595703125, -0.366943359375, -0.1279296875, 0.111083984375, 0.35009765625, 0.589111328125, 0.828125, 1.067138671875, 1.30615234375, 1.545166015625, 1.7841796875, 2.023193359375, 2.26220703125, 2.501220703125, 2.740234375, 2.979248046875, 3.21826171875, 3.457275390625, 3.6962890625, 3.935302734375, 4.17431640625, 4.413330078125, 4.65234375, 4.891357421875, 5.13037109375, 5.369384765625, 5.6083984375, 5.847412109375, 6.08642578125, 6.325439453125, 6.564453125, 6.803466796875, 7.04248046875, 7.281494140625, 7.5205078125, 7.759521484375, 7.99853515625, 8.237548828125, 8.4765625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 10.0, 9.0, 21.0, 34.0, 44.0, 68.0, 158.0, 383.0, 929.0, 3324.0, 28035.0, 3989637.0, 161786.0, 6876.0, 1664.0, 691.0, 265.0, 142.0, 63.0, 42.0, 22.0, 20.0, 26.0, 19.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.125, -86.7509765625, -83.376953125, -80.0029296875, -76.62890625, -73.2548828125, -69.880859375, -66.5068359375, -63.1328125, -59.7587890625, -56.384765625, -53.0107421875, -49.63671875, -46.2626953125, -42.888671875, -39.5146484375, -36.140625, -32.7666015625, -29.392578125, -26.0185546875, -22.64453125, -19.2705078125, -15.896484375, -12.5224609375, -9.1484375, -5.7744140625, -2.400390625, 0.9736328125, 4.34765625, 7.7216796875, 11.095703125, 14.4697265625, 17.84375, 21.2177734375, 24.591796875, 27.9658203125, 31.33984375, 34.7138671875, 38.087890625, 41.4619140625, 44.8359375, 48.2099609375, 51.583984375, 54.9580078125, 58.33203125, 61.7060546875, 65.080078125, 68.4541015625, 71.828125, 75.2021484375, 78.576171875, 81.9501953125, 85.32421875, 88.6982421875, 92.072265625, 95.4462890625, 98.8203125, 102.1943359375, 105.568359375, 108.9423828125, 112.31640625, 115.6904296875, 119.064453125, 122.4384765625, 125.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 21.0, 61.0, 106.0, 300.0, 1576.0, 1503.0, 282.0, 115.0, 35.0, 26.0, 15.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.6875, -17.875, -17.0625, -16.25, -15.4375, -14.625, -13.8125, -13.0, -12.1875, -11.375, -10.5625, -9.75, -8.9375, -8.125, -7.3125, -6.5, -5.6875, -4.875, -4.0625, -3.25, -2.4375, -1.625, -0.8125, 0.0, 0.8125, 1.625, 2.4375, 3.25, 4.0625, 4.875, 5.6875, 6.5, 7.3125, 8.125, 8.9375, 9.75, 10.5625, 11.375, 12.1875, 13.0, 13.8125, 14.625, 15.4375, 16.25, 17.0625, 17.875, 18.6875, 19.5, 20.3125, 21.125, 21.9375, 22.75, 23.5625, 24.375, 25.1875, 26.0, 26.8125, 27.625, 28.4375, 29.25, 30.0625, 30.875, 31.6875, 32.5]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 16.0, 39.0, 111.0, 235.0, 289.0, 188.0, 75.0, 21.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-321.3175048828125, -314.67431640625, -308.0311584472656, -301.3879699707031, -294.7447814941406, -288.10162353515625, -281.45843505859375, -274.81524658203125, -268.17205810546875, -261.52886962890625, -254.8856964111328, -248.24252319335938, -241.59933471679688, -234.95616149902344, -228.31298828125, -221.6697998046875, -215.02664184570312, -208.3834686279297, -201.7402801513672, -195.09710693359375, -188.45391845703125, -181.8107452392578, -175.16757202148438, -168.52438354492188, -161.88119506835938, -155.23802185058594, -148.59483337402344, -141.95166015625, -135.3084716796875, -128.66529846191406, -122.0221176147461, -115.37893676757812, -108.73575592041016, -102.09257507324219, -95.44939422607422, -88.80621337890625, -82.16304016113281, -75.51985931396484, -68.87667846679688, -62.23350143432617, -55.5903205871582, -48.947139739990234, -42.30396270751953, -35.66078186035156, -29.017602920532227, -22.37442398071289, -15.731243133544922, -9.088066101074219, -2.44488525390625, 4.198294162750244, 10.841473579406738, 17.48465347290039, 24.127832412719727, 30.771011352539062, 37.41419219970703, 44.057369232177734, 50.7005500793457, 57.34373092651367, 63.986907958984375, 70.63008880615234, 77.27326965332031, 83.91644287109375, 90.55963134765625, 97.20280456542969, 103.84598541259766]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 6.0, 7.0, 16.0, 25.0, 37.0, 42.0, 59.0, 74.0, 75.0, 88.0, 94.0, 106.0, 97.0, 84.0, 61.0, 40.0, 34.0, 23.0, 14.0, 4.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-92.70051574707031, -89.85249328613281, -87.00447845458984, -84.15645599365234, -81.30844116210938, -78.46041870117188, -75.61239624023438, -72.76437377929688, -69.9163589477539, -67.0683364868164, -64.22032165527344, -61.37229919433594, -58.5242805480957, -55.67626190185547, -52.82823944091797, -49.980220794677734, -47.1322021484375, -44.284183502197266, -41.43616485595703, -38.58814239501953, -35.7401237487793, -32.89210510253906, -30.044084548950195, -27.196063995361328, -24.348045349121094, -21.50002670288086, -18.652006149291992, -15.803986549377441, -12.95596694946289, -10.10794734954834, -7.259927749633789, -4.411907196044922, -1.5638885498046875, 1.2841310501098633, 4.132150650024414, 6.980170249938965, 9.828189849853516, 12.676209449768066, 15.524229049682617, 18.372249603271484, 21.22026824951172, 24.068286895751953, 26.91630744934082, 29.764328002929688, 32.61234664916992, 35.460365295410156, 38.308387756347656, 41.15640640258789, 44.004425048828125, 46.85244369506836, 49.700462341308594, 52.548484802246094, 55.39650344848633, 58.24452209472656, 61.09254455566406, 63.9405632019043, 66.78858184814453, 69.63660430908203, 72.484619140625, 75.3326416015625, 78.1806640625, 81.02867889404297, 83.87670135498047, 86.72471618652344, 89.57273864746094]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 16.0, 26.0, 15.0, 25.0, 42.0, 69.0, 114.0, 143.0, 233.0, 411.0, 711.0, 1427.0, 3321.0, 11921.0, 66978.0, 540631.0, 361288.0, 46671.0, 8861.0, 2816.0, 1196.0, 614.0, 349.0, 223.0, 137.0, 107.0, 66.0, 40.0, 26.0, 15.0, 14.0, 15.0, 10.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.53125, -45.9931640625, -44.455078125, -42.9169921875, -41.37890625, -39.8408203125, -38.302734375, -36.7646484375, -35.2265625, -33.6884765625, -32.150390625, -30.6123046875, -29.07421875, -27.5361328125, -25.998046875, -24.4599609375, -22.921875, -21.3837890625, -19.845703125, -18.3076171875, -16.76953125, -15.2314453125, -13.693359375, -12.1552734375, -10.6171875, -9.0791015625, -7.541015625, -6.0029296875, -4.46484375, -2.9267578125, -1.388671875, 0.1494140625, 1.6875, 3.2255859375, 4.763671875, 6.3017578125, 7.83984375, 9.3779296875, 10.916015625, 12.4541015625, 13.9921875, 15.5302734375, 17.068359375, 18.6064453125, 20.14453125, 21.6826171875, 23.220703125, 24.7587890625, 26.296875, 27.8349609375, 29.373046875, 30.9111328125, 32.44921875, 33.9873046875, 35.525390625, 37.0634765625, 38.6015625, 40.1396484375, 41.677734375, 43.2158203125, 44.75390625, 46.2919921875, 47.830078125, 49.3681640625, 50.90625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 5.0, 8.0, 14.0, 27.0, 51.0, 53.0, 72.0, 100.0, 113.0, 113.0, 124.0, 95.0, 68.0, 63.0, 43.0, 13.0, 15.0, 11.0, 6.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.481201171875, -8.22802734375, -7.974853515625, -7.7216796875, -7.468505859375, -7.21533203125, -6.962158203125, -6.708984375, -6.455810546875, -6.20263671875, -5.949462890625, -5.6962890625, -5.443115234375, -5.18994140625, -4.936767578125, -4.68359375, -4.430419921875, -4.17724609375, -3.924072265625, -3.6708984375, -3.417724609375, -3.16455078125, -2.911376953125, -2.658203125, -2.405029296875, -2.15185546875, -1.898681640625, -1.6455078125, -1.392333984375, -1.13916015625, -0.885986328125, -0.6328125, -0.379638671875, -0.12646484375, 0.126708984375, 0.3798828125, 0.633056640625, 0.88623046875, 1.139404296875, 1.392578125, 1.645751953125, 1.89892578125, 2.152099609375, 2.4052734375, 2.658447265625, 2.91162109375, 3.164794921875, 3.41796875, 3.671142578125, 3.92431640625, 4.177490234375, 4.4306640625, 4.683837890625, 4.93701171875, 5.190185546875, 5.443359375, 5.696533203125, 5.94970703125, 6.202880859375, 6.4560546875, 6.709228515625, 6.96240234375, 7.215576171875, 7.46875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 13.0, 14.0, 12.0, 19.0, 40.0, 45.0, 56.0, 90.0, 130.0, 176.0, 269.0, 425.0, 616.0, 1107.0, 1995.0, 3765.0, 7498.0, 15630.0, 34122.0, 76985.0, 173919.0, 337401.0, 217274.0, 95672.0, 42288.0, 19216.0, 9193.0, 4633.0, 2471.0, 1267.0, 797.0, 476.0, 296.0, 180.0, 121.0, 93.0, 68.0, 53.0, 37.0, 22.0, 18.0, 12.0, 10.0, 12.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.546875, -11.1290283203125, -10.711181640625, -10.2933349609375, -9.87548828125, -9.4576416015625, -9.039794921875, -8.6219482421875, -8.2041015625, -7.7862548828125, -7.368408203125, -6.9505615234375, -6.53271484375, -6.1148681640625, -5.697021484375, -5.2791748046875, -4.861328125, -4.4434814453125, -4.025634765625, -3.6077880859375, -3.18994140625, -2.7720947265625, -2.354248046875, -1.9364013671875, -1.5185546875, -1.1007080078125, -0.682861328125, -0.2650146484375, 0.15283203125, 0.5706787109375, 0.988525390625, 1.4063720703125, 1.82421875, 2.2420654296875, 2.659912109375, 3.0777587890625, 3.49560546875, 3.9134521484375, 4.331298828125, 4.7491455078125, 5.1669921875, 5.5848388671875, 6.002685546875, 6.4205322265625, 6.83837890625, 7.2562255859375, 7.674072265625, 8.0919189453125, 8.509765625, 8.9276123046875, 9.345458984375, 9.7633056640625, 10.18115234375, 10.5989990234375, 11.016845703125, 11.4346923828125, 11.8525390625, 12.2703857421875, 12.688232421875, 13.1060791015625, 13.52392578125, 13.9417724609375, 14.359619140625, 14.7774658203125, 15.1953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 8.0, 8.0, 10.0, 17.0, 16.0, 23.0, 33.0, 33.0, 35.0, 49.0, 53.0, 42.0, 57.0, 43.0, 64.0, 68.0, 60.0, 46.0, 51.0, 43.0, 42.0, 38.0, 34.0, 20.0, 21.0, 29.0, 17.0, 12.0, 7.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15625, -19.597412109375, -19.03857421875, -18.479736328125, -17.9208984375, -17.362060546875, -16.80322265625, -16.244384765625, -15.685546875, -15.126708984375, -14.56787109375, -14.009033203125, -13.4501953125, -12.891357421875, -12.33251953125, -11.773681640625, -11.21484375, -10.656005859375, -10.09716796875, -9.538330078125, -8.9794921875, -8.420654296875, -7.86181640625, -7.302978515625, -6.744140625, -6.185302734375, -5.62646484375, -5.067626953125, -4.5087890625, -3.949951171875, -3.39111328125, -2.832275390625, -2.2734375, -1.714599609375, -1.15576171875, -0.596923828125, -0.0380859375, 0.520751953125, 1.07958984375, 1.638427734375, 2.197265625, 2.756103515625, 3.31494140625, 3.873779296875, 4.4326171875, 4.991455078125, 5.55029296875, 6.109130859375, 6.66796875, 7.226806640625, 7.78564453125, 8.344482421875, 8.9033203125, 9.462158203125, 10.02099609375, 10.579833984375, 11.138671875, 11.697509765625, 12.25634765625, 12.815185546875, 13.3740234375, 13.932861328125, 14.49169921875, 15.050537109375, 15.609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 9.0, 22.0, 17.0, 41.0, 59.0, 97.0, 129.0, 265.0, 425.0, 811.0, 1499.0, 3185.0, 7813.0, 26848.0, 152060.0, 641025.0, 169938.0, 29199.0, 8310.0, 3300.0, 1603.0, 783.0, 443.0, 247.0, 145.0, 98.0, 67.0, 33.0, 25.0, 19.0, 9.0, 8.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7398681640625, -13.221923828125, -12.7039794921875, -12.18603515625, -11.6680908203125, -11.150146484375, -10.6322021484375, -10.1142578125, -9.5963134765625, -9.078369140625, -8.5604248046875, -8.04248046875, -7.5245361328125, -7.006591796875, -6.4886474609375, -5.970703125, -5.4527587890625, -4.934814453125, -4.4168701171875, -3.89892578125, -3.3809814453125, -2.863037109375, -2.3450927734375, -1.8271484375, -1.3092041015625, -0.791259765625, -0.2733154296875, 0.24462890625, 0.7625732421875, 1.280517578125, 1.7984619140625, 2.31640625, 2.8343505859375, 3.352294921875, 3.8702392578125, 4.38818359375, 4.9061279296875, 5.424072265625, 5.9420166015625, 6.4599609375, 6.9779052734375, 7.495849609375, 8.0137939453125, 8.53173828125, 9.0496826171875, 9.567626953125, 10.0855712890625, 10.603515625, 11.1214599609375, 11.639404296875, 12.1573486328125, 12.67529296875, 13.1932373046875, 13.711181640625, 14.2291259765625, 14.7470703125, 15.2650146484375, 15.782958984375, 16.3009033203125, 16.81884765625, 17.3367919921875, 17.854736328125, 18.3726806640625, 18.890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 10.0, 12.0, 29.0, 26.0, 40.0, 84.0, 94.0, 163.0, 165.0, 114.0, 74.0, 45.0, 31.0, 11.0, 21.0, 17.0, 7.0, 8.0, 4.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018243789672851562, -0.0017514973878860474, -0.0016786158084869385, -0.0016057342290878296, -0.0015328526496887207, -0.0014599710702896118, -0.001387089490890503, -0.001314207911491394, -0.0012413263320922852, -0.0011684447526931763, -0.0010955631732940674, -0.0010226815938949585, -0.0009498000144958496, -0.0008769184350967407, -0.0008040368556976318, -0.000731155276298523, -0.0006582736968994141, -0.0005853921175003052, -0.0005125105381011963, -0.0004396289587020874, -0.0003667473793029785, -0.00029386579990386963, -0.00022098422050476074, -0.00014810264110565186, -7.522106170654297e-05, -2.339482307434082e-06, 7.05420970916748e-05, 0.0001434236764907837, 0.00021630525588989258, 0.00028918683528900146, 0.00036206841468811035, 0.00043494999408721924, 0.0005078315734863281, 0.000580713152885437, 0.0006535947322845459, 0.0007264763116836548, 0.0007993578910827637, 0.0008722394704818726, 0.0009451210498809814, 0.0010180026292800903, 0.0010908842086791992, 0.001163765788078308, 0.001236647367477417, 0.0013095289468765259, 0.0013824105262756348, 0.0014552921056747437, 0.0015281736850738525, 0.0016010552644729614, 0.0016739368438720703, 0.0017468184232711792, 0.001819700002670288, 0.001892581582069397, 0.001965463161468506, 0.0020383447408676147, 0.0021112263202667236, 0.0021841078996658325, 0.0022569894790649414, 0.0023298710584640503, 0.002402752637863159, 0.002475634217262268, 0.002548515796661377, 0.002621397376060486, 0.0026942789554595947, 0.0027671605348587036, 0.0028400421142578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 9.0, 3.0, 10.0, 10.0, 22.0, 32.0, 39.0, 51.0, 86.0, 107.0, 173.0, 287.0, 410.0, 639.0, 1058.0, 1906.0, 3415.0, 6842.0, 15192.0, 41149.0, 156332.0, 500134.0, 228968.0, 54656.0, 18891.0, 8325.0, 4188.0, 2200.0, 1288.0, 728.0, 436.0, 325.0, 190.0, 144.0, 89.0, 56.0, 39.0, 33.0, 22.0, 11.0, 8.0, 8.0, 13.0, 9.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-11.65625, -11.275634765625, -10.89501953125, -10.514404296875, -10.1337890625, -9.753173828125, -9.37255859375, -8.991943359375, -8.611328125, -8.230712890625, -7.85009765625, -7.469482421875, -7.0888671875, -6.708251953125, -6.32763671875, -5.947021484375, -5.56640625, -5.185791015625, -4.80517578125, -4.424560546875, -4.0439453125, -3.663330078125, -3.28271484375, -2.902099609375, -2.521484375, -2.140869140625, -1.76025390625, -1.379638671875, -0.9990234375, -0.618408203125, -0.23779296875, 0.142822265625, 0.5234375, 0.904052734375, 1.28466796875, 1.665283203125, 2.0458984375, 2.426513671875, 2.80712890625, 3.187744140625, 3.568359375, 3.948974609375, 4.32958984375, 4.710205078125, 5.0908203125, 5.471435546875, 5.85205078125, 6.232666015625, 6.61328125, 6.993896484375, 7.37451171875, 7.755126953125, 8.1357421875, 8.516357421875, 8.89697265625, 9.277587890625, 9.658203125, 10.038818359375, 10.41943359375, 10.800048828125, 11.1806640625, 11.561279296875, 11.94189453125, 12.322509765625, 12.703125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 5.0, 4.0, 7.0, 3.0, 9.0, 11.0, 16.0, 17.0, 25.0, 30.0, 48.0, 62.0, 85.0, 85.0, 96.0, 103.0, 77.0, 76.0, 58.0, 49.0, 32.0, 26.0, 17.0, 7.0, 12.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6875, -11.3697509765625, -11.052001953125, -10.7342529296875, -10.41650390625, -10.0987548828125, -9.781005859375, -9.4632568359375, -9.1455078125, -8.8277587890625, -8.510009765625, -8.1922607421875, -7.87451171875, -7.5567626953125, -7.239013671875, -6.9212646484375, -6.603515625, -6.2857666015625, -5.968017578125, -5.6502685546875, -5.33251953125, -5.0147705078125, -4.697021484375, -4.3792724609375, -4.0615234375, -3.7437744140625, -3.426025390625, -3.1082763671875, -2.79052734375, -2.4727783203125, -2.155029296875, -1.8372802734375, -1.51953125, -1.2017822265625, -0.884033203125, -0.5662841796875, -0.24853515625, 0.0692138671875, 0.386962890625, 0.7047119140625, 1.0224609375, 1.3402099609375, 1.657958984375, 1.9757080078125, 2.29345703125, 2.6112060546875, 2.928955078125, 3.2467041015625, 3.564453125, 3.8822021484375, 4.199951171875, 4.5177001953125, 4.83544921875, 5.1531982421875, 5.470947265625, 5.7886962890625, 6.1064453125, 6.4241943359375, 6.741943359375, 7.0596923828125, 7.37744140625, 7.6951904296875, 8.012939453125, 8.3306884765625, 8.6484375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 8.0, 9.0, 6.0, 10.0, 33.0, 45.0, 78.0, 94.0, 125.0, 153.0, 136.0, 123.0, 75.0, 45.0, 30.0, 18.0, 9.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-258.61578369140625, -253.43629455566406, -248.2567901611328, -243.07730102539062, -237.89781188964844, -232.71832275390625, -227.538818359375, -222.3593292236328, -217.17984008789062, -212.00035095214844, -206.8208465576172, -201.641357421875, -196.4618682861328, -191.28237915039062, -186.10287475585938, -180.9233856201172, -175.74388122558594, -170.56439208984375, -165.3848876953125, -160.2053985595703, -155.02590942382812, -149.84640502929688, -144.6669158935547, -139.4874267578125, -134.30792236328125, -129.12843322753906, -123.94893646240234, -118.76943969726562, -113.58995056152344, -108.41045379638672, -103.23095703125, -98.05146789550781, -92.87199401855469, -87.69249725341797, -82.51300811767578, -77.33351135253906, -72.15402221679688, -66.97452545166016, -61.79502868652344, -56.615535736083984, -51.43604278564453, -46.25654983520508, -41.077056884765625, -35.897560119628906, -30.718067169189453, -25.53857421875, -20.359079360961914, -15.179584503173828, -10.000091552734375, -4.8205976486206055, 0.35889625549316406, 5.538390159606934, 10.717884063720703, 15.897377014160156, 21.076871871948242, 26.256366729736328, 31.43585968017578, 36.615352630615234, 41.79484558105469, 46.974342346191406, 52.15383529663086, 57.33332824707031, 62.51282501220703, 67.69232177734375, 72.87181091308594]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 11.0, 6.0, 10.0, 15.0, 16.0, 20.0, 24.0, 17.0, 27.0, 23.0, 25.0, 28.0, 31.0, 29.0, 46.0, 52.0, 51.0, 37.0, 39.0, 53.0, 45.0, 64.0, 42.0, 33.0, 33.0, 35.0, 37.0, 23.0, 21.0, 22.0, 16.0, 17.0, 8.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.3358154296875, -87.82262420654297, -85.30943298339844, -82.79623413085938, -80.28304290771484, -77.76985168457031, -75.25666046142578, -72.74346923828125, -70.23027038574219, -67.71707916259766, -65.20388793945312, -62.69069290161133, -60.17749786376953, -57.664306640625, -55.15111541748047, -52.63792037963867, -50.12472915649414, -47.61153793334961, -45.09834289550781, -42.58515167236328, -40.071956634521484, -37.55876541137695, -35.045570373535156, -32.532379150390625, -30.01918601989746, -27.505992889404297, -24.992799758911133, -22.47960662841797, -19.966415405273438, -17.45322036743164, -14.94002914428711, -12.426836013793945, -9.913642883300781, -7.400449752807617, -4.887257099151611, -2.3740644454956055, 0.1391286849975586, 2.6523218154907227, 5.16551399230957, 7.678707122802734, 10.191900253295898, 12.705093383789062, 15.218286514282227, 17.73147964477539, 20.244670867919922, 22.75786590576172, 25.27105712890625, 27.784250259399414, 30.297443389892578, 32.81063461303711, 35.323829650878906, 37.83702087402344, 40.350215911865234, 42.863407135009766, 45.37660217285156, 47.889793395996094, 50.402984619140625, 52.916175842285156, 55.42937088012695, 57.942562103271484, 60.45575714111328, 62.96894836425781, 65.48213958740234, 67.99533081054688, 70.50852966308594]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 11.0, 10.0, 9.0, 19.0, 39.0, 54.0, 84.0, 151.0, 317.0, 616.0, 1587.0, 5467.0, 31768.0, 3581675.0, 544553.0, 21214.0, 4078.0, 1277.0, 550.0, 319.0, 162.0, 120.0, 70.0, 35.0, 24.0, 14.0, 16.0, 14.0, 11.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.75, -72.4072265625, -70.064453125, -67.7216796875, -65.37890625, -63.0361328125, -60.693359375, -58.3505859375, -56.0078125, -53.6650390625, -51.322265625, -48.9794921875, -46.63671875, -44.2939453125, -41.951171875, -39.6083984375, -37.265625, -34.9228515625, -32.580078125, -30.2373046875, -27.89453125, -25.5517578125, -23.208984375, -20.8662109375, -18.5234375, -16.1806640625, -13.837890625, -11.4951171875, -9.15234375, -6.8095703125, -4.466796875, -2.1240234375, 0.21875, 2.5615234375, 4.904296875, 7.2470703125, 9.58984375, 11.9326171875, 14.275390625, 16.6181640625, 18.9609375, 21.3037109375, 23.646484375, 25.9892578125, 28.33203125, 30.6748046875, 33.017578125, 35.3603515625, 37.703125, 40.0458984375, 42.388671875, 44.7314453125, 47.07421875, 49.4169921875, 51.759765625, 54.1025390625, 56.4453125, 58.7880859375, 61.130859375, 63.4736328125, 65.81640625, 68.1591796875, 70.501953125, 72.8447265625, 75.1875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 13.0, 18.0, 42.0, 62.0, 72.0, 79.0, 101.0, 99.0, 119.0, 91.0, 88.0, 84.0, 40.0, 24.0, 20.0, 16.0, 10.0, 6.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.4012451171875, -8.154052734375, -7.9068603515625, -7.65966796875, -7.4124755859375, -7.165283203125, -6.9180908203125, -6.6708984375, -6.4237060546875, -6.176513671875, -5.9293212890625, -5.68212890625, -5.4349365234375, -5.187744140625, -4.9405517578125, -4.693359375, -4.4461669921875, -4.198974609375, -3.9517822265625, -3.70458984375, -3.4573974609375, -3.210205078125, -2.9630126953125, -2.7158203125, -2.4686279296875, -2.221435546875, -1.9742431640625, -1.72705078125, -1.4798583984375, -1.232666015625, -0.9854736328125, -0.73828125, -0.4910888671875, -0.243896484375, 0.0032958984375, 0.25048828125, 0.4976806640625, 0.744873046875, 0.9920654296875, 1.2392578125, 1.4864501953125, 1.733642578125, 1.9808349609375, 2.22802734375, 2.4752197265625, 2.722412109375, 2.9696044921875, 3.216796875, 3.4639892578125, 3.711181640625, 3.9583740234375, 4.20556640625, 4.4527587890625, 4.699951171875, 4.9471435546875, 5.1943359375, 5.4415283203125, 5.688720703125, 5.9359130859375, 6.18310546875, 6.4302978515625, 6.677490234375, 6.9246826171875, 7.171875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 11.0, 16.0, 41.0, 57.0, 94.0, 204.0, 460.0, 1042.0, 2694.0, 7414.0, 25019.0, 121618.0, 2937773.0, 982376.0, 86625.0, 19214.0, 5863.0, 2122.0, 868.0, 360.0, 185.0, 93.0, 48.0, 34.0, 12.0, 13.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.96337890625, -28.9267578125, -27.89013671875, -26.853515625, -25.81689453125, -24.7802734375, -23.74365234375, -22.70703125, -21.67041015625, -20.6337890625, -19.59716796875, -18.560546875, -17.52392578125, -16.4873046875, -15.45068359375, -14.4140625, -13.37744140625, -12.3408203125, -11.30419921875, -10.267578125, -9.23095703125, -8.1943359375, -7.15771484375, -6.12109375, -5.08447265625, -4.0478515625, -3.01123046875, -1.974609375, -0.93798828125, 0.0986328125, 1.13525390625, 2.171875, 3.20849609375, 4.2451171875, 5.28173828125, 6.318359375, 7.35498046875, 8.3916015625, 9.42822265625, 10.46484375, 11.50146484375, 12.5380859375, 13.57470703125, 14.611328125, 15.64794921875, 16.6845703125, 17.72119140625, 18.7578125, 19.79443359375, 20.8310546875, 21.86767578125, 22.904296875, 23.94091796875, 24.9775390625, 26.01416015625, 27.05078125, 28.08740234375, 29.1240234375, 30.16064453125, 31.197265625, 32.23388671875, 33.2705078125, 34.30712890625, 35.34375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 2.0, 6.0, 4.0, 13.0, 12.0, 10.0, 24.0, 32.0, 34.0, 55.0, 69.0, 100.0, 145.0, 285.0, 502.0, 1554.0, 444.0, 254.0, 151.0, 108.0, 59.0, 61.0, 39.0, 18.0, 20.0, 11.0, 6.0, 7.0, 12.0, 4.0, 7.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.96514892578125, -7.7193603515625, -7.47357177734375, -7.227783203125, -6.98199462890625, -6.7362060546875, -6.49041748046875, -6.24462890625, -5.99884033203125, -5.7530517578125, -5.50726318359375, -5.261474609375, -5.01568603515625, -4.7698974609375, -4.52410888671875, -4.2783203125, -4.03253173828125, -3.7867431640625, -3.54095458984375, -3.295166015625, -3.04937744140625, -2.8035888671875, -2.55780029296875, -2.31201171875, -2.06622314453125, -1.8204345703125, -1.57464599609375, -1.328857421875, -1.08306884765625, -0.8372802734375, -0.59149169921875, -0.345703125, -0.09991455078125, 0.1458740234375, 0.39166259765625, 0.637451171875, 0.88323974609375, 1.1290283203125, 1.37481689453125, 1.62060546875, 1.86639404296875, 2.1121826171875, 2.35797119140625, 2.603759765625, 2.84954833984375, 3.0953369140625, 3.34112548828125, 3.5869140625, 3.83270263671875, 4.0784912109375, 4.32427978515625, 4.570068359375, 4.81585693359375, 5.0616455078125, 5.30743408203125, 5.55322265625, 5.79901123046875, 6.0447998046875, 6.29058837890625, 6.536376953125, 6.78216552734375, 7.0279541015625, 7.27374267578125, 7.51953125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 12.0, 12.0, 12.0, 16.0, 33.0, 40.0, 51.0, 72.0, 100.0, 92.0, 110.0, 93.0, 104.0, 87.0, 58.0, 32.0, 27.0, 13.0, 14.0, 5.0, 9.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.348411560058594, -57.58020782470703, -55.8120002746582, -54.04379653930664, -52.27558898925781, -50.50738525390625, -48.73918151855469, -46.97097396850586, -45.20276641845703, -43.43456268310547, -41.66635513305664, -39.89815139770508, -38.12994384765625, -36.36174011230469, -34.593536376953125, -32.8253288269043, -31.057125091552734, -29.28891944885254, -27.520713806152344, -25.75251007080078, -23.984302520751953, -22.21609878540039, -20.447893142700195, -18.6796875, -16.911481857299805, -15.14327621459961, -13.375070571899414, -11.606865882873535, -9.83866024017334, -8.070454597473145, -6.302249908447266, -4.53404426574707, -2.7658348083496094, -0.9976294040679932, 0.770576000213623, 2.53878116607666, 4.3069868087768555, 6.075192451477051, 7.84339714050293, 9.611602783203125, 11.37980842590332, 13.148014068603516, 14.916219711303711, 16.684425354003906, 18.45262908935547, 20.220836639404297, 21.98904037475586, 23.757246017456055, 25.52545166015625, 27.293657302856445, 29.06186294555664, 30.830066680908203, 32.59827423095703, 34.366477966308594, 36.134681701660156, 37.902889251708984, 39.67109680175781, 41.439300537109375, 43.2075080871582, 44.975711822509766, 46.743919372558594, 48.512123107910156, 50.28032684326172, 52.04853439331055, 53.81673812866211]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 7.0, 8.0, 7.0, 15.0, 14.0, 18.0, 18.0, 20.0, 25.0, 19.0, 26.0, 20.0, 24.0, 31.0, 34.0, 34.0, 42.0, 37.0, 42.0, 35.0, 43.0, 53.0, 32.0, 34.0, 36.0, 21.0, 32.0, 24.0, 24.0, 31.0, 28.0, 13.0, 15.0, 18.0, 15.0, 19.0, 10.0, 5.0, 11.0, 7.0, 7.0, 5.0, 5.0, 11.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-23.49685287475586, -22.735055923461914, -21.97325897216797, -21.211462020874023, -20.449665069580078, -19.6878662109375, -18.926069259643555, -18.16427230834961, -17.402475357055664, -16.64067840576172, -15.878881454467773, -15.117083549499512, -14.355286598205566, -13.593489646911621, -12.83169174194336, -12.069894790649414, -11.308097839355469, -10.546300888061523, -9.784503936767578, -9.022706031799316, -8.260909080505371, -7.499112129211426, -6.737314701080322, -5.975517272949219, -5.213720321655273, -4.451923370361328, -3.6901259422302246, -2.9283287525177, -2.166531562805176, -1.4047343730926514, -0.642937183380127, 0.11886024475097656, 0.8806591033935547, 1.642456293106079, 2.4042534828186035, 3.166050672531128, 3.9278478622436523, 4.689644813537598, 5.451442241668701, 6.213239669799805, 6.97503662109375, 7.736833572387695, 8.49863052368164, 9.260428428649902, 10.022225379943848, 10.784022331237793, 11.545820236206055, 12.3076171875, 13.069414138793945, 13.83121109008789, 14.593008041381836, 15.354805946350098, 16.11660385131836, 16.878400802612305, 17.64019775390625, 18.401994705200195, 19.16379165649414, 19.925588607788086, 20.68738555908203, 21.449182510375977, 22.210979461669922, 22.9727783203125, 23.734575271606445, 24.49637222290039, 25.258169174194336]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 12.0, 11.0, 16.0, 34.0, 39.0, 67.0, 80.0, 145.0, 215.0, 340.0, 569.0, 1048.0, 2212.0, 5554.0, 19142.0, 91290.0, 526224.0, 325827.0, 54819.0, 12848.0, 4115.0, 1741.0, 851.0, 474.0, 279.0, 206.0, 114.0, 79.0, 55.0, 37.0, 26.0, 17.0, 16.0, 9.0, 6.0, 4.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-43.09375, -41.74072265625, -40.3876953125, -39.03466796875, -37.681640625, -36.32861328125, -34.9755859375, -33.62255859375, -32.26953125, -30.91650390625, -29.5634765625, -28.21044921875, -26.857421875, -25.50439453125, -24.1513671875, -22.79833984375, -21.4453125, -20.09228515625, -18.7392578125, -17.38623046875, -16.033203125, -14.68017578125, -13.3271484375, -11.97412109375, -10.62109375, -9.26806640625, -7.9150390625, -6.56201171875, -5.208984375, -3.85595703125, -2.5029296875, -1.14990234375, 0.203125, 1.55615234375, 2.9091796875, 4.26220703125, 5.615234375, 6.96826171875, 8.3212890625, 9.67431640625, 11.02734375, 12.38037109375, 13.7333984375, 15.08642578125, 16.439453125, 17.79248046875, 19.1455078125, 20.49853515625, 21.8515625, 23.20458984375, 24.5576171875, 25.91064453125, 27.263671875, 28.61669921875, 29.9697265625, 31.32275390625, 32.67578125, 34.02880859375, 35.3818359375, 36.73486328125, 38.087890625, 39.44091796875, 40.7939453125, 42.14697265625, 43.5]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 7.0, 12.0, 14.0, 30.0, 65.0, 64.0, 101.0, 106.0, 104.0, 88.0, 96.0, 99.0, 61.0, 57.0, 29.0, 19.0, 18.0, 12.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.56097412109375, -8.3094482421875, -8.05792236328125, -7.806396484375, -7.55487060546875, -7.3033447265625, -7.05181884765625, -6.80029296875, -6.54876708984375, -6.2972412109375, -6.04571533203125, -5.794189453125, -5.54266357421875, -5.2911376953125, -5.03961181640625, -4.7880859375, -4.53656005859375, -4.2850341796875, -4.03350830078125, -3.781982421875, -3.53045654296875, -3.2789306640625, -3.02740478515625, -2.77587890625, -2.52435302734375, -2.2728271484375, -2.02130126953125, -1.769775390625, -1.51824951171875, -1.2667236328125, -1.01519775390625, -0.763671875, -0.51214599609375, -0.2606201171875, -0.00909423828125, 0.242431640625, 0.49395751953125, 0.7454833984375, 0.99700927734375, 1.24853515625, 1.50006103515625, 1.7515869140625, 2.00311279296875, 2.254638671875, 2.50616455078125, 2.7576904296875, 3.00921630859375, 3.2607421875, 3.51226806640625, 3.7637939453125, 4.01531982421875, 4.266845703125, 4.51837158203125, 4.7698974609375, 5.02142333984375, 5.27294921875, 5.52447509765625, 5.7760009765625, 6.02752685546875, 6.279052734375, 6.53057861328125, 6.7821044921875, 7.03363037109375, 7.28515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 6.0, 12.0, 16.0, 30.0, 47.0, 52.0, 73.0, 103.0, 169.0, 252.0, 460.0, 837.0, 1605.0, 3725.0, 9857.0, 30276.0, 103072.0, 387839.0, 367200.0, 97359.0, 28865.0, 9535.0, 3696.0, 1604.0, 730.0, 406.0, 247.0, 163.0, 97.0, 70.0, 52.0, 38.0, 24.0, 11.0, 5.0, 3.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.8125, -22.14111328125, -21.4697265625, -20.79833984375, -20.126953125, -19.45556640625, -18.7841796875, -18.11279296875, -17.44140625, -16.77001953125, -16.0986328125, -15.42724609375, -14.755859375, -14.08447265625, -13.4130859375, -12.74169921875, -12.0703125, -11.39892578125, -10.7275390625, -10.05615234375, -9.384765625, -8.71337890625, -8.0419921875, -7.37060546875, -6.69921875, -6.02783203125, -5.3564453125, -4.68505859375, -4.013671875, -3.34228515625, -2.6708984375, -1.99951171875, -1.328125, -0.65673828125, 0.0146484375, 0.68603515625, 1.357421875, 2.02880859375, 2.7001953125, 3.37158203125, 4.04296875, 4.71435546875, 5.3857421875, 6.05712890625, 6.728515625, 7.39990234375, 8.0712890625, 8.74267578125, 9.4140625, 10.08544921875, 10.7568359375, 11.42822265625, 12.099609375, 12.77099609375, 13.4423828125, 14.11376953125, 14.78515625, 15.45654296875, 16.1279296875, 16.79931640625, 17.470703125, 18.14208984375, 18.8134765625, 19.48486328125, 20.15625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 0.0, 8.0, 5.0, 7.0, 7.0, 12.0, 14.0, 10.0, 10.0, 20.0, 22.0, 32.0, 21.0, 33.0, 22.0, 40.0, 33.0, 45.0, 43.0, 45.0, 34.0, 44.0, 44.0, 50.0, 44.0, 46.0, 43.0, 31.0, 35.0, 29.0, 19.0, 24.0, 27.0, 14.0, 13.0, 9.0, 18.0, 11.0, 10.0, 6.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.316650390625, -11.88330078125, -11.449951171875, -11.0166015625, -10.583251953125, -10.14990234375, -9.716552734375, -9.283203125, -8.849853515625, -8.41650390625, -7.983154296875, -7.5498046875, -7.116455078125, -6.68310546875, -6.249755859375, -5.81640625, -5.383056640625, -4.94970703125, -4.516357421875, -4.0830078125, -3.649658203125, -3.21630859375, -2.782958984375, -2.349609375, -1.916259765625, -1.48291015625, -1.049560546875, -0.6162109375, -0.182861328125, 0.25048828125, 0.683837890625, 1.1171875, 1.550537109375, 1.98388671875, 2.417236328125, 2.8505859375, 3.283935546875, 3.71728515625, 4.150634765625, 4.583984375, 5.017333984375, 5.45068359375, 5.884033203125, 6.3173828125, 6.750732421875, 7.18408203125, 7.617431640625, 8.05078125, 8.484130859375, 8.91748046875, 9.350830078125, 9.7841796875, 10.217529296875, 10.65087890625, 11.084228515625, 11.517578125, 11.950927734375, 12.38427734375, 12.817626953125, 13.2509765625, 13.684326171875, 14.11767578125, 14.551025390625, 14.984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 10.0, 3.0, 8.0, 9.0, 15.0, 17.0, 21.0, 39.0, 34.0, 73.0, 101.0, 141.0, 253.0, 368.0, 588.0, 928.0, 1662.0, 3097.0, 6418.0, 17790.0, 87146.0, 657879.0, 222345.0, 30985.0, 9262.0, 4080.0, 2095.0, 1207.0, 705.0, 446.0, 270.0, 194.0, 107.0, 80.0, 49.0, 27.0, 30.0, 31.0, 14.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-21.765625, -21.156005859375, -20.54638671875, -19.936767578125, -19.3271484375, -18.717529296875, -18.10791015625, -17.498291015625, -16.888671875, -16.279052734375, -15.66943359375, -15.059814453125, -14.4501953125, -13.840576171875, -13.23095703125, -12.621337890625, -12.01171875, -11.402099609375, -10.79248046875, -10.182861328125, -9.5732421875, -8.963623046875, -8.35400390625, -7.744384765625, -7.134765625, -6.525146484375, -5.91552734375, -5.305908203125, -4.6962890625, -4.086669921875, -3.47705078125, -2.867431640625, -2.2578125, -1.648193359375, -1.03857421875, -0.428955078125, 0.1806640625, 0.790283203125, 1.39990234375, 2.009521484375, 2.619140625, 3.228759765625, 3.83837890625, 4.447998046875, 5.0576171875, 5.667236328125, 6.27685546875, 6.886474609375, 7.49609375, 8.105712890625, 8.71533203125, 9.324951171875, 9.9345703125, 10.544189453125, 11.15380859375, 11.763427734375, 12.373046875, 12.982666015625, 13.59228515625, 14.201904296875, 14.8115234375, 15.421142578125, 16.03076171875, 16.640380859375, 17.25]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 20.0, 21.0, 38.0, 61.0, 84.0, 207.0, 232.0, 114.0, 80.0, 38.0, 20.0, 17.0, 11.0, 10.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027179718017578125, -0.0026006996631622314, -0.0024834275245666504, -0.0023661553859710693, -0.0022488832473754883, -0.0021316111087799072, -0.002014338970184326, -0.0018970668315887451, -0.001779794692993164, -0.001662522554397583, -0.001545250415802002, -0.001427978277206421, -0.0013107061386108398, -0.0011934340000152588, -0.0010761618614196777, -0.0009588897228240967, -0.0008416175842285156, -0.0007243454456329346, -0.0006070733070373535, -0.0004898011684417725, -0.0003725290298461914, -0.00025525689125061035, -0.0001379847526550293, -2.0712614059448242e-05, 9.655952453613281e-05, 0.00021383166313171387, 0.0003311038017272949, 0.000448375940322876, 0.000565648078918457, 0.0006829202175140381, 0.0008001923561096191, 0.0009174644947052002, 0.0010347366333007812, 0.0011520087718963623, 0.0012692809104919434, 0.0013865530490875244, 0.0015038251876831055, 0.0016210973262786865, 0.0017383694648742676, 0.0018556416034698486, 0.0019729137420654297, 0.0020901858806610107, 0.002207458019256592, 0.002324730157852173, 0.002442002296447754, 0.002559274435043335, 0.002676546573638916, 0.002793818712234497, 0.002911090850830078, 0.003028362989425659, 0.0031456351280212402, 0.0032629072666168213, 0.0033801794052124023, 0.0034974515438079834, 0.0036147236824035645, 0.0037319958209991455, 0.0038492679595947266, 0.003966540098190308, 0.004083812236785889, 0.00420108437538147, 0.004318356513977051, 0.004435628652572632, 0.004552900791168213, 0.004670172929763794, 0.004787445068359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 5.0, 6.0, 11.0, 9.0, 20.0, 17.0, 25.0, 24.0, 50.0, 68.0, 80.0, 126.0, 221.0, 364.0, 622.0, 1189.0, 2419.0, 5486.0, 15530.0, 65190.0, 549790.0, 342135.0, 44544.0, 11655.0, 4416.0, 2059.0, 1041.0, 527.0, 345.0, 173.0, 127.0, 70.0, 64.0, 29.0, 33.0, 16.0, 23.0, 9.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.03125, -18.372314453125, -17.71337890625, -17.054443359375, -16.3955078125, -15.736572265625, -15.07763671875, -14.418701171875, -13.759765625, -13.100830078125, -12.44189453125, -11.782958984375, -11.1240234375, -10.465087890625, -9.80615234375, -9.147216796875, -8.48828125, -7.829345703125, -7.17041015625, -6.511474609375, -5.8525390625, -5.193603515625, -4.53466796875, -3.875732421875, -3.216796875, -2.557861328125, -1.89892578125, -1.239990234375, -0.5810546875, 0.077880859375, 0.73681640625, 1.395751953125, 2.0546875, 2.713623046875, 3.37255859375, 4.031494140625, 4.6904296875, 5.349365234375, 6.00830078125, 6.667236328125, 7.326171875, 7.985107421875, 8.64404296875, 9.302978515625, 9.9619140625, 10.620849609375, 11.27978515625, 11.938720703125, 12.59765625, 13.256591796875, 13.91552734375, 14.574462890625, 15.2333984375, 15.892333984375, 16.55126953125, 17.210205078125, 17.869140625, 18.528076171875, 19.18701171875, 19.845947265625, 20.5048828125, 21.163818359375, 21.82275390625, 22.481689453125, 23.140625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 4.0, 6.0, 11.0, 13.0, 21.0, 31.0, 51.0, 70.0, 136.0, 161.0, 159.0, 129.0, 61.0, 36.0, 26.0, 21.0, 11.0, 11.0, 13.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.015625, -17.4844970703125, -16.953369140625, -16.4222412109375, -15.89111328125, -15.3599853515625, -14.828857421875, -14.2977294921875, -13.7666015625, -13.2354736328125, -12.704345703125, -12.1732177734375, -11.64208984375, -11.1109619140625, -10.579833984375, -10.0487060546875, -9.517578125, -8.9864501953125, -8.455322265625, -7.9241943359375, -7.39306640625, -6.8619384765625, -6.330810546875, -5.7996826171875, -5.2685546875, -4.7374267578125, -4.206298828125, -3.6751708984375, -3.14404296875, -2.6129150390625, -2.081787109375, -1.5506591796875, -1.01953125, -0.4884033203125, 0.042724609375, 0.5738525390625, 1.10498046875, 1.6361083984375, 2.167236328125, 2.6983642578125, 3.2294921875, 3.7606201171875, 4.291748046875, 4.8228759765625, 5.35400390625, 5.8851318359375, 6.416259765625, 6.9473876953125, 7.478515625, 8.0096435546875, 8.540771484375, 9.0718994140625, 9.60302734375, 10.1341552734375, 10.665283203125, 11.1964111328125, 11.7275390625, 12.2586669921875, 12.789794921875, 13.3209228515625, 13.85205078125, 14.3831787109375, 14.914306640625, 15.4454345703125, 15.9765625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 13.0, 30.0, 57.0, 144.0, 209.0, 239.0, 163.0, 96.0, 31.0, 12.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-385.89764404296875, -376.5121765136719, -367.126708984375, -357.7412109375, -348.3557434082031, -338.97027587890625, -329.5848083496094, -320.1993408203125, -310.8138427734375, -301.4283752441406, -292.04290771484375, -282.65740966796875, -273.2719421386719, -263.886474609375, -254.50100708007812, -245.11553955078125, -235.73007202148438, -226.3446044921875, -216.95912170410156, -207.5736541748047, -198.18817138671875, -188.80270385742188, -179.417236328125, -170.03176879882812, -160.6462860107422, -151.2608184814453, -141.87533569335938, -132.4898681640625, -123.1043930053711, -113.71891784667969, -104.33345031738281, -94.9479751586914, -85.56248474121094, -76.17700958251953, -66.79153442382812, -57.40606689453125, -48.020591735839844, -38.63511657714844, -29.249645233154297, -19.864173889160156, -10.47869873046875, -1.0932254791259766, 8.292247772216797, 17.67772102355957, 27.063194274902344, 36.44866943359375, 45.83414077758789, 55.21961212158203, 64.60508728027344, 73.99056243896484, 83.37603759765625, 92.76150512695312, 102.14698028564453, 111.53245544433594, 120.91792297363281, 130.30340576171875, 139.68887329101562, 149.0743408203125, 158.45982360839844, 167.8452911376953, 177.23077392578125, 186.61624145507812, 196.001708984375, 205.38717651367188, 214.7726593017578]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 9.0, 8.0, 15.0, 16.0, 17.0, 21.0, 22.0, 33.0, 30.0, 34.0, 34.0, 44.0, 42.0, 55.0, 42.0, 52.0, 42.0, 50.0, 56.0, 38.0, 44.0, 39.0, 27.0, 32.0, 26.0, 22.0, 25.0, 20.0, 24.0, 13.0, 14.0, 11.0, 7.0, 12.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.11214447021484, -90.23584747314453, -87.35955047607422, -84.4832534790039, -81.60696411132812, -78.73066711425781, -75.8543701171875, -72.97807312011719, -70.10177612304688, -67.22547912597656, -64.34918212890625, -61.4728889465332, -58.59659194946289, -55.72029495239258, -52.84400177001953, -49.96770477294922, -47.091407775878906, -44.215110778808594, -41.33881378173828, -38.462520599365234, -35.58622360229492, -32.70992660522461, -29.83363151550293, -26.95733642578125, -24.081039428710938, -21.204742431640625, -18.328447341918945, -15.45215129852295, -12.575855255126953, -9.699559211730957, -6.823263168334961, -3.9469680786132812, -1.0706634521484375, 1.8056325912475586, 4.681928634643555, 7.558224678039551, 10.434520721435547, 13.310816764831543, 16.18711280822754, 19.06340789794922, 21.93970489501953, 24.816001892089844, 27.692296981811523, 30.568592071533203, 33.444889068603516, 36.32118606567383, 39.197479248046875, 42.07377624511719, 44.9500732421875, 47.82637023925781, 50.702667236328125, 53.57896041870117, 56.455257415771484, 59.3315544128418, 62.207847595214844, 65.08414459228516, 67.96044158935547, 70.83673858642578, 73.7130355834961, 76.5893325805664, 79.46562194824219, 82.3419189453125, 85.21821594238281, 88.09451293945312, 90.97080993652344]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 0.0, 5.0, 3.0, 4.0, 11.0, 11.0, 18.0, 29.0, 25.0, 18.0, 42.0, 54.0, 82.0, 118.0, 166.0, 292.0, 433.0, 771.0, 1602.0, 3775.0, 12105.0, 51836.0, 579497.0, 3409775.0, 103703.0, 19389.0, 5698.0, 2231.0, 1000.0, 582.0, 315.0, 223.0, 152.0, 99.0, 65.0, 53.0, 25.0, 25.0, 15.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.6875, -56.09326171875, -54.4990234375, -52.90478515625, -51.310546875, -49.71630859375, -48.1220703125, -46.52783203125, -44.93359375, -43.33935546875, -41.7451171875, -40.15087890625, -38.556640625, -36.96240234375, -35.3681640625, -33.77392578125, -32.1796875, -30.58544921875, -28.9912109375, -27.39697265625, -25.802734375, -24.20849609375, -22.6142578125, -21.02001953125, -19.42578125, -17.83154296875, -16.2373046875, -14.64306640625, -13.048828125, -11.45458984375, -9.8603515625, -8.26611328125, -6.671875, -5.07763671875, -3.4833984375, -1.88916015625, -0.294921875, 1.29931640625, 2.8935546875, 4.48779296875, 6.08203125, 7.67626953125, 9.2705078125, 10.86474609375, 12.458984375, 14.05322265625, 15.6474609375, 17.24169921875, 18.8359375, 20.43017578125, 22.0244140625, 23.61865234375, 25.212890625, 26.80712890625, 28.4013671875, 29.99560546875, 31.58984375, 33.18408203125, 34.7783203125, 36.37255859375, 37.966796875, 39.56103515625, 41.1552734375, 42.74951171875, 44.34375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 6.0, 18.0, 30.0, 49.0, 65.0, 84.0, 89.0, 94.0, 94.0, 100.0, 86.0, 71.0, 66.0, 47.0, 28.0, 23.0, 16.0, 9.0, 8.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.23895263671875, -7.9935302734375, -7.74810791015625, -7.502685546875, -7.25726318359375, -7.0118408203125, -6.76641845703125, -6.52099609375, -6.27557373046875, -6.0301513671875, -5.78472900390625, -5.539306640625, -5.29388427734375, -5.0484619140625, -4.80303955078125, -4.5576171875, -4.31219482421875, -4.0667724609375, -3.82135009765625, -3.575927734375, -3.33050537109375, -3.0850830078125, -2.83966064453125, -2.59423828125, -2.34881591796875, -2.1033935546875, -1.85797119140625, -1.612548828125, -1.36712646484375, -1.1217041015625, -0.87628173828125, -0.630859375, -0.38543701171875, -0.1400146484375, 0.10540771484375, 0.350830078125, 0.59625244140625, 0.8416748046875, 1.08709716796875, 1.33251953125, 1.57794189453125, 1.8233642578125, 2.06878662109375, 2.314208984375, 2.55963134765625, 2.8050537109375, 3.05047607421875, 3.2958984375, 3.54132080078125, 3.7867431640625, 4.03216552734375, 4.277587890625, 4.52301025390625, 4.7684326171875, 5.01385498046875, 5.25927734375, 5.50469970703125, 5.7501220703125, 5.99554443359375, 6.240966796875, 6.48638916015625, 6.7318115234375, 6.97723388671875, 7.22265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 2.0, 14.0, 19.0, 29.0, 48.0, 52.0, 98.0, 223.0, 391.0, 833.0, 1762.0, 4516.0, 13715.0, 48536.0, 242711.0, 3092431.0, 657969.0, 94691.0, 23589.0, 7471.0, 2705.0, 1193.0, 539.0, 307.0, 184.0, 115.0, 47.0, 33.0, 17.0, 15.0, 11.0, 4.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-36.625, -35.627685546875, -34.63037109375, -33.633056640625, -32.6357421875, -31.638427734375, -30.64111328125, -29.643798828125, -28.646484375, -27.649169921875, -26.65185546875, -25.654541015625, -24.6572265625, -23.659912109375, -22.66259765625, -21.665283203125, -20.66796875, -19.670654296875, -18.67333984375, -17.676025390625, -16.6787109375, -15.681396484375, -14.68408203125, -13.686767578125, -12.689453125, -11.692138671875, -10.69482421875, -9.697509765625, -8.7001953125, -7.702880859375, -6.70556640625, -5.708251953125, -4.7109375, -3.713623046875, -2.71630859375, -1.718994140625, -0.7216796875, 0.275634765625, 1.27294921875, 2.270263671875, 3.267578125, 4.264892578125, 5.26220703125, 6.259521484375, 7.2568359375, 8.254150390625, 9.25146484375, 10.248779296875, 11.24609375, 12.243408203125, 13.24072265625, 14.238037109375, 15.2353515625, 16.232666015625, 17.22998046875, 18.227294921875, 19.224609375, 20.221923828125, 21.21923828125, 22.216552734375, 23.2138671875, 24.211181640625, 25.20849609375, 26.205810546875, 27.203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 10.0, 11.0, 20.0, 20.0, 26.0, 46.0, 58.0, 85.0, 126.0, 215.0, 361.0, 897.0, 1071.0, 394.0, 241.0, 142.0, 89.0, 79.0, 50.0, 34.0, 28.0, 18.0, 14.0, 6.0, 8.0, 2.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1171875, -9.743408203125, -9.36962890625, -8.995849609375, -8.6220703125, -8.248291015625, -7.87451171875, -7.500732421875, -7.126953125, -6.753173828125, -6.37939453125, -6.005615234375, -5.6318359375, -5.258056640625, -4.88427734375, -4.510498046875, -4.13671875, -3.762939453125, -3.38916015625, -3.015380859375, -2.6416015625, -2.267822265625, -1.89404296875, -1.520263671875, -1.146484375, -0.772705078125, -0.39892578125, -0.025146484375, 0.3486328125, 0.722412109375, 1.09619140625, 1.469970703125, 1.84375, 2.217529296875, 2.59130859375, 2.965087890625, 3.3388671875, 3.712646484375, 4.08642578125, 4.460205078125, 4.833984375, 5.207763671875, 5.58154296875, 5.955322265625, 6.3291015625, 6.702880859375, 7.07666015625, 7.450439453125, 7.82421875, 8.197998046875, 8.57177734375, 8.945556640625, 9.3193359375, 9.693115234375, 10.06689453125, 10.440673828125, 10.814453125, 11.188232421875, 11.56201171875, 11.935791015625, 12.3095703125, 12.683349609375, 13.05712890625, 13.430908203125, 13.8046875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 11.0, 18.0, 16.0, 29.0, 41.0, 60.0, 90.0, 100.0, 97.0, 99.0, 105.0, 84.0, 65.0, 46.0, 35.0, 36.0, 18.0, 16.0, 8.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.03144836425781, -64.53826141357422, -62.04507827758789, -59.5518913269043, -57.05870819091797, -54.565521240234375, -52.07233428955078, -49.57915115356445, -47.085968017578125, -44.59278106689453, -42.0995979309082, -39.60641098022461, -37.11322784423828, -34.62004089355469, -32.126853942871094, -29.633670806884766, -27.140483856201172, -24.64729881286621, -22.15411376953125, -19.660926818847656, -17.167743682861328, -14.67455768585205, -12.181371688842773, -9.688186645507812, -7.195001602172852, -4.701816558837891, -2.2086310386657715, 0.28455448150634766, 2.7777395248413086, 5.2709245681762695, 7.764110565185547, 10.257295608520508, 12.750480651855469, 15.24366569519043, 17.73685073852539, 20.230037689208984, 22.723220825195312, 25.216407775878906, 27.709592819213867, 30.202777862548828, 32.695960998535156, 35.18914794921875, 37.68233108520508, 40.17551803588867, 42.668701171875, 45.161888122558594, 47.65507507324219, 50.148258209228516, 52.64144515991211, 55.1346321105957, 57.62781524658203, 60.121002197265625, 62.61418533325195, 65.10736846923828, 67.60055541992188, 70.09374237060547, 72.58692932128906, 75.08011627197266, 77.57330322265625, 80.06648254394531, 82.5596694946289, 85.0528564453125, 87.5460433959961, 90.03923034667969, 92.53240966796875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 12.0, 18.0, 17.0, 9.0, 18.0, 21.0, 26.0, 37.0, 29.0, 36.0, 39.0, 33.0, 44.0, 35.0, 36.0, 39.0, 35.0, 40.0, 46.0, 51.0, 43.0, 41.0, 35.0, 31.0, 21.0, 26.0, 15.0, 21.0, 25.0, 24.0, 11.0, 19.0, 19.0, 10.0, 8.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-51.178184509277344, -49.73715591430664, -48.29612731933594, -46.8551025390625, -45.4140739440918, -43.973045349121094, -42.532020568847656, -41.09099197387695, -39.64996337890625, -38.20893478393555, -36.767906188964844, -35.326881408691406, -33.8858528137207, -32.44482421875, -31.00379753112793, -29.56277084350586, -28.121742248535156, -26.680713653564453, -25.239686965942383, -23.798660278320312, -22.35763168334961, -20.916603088378906, -19.475576400756836, -18.034549713134766, -16.593521118164062, -15.152493476867676, -13.711465835571289, -12.270438194274902, -10.829410552978516, -9.388382911682129, -7.947355270385742, -6.5063276290893555, -5.065299987792969, -3.624272346496582, -2.1832447052001953, -0.7422170639038086, 0.6988105773925781, 2.139838218688965, 3.5808658599853516, 5.021893501281738, 6.462921142578125, 7.903948783874512, 9.344976425170898, 10.786004066467285, 12.227031707763672, 13.668059349060059, 15.109086990356445, 16.550113677978516, 17.99114227294922, 19.432170867919922, 20.873197555541992, 22.314224243164062, 23.755252838134766, 25.19628143310547, 26.63730812072754, 28.07833480834961, 29.519363403320312, 30.960391998291016, 32.40142059326172, 33.842445373535156, 35.28347396850586, 36.72450256347656, 38.16552734375, 39.6065559387207, 41.047584533691406]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 7.0, 19.0, 28.0, 26.0, 54.0, 81.0, 122.0, 205.0, 332.0, 571.0, 1203.0, 2812.0, 8558.0, 32531.0, 171510.0, 676842.0, 117682.0, 24541.0, 6738.0, 2328.0, 981.0, 517.0, 285.0, 188.0, 131.0, 75.0, 43.0, 25.0, 32.0, 13.0, 8.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-42.375, -41.025390625, -39.67578125, -38.326171875, -36.9765625, -35.626953125, -34.27734375, -32.927734375, -31.578125, -30.228515625, -28.87890625, -27.529296875, -26.1796875, -24.830078125, -23.48046875, -22.130859375, -20.78125, -19.431640625, -18.08203125, -16.732421875, -15.3828125, -14.033203125, -12.68359375, -11.333984375, -9.984375, -8.634765625, -7.28515625, -5.935546875, -4.5859375, -3.236328125, -1.88671875, -0.537109375, 0.8125, 2.162109375, 3.51171875, 4.861328125, 6.2109375, 7.560546875, 8.91015625, 10.259765625, 11.609375, 12.958984375, 14.30859375, 15.658203125, 17.0078125, 18.357421875, 19.70703125, 21.056640625, 22.40625, 23.755859375, 25.10546875, 26.455078125, 27.8046875, 29.154296875, 30.50390625, 31.853515625, 33.203125, 34.552734375, 35.90234375, 37.251953125, 38.6015625, 39.951171875, 41.30078125, 42.650390625, 44.0]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 5.0, 15.0, 18.0, 36.0, 43.0, 59.0, 67.0, 77.0, 114.0, 90.0, 92.0, 79.0, 66.0, 77.0, 44.0, 30.0, 27.0, 23.0, 12.0, 7.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -8.01318359375, -7.7685546875, -7.52392578125, -7.279296875, -7.03466796875, -6.7900390625, -6.54541015625, -6.30078125, -6.05615234375, -5.8115234375, -5.56689453125, -5.322265625, -5.07763671875, -4.8330078125, -4.58837890625, -4.34375, -4.09912109375, -3.8544921875, -3.60986328125, -3.365234375, -3.12060546875, -2.8759765625, -2.63134765625, -2.38671875, -2.14208984375, -1.8974609375, -1.65283203125, -1.408203125, -1.16357421875, -0.9189453125, -0.67431640625, -0.4296875, -0.18505859375, 0.0595703125, 0.30419921875, 0.548828125, 0.79345703125, 1.0380859375, 1.28271484375, 1.52734375, 1.77197265625, 2.0166015625, 2.26123046875, 2.505859375, 2.75048828125, 2.9951171875, 3.23974609375, 3.484375, 3.72900390625, 3.9736328125, 4.21826171875, 4.462890625, 4.70751953125, 4.9521484375, 5.19677734375, 5.44140625, 5.68603515625, 5.9306640625, 6.17529296875, 6.419921875, 6.66455078125, 6.9091796875, 7.15380859375, 7.3984375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 1.0, 18.0, 6.0, 19.0, 23.0, 34.0, 50.0, 66.0, 94.0, 126.0, 200.0, 315.0, 463.0, 783.0, 1577.0, 3669.0, 8698.0, 24456.0, 72787.0, 279463.0, 485428.0, 111993.0, 35941.0, 12896.0, 4759.0, 2025.0, 988.0, 550.0, 351.0, 244.0, 148.0, 108.0, 80.0, 54.0, 42.0, 28.0, 23.0, 14.0, 7.0, 12.0, 8.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.967529296875, -18.29443359375, -17.621337890625, -16.9482421875, -16.275146484375, -15.60205078125, -14.928955078125, -14.255859375, -13.582763671875, -12.90966796875, -12.236572265625, -11.5634765625, -10.890380859375, -10.21728515625, -9.544189453125, -8.87109375, -8.197998046875, -7.52490234375, -6.851806640625, -6.1787109375, -5.505615234375, -4.83251953125, -4.159423828125, -3.486328125, -2.813232421875, -2.14013671875, -1.467041015625, -0.7939453125, -0.120849609375, 0.55224609375, 1.225341796875, 1.8984375, 2.571533203125, 3.24462890625, 3.917724609375, 4.5908203125, 5.263916015625, 5.93701171875, 6.610107421875, 7.283203125, 7.956298828125, 8.62939453125, 9.302490234375, 9.9755859375, 10.648681640625, 11.32177734375, 11.994873046875, 12.66796875, 13.341064453125, 14.01416015625, 14.687255859375, 15.3603515625, 16.033447265625, 16.70654296875, 17.379638671875, 18.052734375, 18.725830078125, 19.39892578125, 20.072021484375, 20.7451171875, 21.418212890625, 22.09130859375, 22.764404296875, 23.4375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 7.0, 9.0, 7.0, 12.0, 9.0, 7.0, 20.0, 16.0, 21.0, 24.0, 25.0, 30.0, 35.0, 27.0, 40.0, 37.0, 40.0, 44.0, 49.0, 54.0, 38.0, 39.0, 39.0, 41.0, 39.0, 32.0, 42.0, 40.0, 29.0, 20.0, 29.0, 14.0, 17.0, 7.0, 15.0, 5.0, 9.0, 6.0, 3.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.234375, -15.7479248046875, -15.261474609375, -14.7750244140625, -14.28857421875, -13.8021240234375, -13.315673828125, -12.8292236328125, -12.3427734375, -11.8563232421875, -11.369873046875, -10.8834228515625, -10.39697265625, -9.9105224609375, -9.424072265625, -8.9376220703125, -8.451171875, -7.9647216796875, -7.478271484375, -6.9918212890625, -6.50537109375, -6.0189208984375, -5.532470703125, -5.0460205078125, -4.5595703125, -4.0731201171875, -3.586669921875, -3.1002197265625, -2.61376953125, -2.1273193359375, -1.640869140625, -1.1544189453125, -0.66796875, -0.1815185546875, 0.304931640625, 0.7913818359375, 1.27783203125, 1.7642822265625, 2.250732421875, 2.7371826171875, 3.2236328125, 3.7100830078125, 4.196533203125, 4.6829833984375, 5.16943359375, 5.6558837890625, 6.142333984375, 6.6287841796875, 7.115234375, 7.6016845703125, 8.088134765625, 8.5745849609375, 9.06103515625, 9.5474853515625, 10.033935546875, 10.5203857421875, 11.0068359375, 11.4932861328125, 11.979736328125, 12.4661865234375, 12.95263671875, 13.4390869140625, 13.925537109375, 14.4119873046875, 14.8984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 10.0, 11.0, 16.0, 19.0, 22.0, 20.0, 40.0, 49.0, 75.0, 113.0, 149.0, 216.0, 409.0, 698.0, 1211.0, 2459.0, 5584.0, 15012.0, 61619.0, 664549.0, 246342.0, 32006.0, 9514.0, 3950.0, 1971.0, 985.0, 528.0, 313.0, 175.0, 153.0, 88.0, 62.0, 40.0, 32.0, 29.0, 24.0, 9.0, 10.0, 5.0, 6.0, 5.0, 3.0, 8.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.671875, -18.119384765625, -17.56689453125, -17.014404296875, -16.4619140625, -15.909423828125, -15.35693359375, -14.804443359375, -14.251953125, -13.699462890625, -13.14697265625, -12.594482421875, -12.0419921875, -11.489501953125, -10.93701171875, -10.384521484375, -9.83203125, -9.279541015625, -8.72705078125, -8.174560546875, -7.6220703125, -7.069580078125, -6.51708984375, -5.964599609375, -5.412109375, -4.859619140625, -4.30712890625, -3.754638671875, -3.2021484375, -2.649658203125, -2.09716796875, -1.544677734375, -0.9921875, -0.439697265625, 0.11279296875, 0.665283203125, 1.2177734375, 1.770263671875, 2.32275390625, 2.875244140625, 3.427734375, 3.980224609375, 4.53271484375, 5.085205078125, 5.6376953125, 6.190185546875, 6.74267578125, 7.295166015625, 7.84765625, 8.400146484375, 8.95263671875, 9.505126953125, 10.0576171875, 10.610107421875, 11.16259765625, 11.715087890625, 12.267578125, 12.820068359375, 13.37255859375, 13.925048828125, 14.4775390625, 15.030029296875, 15.58251953125, 16.135009765625, 16.6875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 8.0, 7.0, 10.0, 15.0, 15.0, 20.0, 32.0, 49.0, 75.0, 185.0, 205.0, 143.0, 67.0, 25.0, 35.0, 21.0, 18.0, 8.0, 9.0, 8.0, 4.0, 5.0, 1.0, 5.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023212432861328125, -0.0022393763065338135, -0.0021575093269348145, -0.0020756423473358154, -0.0019937753677368164, -0.0019119083881378174, -0.0018300414085388184, -0.0017481744289398193, -0.0016663074493408203, -0.0015844404697418213, -0.0015025734901428223, -0.0014207065105438232, -0.0013388395309448242, -0.0012569725513458252, -0.0011751055717468262, -0.0010932385921478271, -0.0010113716125488281, -0.0009295046329498291, -0.0008476376533508301, -0.0007657706737518311, -0.000683903694152832, -0.000602036714553833, -0.000520169734954834, -0.00043830275535583496, -0.00035643577575683594, -0.0002745687961578369, -0.0001927018165588379, -0.00011083483695983887, -2.8967857360839844e-05, 5.289912223815918e-05, 0.0001347661018371582, 0.00021663308143615723, 0.00029850006103515625, 0.0003803670406341553, 0.0004622340202331543, 0.0005441009998321533, 0.0006259679794311523, 0.0007078349590301514, 0.0007897019386291504, 0.0008715689182281494, 0.0009534358978271484, 0.0010353028774261475, 0.0011171698570251465, 0.0011990368366241455, 0.0012809038162231445, 0.0013627707958221436, 0.0014446377754211426, 0.0015265047550201416, 0.0016083717346191406, 0.0016902387142181396, 0.0017721056938171387, 0.0018539726734161377, 0.0019358396530151367, 0.0020177066326141357, 0.0020995736122131348, 0.002181440591812134, 0.002263307571411133, 0.002345174551010132, 0.002427041530609131, 0.00250890851020813, 0.002590775489807129, 0.002672642469406128, 0.002754509449005127, 0.002836376428604126, 0.002918243408203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 20.0, 24.0, 31.0, 42.0, 75.0, 117.0, 217.0, 391.0, 768.0, 1859.0, 5424.0, 22067.0, 621258.0, 369634.0, 18495.0, 4807.0, 1679.0, 722.0, 383.0, 175.0, 98.0, 90.0, 54.0, 37.0, 18.0, 18.0, 10.0, 10.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.5, -33.38525390625, -32.2705078125, -31.15576171875, -30.041015625, -28.92626953125, -27.8115234375, -26.69677734375, -25.58203125, -24.46728515625, -23.3525390625, -22.23779296875, -21.123046875, -20.00830078125, -18.8935546875, -17.77880859375, -16.6640625, -15.54931640625, -14.4345703125, -13.31982421875, -12.205078125, -11.09033203125, -9.9755859375, -8.86083984375, -7.74609375, -6.63134765625, -5.5166015625, -4.40185546875, -3.287109375, -2.17236328125, -1.0576171875, 0.05712890625, 1.171875, 2.28662109375, 3.4013671875, 4.51611328125, 5.630859375, 6.74560546875, 7.8603515625, 8.97509765625, 10.08984375, 11.20458984375, 12.3193359375, 13.43408203125, 14.548828125, 15.66357421875, 16.7783203125, 17.89306640625, 19.0078125, 20.12255859375, 21.2373046875, 22.35205078125, 23.466796875, 24.58154296875, 25.6962890625, 26.81103515625, 27.92578125, 29.04052734375, 30.1552734375, 31.27001953125, 32.384765625, 33.49951171875, 34.6142578125, 35.72900390625, 36.84375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 3.0, 11.0, 8.0, 9.0, 20.0, 27.0, 59.0, 152.0, 310.0, 198.0, 86.0, 36.0, 25.0, 15.0, 5.0, 3.0, 9.0, 5.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.765625, -18.08447265625, -17.4033203125, -16.72216796875, -16.041015625, -15.35986328125, -14.6787109375, -13.99755859375, -13.31640625, -12.63525390625, -11.9541015625, -11.27294921875, -10.591796875, -9.91064453125, -9.2294921875, -8.54833984375, -7.8671875, -7.18603515625, -6.5048828125, -5.82373046875, -5.142578125, -4.46142578125, -3.7802734375, -3.09912109375, -2.41796875, -1.73681640625, -1.0556640625, -0.37451171875, 0.306640625, 0.98779296875, 1.6689453125, 2.35009765625, 3.03125, 3.71240234375, 4.3935546875, 5.07470703125, 5.755859375, 6.43701171875, 7.1181640625, 7.79931640625, 8.48046875, 9.16162109375, 9.8427734375, 10.52392578125, 11.205078125, 11.88623046875, 12.5673828125, 13.24853515625, 13.9296875, 14.61083984375, 15.2919921875, 15.97314453125, 16.654296875, 17.33544921875, 18.0166015625, 18.69775390625, 19.37890625, 20.06005859375, 20.7412109375, 21.42236328125, 22.103515625, 22.78466796875, 23.4658203125, 24.14697265625, 24.828125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 30.0, 120.0, 283.0, 380.0, 130.0, 35.0, 13.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-687.7215576171875, -672.133056640625, -656.5445556640625, -640.9560546875, -625.3675537109375, -609.779052734375, -594.1905517578125, -578.60205078125, -563.0135498046875, -547.425048828125, -531.8365478515625, -516.248046875, -500.6595458984375, -485.071044921875, -469.4825439453125, -453.89404296875, -438.3055725097656, -422.7170715332031, -407.1285705566406, -391.5400695800781, -375.9515686035156, -360.3630676269531, -344.77459716796875, -329.18609619140625, -313.59759521484375, -298.00909423828125, -282.42059326171875, -266.83209228515625, -251.24359130859375, -235.65509033203125, -220.0666046142578, -204.4781036376953, -188.88958740234375, -173.30108642578125, -157.71258544921875, -142.12408447265625, -126.53559112548828, -110.94709014892578, -95.35859680175781, -79.77009582519531, -64.18159484863281, -48.59309387207031, -33.00459671020508, -17.416099548339844, -1.8275985717773438, 13.760902404785156, 29.349395751953125, 44.937896728515625, 60.526397705078125, 76.11489868164062, 91.70339965820312, 107.2918930053711, 122.8803939819336, 138.46890258789062, 154.05738830566406, 169.64588928222656, 185.23439025878906, 200.82289123535156, 216.41139221191406, 231.9998779296875, 247.58837890625, 263.1768798828125, 278.765380859375, 294.3538818359375, 309.9423828125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 16.0, 13.0, 17.0, 19.0, 20.0, 18.0, 41.0, 34.0, 30.0, 45.0, 36.0, 57.0, 43.0, 40.0, 35.0, 44.0, 43.0, 30.0, 44.0, 40.0, 32.0, 34.0, 35.0, 31.0, 26.0, 20.0, 20.0, 16.0, 12.0, 16.0, 10.0, 12.0, 7.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.71067810058594, -90.0806655883789, -87.45065307617188, -84.82064819335938, -82.19063568115234, -79.56062316894531, -76.93061065673828, -74.30059814453125, -71.67059326171875, -69.04058074951172, -66.41056823730469, -63.78055953979492, -61.150550842285156, -58.520538330078125, -55.890525817871094, -53.26051330566406, -50.63050079345703, -48.00048828125, -45.370479583740234, -42.7404670715332, -40.11045837402344, -37.480445861816406, -34.850433349609375, -32.220420837402344, -29.590412139892578, -26.96040153503418, -24.33039093017578, -21.70037841796875, -19.07036781311035, -16.440357208251953, -13.810345649719238, -11.180334091186523, -8.550331115722656, -5.9203200340271, -3.290308952331543, -0.6602978706359863, 1.9697132110595703, 4.599723815917969, 7.229735374450684, 9.859746932983398, 12.489757537841797, 15.119768142700195, 17.749778747558594, 20.379791259765625, 23.009801864624023, 25.639812469482422, 28.269824981689453, 30.89983558654785, 33.52984619140625, 36.15985870361328, 38.78986740112305, 41.41987991333008, 44.049888610839844, 46.679901123046875, 49.309913635253906, 51.93992614746094, 54.5699348449707, 57.199947357177734, 59.8299560546875, 62.45996856689453, 65.08998107910156, 67.71998596191406, 70.3499984741211, 72.98001098632812, 75.61002349853516]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 10.0, 6.0, 8.0, 11.0, 14.0, 19.0, 43.0, 46.0, 53.0, 84.0, 141.0, 221.0, 352.0, 671.0, 1344.0, 3196.0, 9718.0, 41597.0, 541936.0, 3494185.0, 77796.0, 14698.0, 4453.0, 1717.0, 818.0, 416.0, 258.0, 158.0, 97.0, 68.0, 39.0, 32.0, 26.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.0625, -51.30322265625, -49.5439453125, -47.78466796875, -46.025390625, -44.26611328125, -42.5068359375, -40.74755859375, -38.98828125, -37.22900390625, -35.4697265625, -33.71044921875, -31.951171875, -30.19189453125, -28.4326171875, -26.67333984375, -24.9140625, -23.15478515625, -21.3955078125, -19.63623046875, -17.876953125, -16.11767578125, -14.3583984375, -12.59912109375, -10.83984375, -9.08056640625, -7.3212890625, -5.56201171875, -3.802734375, -2.04345703125, -0.2841796875, 1.47509765625, 3.234375, 4.99365234375, 6.7529296875, 8.51220703125, 10.271484375, 12.03076171875, 13.7900390625, 15.54931640625, 17.30859375, 19.06787109375, 20.8271484375, 22.58642578125, 24.345703125, 26.10498046875, 27.8642578125, 29.62353515625, 31.3828125, 33.14208984375, 34.9013671875, 36.66064453125, 38.419921875, 40.17919921875, 41.9384765625, 43.69775390625, 45.45703125, 47.21630859375, 48.9755859375, 50.73486328125, 52.494140625, 54.25341796875, 56.0126953125, 57.77197265625, 59.53125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 17.0, 24.0, 37.0, 41.0, 59.0, 64.0, 74.0, 83.0, 86.0, 98.0, 67.0, 82.0, 63.0, 47.0, 41.0, 27.0, 23.0, 12.0, 16.0, 9.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.92333984375, -7.6826171875, -7.44189453125, -7.201171875, -6.96044921875, -6.7197265625, -6.47900390625, -6.23828125, -5.99755859375, -5.7568359375, -5.51611328125, -5.275390625, -5.03466796875, -4.7939453125, -4.55322265625, -4.3125, -4.07177734375, -3.8310546875, -3.59033203125, -3.349609375, -3.10888671875, -2.8681640625, -2.62744140625, -2.38671875, -2.14599609375, -1.9052734375, -1.66455078125, -1.423828125, -1.18310546875, -0.9423828125, -0.70166015625, -0.4609375, -0.22021484375, 0.0205078125, 0.26123046875, 0.501953125, 0.74267578125, 0.9833984375, 1.22412109375, 1.46484375, 1.70556640625, 1.9462890625, 2.18701171875, 2.427734375, 2.66845703125, 2.9091796875, 3.14990234375, 3.390625, 3.63134765625, 3.8720703125, 4.11279296875, 4.353515625, 4.59423828125, 4.8349609375, 5.07568359375, 5.31640625, 5.55712890625, 5.7978515625, 6.03857421875, 6.279296875, 6.52001953125, 6.7607421875, 7.00146484375, 7.2421875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 8.0, 11.0, 10.0, 24.0, 30.0, 38.0, 49.0, 79.0, 116.0, 209.0, 344.0, 625.0, 1123.0, 2382.0, 5011.0, 12235.0, 35010.0, 138693.0, 2363664.0, 1455838.0, 125210.0, 32279.0, 11618.0, 4760.0, 2257.0, 1134.0, 606.0, 311.0, 197.0, 121.0, 70.0, 51.0, 39.0, 33.0, 20.0, 13.0, 12.0, 12.0, 7.0, 3.0, 8.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-35.46875, -34.482666015625, -33.49658203125, -32.510498046875, -31.5244140625, -30.538330078125, -29.55224609375, -28.566162109375, -27.580078125, -26.593994140625, -25.60791015625, -24.621826171875, -23.6357421875, -22.649658203125, -21.66357421875, -20.677490234375, -19.69140625, -18.705322265625, -17.71923828125, -16.733154296875, -15.7470703125, -14.760986328125, -13.77490234375, -12.788818359375, -11.802734375, -10.816650390625, -9.83056640625, -8.844482421875, -7.8583984375, -6.872314453125, -5.88623046875, -4.900146484375, -3.9140625, -2.927978515625, -1.94189453125, -0.955810546875, 0.0302734375, 1.016357421875, 2.00244140625, 2.988525390625, 3.974609375, 4.960693359375, 5.94677734375, 6.932861328125, 7.9189453125, 8.905029296875, 9.89111328125, 10.877197265625, 11.86328125, 12.849365234375, 13.83544921875, 14.821533203125, 15.8076171875, 16.793701171875, 17.77978515625, 18.765869140625, 19.751953125, 20.738037109375, 21.72412109375, 22.710205078125, 23.6962890625, 24.682373046875, 25.66845703125, 26.654541015625, 27.640625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 4.0, 13.0, 4.0, 11.0, 13.0, 35.0, 47.0, 82.0, 109.0, 220.0, 472.0, 1842.0, 588.0, 269.0, 132.0, 76.0, 47.0, 26.0, 22.0, 17.0, 10.0, 5.0, 9.0, 7.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.1650390625, -12.705078125, -12.2451171875, -11.78515625, -11.3251953125, -10.865234375, -10.4052734375, -9.9453125, -9.4853515625, -9.025390625, -8.5654296875, -8.10546875, -7.6455078125, -7.185546875, -6.7255859375, -6.265625, -5.8056640625, -5.345703125, -4.8857421875, -4.42578125, -3.9658203125, -3.505859375, -3.0458984375, -2.5859375, -2.1259765625, -1.666015625, -1.2060546875, -0.74609375, -0.2861328125, 0.173828125, 0.6337890625, 1.09375, 1.5537109375, 2.013671875, 2.4736328125, 2.93359375, 3.3935546875, 3.853515625, 4.3134765625, 4.7734375, 5.2333984375, 5.693359375, 6.1533203125, 6.61328125, 7.0732421875, 7.533203125, 7.9931640625, 8.453125, 8.9130859375, 9.373046875, 9.8330078125, 10.29296875, 10.7529296875, 11.212890625, 11.6728515625, 12.1328125, 12.5927734375, 13.052734375, 13.5126953125, 13.97265625, 14.4326171875, 14.892578125, 15.3525390625, 15.8125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 11.0, 13.0, 37.0, 56.0, 76.0, 112.0, 143.0, 156.0, 131.0, 93.0, 66.0, 41.0, 21.0, 17.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.44892883300781, -102.56626892089844, -99.68360137939453, -96.80094146728516, -93.91827392578125, -91.03561401367188, -88.1529541015625, -85.2702865600586, -82.38761901855469, -79.50495910644531, -76.6222915649414, -73.73963165283203, -70.85696411132812, -67.97430419921875, -65.09164428710938, -62.20897674560547, -59.326316833496094, -56.44365310668945, -53.56098937988281, -50.67832946777344, -47.79566192626953, -44.913002014160156, -42.030338287353516, -39.147674560546875, -36.265010833740234, -33.382347106933594, -30.499683380126953, -27.617021560668945, -24.734357833862305, -21.851694107055664, -18.969032287597656, -16.086368560791016, -13.203704833984375, -10.321041107177734, -7.43837833404541, -4.555715560913086, -1.6730518341064453, 1.2096118927001953, 4.092273712158203, 6.974937438964844, 9.857601165771484, 12.740264892578125, 15.62292766571045, 18.505590438842773, 21.388254165649414, 24.270917892456055, 27.153579711914062, 30.036243438720703, 32.918907165527344, 35.801570892333984, 38.684234619140625, 41.56689453125, 44.449562072753906, 47.33222198486328, 50.21488571166992, 53.09754943847656, 55.9802131652832, 58.862876892089844, 61.745540618896484, 64.62820434570312, 67.5108642578125, 70.3935317993164, 73.27619171142578, 76.15885925292969, 79.04151916503906]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 6.0, 6.0, 10.0, 13.0, 13.0, 21.0, 16.0, 25.0, 25.0, 29.0, 28.0, 29.0, 46.0, 47.0, 51.0, 50.0, 44.0, 58.0, 55.0, 51.0, 49.0, 52.0, 39.0, 39.0, 38.0, 36.0, 17.0, 22.0, 19.0, 18.0, 11.0, 10.0, 6.0, 7.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.01183319091797, -39.669464111328125, -38.32709503173828, -36.98472213745117, -35.64235305786133, -34.299983978271484, -32.95761489868164, -31.615243911743164, -30.272872924804688, -28.930503845214844, -27.588132858276367, -26.245763778686523, -24.903392791748047, -23.561023712158203, -22.21865463256836, -20.876283645629883, -19.53391456604004, -18.191545486450195, -16.84917449951172, -15.506805419921875, -14.164434432983398, -12.822065353393555, -11.479695320129395, -10.137325286865234, -8.794955253601074, -7.452585220336914, -6.110215187072754, -4.767845630645752, -3.425475597381592, -2.0831055641174316, -0.7407360076904297, 0.6016340255737305, 1.9440040588378906, 3.286374092102051, 4.628744125366211, 5.971113681793213, 7.313483715057373, 8.655853271484375, 9.998223304748535, 11.340593338012695, 12.682963371276855, 14.025333404541016, 15.367703437805176, 16.710073471069336, 18.05244255065918, 19.394813537597656, 20.7371826171875, 22.079551696777344, 23.42192268371582, 24.764291763305664, 26.10666275024414, 27.449031829833984, 28.79140281677246, 30.133771896362305, 31.47614288330078, 32.818511962890625, 34.16088104248047, 35.50325012207031, 36.845619201660156, 38.187992095947266, 39.53036117553711, 40.87273025512695, 42.2150993347168, 43.557472229003906, 44.89984130859375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 12.0, 13.0, 19.0, 18.0, 45.0, 51.0, 77.0, 123.0, 231.0, 388.0, 731.0, 1613.0, 4305.0, 14736.0, 61184.0, 412706.0, 462922.0, 65612.0, 15775.0, 4443.0, 1724.0, 810.0, 408.0, 239.0, 125.0, 76.0, 60.0, 36.0, 18.0, 7.0, 12.0, 8.0, 3.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-49.6875, -48.446044921875, -47.20458984375, -45.963134765625, -44.7216796875, -43.480224609375, -42.23876953125, -40.997314453125, -39.755859375, -38.514404296875, -37.27294921875, -36.031494140625, -34.7900390625, -33.548583984375, -32.30712890625, -31.065673828125, -29.82421875, -28.582763671875, -27.34130859375, -26.099853515625, -24.8583984375, -23.616943359375, -22.37548828125, -21.134033203125, -19.892578125, -18.651123046875, -17.40966796875, -16.168212890625, -14.9267578125, -13.685302734375, -12.44384765625, -11.202392578125, -9.9609375, -8.719482421875, -7.47802734375, -6.236572265625, -4.9951171875, -3.753662109375, -2.51220703125, -1.270751953125, -0.029296875, 1.212158203125, 2.45361328125, 3.695068359375, 4.9365234375, 6.177978515625, 7.41943359375, 8.660888671875, 9.90234375, 11.143798828125, 12.38525390625, 13.626708984375, 14.8681640625, 16.109619140625, 17.35107421875, 18.592529296875, 19.833984375, 21.075439453125, 22.31689453125, 23.558349609375, 24.7998046875, 26.041259765625, 27.28271484375, 28.524169921875, 29.765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 12.0, 19.0, 31.0, 39.0, 50.0, 70.0, 70.0, 82.0, 93.0, 96.0, 80.0, 66.0, 81.0, 59.0, 38.0, 31.0, 20.0, 9.0, 16.0, 7.0, 5.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.75, -8.4942626953125, -8.238525390625, -7.9827880859375, -7.72705078125, -7.4713134765625, -7.215576171875, -6.9598388671875, -6.7041015625, -6.4483642578125, -6.192626953125, -5.9368896484375, -5.68115234375, -5.4254150390625, -5.169677734375, -4.9139404296875, -4.658203125, -4.4024658203125, -4.146728515625, -3.8909912109375, -3.63525390625, -3.3795166015625, -3.123779296875, -2.8680419921875, -2.6123046875, -2.3565673828125, -2.100830078125, -1.8450927734375, -1.58935546875, -1.3336181640625, -1.077880859375, -0.8221435546875, -0.56640625, -0.3106689453125, -0.054931640625, 0.2008056640625, 0.45654296875, 0.7122802734375, 0.968017578125, 1.2237548828125, 1.4794921875, 1.7352294921875, 1.990966796875, 2.2467041015625, 2.50244140625, 2.7581787109375, 3.013916015625, 3.2696533203125, 3.525390625, 3.7811279296875, 4.036865234375, 4.2926025390625, 4.54833984375, 4.8040771484375, 5.059814453125, 5.3155517578125, 5.5712890625, 5.8270263671875, 6.082763671875, 6.3385009765625, 6.59423828125, 6.8499755859375, 7.105712890625, 7.3614501953125, 7.6171875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 2.0, 6.0, 5.0, 9.0, 10.0, 11.0, 25.0, 32.0, 48.0, 60.0, 89.0, 161.0, 309.0, 596.0, 1283.0, 3222.0, 9058.0, 27549.0, 93078.0, 527697.0, 292420.0, 62444.0, 19331.0, 6467.0, 2536.0, 953.0, 530.0, 242.0, 126.0, 80.0, 57.0, 33.0, 27.0, 19.0, 15.0, 7.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.078125, -21.33837890625, -20.5986328125, -19.85888671875, -19.119140625, -18.37939453125, -17.6396484375, -16.89990234375, -16.16015625, -15.42041015625, -14.6806640625, -13.94091796875, -13.201171875, -12.46142578125, -11.7216796875, -10.98193359375, -10.2421875, -9.50244140625, -8.7626953125, -8.02294921875, -7.283203125, -6.54345703125, -5.8037109375, -5.06396484375, -4.32421875, -3.58447265625, -2.8447265625, -2.10498046875, -1.365234375, -0.62548828125, 0.1142578125, 0.85400390625, 1.59375, 2.33349609375, 3.0732421875, 3.81298828125, 4.552734375, 5.29248046875, 6.0322265625, 6.77197265625, 7.51171875, 8.25146484375, 8.9912109375, 9.73095703125, 10.470703125, 11.21044921875, 11.9501953125, 12.68994140625, 13.4296875, 14.16943359375, 14.9091796875, 15.64892578125, 16.388671875, 17.12841796875, 17.8681640625, 18.60791015625, 19.34765625, 20.08740234375, 20.8271484375, 21.56689453125, 22.306640625, 23.04638671875, 23.7861328125, 24.52587890625, 25.265625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 7.0, 12.0, 13.0, 15.0, 26.0, 28.0, 21.0, 23.0, 42.0, 35.0, 52.0, 52.0, 53.0, 59.0, 52.0, 62.0, 60.0, 72.0, 46.0, 33.0, 37.0, 37.0, 27.0, 24.0, 28.0, 18.0, 17.0, 5.0, 10.0, 9.0, 9.0, 2.0, 3.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0], "bins": [-26.140625, -25.466796875, -24.79296875, -24.119140625, -23.4453125, -22.771484375, -22.09765625, -21.423828125, -20.75, -20.076171875, -19.40234375, -18.728515625, -18.0546875, -17.380859375, -16.70703125, -16.033203125, -15.359375, -14.685546875, -14.01171875, -13.337890625, -12.6640625, -11.990234375, -11.31640625, -10.642578125, -9.96875, -9.294921875, -8.62109375, -7.947265625, -7.2734375, -6.599609375, -5.92578125, -5.251953125, -4.578125, -3.904296875, -3.23046875, -2.556640625, -1.8828125, -1.208984375, -0.53515625, 0.138671875, 0.8125, 1.486328125, 2.16015625, 2.833984375, 3.5078125, 4.181640625, 4.85546875, 5.529296875, 6.203125, 6.876953125, 7.55078125, 8.224609375, 8.8984375, 9.572265625, 10.24609375, 10.919921875, 11.59375, 12.267578125, 12.94140625, 13.615234375, 14.2890625, 14.962890625, 15.63671875, 16.310546875, 16.984375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 8.0, 11.0, 5.0, 9.0, 11.0, 21.0, 26.0, 41.0, 53.0, 68.0, 106.0, 148.0, 297.0, 464.0, 709.0, 1345.0, 2637.0, 5824.0, 16686.0, 102670.0, 782923.0, 105533.0, 17053.0, 5851.0, 2632.0, 1373.0, 763.0, 479.0, 255.0, 168.0, 117.0, 65.0, 43.0, 37.0, 29.0, 22.0, 13.0, 12.0, 10.0, 10.0, 6.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.421875, -15.883544921875, -15.34521484375, -14.806884765625, -14.2685546875, -13.730224609375, -13.19189453125, -12.653564453125, -12.115234375, -11.576904296875, -11.03857421875, -10.500244140625, -9.9619140625, -9.423583984375, -8.88525390625, -8.346923828125, -7.80859375, -7.270263671875, -6.73193359375, -6.193603515625, -5.6552734375, -5.116943359375, -4.57861328125, -4.040283203125, -3.501953125, -2.963623046875, -2.42529296875, -1.886962890625, -1.3486328125, -0.810302734375, -0.27197265625, 0.266357421875, 0.8046875, 1.343017578125, 1.88134765625, 2.419677734375, 2.9580078125, 3.496337890625, 4.03466796875, 4.572998046875, 5.111328125, 5.649658203125, 6.18798828125, 6.726318359375, 7.2646484375, 7.802978515625, 8.34130859375, 8.879638671875, 9.41796875, 9.956298828125, 10.49462890625, 11.032958984375, 11.5712890625, 12.109619140625, 12.64794921875, 13.186279296875, 13.724609375, 14.262939453125, 14.80126953125, 15.339599609375, 15.8779296875, 16.416259765625, 16.95458984375, 17.492919921875, 18.03125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 17.0, 21.0, 26.0, 52.0, 121.0, 269.0, 229.0, 114.0, 35.0, 27.0, 17.0, 12.0, 11.0, 2.0, 1.0, 8.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031414031982421875, -0.0030396878719329834, -0.0029379725456237793, -0.002836257219314575, -0.002734541893005371, -0.002632826566696167, -0.002531111240386963, -0.002429395914077759, -0.0023276805877685547, -0.0022259652614593506, -0.0021242499351501465, -0.0020225346088409424, -0.0019208192825317383, -0.0018191039562225342, -0.00171738862991333, -0.001615673303604126, -0.0015139579772949219, -0.0014122426509857178, -0.0013105273246765137, -0.0012088119983673096, -0.0011070966720581055, -0.0010053813457489014, -0.0009036660194396973, -0.0008019506931304932, -0.0007002353668212891, -0.000598520040512085, -0.0004968047142028809, -0.00039508938789367676, -0.00029337406158447266, -0.00019165873527526855, -8.994340896606445e-05, 1.1771917343139648e-05, 0.00011348724365234375, 0.00021520256996154785, 0.00031691789627075195, 0.00041863322257995605, 0.0005203485488891602, 0.0006220638751983643, 0.0007237792015075684, 0.0008254945278167725, 0.0009272098541259766, 0.0010289251804351807, 0.0011306405067443848, 0.0012323558330535889, 0.001334071159362793, 0.001435786485671997, 0.0015375018119812012, 0.0016392171382904053, 0.0017409324645996094, 0.0018426477909088135, 0.0019443631172180176, 0.0020460784435272217, 0.0021477937698364258, 0.00224950909614563, 0.002351224422454834, 0.002452939748764038, 0.002554655075073242, 0.0026563704013824463, 0.0027580857276916504, 0.0028598010540008545, 0.0029615163803100586, 0.0030632317066192627, 0.003164947032928467, 0.003266662359237671, 0.003368377685546875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 12.0, 26.0, 18.0, 46.0, 59.0, 143.0, 228.0, 461.0, 1010.0, 2657.0, 10429.0, 661161.0, 358731.0, 9186.0, 2460.0, 969.0, 424.0, 226.0, 125.0, 67.0, 38.0, 28.0, 15.0, 10.0, 9.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.21875, -57.47509765625, -55.7314453125, -53.98779296875, -52.244140625, -50.50048828125, -48.7568359375, -47.01318359375, -45.26953125, -43.52587890625, -41.7822265625, -40.03857421875, -38.294921875, -36.55126953125, -34.8076171875, -33.06396484375, -31.3203125, -29.57666015625, -27.8330078125, -26.08935546875, -24.345703125, -22.60205078125, -20.8583984375, -19.11474609375, -17.37109375, -15.62744140625, -13.8837890625, -12.14013671875, -10.396484375, -8.65283203125, -6.9091796875, -5.16552734375, -3.421875, -1.67822265625, 0.0654296875, 1.80908203125, 3.552734375, 5.29638671875, 7.0400390625, 8.78369140625, 10.52734375, 12.27099609375, 14.0146484375, 15.75830078125, 17.501953125, 19.24560546875, 20.9892578125, 22.73291015625, 24.4765625, 26.22021484375, 27.9638671875, 29.70751953125, 31.451171875, 33.19482421875, 34.9384765625, 36.68212890625, 38.42578125, 40.16943359375, 41.9130859375, 43.65673828125, 45.400390625, 47.14404296875, 48.8876953125, 50.63134765625, 52.375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 9.0, 12.0, 15.0, 52.0, 143.0, 497.0, 161.0, 54.0, 14.0, 10.0, 10.0, 6.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.53125, -36.443359375, -35.35546875, -34.267578125, -33.1796875, -32.091796875, -31.00390625, -29.916015625, -28.828125, -27.740234375, -26.65234375, -25.564453125, -24.4765625, -23.388671875, -22.30078125, -21.212890625, -20.125, -19.037109375, -17.94921875, -16.861328125, -15.7734375, -14.685546875, -13.59765625, -12.509765625, -11.421875, -10.333984375, -9.24609375, -8.158203125, -7.0703125, -5.982421875, -4.89453125, -3.806640625, -2.71875, -1.630859375, -0.54296875, 0.544921875, 1.6328125, 2.720703125, 3.80859375, 4.896484375, 5.984375, 7.072265625, 8.16015625, 9.248046875, 10.3359375, 11.423828125, 12.51171875, 13.599609375, 14.6875, 15.775390625, 16.86328125, 17.951171875, 19.0390625, 20.126953125, 21.21484375, 22.302734375, 23.390625, 24.478515625, 25.56640625, 26.654296875, 27.7421875, 28.830078125, 29.91796875, 31.005859375, 32.09375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 8.0, 18.0, 60.0, 145.0, 254.0, 278.0, 157.0, 50.0, 24.0, 13.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-408.7998352050781, -395.65716552734375, -382.5145263671875, -369.37188720703125, -356.2292175292969, -343.0865478515625, -329.94390869140625, -316.80126953125, -303.6585998535156, -290.51593017578125, -277.373291015625, -264.23065185546875, -251.08798217773438, -237.94532775878906, -224.80267333984375, -211.66001892089844, -198.51736450195312, -185.3747100830078, -172.2320556640625, -159.0894012451172, -145.94674682617188, -132.80409240722656, -119.66143798828125, -106.51878356933594, -93.37612915039062, -80.23347473144531, -67.0908203125, -53.94816589355469, -40.805511474609375, -27.662857055664062, -14.52020263671875, -1.3775482177734375, 11.765106201171875, 24.907760620117188, 38.0504150390625, 51.19306945800781, 64.33572387695312, 77.47837829589844, 90.62103271484375, 103.76368713378906, 116.90634155273438, 130.0489959716797, 143.191650390625, 156.3343048095703, 169.47695922851562, 182.61961364746094, 195.76226806640625, 208.90492248535156, 222.04757690429688, 235.1902313232422, 248.3328857421875, 261.47552490234375, 274.6181945800781, 287.7608642578125, 300.90350341796875, 314.046142578125, 327.1888122558594, 340.33148193359375, 353.47412109375, 366.61676025390625, 379.7594299316406, 392.902099609375, 406.04473876953125, 419.1873779296875, 432.3300476074219]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 5.0, 5.0, 3.0, 12.0, 9.0, 8.0, 12.0, 16.0, 16.0, 21.0, 27.0, 19.0, 15.0, 34.0, 28.0, 35.0, 36.0, 36.0, 29.0, 36.0, 40.0, 49.0, 50.0, 39.0, 41.0, 37.0, 53.0, 39.0, 28.0, 37.0, 26.0, 29.0, 19.0, 21.0, 17.0, 17.0, 14.0, 6.0, 11.0, 10.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-107.05431365966797, -103.92790222167969, -100.80148315429688, -97.6750717163086, -94.54866027832031, -91.4222412109375, -88.29582977294922, -85.16941833496094, -82.04299926757812, -78.91658782958984, -75.79016876220703, -72.66375732421875, -69.53734588623047, -66.41093444824219, -63.284515380859375, -60.158103942871094, -57.03169250488281, -53.905277252197266, -50.778865814208984, -47.65245056152344, -44.526039123535156, -41.39962387084961, -38.27320861816406, -35.14679718017578, -32.020381927490234, -28.89396858215332, -25.767555236816406, -22.64113998413086, -19.514726638793945, -16.38831329345703, -13.261898040771484, -10.13548469543457, -7.009063720703125, -3.8826498985290527, -0.7562360763549805, 2.37017822265625, 5.496591567993164, 8.623004913330078, 11.749420166015625, 14.875833511352539, 18.002246856689453, 21.128660202026367, 24.25507354736328, 27.381488800048828, 30.507902145385742, 33.634315490722656, 36.7607307434082, 39.88714599609375, 43.01355743408203, 46.13997268676758, 49.26638412475586, 52.392799377441406, 55.51921081542969, 58.645626068115234, 61.77204132080078, 64.89845275878906, 68.02487182617188, 71.15128326416016, 74.27770233154297, 77.40411376953125, 80.53052520751953, 83.65693664550781, 86.78335571289062, 89.9097671508789, 93.03617858886719]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 4.0, 4.0, 13.0, 14.0, 18.0, 14.0, 41.0, 60.0, 80.0, 106.0, 203.0, 350.0, 595.0, 1158.0, 2346.0, 6224.0, 21169.0, 130928.0, 3822143.0, 171650.0, 25043.0, 6735.0, 2659.0, 1152.0, 628.0, 351.0, 219.0, 129.0, 82.0, 53.0, 41.0, 20.0, 15.0, 9.0, 4.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.4375, -64.189453125, -61.94140625, -59.693359375, -57.4453125, -55.197265625, -52.94921875, -50.701171875, -48.453125, -46.205078125, -43.95703125, -41.708984375, -39.4609375, -37.212890625, -34.96484375, -32.716796875, -30.46875, -28.220703125, -25.97265625, -23.724609375, -21.4765625, -19.228515625, -16.98046875, -14.732421875, -12.484375, -10.236328125, -7.98828125, -5.740234375, -3.4921875, -1.244140625, 1.00390625, 3.251953125, 5.5, 7.748046875, 9.99609375, 12.244140625, 14.4921875, 16.740234375, 18.98828125, 21.236328125, 23.484375, 25.732421875, 27.98046875, 30.228515625, 32.4765625, 34.724609375, 36.97265625, 39.220703125, 41.46875, 43.716796875, 45.96484375, 48.212890625, 50.4609375, 52.708984375, 54.95703125, 57.205078125, 59.453125, 61.701171875, 63.94921875, 66.197265625, 68.4453125, 70.693359375, 72.94140625, 75.189453125, 77.4375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 7.0, 10.0, 13.0, 25.0, 23.0, 47.0, 41.0, 53.0, 68.0, 82.0, 79.0, 83.0, 93.0, 70.0, 67.0, 63.0, 47.0, 34.0, 29.0, 18.0, 12.0, 18.0, 8.0, 4.0, 2.0, 0.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.90625, -8.6488037109375, -8.391357421875, -8.1339111328125, -7.87646484375, -7.6190185546875, -7.361572265625, -7.1041259765625, -6.8466796875, -6.5892333984375, -6.331787109375, -6.0743408203125, -5.81689453125, -5.5594482421875, -5.302001953125, -5.0445556640625, -4.787109375, -4.5296630859375, -4.272216796875, -4.0147705078125, -3.75732421875, -3.4998779296875, -3.242431640625, -2.9849853515625, -2.7275390625, -2.4700927734375, -2.212646484375, -1.9552001953125, -1.69775390625, -1.4403076171875, -1.182861328125, -0.9254150390625, -0.66796875, -0.4105224609375, -0.153076171875, 0.1043701171875, 0.36181640625, 0.6192626953125, 0.876708984375, 1.1341552734375, 1.3916015625, 1.6490478515625, 1.906494140625, 2.1639404296875, 2.42138671875, 2.6788330078125, 2.936279296875, 3.1937255859375, 3.451171875, 3.7086181640625, 3.966064453125, 4.2235107421875, 4.48095703125, 4.7384033203125, 4.995849609375, 5.2532958984375, 5.5107421875, 5.7681884765625, 6.025634765625, 6.2830810546875, 6.54052734375, 6.7979736328125, 7.055419921875, 7.3128662109375, 7.5703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 9.0, 21.0, 31.0, 59.0, 91.0, 152.0, 263.0, 590.0, 1180.0, 2379.0, 5224.0, 13927.0, 47488.0, 286974.0, 3563903.0, 210999.0, 39622.0, 12100.0, 4712.0, 2171.0, 1089.0, 540.0, 323.0, 158.0, 105.0, 65.0, 31.0, 29.0, 11.0, 8.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.09375, -41.578125, -40.0625, -38.546875, -37.03125, -35.515625, -34.0, -32.484375, -30.96875, -29.453125, -27.9375, -26.421875, -24.90625, -23.390625, -21.875, -20.359375, -18.84375, -17.328125, -15.8125, -14.296875, -12.78125, -11.265625, -9.75, -8.234375, -6.71875, -5.203125, -3.6875, -2.171875, -0.65625, 0.859375, 2.375, 3.890625, 5.40625, 6.921875, 8.4375, 9.953125, 11.46875, 12.984375, 14.5, 16.015625, 17.53125, 19.046875, 20.5625, 22.078125, 23.59375, 25.109375, 26.625, 28.140625, 29.65625, 31.171875, 32.6875, 34.203125, 35.71875, 37.234375, 38.75, 40.265625, 41.78125, 43.296875, 44.8125, 46.328125, 47.84375, 49.359375, 50.875, 52.390625, 53.90625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 5.0, 5.0, 3.0, 2.0, 11.0, 8.0, 11.0, 24.0, 34.0, 38.0, 60.0, 77.0, 139.0, 247.0, 593.0, 1873.0, 380.0, 192.0, 96.0, 66.0, 47.0, 35.0, 25.0, 16.0, 19.0, 8.0, 10.0, 11.0, 2.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.5859375, -12.140625, -11.6953125, -11.25, -10.8046875, -10.359375, -9.9140625, -9.46875, -9.0234375, -8.578125, -8.1328125, -7.6875, -7.2421875, -6.796875, -6.3515625, -5.90625, -5.4609375, -5.015625, -4.5703125, -4.125, -3.6796875, -3.234375, -2.7890625, -2.34375, -1.8984375, -1.453125, -1.0078125, -0.5625, -0.1171875, 0.328125, 0.7734375, 1.21875, 1.6640625, 2.109375, 2.5546875, 3.0, 3.4453125, 3.890625, 4.3359375, 4.78125, 5.2265625, 5.671875, 6.1171875, 6.5625, 7.0078125, 7.453125, 7.8984375, 8.34375, 8.7890625, 9.234375, 9.6796875, 10.125, 10.5703125, 11.015625, 11.4609375, 11.90625, 12.3515625, 12.796875, 13.2421875, 13.6875, 14.1328125, 14.578125, 15.0234375, 15.46875, 15.9140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 16.0, 68.0, 204.0, 317.0, 229.0, 97.0, 36.0, 23.0, 7.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.7562255859375, -106.1827163696289, -97.60920715332031, -89.03569030761719, -80.4621810913086, -71.888671875, -63.31515884399414, -54.74164581298828, -46.16813659667969, -37.594627380371094, -29.021114349365234, -20.447603225708008, -11.874092102050781, -3.3005828857421875, 5.272930145263672, 13.846443176269531, 22.419952392578125, 30.99346351623535, 39.56697463989258, 48.14048767089844, 56.71399688720703, 65.28750610351562, 73.86102294921875, 82.43453216552734, 91.00804138183594, 99.58155059814453, 108.15505981445312, 116.72857666015625, 125.30208587646484, 133.87559509277344, 142.44911193847656, 151.02261352539062, 159.59609985351562, 168.16961669921875, 176.7431182861328, 185.31663513183594, 193.89013671875, 202.46365356445312, 211.03717041015625, 219.61068725585938, 228.18418884277344, 236.75770568847656, 245.33120727539062, 253.90472412109375, 262.4782409667969, 271.0517578125, 279.625244140625, 288.1987609863281, 296.77227783203125, 305.3457946777344, 313.9193115234375, 322.4927978515625, 331.0663146972656, 339.63983154296875, 348.2133483886719, 356.786865234375, 365.3603515625, 373.9338684082031, 382.50738525390625, 391.08087158203125, 399.6543884277344, 408.2279052734375, 416.8014221191406, 425.37493896484375, 433.9484558105469]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 3.0, 7.0, 10.0, 10.0, 18.0, 14.0, 25.0, 19.0, 15.0, 19.0, 31.0, 30.0, 32.0, 33.0, 47.0, 45.0, 41.0, 34.0, 45.0, 49.0, 47.0, 46.0, 34.0, 46.0, 41.0, 42.0, 35.0, 29.0, 18.0, 24.0, 21.0, 12.0, 13.0, 12.0, 13.0, 9.0, 10.0, 4.0, 3.0, 6.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-66.1232681274414, -64.26688385009766, -62.410499572753906, -60.554115295410156, -58.697731018066406, -56.841346740722656, -54.98496627807617, -53.12858200073242, -51.27219772338867, -49.41581344604492, -47.55942916870117, -45.70304489135742, -43.84666442871094, -41.99028015136719, -40.13389587402344, -38.27751159667969, -36.42112731933594, -34.56474304199219, -32.70835876464844, -30.85197639465332, -28.99559211730957, -27.13920783996582, -25.282825469970703, -23.426441192626953, -21.570056915283203, -19.713672637939453, -17.857288360595703, -16.000905990600586, -14.144521713256836, -12.288137435913086, -10.431754112243652, -8.575370788574219, -6.718990325927734, -4.862606525421143, -3.006222724914551, -1.149838924407959, 0.7065448760986328, 2.562929153442383, 4.419312477111816, 6.27569580078125, 8.132080078125, 9.98846435546875, 11.844847679138184, 13.701231002807617, 15.557615280151367, 17.413999557495117, 19.270381927490234, 21.126766204833984, 22.983150482177734, 24.839534759521484, 26.695919036865234, 28.55230140686035, 30.4086856842041, 32.26506805419922, 34.12145233154297, 35.97783660888672, 37.83422088623047, 39.69060516357422, 41.54698944091797, 43.40337371826172, 45.25975799560547, 47.11614227294922, 48.9725227355957, 50.82890701293945, 52.6852912902832]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 6.0, 4.0, 15.0, 15.0, 24.0, 27.0, 53.0, 68.0, 100.0, 163.0, 307.0, 560.0, 1081.0, 2371.0, 5565.0, 15427.0, 49516.0, 173591.0, 494142.0, 215012.0, 59854.0, 18568.0, 6616.0, 2756.0, 1265.0, 600.0, 329.0, 189.0, 129.0, 72.0, 30.0, 24.0, 23.0, 17.0, 12.0, 10.0, 8.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.578125, -29.469482421875, -28.36083984375, -27.252197265625, -26.1435546875, -25.034912109375, -23.92626953125, -22.817626953125, -21.708984375, -20.600341796875, -19.49169921875, -18.383056640625, -17.2744140625, -16.165771484375, -15.05712890625, -13.948486328125, -12.83984375, -11.731201171875, -10.62255859375, -9.513916015625, -8.4052734375, -7.296630859375, -6.18798828125, -5.079345703125, -3.970703125, -2.862060546875, -1.75341796875, -0.644775390625, 0.4638671875, 1.572509765625, 2.68115234375, 3.789794921875, 4.8984375, 6.007080078125, 7.11572265625, 8.224365234375, 9.3330078125, 10.441650390625, 11.55029296875, 12.658935546875, 13.767578125, 14.876220703125, 15.98486328125, 17.093505859375, 18.2021484375, 19.310791015625, 20.41943359375, 21.528076171875, 22.63671875, 23.745361328125, 24.85400390625, 25.962646484375, 27.0712890625, 28.179931640625, 29.28857421875, 30.397216796875, 31.505859375, 32.614501953125, 33.72314453125, 34.831787109375, 35.9404296875, 37.049072265625, 38.15771484375, 39.266357421875, 40.375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 11.0, 17.0, 28.0, 28.0, 41.0, 44.0, 60.0, 52.0, 55.0, 61.0, 65.0, 67.0, 60.0, 53.0, 58.0, 56.0, 53.0, 32.0, 28.0, 32.0, 19.0, 14.0, 14.0, 9.0, 11.0, 3.0, 3.0, 2.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.484375, -8.23760986328125, -7.9908447265625, -7.74407958984375, -7.497314453125, -7.25054931640625, -7.0037841796875, -6.75701904296875, -6.51025390625, -6.26348876953125, -6.0167236328125, -5.76995849609375, -5.523193359375, -5.27642822265625, -5.0296630859375, -4.78289794921875, -4.5361328125, -4.28936767578125, -4.0426025390625, -3.79583740234375, -3.549072265625, -3.30230712890625, -3.0555419921875, -2.80877685546875, -2.56201171875, -2.31524658203125, -2.0684814453125, -1.82171630859375, -1.574951171875, -1.32818603515625, -1.0814208984375, -0.83465576171875, -0.587890625, -0.34112548828125, -0.0943603515625, 0.15240478515625, 0.399169921875, 0.64593505859375, 0.8927001953125, 1.13946533203125, 1.38623046875, 1.63299560546875, 1.8797607421875, 2.12652587890625, 2.373291015625, 2.62005615234375, 2.8668212890625, 3.11358642578125, 3.3603515625, 3.60711669921875, 3.8538818359375, 4.10064697265625, 4.347412109375, 4.59417724609375, 4.8409423828125, 5.08770751953125, 5.33447265625, 5.58123779296875, 5.8280029296875, 6.07476806640625, 6.321533203125, 6.56829833984375, 6.8150634765625, 7.06182861328125, 7.30859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 6.0, 11.0, 7.0, 14.0, 15.0, 22.0, 38.0, 48.0, 71.0, 114.0, 184.0, 269.0, 406.0, 620.0, 1295.0, 2847.0, 8200.0, 31941.0, 159111.0, 624255.0, 170469.0, 34006.0, 8609.0, 2875.0, 1283.0, 680.0, 385.0, 242.0, 160.0, 91.0, 79.0, 49.0, 29.0, 29.0, 28.0, 17.0, 13.0, 6.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -30.98779296875, -29.8193359375, -28.65087890625, -27.482421875, -26.31396484375, -25.1455078125, -23.97705078125, -22.80859375, -21.64013671875, -20.4716796875, -19.30322265625, -18.134765625, -16.96630859375, -15.7978515625, -14.62939453125, -13.4609375, -12.29248046875, -11.1240234375, -9.95556640625, -8.787109375, -7.61865234375, -6.4501953125, -5.28173828125, -4.11328125, -2.94482421875, -1.7763671875, -0.60791015625, 0.560546875, 1.72900390625, 2.8974609375, 4.06591796875, 5.234375, 6.40283203125, 7.5712890625, 8.73974609375, 9.908203125, 11.07666015625, 12.2451171875, 13.41357421875, 14.58203125, 15.75048828125, 16.9189453125, 18.08740234375, 19.255859375, 20.42431640625, 21.5927734375, 22.76123046875, 23.9296875, 25.09814453125, 26.2666015625, 27.43505859375, 28.603515625, 29.77197265625, 30.9404296875, 32.10888671875, 33.27734375, 34.44580078125, 35.6142578125, 36.78271484375, 37.951171875, 39.11962890625, 40.2880859375, 41.45654296875, 42.625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 18.0, 19.0, 10.0, 15.0, 24.0, 22.0, 33.0, 19.0, 29.0, 36.0, 36.0, 29.0, 45.0, 40.0, 43.0, 44.0, 44.0, 54.0, 35.0, 34.0, 38.0, 54.0, 34.0, 28.0, 25.0, 26.0, 24.0, 23.0, 16.0, 23.0, 10.0, 5.0, 7.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5, -24.715087890625, -23.93017578125, -23.145263671875, -22.3603515625, -21.575439453125, -20.79052734375, -20.005615234375, -19.220703125, -18.435791015625, -17.65087890625, -16.865966796875, -16.0810546875, -15.296142578125, -14.51123046875, -13.726318359375, -12.94140625, -12.156494140625, -11.37158203125, -10.586669921875, -9.8017578125, -9.016845703125, -8.23193359375, -7.447021484375, -6.662109375, -5.877197265625, -5.09228515625, -4.307373046875, -3.5224609375, -2.737548828125, -1.95263671875, -1.167724609375, -0.3828125, 0.402099609375, 1.18701171875, 1.971923828125, 2.7568359375, 3.541748046875, 4.32666015625, 5.111572265625, 5.896484375, 6.681396484375, 7.46630859375, 8.251220703125, 9.0361328125, 9.821044921875, 10.60595703125, 11.390869140625, 12.17578125, 12.960693359375, 13.74560546875, 14.530517578125, 15.3154296875, 16.100341796875, 16.88525390625, 17.670166015625, 18.455078125, 19.239990234375, 20.02490234375, 20.809814453125, 21.5947265625, 22.379638671875, 23.16455078125, 23.949462890625, 24.734375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 6.0, 13.0, 16.0, 14.0, 26.0, 28.0, 66.0, 82.0, 133.0, 230.0, 428.0, 929.0, 1857.0, 4280.0, 12472.0, 56295.0, 519265.0, 387779.0, 46253.0, 11022.0, 3874.0, 1706.0, 800.0, 410.0, 188.0, 138.0, 78.0, 51.0, 26.0, 23.0, 14.0, 15.0, 9.0, 10.0, 3.0, 8.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.452880859375, -18.78076171875, -18.108642578125, -17.4365234375, -16.764404296875, -16.09228515625, -15.420166015625, -14.748046875, -14.075927734375, -13.40380859375, -12.731689453125, -12.0595703125, -11.387451171875, -10.71533203125, -10.043212890625, -9.37109375, -8.698974609375, -8.02685546875, -7.354736328125, -6.6826171875, -6.010498046875, -5.33837890625, -4.666259765625, -3.994140625, -3.322021484375, -2.64990234375, -1.977783203125, -1.3056640625, -0.633544921875, 0.03857421875, 0.710693359375, 1.3828125, 2.054931640625, 2.72705078125, 3.399169921875, 4.0712890625, 4.743408203125, 5.41552734375, 6.087646484375, 6.759765625, 7.431884765625, 8.10400390625, 8.776123046875, 9.4482421875, 10.120361328125, 10.79248046875, 11.464599609375, 12.13671875, 12.808837890625, 13.48095703125, 14.153076171875, 14.8251953125, 15.497314453125, 16.16943359375, 16.841552734375, 17.513671875, 18.185791015625, 18.85791015625, 19.530029296875, 20.2021484375, 20.874267578125, 21.54638671875, 22.218505859375, 22.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 8.0, 6.0, 12.0, 21.0, 32.0, 45.0, 71.0, 141.0, 245.0, 167.0, 77.0, 54.0, 39.0, 21.0, 17.0, 11.0, 5.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0052337646484375, -0.005094558000564575, -0.00495535135269165, -0.004816144704818726, -0.004676938056945801, -0.004537731409072876, -0.004398524761199951, -0.004259318113327026, -0.0041201114654541016, -0.003980904817581177, -0.003841698169708252, -0.003702491521835327, -0.0035632848739624023, -0.0034240782260894775, -0.0032848715782165527, -0.003145664930343628, -0.003006458282470703, -0.0028672516345977783, -0.0027280449867248535, -0.0025888383388519287, -0.002449631690979004, -0.002310425043106079, -0.0021712183952331543, -0.0020320117473602295, -0.0018928050994873047, -0.0017535984516143799, -0.001614391803741455, -0.0014751851558685303, -0.0013359785079956055, -0.0011967718601226807, -0.0010575652122497559, -0.0009183585643768311, -0.0007791519165039062, -0.0006399452686309814, -0.0005007386207580566, -0.00036153197288513184, -0.00022232532501220703, -8.311867713928223e-05, 5.608797073364258e-05, 0.00019529461860656738, 0.0003345012664794922, 0.000473707914352417, 0.0006129145622253418, 0.0007521212100982666, 0.0008913278579711914, 0.0010305345058441162, 0.001169741153717041, 0.0013089478015899658, 0.0014481544494628906, 0.0015873610973358154, 0.0017265677452087402, 0.001865774393081665, 0.00200498104095459, 0.0021441876888275146, 0.0022833943367004395, 0.0024226009845733643, 0.002561807632446289, 0.002701014280319214, 0.0028402209281921387, 0.0029794275760650635, 0.0031186342239379883, 0.003257840871810913, 0.003397047519683838, 0.0035362541675567627, 0.0036754608154296875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 13.0, 13.0, 15.0, 11.0, 20.0, 18.0, 53.0, 55.0, 91.0, 134.0, 207.0, 306.0, 530.0, 1026.0, 2079.0, 4348.0, 11545.0, 42186.0, 347430.0, 552125.0, 61033.0, 14597.0, 5410.0, 2421.0, 1162.0, 665.0, 384.0, 237.0, 140.0, 68.0, 66.0, 42.0, 25.0, 18.0, 14.0, 12.0, 13.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.890625, -22.15478515625, -21.4189453125, -20.68310546875, -19.947265625, -19.21142578125, -18.4755859375, -17.73974609375, -17.00390625, -16.26806640625, -15.5322265625, -14.79638671875, -14.060546875, -13.32470703125, -12.5888671875, -11.85302734375, -11.1171875, -10.38134765625, -9.6455078125, -8.90966796875, -8.173828125, -7.43798828125, -6.7021484375, -5.96630859375, -5.23046875, -4.49462890625, -3.7587890625, -3.02294921875, -2.287109375, -1.55126953125, -0.8154296875, -0.07958984375, 0.65625, 1.39208984375, 2.1279296875, 2.86376953125, 3.599609375, 4.33544921875, 5.0712890625, 5.80712890625, 6.54296875, 7.27880859375, 8.0146484375, 8.75048828125, 9.486328125, 10.22216796875, 10.9580078125, 11.69384765625, 12.4296875, 13.16552734375, 13.9013671875, 14.63720703125, 15.373046875, 16.10888671875, 16.8447265625, 17.58056640625, 18.31640625, 19.05224609375, 19.7880859375, 20.52392578125, 21.259765625, 21.99560546875, 22.7314453125, 23.46728515625, 24.203125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 6.0, 9.0, 9.0, 10.0, 16.0, 17.0, 27.0, 41.0, 44.0, 79.0, 109.0, 137.0, 107.0, 106.0, 65.0, 53.0, 31.0, 31.0, 27.0, 11.0, 15.0, 11.0, 5.0, 9.0, 3.0, 0.0, 4.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.5, -18.92529296875, -18.3505859375, -17.77587890625, -17.201171875, -16.62646484375, -16.0517578125, -15.47705078125, -14.90234375, -14.32763671875, -13.7529296875, -13.17822265625, -12.603515625, -12.02880859375, -11.4541015625, -10.87939453125, -10.3046875, -9.72998046875, -9.1552734375, -8.58056640625, -8.005859375, -7.43115234375, -6.8564453125, -6.28173828125, -5.70703125, -5.13232421875, -4.5576171875, -3.98291015625, -3.408203125, -2.83349609375, -2.2587890625, -1.68408203125, -1.109375, -0.53466796875, 0.0400390625, 0.61474609375, 1.189453125, 1.76416015625, 2.3388671875, 2.91357421875, 3.48828125, 4.06298828125, 4.6376953125, 5.21240234375, 5.787109375, 6.36181640625, 6.9365234375, 7.51123046875, 8.0859375, 8.66064453125, 9.2353515625, 9.81005859375, 10.384765625, 10.95947265625, 11.5341796875, 12.10888671875, 12.68359375, 13.25830078125, 13.8330078125, 14.40771484375, 14.982421875, 15.55712890625, 16.1318359375, 16.70654296875, 17.28125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 13.0, 45.0, 97.0, 208.0, 244.0, 191.0, 116.0, 52.0, 14.0, 13.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-414.6982421875, -399.5536804199219, -384.40911865234375, -369.2645568847656, -354.1199951171875, -338.97540283203125, -323.8308410644531, -308.686279296875, -293.5417175292969, -278.39715576171875, -263.2525939941406, -248.10801696777344, -232.9634552001953, -217.8188934326172, -202.67431640625, -187.52975463867188, -172.38519287109375, -157.24063110351562, -142.0960693359375, -126.95149230957031, -111.80693054199219, -96.66236877441406, -81.5177993774414, -66.37322998046875, -51.228668212890625, -36.084102630615234, -20.939537048339844, -5.794971466064453, 9.349594116210938, 24.494155883789062, 39.63872528076172, 54.783294677734375, 69.9278564453125, 85.07241821289062, 100.21698760986328, 115.36155700683594, 130.50611877441406, 145.6506805419922, 160.79525756835938, 175.9398193359375, 191.08438110351562, 206.22894287109375, 221.37350463867188, 236.51808166503906, 251.6626434326172, 266.80718994140625, 281.9517822265625, 297.0963439941406, 312.24090576171875, 327.3854675292969, 342.530029296875, 357.6745910644531, 372.81915283203125, 387.9637451171875, 403.1083068847656, 418.25286865234375, 433.3974304199219, 448.5419921875, 463.6865539550781, 478.83111572265625, 493.9757080078125, 509.1202392578125, 524.2648315429688, 539.409423828125, 554.553955078125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 2.0, 6.0, 9.0, 13.0, 8.0, 13.0, 10.0, 14.0, 20.0, 13.0, 21.0, 36.0, 31.0, 47.0, 36.0, 44.0, 43.0, 55.0, 51.0, 38.0, 39.0, 42.0, 47.0, 42.0, 40.0, 38.0, 26.0, 27.0, 30.0, 29.0, 18.0, 16.0, 14.0, 18.0, 12.0, 11.0, 3.0, 8.0, 6.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-152.98780822753906, -148.5850067138672, -144.1822052001953, -139.77940368652344, -135.37661743164062, -130.97381591796875, -126.57101440429688, -122.168212890625, -117.76541137695312, -113.36260986328125, -108.95980834960938, -104.55701446533203, -100.15421295166016, -95.75141143798828, -91.34861755371094, -86.94581604003906, -82.54301452636719, -78.14021301269531, -73.73741149902344, -69.3346176147461, -64.93181610107422, -60.529014587402344, -56.126216888427734, -51.723419189453125, -47.32061767578125, -42.917816162109375, -38.515018463134766, -34.112220764160156, -29.70941925048828, -25.30661964416504, -20.903820037841797, -16.501020431518555, -12.098236083984375, -7.695436477661133, -3.2926368713378906, 1.1101627349853516, 5.512962341308594, 9.915761947631836, 14.318561553955078, 18.72136116027832, 23.124160766601562, 27.526960372924805, 31.929759979248047, 36.332557678222656, 40.73535919189453, 45.138160705566406, 49.540958404541016, 53.943756103515625, 58.3465576171875, 62.749359130859375, 67.15216064453125, 71.5549545288086, 75.95775604248047, 80.36055755615234, 84.76335144042969, 89.16615295410156, 93.56895446777344, 97.97175598144531, 102.37455749511719, 106.77735137939453, 111.1801528930664, 115.58295440673828, 119.98574829101562, 124.3885498046875, 128.79135131835938]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 12.0, 25.0, 24.0, 36.0, 68.0, 67.0, 82.0, 140.0, 201.0, 284.0, 375.0, 594.0, 986.0, 1781.0, 3856.0, 9840.0, 33559.0, 206592.0, 3610289.0, 265172.0, 39915.0, 11244.0, 4198.0, 1928.0, 1054.0, 652.0, 409.0, 274.0, 177.0, 142.0, 86.0, 66.0, 46.0, 33.0, 26.0, 22.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.34375, -34.92138671875, -33.4990234375, -32.07666015625, -30.654296875, -29.23193359375, -27.8095703125, -26.38720703125, -24.96484375, -23.54248046875, -22.1201171875, -20.69775390625, -19.275390625, -17.85302734375, -16.4306640625, -15.00830078125, -13.5859375, -12.16357421875, -10.7412109375, -9.31884765625, -7.896484375, -6.47412109375, -5.0517578125, -3.62939453125, -2.20703125, -0.78466796875, 0.6376953125, 2.06005859375, 3.482421875, 4.90478515625, 6.3271484375, 7.74951171875, 9.171875, 10.59423828125, 12.0166015625, 13.43896484375, 14.861328125, 16.28369140625, 17.7060546875, 19.12841796875, 20.55078125, 21.97314453125, 23.3955078125, 24.81787109375, 26.240234375, 27.66259765625, 29.0849609375, 30.50732421875, 31.9296875, 33.35205078125, 34.7744140625, 36.19677734375, 37.619140625, 39.04150390625, 40.4638671875, 41.88623046875, 43.30859375, 44.73095703125, 46.1533203125, 47.57568359375, 48.998046875, 50.42041015625, 51.8427734375, 53.26513671875, 54.6875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 8.0, 11.0, 8.0, 17.0, 19.0, 23.0, 34.0, 42.0, 46.0, 51.0, 58.0, 60.0, 47.0, 61.0, 55.0, 64.0, 66.0, 52.0, 51.0, 36.0, 31.0, 33.0, 34.0, 19.0, 23.0, 11.0, 9.0, 5.0, 3.0, 6.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.171875, -7.9315185546875, -7.691162109375, -7.4508056640625, -7.21044921875, -6.9700927734375, -6.729736328125, -6.4893798828125, -6.2490234375, -6.0086669921875, -5.768310546875, -5.5279541015625, -5.28759765625, -5.0472412109375, -4.806884765625, -4.5665283203125, -4.326171875, -4.0858154296875, -3.845458984375, -3.6051025390625, -3.36474609375, -3.1243896484375, -2.884033203125, -2.6436767578125, -2.4033203125, -2.1629638671875, -1.922607421875, -1.6822509765625, -1.44189453125, -1.2015380859375, -0.961181640625, -0.7208251953125, -0.48046875, -0.2401123046875, 0.000244140625, 0.2406005859375, 0.48095703125, 0.7213134765625, 0.961669921875, 1.2020263671875, 1.4423828125, 1.6827392578125, 1.923095703125, 2.1634521484375, 2.40380859375, 2.6441650390625, 2.884521484375, 3.1248779296875, 3.365234375, 3.6055908203125, 3.845947265625, 4.0863037109375, 4.32666015625, 4.5670166015625, 4.807373046875, 5.0477294921875, 5.2880859375, 5.5284423828125, 5.768798828125, 6.0091552734375, 6.24951171875, 6.4898681640625, 6.730224609375, 6.9705810546875, 7.2109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 0.0, 4.0, 2.0, 6.0, 10.0, 11.0, 16.0, 29.0, 54.0, 88.0, 180.0, 226.0, 345.0, 634.0, 1021.0, 2077.0, 4211.0, 10500.0, 32807.0, 146166.0, 2740757.0, 1101585.0, 109699.0, 26939.0, 8978.0, 3737.0, 1838.0, 961.0, 539.0, 334.0, 220.0, 107.0, 82.0, 42.0, 30.0, 10.0, 10.0, 12.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.58837890625, -32.4267578125, -31.26513671875, -30.103515625, -28.94189453125, -27.7802734375, -26.61865234375, -25.45703125, -24.29541015625, -23.1337890625, -21.97216796875, -20.810546875, -19.64892578125, -18.4873046875, -17.32568359375, -16.1640625, -15.00244140625, -13.8408203125, -12.67919921875, -11.517578125, -10.35595703125, -9.1943359375, -8.03271484375, -6.87109375, -5.70947265625, -4.5478515625, -3.38623046875, -2.224609375, -1.06298828125, 0.0986328125, 1.26025390625, 2.421875, 3.58349609375, 4.7451171875, 5.90673828125, 7.068359375, 8.22998046875, 9.3916015625, 10.55322265625, 11.71484375, 12.87646484375, 14.0380859375, 15.19970703125, 16.361328125, 17.52294921875, 18.6845703125, 19.84619140625, 21.0078125, 22.16943359375, 23.3310546875, 24.49267578125, 25.654296875, 26.81591796875, 27.9775390625, 29.13916015625, 30.30078125, 31.46240234375, 32.6240234375, 33.78564453125, 34.947265625, 36.10888671875, 37.2705078125, 38.43212890625, 39.59375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 6.0, 15.0, 17.0, 24.0, 30.0, 43.0, 77.0, 134.0, 218.0, 524.0, 1898.0, 581.0, 217.0, 101.0, 73.0, 28.0, 21.0, 19.0, 12.0, 5.0, 7.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.961669921875, -20.25146484375, -19.541259765625, -18.8310546875, -18.120849609375, -17.41064453125, -16.700439453125, -15.990234375, -15.280029296875, -14.56982421875, -13.859619140625, -13.1494140625, -12.439208984375, -11.72900390625, -11.018798828125, -10.30859375, -9.598388671875, -8.88818359375, -8.177978515625, -7.4677734375, -6.757568359375, -6.04736328125, -5.337158203125, -4.626953125, -3.916748046875, -3.20654296875, -2.496337890625, -1.7861328125, -1.075927734375, -0.36572265625, 0.344482421875, 1.0546875, 1.764892578125, 2.47509765625, 3.185302734375, 3.8955078125, 4.605712890625, 5.31591796875, 6.026123046875, 6.736328125, 7.446533203125, 8.15673828125, 8.866943359375, 9.5771484375, 10.287353515625, 10.99755859375, 11.707763671875, 12.41796875, 13.128173828125, 13.83837890625, 14.548583984375, 15.2587890625, 15.968994140625, 16.67919921875, 17.389404296875, 18.099609375, 18.809814453125, 19.52001953125, 20.230224609375, 20.9404296875, 21.650634765625, 22.36083984375, 23.071044921875, 23.78125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 10.0, 16.0, 56.0, 160.0, 308.0, 280.0, 126.0, 32.0, 9.0, 7.0, 5.0], "bins": [-618.598876953125, -607.9883422851562, -597.3778686523438, -586.767333984375, -576.1568603515625, -565.5463256835938, -554.9358520507812, -544.3253173828125, -533.71484375, -523.1043090820312, -512.4938354492188, -501.8833312988281, -491.2728271484375, -480.66229248046875, -470.0517883300781, -459.4412841796875, -448.83074951171875, -438.2202453613281, -427.6097412109375, -416.9992370605469, -406.38873291015625, -395.7781982421875, -385.1676940917969, -374.55718994140625, -363.9466857910156, -353.336181640625, -342.7256774902344, -332.11517333984375, -321.504638671875, -310.8941345214844, -300.28363037109375, -289.6731262207031, -279.0625915527344, -268.45208740234375, -257.8415832519531, -247.23106384277344, -236.6205596923828, -226.0100555419922, -215.3995361328125, -204.78903198242188, -194.17852783203125, -183.56802368164062, -172.95751953125, -162.3470001220703, -151.7364959716797, -141.12599182128906, -130.51547241210938, -119.90496826171875, -109.29446411132812, -98.6839599609375, -88.07344818115234, -77.46293640136719, -66.85243225097656, -56.24192428588867, -45.63141632080078, -35.020904541015625, -24.410404205322266, -13.799896240234375, -3.1893882751464844, 7.421119689941406, 18.031627655029297, 28.642135620117188, 39.25264358520508, 49.863155364990234, 60.47365951538086]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 10.0, 3.0, 3.0, 8.0, 10.0, 10.0, 10.0, 10.0, 13.0, 24.0, 28.0, 25.0, 21.0, 27.0, 30.0, 35.0, 26.0, 44.0, 39.0, 35.0, 42.0, 28.0, 39.0, 35.0, 31.0, 36.0, 26.0, 32.0, 39.0, 34.0, 37.0, 24.0, 19.0, 29.0, 30.0, 20.0, 15.0, 14.0, 13.0, 8.0, 9.0, 8.0, 7.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0], "bins": [-72.7452163696289, -70.65095520019531, -68.55668640136719, -66.4624252319336, -64.36815643310547, -62.27389144897461, -60.17962646484375, -58.085365295410156, -55.99109649658203, -53.89683151245117, -51.80256652832031, -49.70830154418945, -47.614036560058594, -45.519771575927734, -43.425506591796875, -41.33124542236328, -39.23698043823242, -37.14271545410156, -35.0484504699707, -32.954185485839844, -30.859920501708984, -28.765655517578125, -26.6713924407959, -24.57712745666504, -22.48286247253418, -20.38859748840332, -18.29433250427246, -16.200069427490234, -14.105803489685059, -12.0115385055542, -9.917274475097656, -7.823009490966797, -5.728748321533203, -3.634483575820923, -1.5402188301086426, 0.5540456771850586, 2.648310661315918, 4.742575645446777, 6.83683967590332, 8.93110466003418, 11.025369644165039, 13.119634628295898, 15.213899612426758, 17.308162689208984, 19.402427673339844, 21.496692657470703, 23.590957641601562, 25.685222625732422, 27.77948760986328, 29.87375259399414, 31.968017578125, 34.06228256225586, 36.15654754638672, 38.25081253051758, 40.34507751464844, 42.43933868408203, 44.533607482910156, 46.627872467041016, 48.722137451171875, 50.816402435302734, 52.910667419433594, 55.00493240356445, 57.09919738769531, 59.193458557128906, 61.287723541259766]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 18.0, 23.0, 25.0, 37.0, 76.0, 126.0, 194.0, 321.0, 657.0, 1263.0, 3010.0, 7436.0, 21931.0, 78690.0, 325153.0, 440808.0, 119841.0, 31662.0, 10140.0, 3730.0, 1603.0, 770.0, 398.0, 225.0, 142.0, 88.0, 53.0, 35.0, 27.0, 18.0, 14.0, 8.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.73046875, -31.6796875, -30.62890625, -29.578125, -28.52734375, -27.4765625, -26.42578125, -25.375, -24.32421875, -23.2734375, -22.22265625, -21.171875, -20.12109375, -19.0703125, -18.01953125, -16.96875, -15.91796875, -14.8671875, -13.81640625, -12.765625, -11.71484375, -10.6640625, -9.61328125, -8.5625, -7.51171875, -6.4609375, -5.41015625, -4.359375, -3.30859375, -2.2578125, -1.20703125, -0.15625, 0.89453125, 1.9453125, 2.99609375, 4.046875, 5.09765625, 6.1484375, 7.19921875, 8.25, 9.30078125, 10.3515625, 11.40234375, 12.453125, 13.50390625, 14.5546875, 15.60546875, 16.65625, 17.70703125, 18.7578125, 19.80859375, 20.859375, 21.91015625, 22.9609375, 24.01171875, 25.0625, 26.11328125, 27.1640625, 28.21484375, 29.265625, 30.31640625, 31.3671875, 32.41796875, 33.46875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 5.0, 2.0, 9.0, 7.0, 8.0, 14.0, 17.0, 24.0, 24.0, 25.0, 44.0, 32.0, 50.0, 59.0, 65.0, 64.0, 59.0, 49.0, 69.0, 60.0, 57.0, 53.0, 44.0, 36.0, 26.0, 29.0, 19.0, 13.0, 15.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.09375, -8.8250732421875, -8.556396484375, -8.2877197265625, -8.01904296875, -7.7503662109375, -7.481689453125, -7.2130126953125, -6.9443359375, -6.6756591796875, -6.406982421875, -6.1383056640625, -5.86962890625, -5.6009521484375, -5.332275390625, -5.0635986328125, -4.794921875, -4.5262451171875, -4.257568359375, -3.9888916015625, -3.72021484375, -3.4515380859375, -3.182861328125, -2.9141845703125, -2.6455078125, -2.3768310546875, -2.108154296875, -1.8394775390625, -1.57080078125, -1.3021240234375, -1.033447265625, -0.7647705078125, -0.49609375, -0.2274169921875, 0.041259765625, 0.3099365234375, 0.57861328125, 0.8472900390625, 1.115966796875, 1.3846435546875, 1.6533203125, 1.9219970703125, 2.190673828125, 2.4593505859375, 2.72802734375, 2.9967041015625, 3.265380859375, 3.5340576171875, 3.802734375, 4.0714111328125, 4.340087890625, 4.6087646484375, 4.87744140625, 5.1461181640625, 5.414794921875, 5.6834716796875, 5.9521484375, 6.2208251953125, 6.489501953125, 6.7581787109375, 7.02685546875, 7.2955322265625, 7.564208984375, 7.8328857421875, 8.1015625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 4.0, 9.0, 10.0, 15.0, 18.0, 16.0, 33.0, 38.0, 52.0, 90.0, 113.0, 188.0, 274.0, 427.0, 748.0, 1444.0, 3542.0, 10633.0, 41238.0, 199154.0, 576426.0, 163597.0, 34712.0, 9417.0, 3141.0, 1357.0, 654.0, 396.0, 240.0, 159.0, 109.0, 81.0, 67.0, 51.0, 24.0, 17.0, 19.0, 11.0, 8.0, 6.0, 9.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.96875, -33.923095703125, -32.87744140625, -31.831787109375, -30.7861328125, -29.740478515625, -28.69482421875, -27.649169921875, -26.603515625, -25.557861328125, -24.51220703125, -23.466552734375, -22.4208984375, -21.375244140625, -20.32958984375, -19.283935546875, -18.23828125, -17.192626953125, -16.14697265625, -15.101318359375, -14.0556640625, -13.010009765625, -11.96435546875, -10.918701171875, -9.873046875, -8.827392578125, -7.78173828125, -6.736083984375, -5.6904296875, -4.644775390625, -3.59912109375, -2.553466796875, -1.5078125, -0.462158203125, 0.58349609375, 1.629150390625, 2.6748046875, 3.720458984375, 4.76611328125, 5.811767578125, 6.857421875, 7.903076171875, 8.94873046875, 9.994384765625, 11.0400390625, 12.085693359375, 13.13134765625, 14.177001953125, 15.22265625, 16.268310546875, 17.31396484375, 18.359619140625, 19.4052734375, 20.450927734375, 21.49658203125, 22.542236328125, 23.587890625, 24.633544921875, 25.67919921875, 26.724853515625, 27.7705078125, 28.816162109375, 29.86181640625, 30.907470703125, 31.953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 8.0, 10.0, 14.0, 15.0, 13.0, 16.0, 11.0, 21.0, 36.0, 30.0, 33.0, 29.0, 37.0, 46.0, 44.0, 51.0, 36.0, 32.0, 49.0, 54.0, 44.0, 36.0, 43.0, 43.0, 36.0, 36.0, 31.0, 26.0, 20.0, 18.0, 23.0, 10.0, 6.0, 10.0, 9.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.40625, -29.46875, -28.53125, -27.59375, -26.65625, -25.71875, -24.78125, -23.84375, -22.90625, -21.96875, -21.03125, -20.09375, -19.15625, -18.21875, -17.28125, -16.34375, -15.40625, -14.46875, -13.53125, -12.59375, -11.65625, -10.71875, -9.78125, -8.84375, -7.90625, -6.96875, -6.03125, -5.09375, -4.15625, -3.21875, -2.28125, -1.34375, -0.40625, 0.53125, 1.46875, 2.40625, 3.34375, 4.28125, 5.21875, 6.15625, 7.09375, 8.03125, 8.96875, 9.90625, 10.84375, 11.78125, 12.71875, 13.65625, 14.59375, 15.53125, 16.46875, 17.40625, 18.34375, 19.28125, 20.21875, 21.15625, 22.09375, 23.03125, 23.96875, 24.90625, 25.84375, 26.78125, 27.71875, 28.65625, 29.59375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 10.0, 14.0, 24.0, 25.0, 37.0, 46.0, 101.0, 184.0, 318.0, 675.0, 1673.0, 5436.0, 22380.0, 117454.0, 467897.0, 340689.0, 71253.0, 14226.0, 3679.0, 1207.0, 532.0, 273.0, 147.0, 101.0, 67.0, 32.0, 15.0, 20.0, 9.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.625, -11.2481689453125, -10.871337890625, -10.4945068359375, -10.11767578125, -9.7408447265625, -9.364013671875, -8.9871826171875, -8.6103515625, -8.2335205078125, -7.856689453125, -7.4798583984375, -7.10302734375, -6.7261962890625, -6.349365234375, -5.9725341796875, -5.595703125, -5.2188720703125, -4.842041015625, -4.4652099609375, -4.08837890625, -3.7115478515625, -3.334716796875, -2.9578857421875, -2.5810546875, -2.2042236328125, -1.827392578125, -1.4505615234375, -1.07373046875, -0.6968994140625, -0.320068359375, 0.0567626953125, 0.43359375, 0.8104248046875, 1.187255859375, 1.5640869140625, 1.94091796875, 2.3177490234375, 2.694580078125, 3.0714111328125, 3.4482421875, 3.8250732421875, 4.201904296875, 4.5787353515625, 4.95556640625, 5.3323974609375, 5.709228515625, 6.0860595703125, 6.462890625, 6.8397216796875, 7.216552734375, 7.5933837890625, 7.97021484375, 8.3470458984375, 8.723876953125, 9.1007080078125, 9.4775390625, 9.8543701171875, 10.231201171875, 10.6080322265625, 10.98486328125, 11.3616943359375, 11.738525390625, 12.1153564453125, 12.4921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 17.0, 7.0, 11.0, 12.0, 29.0, 42.0, 43.0, 65.0, 73.0, 116.0, 101.0, 94.0, 87.0, 77.0, 60.0, 41.0, 26.0, 27.0, 18.0, 17.0, 5.0, 5.0, 9.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020580291748046875, -0.001984149217605591, -0.0019102692604064941, -0.0018363893032073975, -0.0017625093460083008, -0.001688629388809204, -0.0016147494316101074, -0.0015408694744110107, -0.001466989517211914, -0.0013931095600128174, -0.0013192296028137207, -0.001245349645614624, -0.0011714696884155273, -0.0010975897312164307, -0.001023709774017334, -0.0009498298168182373, -0.0008759498596191406, -0.0008020699024200439, -0.0007281899452209473, -0.0006543099880218506, -0.0005804300308227539, -0.0005065500736236572, -0.00043267011642456055, -0.00035879015922546387, -0.0002849102020263672, -0.0002110302448272705, -0.00013715028762817383, -6.327033042907715e-05, 1.0609626770019531e-05, 8.448958396911621e-05, 0.0001583695411682129, 0.00023224949836730957, 0.00030612945556640625, 0.00038000941276550293, 0.0004538893699645996, 0.0005277693271636963, 0.000601649284362793, 0.0006755292415618896, 0.0007494091987609863, 0.000823289155960083, 0.0008971691131591797, 0.0009710490703582764, 0.001044929027557373, 0.0011188089847564697, 0.0011926889419555664, 0.001266568899154663, 0.0013404488563537598, 0.0014143288135528564, 0.0014882087707519531, 0.0015620887279510498, 0.0016359686851501465, 0.0017098486423492432, 0.0017837285995483398, 0.0018576085567474365, 0.0019314885139465332, 0.00200536847114563, 0.0020792484283447266, 0.0021531283855438232, 0.00222700834274292, 0.0023008882999420166, 0.0023747682571411133, 0.00244864821434021, 0.0025225281715393066, 0.0025964081287384033, 0.0026702880859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 3.0, 8.0, 10.0, 5.0, 24.0, 33.0, 42.0, 72.0, 151.0, 272.0, 556.0, 1499.0, 4754.0, 24267.0, 242288.0, 659321.0, 97915.0, 12301.0, 3078.0, 994.0, 427.0, 205.0, 112.0, 73.0, 48.0, 25.0, 17.0, 9.0, 7.0, 7.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.328125, -20.72412109375, -20.1201171875, -19.51611328125, -18.912109375, -18.30810546875, -17.7041015625, -17.10009765625, -16.49609375, -15.89208984375, -15.2880859375, -14.68408203125, -14.080078125, -13.47607421875, -12.8720703125, -12.26806640625, -11.6640625, -11.06005859375, -10.4560546875, -9.85205078125, -9.248046875, -8.64404296875, -8.0400390625, -7.43603515625, -6.83203125, -6.22802734375, -5.6240234375, -5.02001953125, -4.416015625, -3.81201171875, -3.2080078125, -2.60400390625, -2.0, -1.39599609375, -0.7919921875, -0.18798828125, 0.416015625, 1.02001953125, 1.6240234375, 2.22802734375, 2.83203125, 3.43603515625, 4.0400390625, 4.64404296875, 5.248046875, 5.85205078125, 6.4560546875, 7.06005859375, 7.6640625, 8.26806640625, 8.8720703125, 9.47607421875, 10.080078125, 10.68408203125, 11.2880859375, 11.89208984375, 12.49609375, 13.10009765625, 13.7041015625, 14.30810546875, 14.912109375, 15.51611328125, 16.1201171875, 16.72412109375, 17.328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 9.0, 19.0, 16.0, 14.0, 23.0, 37.0, 45.0, 56.0, 38.0, 65.0, 70.0, 79.0, 68.0, 76.0, 59.0, 70.0, 50.0, 39.0, 36.0, 25.0, 17.0, 16.0, 14.0, 14.0, 6.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.6328125, -10.34381103515625, -10.0548095703125, -9.76580810546875, -9.476806640625, -9.18780517578125, -8.8988037109375, -8.60980224609375, -8.32080078125, -8.03179931640625, -7.7427978515625, -7.45379638671875, -7.164794921875, -6.87579345703125, -6.5867919921875, -6.29779052734375, -6.0087890625, -5.71978759765625, -5.4307861328125, -5.14178466796875, -4.852783203125, -4.56378173828125, -4.2747802734375, -3.98577880859375, -3.69677734375, -3.40777587890625, -3.1187744140625, -2.82977294921875, -2.540771484375, -2.25177001953125, -1.9627685546875, -1.67376708984375, -1.384765625, -1.09576416015625, -0.8067626953125, -0.51776123046875, -0.228759765625, 0.06024169921875, 0.3492431640625, 0.63824462890625, 0.92724609375, 1.21624755859375, 1.5052490234375, 1.79425048828125, 2.083251953125, 2.37225341796875, 2.6612548828125, 2.95025634765625, 3.2392578125, 3.52825927734375, 3.8172607421875, 4.10626220703125, 4.395263671875, 4.68426513671875, 4.9732666015625, 5.26226806640625, 5.55126953125, 5.84027099609375, 6.1292724609375, 6.41827392578125, 6.707275390625, 6.99627685546875, 7.2852783203125, 7.57427978515625, 7.86328125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 9.0, 19.0, 19.0, 81.0, 172.0, 250.0, 211.0, 149.0, 61.0, 22.0, 14.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.75823974609375, -119.47874450683594, -107.1992416381836, -94.91973876953125, -82.64024353027344, -70.36074829101562, -58.08124542236328, -45.80174255371094, -33.522247314453125, -21.242748260498047, -8.963249206542969, 3.3162498474121094, 15.595748901367188, 27.875247955322266, 40.154747009277344, 52.43424987792969, 64.7137451171875, 76.99324035644531, 89.27274322509766, 101.55224609375, 113.83174133300781, 126.11123657226562, 138.3907470703125, 150.6702423095703, 162.94973754882812, 175.22923278808594, 187.50872802734375, 199.78823852539062, 212.06773376464844, 224.34722900390625, 236.62673950195312, 248.90623474121094, 261.18572998046875, 273.4652404785156, 285.7447204589844, 298.02423095703125, 310.3037109375, 322.5832214355469, 334.86273193359375, 347.1422119140625, 359.4217224121094, 371.70123291015625, 383.980712890625, 396.2602233886719, 408.53973388671875, 420.8192138671875, 433.0987243652344, 445.37823486328125, 457.65771484375, 469.9372253417969, 482.2167053222656, 494.4962158203125, 506.77569580078125, 519.0552368164062, 531.334716796875, 543.6141967773438, 555.8936767578125, 568.1731567382812, 580.4526977539062, 592.732177734375, 605.0116577148438, 617.2911987304688, 629.5706787109375, 641.8501586914062, 654.1296997070312]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 4.0, 8.0, 11.0, 10.0, 5.0, 12.0, 14.0, 25.0, 20.0, 25.0, 34.0, 37.0, 42.0, 50.0, 51.0, 49.0, 38.0, 49.0, 44.0, 42.0, 66.0, 50.0, 38.0, 36.0, 34.0, 36.0, 21.0, 23.0, 20.0, 15.0, 17.0, 19.0, 11.0, 12.0, 7.0, 1.0, 6.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.80227661132812, -142.89404296875, -137.98580932617188, -133.0775604248047, -128.16932678222656, -123.26109313964844, -118.35285949707031, -113.44462585449219, -108.53638458251953, -103.6281509399414, -98.71990966796875, -93.81167602539062, -88.9034423828125, -83.99520111083984, -79.08696746826172, -74.17872619628906, -69.27049255371094, -64.36225891113281, -59.454017639160156, -54.54578399658203, -49.63754653930664, -44.72930908203125, -39.821075439453125, -34.912837982177734, -30.004600524902344, -25.096363067626953, -20.188127517700195, -15.279891014099121, -10.371654510498047, -5.463417053222656, -0.5551815032958984, 4.353054046630859, 9.261276245117188, 14.169512748718262, 19.077749252319336, 23.985984802246094, 28.894222259521484, 33.802459716796875, 38.710693359375, 43.61893081665039, 48.52716827392578, 53.43540573120117, 58.34364318847656, 63.25187683105469, 68.16011047363281, 73.06835174560547, 77.9765853881836, 82.88482666015625, 87.79306030273438, 92.7012939453125, 97.60953521728516, 102.51776885986328, 107.42601013183594, 112.33424377441406, 117.24247741699219, 122.15071105957031, 127.05895233154297, 131.96719360351562, 136.87542724609375, 141.78366088867188, 146.69189453125, 151.60012817382812, 156.5083770751953, 161.41661071777344, 166.32484436035156]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 7.0, 14.0, 14.0, 17.0, 27.0, 26.0, 34.0, 51.0, 65.0, 89.0, 121.0, 171.0, 255.0, 403.0, 737.0, 1389.0, 2873.0, 7261.0, 25073.0, 3794483.0, 327325.0, 21368.0, 6558.0, 2616.0, 1300.0, 713.0, 423.0, 261.0, 160.0, 118.0, 93.0, 70.0, 46.0, 29.0, 24.0, 18.0, 10.0, 10.0, 15.0, 5.0, 3.0, 7.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.84375, -44.31298828125, -42.7822265625, -41.25146484375, -39.720703125, -38.18994140625, -36.6591796875, -35.12841796875, -33.59765625, -32.06689453125, -30.5361328125, -29.00537109375, -27.474609375, -25.94384765625, -24.4130859375, -22.88232421875, -21.3515625, -19.82080078125, -18.2900390625, -16.75927734375, -15.228515625, -13.69775390625, -12.1669921875, -10.63623046875, -9.10546875, -7.57470703125, -6.0439453125, -4.51318359375, -2.982421875, -1.45166015625, 0.0791015625, 1.60986328125, 3.140625, 4.67138671875, 6.2021484375, 7.73291015625, 9.263671875, 10.79443359375, 12.3251953125, 13.85595703125, 15.38671875, 16.91748046875, 18.4482421875, 19.97900390625, 21.509765625, 23.04052734375, 24.5712890625, 26.10205078125, 27.6328125, 29.16357421875, 30.6943359375, 32.22509765625, 33.755859375, 35.28662109375, 36.8173828125, 38.34814453125, 39.87890625, 41.40966796875, 42.9404296875, 44.47119140625, 46.001953125, 47.53271484375, 49.0634765625, 50.59423828125, 52.125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 0.0, 5.0, 9.0, 6.0, 5.0, 7.0, 14.0, 26.0, 30.0, 33.0, 37.0, 34.0, 54.0, 47.0, 51.0, 57.0, 45.0, 56.0, 52.0, 57.0, 62.0, 48.0, 41.0, 27.0, 36.0, 32.0, 26.0, 16.0, 19.0, 15.0, 15.0, 11.0, 7.0, 9.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.359375, -9.08990478515625, -8.8204345703125, -8.55096435546875, -8.281494140625, -8.01202392578125, -7.7425537109375, -7.47308349609375, -7.20361328125, -6.93414306640625, -6.6646728515625, -6.39520263671875, -6.125732421875, -5.85626220703125, -5.5867919921875, -5.31732177734375, -5.0478515625, -4.77838134765625, -4.5089111328125, -4.23944091796875, -3.969970703125, -3.70050048828125, -3.4310302734375, -3.16156005859375, -2.89208984375, -2.62261962890625, -2.3531494140625, -2.08367919921875, -1.814208984375, -1.54473876953125, -1.2752685546875, -1.00579833984375, -0.736328125, -0.46685791015625, -0.1973876953125, 0.07208251953125, 0.341552734375, 0.61102294921875, 0.8804931640625, 1.14996337890625, 1.41943359375, 1.68890380859375, 1.9583740234375, 2.22784423828125, 2.497314453125, 2.76678466796875, 3.0362548828125, 3.30572509765625, 3.5751953125, 3.84466552734375, 4.1141357421875, 4.38360595703125, 4.653076171875, 4.92254638671875, 5.1920166015625, 5.46148681640625, 5.73095703125, 6.00042724609375, 6.2698974609375, 6.53936767578125, 6.808837890625, 7.07830810546875, 7.3477783203125, 7.61724853515625, 7.88671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 20.0, 22.0, 40.0, 79.0, 137.0, 239.0, 426.0, 770.0, 1407.0, 2961.0, 7840.0, 35541.0, 3986952.0, 133873.0, 14976.0, 4558.0, 2039.0, 1063.0, 568.0, 317.0, 187.0, 99.0, 59.0, 46.0, 22.0, 13.0, 4.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.34375, -38.77685546875, -37.2099609375, -35.64306640625, -34.076171875, -32.50927734375, -30.9423828125, -29.37548828125, -27.80859375, -26.24169921875, -24.6748046875, -23.10791015625, -21.541015625, -19.97412109375, -18.4072265625, -16.84033203125, -15.2734375, -13.70654296875, -12.1396484375, -10.57275390625, -9.005859375, -7.43896484375, -5.8720703125, -4.30517578125, -2.73828125, -1.17138671875, 0.3955078125, 1.96240234375, 3.529296875, 5.09619140625, 6.6630859375, 8.22998046875, 9.796875, 11.36376953125, 12.9306640625, 14.49755859375, 16.064453125, 17.63134765625, 19.1982421875, 20.76513671875, 22.33203125, 23.89892578125, 25.4658203125, 27.03271484375, 28.599609375, 30.16650390625, 31.7333984375, 33.30029296875, 34.8671875, 36.43408203125, 38.0009765625, 39.56787109375, 41.134765625, 42.70166015625, 44.2685546875, 45.83544921875, 47.40234375, 48.96923828125, 50.5361328125, 52.10302734375, 53.669921875, 55.23681640625, 56.8037109375, 58.37060546875, 59.9375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 7.0, 8.0, 9.0, 17.0, 21.0, 53.0, 144.0, 3382.0, 241.0, 87.0, 41.0, 29.0, 9.0, 11.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.7421875, -10.46453857421875, -10.1868896484375, -9.90924072265625, -9.631591796875, -9.35394287109375, -9.0762939453125, -8.79864501953125, -8.52099609375, -8.24334716796875, -7.9656982421875, -7.68804931640625, -7.410400390625, -7.13275146484375, -6.8551025390625, -6.57745361328125, -6.2998046875, -6.02215576171875, -5.7445068359375, -5.46685791015625, -5.189208984375, -4.91156005859375, -4.6339111328125, -4.35626220703125, -4.07861328125, -3.80096435546875, -3.5233154296875, -3.24566650390625, -2.968017578125, -2.69036865234375, -2.4127197265625, -2.13507080078125, -1.857421875, -1.57977294921875, -1.3021240234375, -1.02447509765625, -0.746826171875, -0.46917724609375, -0.1915283203125, 0.08612060546875, 0.36376953125, 0.64141845703125, 0.9190673828125, 1.19671630859375, 1.474365234375, 1.75201416015625, 2.0296630859375, 2.30731201171875, 2.5849609375, 2.86260986328125, 3.1402587890625, 3.41790771484375, 3.695556640625, 3.97320556640625, 4.2508544921875, 4.52850341796875, 4.80615234375, 5.08380126953125, 5.3614501953125, 5.63909912109375, 5.916748046875, 6.19439697265625, 6.4720458984375, 6.74969482421875, 7.02734375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 12.0, 29.0, 49.0, 68.0, 126.0, 135.0, 165.0, 122.0, 92.0, 75.0, 40.0, 29.0, 20.0, 16.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.60188865661621, -20.338390350341797, -19.074892044067383, -17.81139373779297, -16.547895431518555, -15.28439712524414, -14.020898818969727, -12.757400512695312, -11.493902206420898, -10.230403900146484, -8.96690559387207, -7.703407287597656, -6.439908981323242, -5.176410675048828, -3.912912368774414, -2.6494140625, -1.385915756225586, -0.12241744995117188, 1.1410808563232422, 2.4045791625976562, 3.6680774688720703, 4.931575775146484, 6.195074081420898, 7.4585723876953125, 8.722070693969727, 9.98556900024414, 11.249067306518555, 12.512565612792969, 13.776063919067383, 15.039562225341797, 16.30306053161621, 17.566558837890625, 18.830055236816406, 20.09355354309082, 21.357051849365234, 22.62055015563965, 23.884048461914062, 25.147546768188477, 26.41104507446289, 27.674543380737305, 28.93804168701172, 30.201539993286133, 31.465038299560547, 32.728538513183594, 33.992034912109375, 35.255531311035156, 36.5190315246582, 37.78253173828125, 39.04602813720703, 40.30952453613281, 41.57302474975586, 42.836524963378906, 44.10002136230469, 45.36351776123047, 46.627017974853516, 47.89051818847656, 49.154014587402344, 50.417510986328125, 51.68101119995117, 52.94451141357422, 54.2080078125, 55.47150421142578, 56.73500442504883, 57.998504638671875, 59.262001037597656]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 9.0, 3.0, 7.0, 12.0, 13.0, 16.0, 11.0, 12.0, 17.0, 16.0, 27.0, 28.0, 38.0, 33.0, 29.0, 22.0, 27.0, 34.0, 33.0, 29.0, 32.0, 48.0, 32.0, 44.0, 45.0, 40.0, 36.0, 38.0, 43.0, 35.0, 26.0, 30.0, 19.0, 17.0, 18.0, 21.0, 13.0, 11.0, 6.0, 13.0, 4.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.117809295654297, -13.632817268371582, -13.14782428741455, -12.662832260131836, -12.177839279174805, -11.69284725189209, -11.207855224609375, -10.722862243652344, -10.237870216369629, -9.752878189086914, -9.267885208129883, -8.782893180847168, -8.297901153564453, -7.812908172607422, -7.327916145324707, -6.842923641204834, -6.357931137084961, -5.872938632965088, -5.387946128845215, -4.9029541015625, -4.417961597442627, -3.932969093322754, -3.44797682762146, -2.962984561920166, -2.477992057800293, -1.9929996728897095, -1.508007287979126, -1.0230149030685425, -0.538022518157959, -0.05303001403808594, 0.431962251663208, 0.916954517364502, 1.401947021484375, 1.8869394063949585, 2.371931791305542, 2.856924057006836, 3.341916561126709, 3.826909065246582, 4.311901092529297, 4.79689359664917, 5.281886100769043, 5.766878604888916, 6.251871109008789, 6.736863136291504, 7.221855640411377, 7.70684814453125, 8.191840171813965, 8.67683219909668, 9.161825180053711, 9.646817207336426, 10.131810188293457, 10.616802215576172, 11.101795196533203, 11.586787223815918, 12.071779251098633, 12.556772232055664, 13.041764259338379, 13.526756286621094, 14.011749267578125, 14.49674129486084, 14.981733322143555, 15.466726303100586, 15.9517183303833, 16.436710357666016, 16.921703338623047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 11.0, 8.0, 17.0, 15.0, 30.0, 35.0, 52.0, 111.0, 141.0, 249.0, 434.0, 843.0, 1487.0, 2995.0, 6023.0, 13103.0, 29019.0, 67449.0, 170950.0, 354317.0, 236705.0, 92761.0, 38502.0, 17335.0, 7988.0, 3660.0, 1934.0, 1011.0, 540.0, 313.0, 175.0, 118.0, 73.0, 50.0, 25.0, 26.0, 18.0, 12.0, 4.0, 5.0, 6.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.078125, -18.475830078125, -17.87353515625, -17.271240234375, -16.6689453125, -16.066650390625, -15.46435546875, -14.862060546875, -14.259765625, -13.657470703125, -13.05517578125, -12.452880859375, -11.8505859375, -11.248291015625, -10.64599609375, -10.043701171875, -9.44140625, -8.839111328125, -8.23681640625, -7.634521484375, -7.0322265625, -6.429931640625, -5.82763671875, -5.225341796875, -4.623046875, -4.020751953125, -3.41845703125, -2.816162109375, -2.2138671875, -1.611572265625, -1.00927734375, -0.406982421875, 0.1953125, 0.797607421875, 1.39990234375, 2.002197265625, 2.6044921875, 3.206787109375, 3.80908203125, 4.411376953125, 5.013671875, 5.615966796875, 6.21826171875, 6.820556640625, 7.4228515625, 8.025146484375, 8.62744140625, 9.229736328125, 9.83203125, 10.434326171875, 11.03662109375, 11.638916015625, 12.2412109375, 12.843505859375, 13.44580078125, 14.048095703125, 14.650390625, 15.252685546875, 15.85498046875, 16.457275390625, 17.0595703125, 17.661865234375, 18.26416015625, 18.866455078125, 19.46875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 6.0, 8.0, 12.0, 11.0, 27.0, 23.0, 30.0, 38.0, 40.0, 46.0, 44.0, 47.0, 51.0, 66.0, 47.0, 62.0, 54.0, 47.0, 46.0, 40.0, 32.0, 43.0, 26.0, 22.0, 24.0, 17.0, 13.0, 20.0, 10.0, 5.0, 13.0, 4.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.09375, -8.8251953125, -8.556640625, -8.2880859375, -8.01953125, -7.7509765625, -7.482421875, -7.2138671875, -6.9453125, -6.6767578125, -6.408203125, -6.1396484375, -5.87109375, -5.6025390625, -5.333984375, -5.0654296875, -4.796875, -4.5283203125, -4.259765625, -3.9912109375, -3.72265625, -3.4541015625, -3.185546875, -2.9169921875, -2.6484375, -2.3798828125, -2.111328125, -1.8427734375, -1.57421875, -1.3056640625, -1.037109375, -0.7685546875, -0.5, -0.2314453125, 0.037109375, 0.3056640625, 0.57421875, 0.8427734375, 1.111328125, 1.3798828125, 1.6484375, 1.9169921875, 2.185546875, 2.4541015625, 2.72265625, 2.9912109375, 3.259765625, 3.5283203125, 3.796875, 4.0654296875, 4.333984375, 4.6025390625, 4.87109375, 5.1396484375, 5.408203125, 5.6767578125, 5.9453125, 6.2138671875, 6.482421875, 6.7509765625, 7.01953125, 7.2880859375, 7.556640625, 7.8251953125, 8.09375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 8.0, 10.0, 16.0, 13.0, 14.0, 22.0, 38.0, 54.0, 60.0, 72.0, 105.0, 142.0, 204.0, 286.0, 456.0, 640.0, 1091.0, 2459.0, 7254.0, 26149.0, 112527.0, 604931.0, 228375.0, 44293.0, 11759.0, 3701.0, 1483.0, 769.0, 496.0, 286.0, 220.0, 146.0, 117.0, 84.0, 57.0, 60.0, 34.0, 29.0, 23.0, 16.0, 16.0, 4.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.765869140625, -27.82861328125, -26.891357421875, -25.9541015625, -25.016845703125, -24.07958984375, -23.142333984375, -22.205078125, -21.267822265625, -20.33056640625, -19.393310546875, -18.4560546875, -17.518798828125, -16.58154296875, -15.644287109375, -14.70703125, -13.769775390625, -12.83251953125, -11.895263671875, -10.9580078125, -10.020751953125, -9.08349609375, -8.146240234375, -7.208984375, -6.271728515625, -5.33447265625, -4.397216796875, -3.4599609375, -2.522705078125, -1.58544921875, -0.648193359375, 0.2890625, 1.226318359375, 2.16357421875, 3.100830078125, 4.0380859375, 4.975341796875, 5.91259765625, 6.849853515625, 7.787109375, 8.724365234375, 9.66162109375, 10.598876953125, 11.5361328125, 12.473388671875, 13.41064453125, 14.347900390625, 15.28515625, 16.222412109375, 17.15966796875, 18.096923828125, 19.0341796875, 19.971435546875, 20.90869140625, 21.845947265625, 22.783203125, 23.720458984375, 24.65771484375, 25.594970703125, 26.5322265625, 27.469482421875, 28.40673828125, 29.343994140625, 30.28125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 5.0, 10.0, 4.0, 9.0, 17.0, 12.0, 12.0, 16.0, 15.0, 22.0, 32.0, 28.0, 31.0, 37.0, 34.0, 37.0, 26.0, 36.0, 40.0, 44.0, 38.0, 39.0, 46.0, 43.0, 46.0, 35.0, 36.0, 35.0, 26.0, 20.0, 29.0, 23.0, 15.0, 17.0, 11.0, 10.0, 12.0, 11.0, 3.0, 7.0, 6.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.87109375, -24.9609375, -24.05078125, -23.140625, -22.23046875, -21.3203125, -20.41015625, -19.5, -18.58984375, -17.6796875, -16.76953125, -15.859375, -14.94921875, -14.0390625, -13.12890625, -12.21875, -11.30859375, -10.3984375, -9.48828125, -8.578125, -7.66796875, -6.7578125, -5.84765625, -4.9375, -4.02734375, -3.1171875, -2.20703125, -1.296875, -0.38671875, 0.5234375, 1.43359375, 2.34375, 3.25390625, 4.1640625, 5.07421875, 5.984375, 6.89453125, 7.8046875, 8.71484375, 9.625, 10.53515625, 11.4453125, 12.35546875, 13.265625, 14.17578125, 15.0859375, 15.99609375, 16.90625, 17.81640625, 18.7265625, 19.63671875, 20.546875, 21.45703125, 22.3671875, 23.27734375, 24.1875, 25.09765625, 26.0078125, 26.91796875, 27.828125, 28.73828125, 29.6484375, 30.55859375, 31.46875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 10.0, 12.0, 18.0, 23.0, 32.0, 64.0, 76.0, 129.0, 227.0, 365.0, 670.0, 1345.0, 2857.0, 7664.0, 27087.0, 146372.0, 635943.0, 178835.0, 32021.0, 8602.0, 3194.0, 1386.0, 661.0, 350.0, 209.0, 115.0, 86.0, 60.0, 40.0, 27.0, 17.0, 14.0, 6.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.96875, -11.563720703125, -11.15869140625, -10.753662109375, -10.3486328125, -9.943603515625, -9.53857421875, -9.133544921875, -8.728515625, -8.323486328125, -7.91845703125, -7.513427734375, -7.1083984375, -6.703369140625, -6.29833984375, -5.893310546875, -5.48828125, -5.083251953125, -4.67822265625, -4.273193359375, -3.8681640625, -3.463134765625, -3.05810546875, -2.653076171875, -2.248046875, -1.843017578125, -1.43798828125, -1.032958984375, -0.6279296875, -0.222900390625, 0.18212890625, 0.587158203125, 0.9921875, 1.397216796875, 1.80224609375, 2.207275390625, 2.6123046875, 3.017333984375, 3.42236328125, 3.827392578125, 4.232421875, 4.637451171875, 5.04248046875, 5.447509765625, 5.8525390625, 6.257568359375, 6.66259765625, 7.067626953125, 7.47265625, 7.877685546875, 8.28271484375, 8.687744140625, 9.0927734375, 9.497802734375, 9.90283203125, 10.307861328125, 10.712890625, 11.117919921875, 11.52294921875, 11.927978515625, 12.3330078125, 12.738037109375, 13.14306640625, 13.548095703125, 13.953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 12.0, 11.0, 10.0, 22.0, 38.0, 32.0, 42.0, 56.0, 59.0, 110.0, 88.0, 85.0, 85.0, 71.0, 66.0, 51.0, 36.0, 27.0, 22.0, 17.0, 7.0, 10.0, 5.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017385482788085938, -0.001680418848991394, -0.0016222894191741943, -0.0015641599893569946, -0.001506030559539795, -0.0014479011297225952, -0.0013897716999053955, -0.0013316422700881958, -0.001273512840270996, -0.0012153834104537964, -0.0011572539806365967, -0.001099124550819397, -0.0010409951210021973, -0.0009828656911849976, -0.0009247362613677979, -0.0008666068315505981, -0.0008084774017333984, -0.0007503479719161987, -0.000692218542098999, -0.0006340891122817993, -0.0005759596824645996, -0.0005178302526473999, -0.0004597008228302002, -0.0004015713930130005, -0.0003434419631958008, -0.0002853125333786011, -0.00022718310356140137, -0.00016905367374420166, -0.00011092424392700195, -5.2794814109802246e-05, 5.334615707397461e-06, 6.346404552459717e-05, 0.00012159347534179688, 0.00017972290515899658, 0.0002378523349761963, 0.000295981764793396, 0.0003541111946105957, 0.0004122406244277954, 0.0004703700542449951, 0.0005284994840621948, 0.0005866289138793945, 0.0006447583436965942, 0.0007028877735137939, 0.0007610172033309937, 0.0008191466331481934, 0.0008772760629653931, 0.0009354054927825928, 0.0009935349225997925, 0.0010516643524169922, 0.001109793782234192, 0.0011679232120513916, 0.0012260526418685913, 0.001284182071685791, 0.0013423115015029907, 0.0014004409313201904, 0.0014585703611373901, 0.0015166997909545898, 0.0015748292207717896, 0.0016329586505889893, 0.001691088080406189, 0.0017492175102233887, 0.0018073469400405884, 0.001865476369857788, 0.0019236057996749878, 0.0019817352294921875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 8.0, 15.0, 16.0, 30.0, 45.0, 72.0, 140.0, 348.0, 786.0, 2244.0, 9250.0, 88147.0, 802580.0, 128874.0, 11732.0, 2620.0, 883.0, 386.0, 160.0, 93.0, 43.0, 36.0, 20.0, 10.0, 7.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.4375, -22.7177734375, -21.998046875, -21.2783203125, -20.55859375, -19.8388671875, -19.119140625, -18.3994140625, -17.6796875, -16.9599609375, -16.240234375, -15.5205078125, -14.80078125, -14.0810546875, -13.361328125, -12.6416015625, -11.921875, -11.2021484375, -10.482421875, -9.7626953125, -9.04296875, -8.3232421875, -7.603515625, -6.8837890625, -6.1640625, -5.4443359375, -4.724609375, -4.0048828125, -3.28515625, -2.5654296875, -1.845703125, -1.1259765625, -0.40625, 0.3134765625, 1.033203125, 1.7529296875, 2.47265625, 3.1923828125, 3.912109375, 4.6318359375, 5.3515625, 6.0712890625, 6.791015625, 7.5107421875, 8.23046875, 8.9501953125, 9.669921875, 10.3896484375, 11.109375, 11.8291015625, 12.548828125, 13.2685546875, 13.98828125, 14.7080078125, 15.427734375, 16.1474609375, 16.8671875, 17.5869140625, 18.306640625, 19.0263671875, 19.74609375, 20.4658203125, 21.185546875, 21.9052734375, 22.625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 7.0, 0.0, 10.0, 14.0, 15.0, 20.0, 17.0, 58.0, 77.0, 96.0, 122.0, 121.0, 122.0, 97.0, 74.0, 51.0, 38.0, 17.0, 17.0, 13.0, 10.0, 3.0, 0.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.142578125, -16.58203125, -16.021484375, -15.4609375, -14.900390625, -14.33984375, -13.779296875, -13.21875, -12.658203125, -12.09765625, -11.537109375, -10.9765625, -10.416015625, -9.85546875, -9.294921875, -8.734375, -8.173828125, -7.61328125, -7.052734375, -6.4921875, -5.931640625, -5.37109375, -4.810546875, -4.25, -3.689453125, -3.12890625, -2.568359375, -2.0078125, -1.447265625, -0.88671875, -0.326171875, 0.234375, 0.794921875, 1.35546875, 1.916015625, 2.4765625, 3.037109375, 3.59765625, 4.158203125, 4.71875, 5.279296875, 5.83984375, 6.400390625, 6.9609375, 7.521484375, 8.08203125, 8.642578125, 9.203125, 9.763671875, 10.32421875, 10.884765625, 11.4453125, 12.005859375, 12.56640625, 13.126953125, 13.6875, 14.248046875, 14.80859375, 15.369140625, 15.9296875, 16.490234375, 17.05078125, 17.611328125, 18.171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 24.0, 120.0, 343.0, 359.0, 120.0, 30.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1158.416015625, -1135.703369140625, -1112.9908447265625, -1090.2781982421875, -1067.565673828125, -1044.85302734375, -1022.1404418945312, -999.4278564453125, -976.7152709960938, -954.002685546875, -931.2901000976562, -908.5775146484375, -885.8648681640625, -863.1522827148438, -840.439697265625, -817.7271118164062, -795.0145263671875, -772.3019409179688, -749.58935546875, -726.876708984375, -704.1641235351562, -681.4515380859375, -658.7389526367188, -636.0263671875, -613.313720703125, -590.6011352539062, -567.8885498046875, -545.1759033203125, -522.4633178710938, -499.750732421875, -477.03814697265625, -454.3255615234375, -431.61297607421875, -408.900390625, -386.1877746582031, -363.4751892089844, -340.7626037597656, -318.04998779296875, -295.33740234375, -272.62481689453125, -249.91221618652344, -227.19961547851562, -204.48703002929688, -181.77442932128906, -159.06182861328125, -136.3492431640625, -113.63664245605469, -90.92405700683594, -68.21145629882812, -45.498863220214844, -22.786266326904297, -0.07366943359375, 22.63892364501953, 45.35151672363281, 68.06411743164062, 90.77670288085938, 113.48930358886719, 136.201904296875, 158.91448974609375, 181.62709045410156, 204.33969116210938, 227.05227661132812, 249.76487731933594, 272.47747802734375, 295.1900634765625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 4.0, 4.0, 7.0, 9.0, 6.0, 10.0, 14.0, 14.0, 22.0, 26.0, 20.0, 33.0, 28.0, 41.0, 41.0, 31.0, 47.0, 38.0, 33.0, 39.0, 42.0, 60.0, 43.0, 41.0, 42.0, 35.0, 27.0, 28.0, 31.0, 25.0, 15.0, 15.0, 16.0, 19.0, 16.0, 8.0, 10.0, 9.0, 8.0, 8.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-173.44593811035156, -168.6623992919922, -163.87884521484375, -159.09530639648438, -154.311767578125, -149.52821350097656, -144.7446746826172, -139.96112060546875, -135.17758178710938, -130.39404296875, -125.61048889160156, -120.82695007324219, -116.04340362548828, -111.25985717773438, -106.476318359375, -101.6927719116211, -96.90922546386719, -92.12567901611328, -87.34213256835938, -82.55859375, -77.7750473022461, -72.99150085449219, -68.20796203613281, -63.424415588378906, -58.640869140625, -53.857322692871094, -49.07378005981445, -44.29023742675781, -39.506690979003906, -34.72314453125, -29.93960189819336, -25.15605926513672, -20.37249755859375, -15.588953018188477, -10.805408477783203, -6.02186393737793, -1.2383193969726562, 3.545225143432617, 8.32876968383789, 13.112312316894531, 17.895858764648438, 22.67940330505371, 27.462947845458984, 32.246490478515625, 37.03003692626953, 41.81358337402344, 46.59712600708008, 51.38066864013672, 56.164215087890625, 60.94776153564453, 65.73130798339844, 70.51484680175781, 75.29839324951172, 80.08193969726562, 84.865478515625, 89.6490249633789, 94.43257141113281, 99.21611785888672, 103.99966430664062, 108.783203125, 113.5667495727539, 118.35029602050781, 123.13383483886719, 127.9173812866211, 132.700927734375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 10.0, 10.0, 14.0, 20.0, 23.0, 51.0, 63.0, 112.0, 202.0, 326.0, 524.0, 857.0, 1738.0, 4685.0, 20238.0, 635856.0, 3499471.0, 21315.0, 4890.0, 1718.0, 830.0, 517.0, 297.0, 182.0, 143.0, 71.0, 43.0, 32.0, 15.0, 9.0, 7.0, 8.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -50.86767578125, -49.1728515625, -47.47802734375, -45.783203125, -44.08837890625, -42.3935546875, -40.69873046875, -39.00390625, -37.30908203125, -35.6142578125, -33.91943359375, -32.224609375, -30.52978515625, -28.8349609375, -27.14013671875, -25.4453125, -23.75048828125, -22.0556640625, -20.36083984375, -18.666015625, -16.97119140625, -15.2763671875, -13.58154296875, -11.88671875, -10.19189453125, -8.4970703125, -6.80224609375, -5.107421875, -3.41259765625, -1.7177734375, -0.02294921875, 1.671875, 3.36669921875, 5.0615234375, 6.75634765625, 8.451171875, 10.14599609375, 11.8408203125, 13.53564453125, 15.23046875, 16.92529296875, 18.6201171875, 20.31494140625, 22.009765625, 23.70458984375, 25.3994140625, 27.09423828125, 28.7890625, 30.48388671875, 32.1787109375, 33.87353515625, 35.568359375, 37.26318359375, 38.9580078125, 40.65283203125, 42.34765625, 44.04248046875, 45.7373046875, 47.43212890625, 49.126953125, 50.82177734375, 52.5166015625, 54.21142578125, 55.90625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 8.0, 11.0, 12.0, 12.0, 26.0, 32.0, 30.0, 35.0, 35.0, 53.0, 56.0, 52.0, 59.0, 43.0, 45.0, 70.0, 54.0, 39.0, 52.0, 38.0, 39.0, 32.0, 26.0, 18.0, 26.0, 21.0, 11.0, 9.0, 12.0, 8.0, 8.0, 0.0, 4.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.96875, -8.70831298828125, -8.4478759765625, -8.18743896484375, -7.927001953125, -7.66656494140625, -7.4061279296875, -7.14569091796875, -6.88525390625, -6.62481689453125, -6.3643798828125, -6.10394287109375, -5.843505859375, -5.58306884765625, -5.3226318359375, -5.06219482421875, -4.8017578125, -4.54132080078125, -4.2808837890625, -4.02044677734375, -3.760009765625, -3.49957275390625, -3.2391357421875, -2.97869873046875, -2.71826171875, -2.45782470703125, -2.1973876953125, -1.93695068359375, -1.676513671875, -1.41607666015625, -1.1556396484375, -0.89520263671875, -0.634765625, -0.37432861328125, -0.1138916015625, 0.14654541015625, 0.406982421875, 0.66741943359375, 0.9278564453125, 1.18829345703125, 1.44873046875, 1.70916748046875, 1.9696044921875, 2.23004150390625, 2.490478515625, 2.75091552734375, 3.0113525390625, 3.27178955078125, 3.5322265625, 3.79266357421875, 4.0531005859375, 4.31353759765625, 4.573974609375, 4.83441162109375, 5.0948486328125, 5.35528564453125, 5.61572265625, 5.87615966796875, 6.1365966796875, 6.39703369140625, 6.657470703125, 6.91790771484375, 7.1783447265625, 7.43878173828125, 7.69921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 5.0, 14.0, 12.0, 18.0, 20.0, 40.0, 51.0, 55.0, 89.0, 139.0, 233.0, 307.0, 493.0, 819.0, 1199.0, 2143.0, 3784.0, 8293.0, 21800.0, 93944.0, 3830560.0, 177907.0, 30493.0, 10628.0, 4718.0, 2471.0, 1484.0, 883.0, 511.0, 389.0, 227.0, 144.0, 102.0, 83.0, 67.0, 31.0, 29.0, 20.0, 20.0, 13.0, 10.0, 6.0, 6.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.8125, -30.919921875, -30.02734375, -29.134765625, -28.2421875, -27.349609375, -26.45703125, -25.564453125, -24.671875, -23.779296875, -22.88671875, -21.994140625, -21.1015625, -20.208984375, -19.31640625, -18.423828125, -17.53125, -16.638671875, -15.74609375, -14.853515625, -13.9609375, -13.068359375, -12.17578125, -11.283203125, -10.390625, -9.498046875, -8.60546875, -7.712890625, -6.8203125, -5.927734375, -5.03515625, -4.142578125, -3.25, -2.357421875, -1.46484375, -0.572265625, 0.3203125, 1.212890625, 2.10546875, 2.998046875, 3.890625, 4.783203125, 5.67578125, 6.568359375, 7.4609375, 8.353515625, 9.24609375, 10.138671875, 11.03125, 11.923828125, 12.81640625, 13.708984375, 14.6015625, 15.494140625, 16.38671875, 17.279296875, 18.171875, 19.064453125, 19.95703125, 20.849609375, 21.7421875, 22.634765625, 23.52734375, 24.419921875, 25.3125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 5.0, 9.0, 7.0, 8.0, 21.0, 15.0, 27.0, 34.0, 76.0, 113.0, 331.0, 2887.0, 218.0, 120.0, 59.0, 29.0, 34.0, 21.0, 10.0, 5.0, 1.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.66796875, -6.494140625, -6.3203125, -6.146484375, -5.97265625, -5.798828125, -5.625, -5.451171875, -5.27734375, -5.103515625, -4.9296875, -4.755859375, -4.58203125, -4.408203125, -4.234375, -4.060546875, -3.88671875, -3.712890625, -3.5390625, -3.365234375, -3.19140625, -3.017578125, -2.84375, -2.669921875, -2.49609375, -2.322265625, -2.1484375, -1.974609375, -1.80078125, -1.626953125, -1.453125, -1.279296875, -1.10546875, -0.931640625, -0.7578125, -0.583984375, -0.41015625, -0.236328125, -0.0625, 0.111328125, 0.28515625, 0.458984375, 0.6328125, 0.806640625, 0.98046875, 1.154296875, 1.328125, 1.501953125, 1.67578125, 1.849609375, 2.0234375, 2.197265625, 2.37109375, 2.544921875, 2.71875, 2.892578125, 3.06640625, 3.240234375, 3.4140625, 3.587890625, 3.76171875, 3.935546875, 4.109375, 4.283203125, 4.45703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 8.0, 10.0, 25.0, 42.0, 58.0, 100.0, 133.0, 144.0, 153.0, 136.0, 88.0, 64.0, 18.0, 7.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-68.17774963378906, -66.56575775146484, -64.9537582397461, -63.341766357421875, -61.729774475097656, -60.11777877807617, -58.50578308105469, -56.89379119873047, -55.281795501708984, -53.6697998046875, -52.05780792236328, -50.4458122253418, -48.83381652832031, -47.221824645996094, -45.60982894897461, -43.997833251953125, -42.385841369628906, -40.77384567260742, -39.1618537902832, -37.54985809326172, -35.9378662109375, -34.325870513916016, -32.71387481689453, -31.10188102722168, -29.489887237548828, -27.877893447875977, -26.265899658203125, -24.65390396118164, -23.04191017150879, -21.429916381835938, -19.817920684814453, -18.2059268951416, -16.593929290771484, -14.981935501098633, -13.369940757751465, -11.757946014404297, -10.145952224731445, -8.533958435058594, -6.921963691711426, -5.309968948364258, -3.6979751586914062, -2.0859808921813965, -0.4739866256713867, 1.138007640838623, 2.750001907348633, 4.361995697021484, 5.973990440368652, 7.58598518371582, 9.197978973388672, 10.809972763061523, 12.421967506408691, 14.03396224975586, 15.645956039428711, 17.257949829101562, 18.869945526123047, 20.4819393157959, 22.09393310546875, 23.7059268951416, 25.317920684814453, 26.929916381835938, 28.54191017150879, 30.15390396118164, 31.765899658203125, 33.377891540527344, 34.98988723754883]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 3.0, 5.0, 8.0, 8.0, 13.0, 9.0, 13.0, 22.0, 16.0, 17.0, 21.0, 24.0, 33.0, 29.0, 26.0, 37.0, 34.0, 50.0, 36.0, 39.0, 43.0, 52.0, 43.0, 44.0, 40.0, 41.0, 28.0, 30.0, 31.0, 29.0, 24.0, 16.0, 30.0, 17.0, 16.0, 10.0, 11.0, 7.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.808642387390137, -14.319196701049805, -13.829750061035156, -13.340304374694824, -12.850858688354492, -12.36141300201416, -11.871967315673828, -11.38252067565918, -10.893074989318848, -10.403629302978516, -9.914182662963867, -9.424736976623535, -8.935291290283203, -8.445845603942871, -7.956399440765381, -7.466953277587891, -6.977507591247559, -6.488061904907227, -5.998615741729736, -5.509169578552246, -5.019723892211914, -4.530278205871582, -4.040832042694092, -3.5513861179351807, -3.0619401931762695, -2.5724942684173584, -2.0830483436584473, -1.5936024188995361, -1.104156494140625, -0.6147105693817139, -0.12526464462280273, 0.3641812801361084, 0.8536262512207031, 1.3430721759796143, 1.8325181007385254, 2.3219640254974365, 2.8114099502563477, 3.300855875015259, 3.79030179977417, 4.27974796295166, 4.769193649291992, 5.258639335632324, 5.7480854988098145, 6.237531661987305, 6.726977348327637, 7.216423034667969, 7.705869197845459, 8.19531536102295, 8.684761047363281, 9.174206733703613, 9.663652420043945, 10.153099060058594, 10.642544746398926, 11.131990432739258, 11.621437072753906, 12.110882759094238, 12.60032844543457, 13.089774131774902, 13.579219818115234, 14.068666458129883, 14.558112144470215, 15.047557830810547, 15.537004470825195, 16.02644920349121, 16.51589584350586]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 6.0, 13.0, 11.0, 13.0, 29.0, 53.0, 66.0, 116.0, 178.0, 317.0, 616.0, 1122.0, 2361.0, 5023.0, 12176.0, 31638.0, 92347.0, 260286.0, 371581.0, 174353.0, 59004.0, 21354.0, 8452.0, 3755.0, 1717.0, 870.0, 462.0, 251.0, 139.0, 73.0, 60.0, 41.0, 20.0, 14.0, 7.0, 9.0, 7.0, 5.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3515625, -13.8057861328125, -13.260009765625, -12.7142333984375, -12.16845703125, -11.6226806640625, -11.076904296875, -10.5311279296875, -9.9853515625, -9.4395751953125, -8.893798828125, -8.3480224609375, -7.80224609375, -7.2564697265625, -6.710693359375, -6.1649169921875, -5.619140625, -5.0733642578125, -4.527587890625, -3.9818115234375, -3.43603515625, -2.8902587890625, -2.344482421875, -1.7987060546875, -1.2529296875, -0.7071533203125, -0.161376953125, 0.3843994140625, 0.93017578125, 1.4759521484375, 2.021728515625, 2.5675048828125, 3.11328125, 3.6590576171875, 4.204833984375, 4.7506103515625, 5.29638671875, 5.8421630859375, 6.387939453125, 6.9337158203125, 7.4794921875, 8.0252685546875, 8.571044921875, 9.1168212890625, 9.66259765625, 10.2083740234375, 10.754150390625, 11.2999267578125, 11.845703125, 12.3914794921875, 12.937255859375, 13.4830322265625, 14.02880859375, 14.5745849609375, 15.120361328125, 15.6661376953125, 16.2119140625, 16.7576904296875, 17.303466796875, 17.8492431640625, 18.39501953125, 18.9407958984375, 19.486572265625, 20.0323486328125, 20.578125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 8.0, 1.0, 6.0, 8.0, 8.0, 10.0, 23.0, 22.0, 22.0, 28.0, 25.0, 42.0, 40.0, 55.0, 49.0, 65.0, 46.0, 56.0, 51.0, 37.0, 50.0, 47.0, 52.0, 27.0, 36.0, 28.0, 30.0, 20.0, 25.0, 21.0, 16.0, 11.0, 7.0, 6.0, 6.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.1484375, -8.88055419921875, -8.6126708984375, -8.34478759765625, -8.076904296875, -7.80902099609375, -7.5411376953125, -7.27325439453125, -7.00537109375, -6.73748779296875, -6.4696044921875, -6.20172119140625, -5.933837890625, -5.66595458984375, -5.3980712890625, -5.13018798828125, -4.8623046875, -4.59442138671875, -4.3265380859375, -4.05865478515625, -3.790771484375, -3.52288818359375, -3.2550048828125, -2.98712158203125, -2.71923828125, -2.45135498046875, -2.1834716796875, -1.91558837890625, -1.647705078125, -1.37982177734375, -1.1119384765625, -0.84405517578125, -0.576171875, -0.30828857421875, -0.0404052734375, 0.22747802734375, 0.495361328125, 0.76324462890625, 1.0311279296875, 1.29901123046875, 1.56689453125, 1.83477783203125, 2.1026611328125, 2.37054443359375, 2.638427734375, 2.90631103515625, 3.1741943359375, 3.44207763671875, 3.7099609375, 3.97784423828125, 4.2457275390625, 4.51361083984375, 4.781494140625, 5.04937744140625, 5.3172607421875, 5.58514404296875, 5.85302734375, 6.12091064453125, 6.3887939453125, 6.65667724609375, 6.924560546875, 7.19244384765625, 7.4603271484375, 7.72821044921875, 7.99609375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 10.0, 10.0, 8.0, 15.0, 17.0, 33.0, 43.0, 50.0, 80.0, 85.0, 123.0, 178.0, 258.0, 454.0, 649.0, 1048.0, 2004.0, 5086.0, 20642.0, 134873.0, 668993.0, 177468.0, 25107.0, 5997.0, 2168.0, 1104.0, 667.0, 420.0, 278.0, 212.0, 138.0, 80.0, 71.0, 37.0, 38.0, 27.0, 24.0, 11.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-29.015625, -28.12451171875, -27.2333984375, -26.34228515625, -25.451171875, -24.56005859375, -23.6689453125, -22.77783203125, -21.88671875, -20.99560546875, -20.1044921875, -19.21337890625, -18.322265625, -17.43115234375, -16.5400390625, -15.64892578125, -14.7578125, -13.86669921875, -12.9755859375, -12.08447265625, -11.193359375, -10.30224609375, -9.4111328125, -8.52001953125, -7.62890625, -6.73779296875, -5.8466796875, -4.95556640625, -4.064453125, -3.17333984375, -2.2822265625, -1.39111328125, -0.5, 0.39111328125, 1.2822265625, 2.17333984375, 3.064453125, 3.95556640625, 4.8466796875, 5.73779296875, 6.62890625, 7.52001953125, 8.4111328125, 9.30224609375, 10.193359375, 11.08447265625, 11.9755859375, 12.86669921875, 13.7578125, 14.64892578125, 15.5400390625, 16.43115234375, 17.322265625, 18.21337890625, 19.1044921875, 19.99560546875, 20.88671875, 21.77783203125, 22.6689453125, 23.56005859375, 24.451171875, 25.34228515625, 26.2333984375, 27.12451171875, 28.015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 6.0, 11.0, 7.0, 12.0, 19.0, 18.0, 27.0, 28.0, 21.0, 18.0, 38.0, 31.0, 31.0, 32.0, 35.0, 41.0, 43.0, 43.0, 57.0, 39.0, 41.0, 41.0, 44.0, 37.0, 28.0, 30.0, 35.0, 24.0, 22.0, 25.0, 20.0, 16.0, 11.0, 9.0, 11.0, 10.0, 4.0, 6.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.359375, -28.4501953125, -27.541015625, -26.6318359375, -25.72265625, -24.8134765625, -23.904296875, -22.9951171875, -22.0859375, -21.1767578125, -20.267578125, -19.3583984375, -18.44921875, -17.5400390625, -16.630859375, -15.7216796875, -14.8125, -13.9033203125, -12.994140625, -12.0849609375, -11.17578125, -10.2666015625, -9.357421875, -8.4482421875, -7.5390625, -6.6298828125, -5.720703125, -4.8115234375, -3.90234375, -2.9931640625, -2.083984375, -1.1748046875, -0.265625, 0.6435546875, 1.552734375, 2.4619140625, 3.37109375, 4.2802734375, 5.189453125, 6.0986328125, 7.0078125, 7.9169921875, 8.826171875, 9.7353515625, 10.64453125, 11.5537109375, 12.462890625, 13.3720703125, 14.28125, 15.1904296875, 16.099609375, 17.0087890625, 17.91796875, 18.8271484375, 19.736328125, 20.6455078125, 21.5546875, 22.4638671875, 23.373046875, 24.2822265625, 25.19140625, 26.1005859375, 27.009765625, 27.9189453125, 28.828125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 4.0, 11.0, 10.0, 13.0, 16.0, 23.0, 36.0, 55.0, 102.0, 192.0, 387.0, 1225.0, 6108.0, 117767.0, 883883.0, 34132.0, 3141.0, 783.0, 283.0, 131.0, 94.0, 55.0, 37.0, 15.0, 9.0, 16.0, 7.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.359130859375, -20.57763671875, -19.796142578125, -19.0146484375, -18.233154296875, -17.45166015625, -16.670166015625, -15.888671875, -15.107177734375, -14.32568359375, -13.544189453125, -12.7626953125, -11.981201171875, -11.19970703125, -10.418212890625, -9.63671875, -8.855224609375, -8.07373046875, -7.292236328125, -6.5107421875, -5.729248046875, -4.94775390625, -4.166259765625, -3.384765625, -2.603271484375, -1.82177734375, -1.040283203125, -0.2587890625, 0.522705078125, 1.30419921875, 2.085693359375, 2.8671875, 3.648681640625, 4.43017578125, 5.211669921875, 5.9931640625, 6.774658203125, 7.55615234375, 8.337646484375, 9.119140625, 9.900634765625, 10.68212890625, 11.463623046875, 12.2451171875, 13.026611328125, 13.80810546875, 14.589599609375, 15.37109375, 16.152587890625, 16.93408203125, 17.715576171875, 18.4970703125, 19.278564453125, 20.06005859375, 20.841552734375, 21.623046875, 22.404541015625, 23.18603515625, 23.967529296875, 24.7490234375, 25.530517578125, 26.31201171875, 27.093505859375, 27.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 7.0, 6.0, 3.0, 3.0, 6.0, 12.0, 23.0, 45.0, 59.0, 110.0, 204.0, 240.0, 134.0, 73.0, 46.0, 17.0, 9.0, 10.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005207061767578125, -0.0050890445709228516, -0.004971027374267578, -0.004853010177612305, -0.004734992980957031, -0.004616975784301758, -0.004498958587646484, -0.004380941390991211, -0.0042629241943359375, -0.004144906997680664, -0.004026889801025391, -0.003908872604370117, -0.0037908554077148438, -0.0036728382110595703, -0.003554821014404297, -0.0034368038177490234, -0.00331878662109375, -0.0032007694244384766, -0.003082752227783203, -0.0029647350311279297, -0.0028467178344726562, -0.002728700637817383, -0.0026106834411621094, -0.002492666244506836, -0.0023746490478515625, -0.002256631851196289, -0.0021386146545410156, -0.002020597457885742, -0.0019025802612304688, -0.0017845630645751953, -0.0016665458679199219, -0.0015485286712646484, -0.001430511474609375, -0.0013124942779541016, -0.0011944770812988281, -0.0010764598846435547, -0.0009584426879882812, -0.0008404254913330078, -0.0007224082946777344, -0.0006043910980224609, -0.0004863739013671875, -0.00036835670471191406, -0.0002503395080566406, -0.0001323223114013672, -1.430511474609375e-05, 0.00010371208190917969, 0.00022172927856445312, 0.00033974647521972656, 0.000457763671875, 0.0005757808685302734, 0.0006937980651855469, 0.0008118152618408203, 0.0009298324584960938, 0.0010478496551513672, 0.0011658668518066406, 0.001283884048461914, 0.0014019012451171875, 0.001519918441772461, 0.0016379356384277344, 0.0017559528350830078, 0.0018739700317382812, 0.0019919872283935547, 0.002110004425048828, 0.0022280216217041016, 0.002346038818359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 10.0, 18.0, 24.0, 43.0, 119.0, 308.0, 936.0, 4988.0, 323514.0, 709428.0, 7243.0, 1235.0, 401.0, 133.0, 65.0, 32.0, 20.0, 10.0, 6.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.21875, -37.99609375, -36.7734375, -35.55078125, -34.328125, -33.10546875, -31.8828125, -30.66015625, -29.4375, -28.21484375, -26.9921875, -25.76953125, -24.546875, -23.32421875, -22.1015625, -20.87890625, -19.65625, -18.43359375, -17.2109375, -15.98828125, -14.765625, -13.54296875, -12.3203125, -11.09765625, -9.875, -8.65234375, -7.4296875, -6.20703125, -4.984375, -3.76171875, -2.5390625, -1.31640625, -0.09375, 1.12890625, 2.3515625, 3.57421875, 4.796875, 6.01953125, 7.2421875, 8.46484375, 9.6875, 10.91015625, 12.1328125, 13.35546875, 14.578125, 15.80078125, 17.0234375, 18.24609375, 19.46875, 20.69140625, 21.9140625, 23.13671875, 24.359375, 25.58203125, 26.8046875, 28.02734375, 29.25, 30.47265625, 31.6953125, 32.91796875, 34.140625, 35.36328125, 36.5859375, 37.80859375, 39.03125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 14.0, 27.0, 39.0, 85.0, 145.0, 181.0, 193.0, 151.0, 79.0, 30.0, 26.0, 11.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.796875, -28.016845703125, -27.23681640625, -26.456787109375, -25.6767578125, -24.896728515625, -24.11669921875, -23.336669921875, -22.556640625, -21.776611328125, -20.99658203125, -20.216552734375, -19.4365234375, -18.656494140625, -17.87646484375, -17.096435546875, -16.31640625, -15.536376953125, -14.75634765625, -13.976318359375, -13.1962890625, -12.416259765625, -11.63623046875, -10.856201171875, -10.076171875, -9.296142578125, -8.51611328125, -7.736083984375, -6.9560546875, -6.176025390625, -5.39599609375, -4.615966796875, -3.8359375, -3.055908203125, -2.27587890625, -1.495849609375, -0.7158203125, 0.064208984375, 0.84423828125, 1.624267578125, 2.404296875, 3.184326171875, 3.96435546875, 4.744384765625, 5.5244140625, 6.304443359375, 7.08447265625, 7.864501953125, 8.64453125, 9.424560546875, 10.20458984375, 10.984619140625, 11.7646484375, 12.544677734375, 13.32470703125, 14.104736328125, 14.884765625, 15.664794921875, 16.44482421875, 17.224853515625, 18.0048828125, 18.784912109375, 19.56494140625, 20.344970703125, 21.125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 9.0, 19.0, 104.0, 289.0, 370.0, 156.0, 41.0, 8.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-451.2337646484375, -432.5804138183594, -413.92706298828125, -395.2737121582031, -376.620361328125, -357.967041015625, -339.3136901855469, -320.66033935546875, -302.0069885253906, -283.3536376953125, -264.7002868652344, -246.0469512939453, -227.3936004638672, -208.74024963378906, -190.0869140625, -171.43356323242188, -152.78021240234375, -134.12686157226562, -115.47351837158203, -96.82017517089844, -78.16682434082031, -59.51347351074219, -40.860130310058594, -22.206787109375, -3.553436279296875, 15.099910736083984, 33.753257751464844, 52.4066047668457, 71.05995178222656, 89.71330261230469, 108.36664581298828, 127.01998901367188, 145.67333984375, 164.32669067382812, 182.98004150390625, 201.6333770751953, 220.28672790527344, 238.94007873535156, 257.5934143066406, 276.24676513671875, 294.9001159667969, 313.553466796875, 332.2068176269531, 350.86016845703125, 369.51348876953125, 388.1668701171875, 406.8201904296875, 425.4735412597656, 444.12689208984375, 462.7802429199219, 481.43359375, 500.0869445800781, 518.7402954101562, 537.3936157226562, 556.0469970703125, 574.7003173828125, 593.3536376953125, 612.0069580078125, 630.6603393554688, 649.3136596679688, 667.967041015625, 686.620361328125, 705.2737426757812, 723.9270629882812, 742.5804443359375]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 4.0, 6.0, 14.0, 12.0, 24.0, 18.0, 15.0, 23.0, 30.0, 25.0, 37.0, 45.0, 38.0, 47.0, 50.0, 37.0, 46.0, 50.0, 42.0, 39.0, 46.0, 31.0, 40.0, 39.0, 40.0, 25.0, 32.0, 30.0, 22.0, 13.0, 6.0, 11.0, 5.0, 5.0, 12.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-141.65960693359375, -136.95567321777344, -132.2517547607422, -127.54782104492188, -122.84388732910156, -118.13996124267578, -113.43603515625, -108.73210144042969, -104.0281753540039, -99.32424926757812, -94.62031555175781, -89.91638946533203, -85.21246337890625, -80.50852966308594, -75.80460357666016, -71.10067749023438, -66.39674377441406, -61.692813873291016, -56.98888397216797, -52.28495788574219, -47.58102798461914, -42.877098083496094, -38.17317199707031, -33.469242095947266, -28.76531219482422, -24.061382293701172, -19.357454299926758, -14.653525352478027, -9.949596405029297, -5.24566650390625, -0.5417385101318359, 4.162189483642578, 8.866119384765625, 13.570048332214355, 18.273977279663086, 22.9779052734375, 27.681835174560547, 32.385765075683594, 37.089691162109375, 41.79362106323242, 46.49755096435547, 51.201480865478516, 55.90541076660156, 60.609336853027344, 65.31326293945312, 70.01719665527344, 74.72112274169922, 79.425048828125, 84.12898254394531, 88.8329086303711, 93.5368423461914, 98.24076843261719, 102.9447021484375, 107.64862823486328, 112.35255432128906, 117.05648803710938, 121.76041412353516, 126.46434020996094, 131.16827392578125, 135.87220764160156, 140.5761260986328, 145.28005981445312, 149.98399353027344, 154.6879119873047, 159.391845703125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 12.0, 18.0, 17.0, 30.0, 40.0, 65.0, 76.0, 123.0, 196.0, 308.0, 475.0, 785.0, 1412.0, 2894.0, 7077.0, 25976.0, 4085553.0, 51623.0, 9607.0, 3754.0, 1780.0, 912.0, 550.0, 338.0, 202.0, 156.0, 84.0, 60.0, 41.0, 31.0, 28.0, 12.0, 8.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.90625, -35.740234375, -34.57421875, -33.408203125, -32.2421875, -31.076171875, -29.91015625, -28.744140625, -27.578125, -26.412109375, -25.24609375, -24.080078125, -22.9140625, -21.748046875, -20.58203125, -19.416015625, -18.25, -17.083984375, -15.91796875, -14.751953125, -13.5859375, -12.419921875, -11.25390625, -10.087890625, -8.921875, -7.755859375, -6.58984375, -5.423828125, -4.2578125, -3.091796875, -1.92578125, -0.759765625, 0.40625, 1.572265625, 2.73828125, 3.904296875, 5.0703125, 6.236328125, 7.40234375, 8.568359375, 9.734375, 10.900390625, 12.06640625, 13.232421875, 14.3984375, 15.564453125, 16.73046875, 17.896484375, 19.0625, 20.228515625, 21.39453125, 22.560546875, 23.7265625, 24.892578125, 26.05859375, 27.224609375, 28.390625, 29.556640625, 30.72265625, 31.888671875, 33.0546875, 34.220703125, 35.38671875, 36.552734375, 37.71875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 11.0, 12.0, 23.0, 20.0, 29.0, 26.0, 34.0, 43.0, 46.0, 59.0, 73.0, 46.0, 59.0, 52.0, 54.0, 53.0, 44.0, 41.0, 48.0, 44.0, 35.0, 16.0, 18.0, 19.0, 24.0, 13.0, 13.0, 5.0, 5.0, 4.0, 9.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0078125, -8.7115478515625, -8.415283203125, -8.1190185546875, -7.82275390625, -7.5264892578125, -7.230224609375, -6.9339599609375, -6.6376953125, -6.3414306640625, -6.045166015625, -5.7489013671875, -5.45263671875, -5.1563720703125, -4.860107421875, -4.5638427734375, -4.267578125, -3.9713134765625, -3.675048828125, -3.3787841796875, -3.08251953125, -2.7862548828125, -2.489990234375, -2.1937255859375, -1.8974609375, -1.6011962890625, -1.304931640625, -1.0086669921875, -0.71240234375, -0.4161376953125, -0.119873046875, 0.1763916015625, 0.47265625, 0.7689208984375, 1.065185546875, 1.3614501953125, 1.65771484375, 1.9539794921875, 2.250244140625, 2.5465087890625, 2.8427734375, 3.1390380859375, 3.435302734375, 3.7315673828125, 4.02783203125, 4.3240966796875, 4.620361328125, 4.9166259765625, 5.212890625, 5.5091552734375, 5.805419921875, 6.1016845703125, 6.39794921875, 6.6942138671875, 6.990478515625, 7.2867431640625, 7.5830078125, 7.8792724609375, 8.175537109375, 8.4718017578125, 8.76806640625, 9.0643310546875, 9.360595703125, 9.6568603515625, 9.953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 13.0, 16.0, 17.0, 34.0, 35.0, 54.0, 78.0, 98.0, 161.0, 253.0, 398.0, 634.0, 1291.0, 2620.0, 6843.0, 31868.0, 4089768.0, 45885.0, 7922.0, 2942.0, 1378.0, 729.0, 426.0, 284.0, 177.0, 111.0, 57.0, 57.0, 45.0, 29.0, 16.0, 19.0, 12.0, 5.0, 6.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.78125, -34.52880859375, -33.2763671875, -32.02392578125, -30.771484375, -29.51904296875, -28.2666015625, -27.01416015625, -25.76171875, -24.50927734375, -23.2568359375, -22.00439453125, -20.751953125, -19.49951171875, -18.2470703125, -16.99462890625, -15.7421875, -14.48974609375, -13.2373046875, -11.98486328125, -10.732421875, -9.47998046875, -8.2275390625, -6.97509765625, -5.72265625, -4.47021484375, -3.2177734375, -1.96533203125, -0.712890625, 0.53955078125, 1.7919921875, 3.04443359375, 4.296875, 5.54931640625, 6.8017578125, 8.05419921875, 9.306640625, 10.55908203125, 11.8115234375, 13.06396484375, 14.31640625, 15.56884765625, 16.8212890625, 18.07373046875, 19.326171875, 20.57861328125, 21.8310546875, 23.08349609375, 24.3359375, 25.58837890625, 26.8408203125, 28.09326171875, 29.345703125, 30.59814453125, 31.8505859375, 33.10302734375, 34.35546875, 35.60791015625, 36.8603515625, 38.11279296875, 39.365234375, 40.61767578125, 41.8701171875, 43.12255859375, 44.375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 10.0, 7.0, 20.0, 30.0, 73.0, 3504.0, 281.0, 68.0, 31.0, 15.0, 9.0, 4.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8828125, -7.642822265625, -7.40283203125, -7.162841796875, -6.9228515625, -6.682861328125, -6.44287109375, -6.202880859375, -5.962890625, -5.722900390625, -5.48291015625, -5.242919921875, -5.0029296875, -4.762939453125, -4.52294921875, -4.282958984375, -4.04296875, -3.802978515625, -3.56298828125, -3.322998046875, -3.0830078125, -2.843017578125, -2.60302734375, -2.363037109375, -2.123046875, -1.883056640625, -1.64306640625, -1.403076171875, -1.1630859375, -0.923095703125, -0.68310546875, -0.443115234375, -0.203125, 0.036865234375, 0.27685546875, 0.516845703125, 0.7568359375, 0.996826171875, 1.23681640625, 1.476806640625, 1.716796875, 1.956787109375, 2.19677734375, 2.436767578125, 2.6767578125, 2.916748046875, 3.15673828125, 3.396728515625, 3.63671875, 3.876708984375, 4.11669921875, 4.356689453125, 4.5966796875, 4.836669921875, 5.07666015625, 5.316650390625, 5.556640625, 5.796630859375, 6.03662109375, 6.276611328125, 6.5166015625, 6.756591796875, 6.99658203125, 7.236572265625, 7.4765625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 12.0, 17.0, 30.0, 44.0, 57.0, 103.0, 140.0, 142.0, 125.0, 119.0, 73.0, 49.0, 29.0, 24.0, 8.0, 6.0, 10.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.08169174194336, -35.12140655517578, -34.1611213684082, -33.200836181640625, -32.24055099487305, -31.28026580810547, -30.31998062133789, -29.359697341918945, -28.399412155151367, -27.43912696838379, -26.47884178161621, -25.518556594848633, -24.558271408081055, -23.59798812866211, -22.63770294189453, -21.677417755126953, -20.717132568359375, -19.756847381591797, -18.79656219482422, -17.83627700805664, -16.875991821289062, -15.9157075881958, -14.955422401428223, -13.995138168334961, -13.03485107421875, -12.074565887451172, -11.114280700683594, -10.153995513916016, -9.193711280822754, -8.233426094055176, -7.273140907287598, -6.312856197357178, -5.352571487426758, -4.39228630065918, -3.4320015907287598, -2.4717164039611816, -1.5114314556121826, -0.5511465072631836, 0.40913867950439453, 1.3694233894348145, 2.3297085762023926, 3.2899935245513916, 4.250278472900391, 5.210563659667969, 6.170848846435547, 7.131133556365967, 8.091419219970703, 9.051703453063965, 10.011988639831543, 10.972273826599121, 11.9325590133667, 12.892843246459961, 13.853128433227539, 14.813413619995117, 15.773698806762695, 16.733983993530273, 17.69426918029785, 18.65455436706543, 19.614839553833008, 20.575124740600586, 21.535409927368164, 22.49569320678711, 23.455978393554688, 24.416263580322266, 25.376548767089844]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 11.0, 10.0, 19.0, 13.0, 10.0, 13.0, 20.0, 15.0, 19.0, 29.0, 35.0, 29.0, 44.0, 35.0, 43.0, 30.0, 33.0, 47.0, 59.0, 46.0, 41.0, 38.0, 39.0, 41.0, 35.0, 32.0, 26.0, 17.0, 29.0, 21.0, 24.0, 14.0, 16.0, 12.0, 13.0, 10.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.810247421264648, -11.466096878051758, -11.121946334838867, -10.777795791625977, -10.433645248413086, -10.089493751525879, -9.745343208312988, -9.401192665100098, -9.057042121887207, -8.712891578674316, -8.368741035461426, -8.024590492248535, -7.680439472198486, -7.336288928985596, -6.992137908935547, -6.647987365722656, -6.303836822509766, -5.959686279296875, -5.615535736083984, -5.2713847160339355, -4.927234172821045, -4.583083629608154, -4.2389326095581055, -3.894782066345215, -3.550631523132324, -3.2064809799194336, -2.862330198287964, -2.518179416656494, -2.1740288734436035, -1.8298782110214233, -1.4857275485992432, -1.1415767669677734, -0.7974262237548828, -0.45327556133270264, -0.10912489891052246, 0.23502576351165771, 0.5791764259338379, 0.9233270883560181, 1.2674777507781982, 1.611628532409668, 1.9557790756225586, 2.299929618835449, 2.644080400466919, 2.9882311820983887, 3.3323817253112793, 3.67653226852417, 4.020683288574219, 4.364833831787109, 4.708984375, 5.053134918212891, 5.397285461425781, 5.74143648147583, 6.085587024688721, 6.429737567901611, 6.77388858795166, 7.118039131164551, 7.462189674377441, 7.806340217590332, 8.150490760803223, 8.494641304016113, 8.83879280090332, 9.182943344116211, 9.527093887329102, 9.871244430541992, 10.215394973754883]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 6.0, 11.0, 16.0, 22.0, 22.0, 40.0, 57.0, 97.0, 133.0, 202.0, 323.0, 535.0, 966.0, 1679.0, 3256.0, 6022.0, 11914.0, 23626.0, 48173.0, 98052.0, 184844.0, 259787.0, 196305.0, 106227.0, 53019.0, 26002.0, 12729.0, 6527.0, 3367.0, 1921.0, 1033.0, 614.0, 371.0, 225.0, 161.0, 80.0, 63.0, 39.0, 25.0, 24.0, 10.0, 13.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.7578125, -11.4176025390625, -11.077392578125, -10.7371826171875, -10.39697265625, -10.0567626953125, -9.716552734375, -9.3763427734375, -9.0361328125, -8.6959228515625, -8.355712890625, -8.0155029296875, -7.67529296875, -7.3350830078125, -6.994873046875, -6.6546630859375, -6.314453125, -5.9742431640625, -5.634033203125, -5.2938232421875, -4.95361328125, -4.6134033203125, -4.273193359375, -3.9329833984375, -3.5927734375, -3.2525634765625, -2.912353515625, -2.5721435546875, -2.23193359375, -1.8917236328125, -1.551513671875, -1.2113037109375, -0.87109375, -0.5308837890625, -0.190673828125, 0.1495361328125, 0.48974609375, 0.8299560546875, 1.170166015625, 1.5103759765625, 1.8505859375, 2.1907958984375, 2.531005859375, 2.8712158203125, 3.21142578125, 3.5516357421875, 3.891845703125, 4.2320556640625, 4.572265625, 4.9124755859375, 5.252685546875, 5.5928955078125, 5.93310546875, 6.2733154296875, 6.613525390625, 6.9537353515625, 7.2939453125, 7.6341552734375, 7.974365234375, 8.3145751953125, 8.65478515625, 8.9949951171875, 9.335205078125, 9.6754150390625, 10.015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 6.0, 9.0, 12.0, 17.0, 29.0, 22.0, 28.0, 37.0, 37.0, 40.0, 61.0, 48.0, 67.0, 50.0, 45.0, 54.0, 53.0, 44.0, 47.0, 44.0, 41.0, 35.0, 30.0, 19.0, 22.0, 19.0, 20.0, 15.0, 11.0, 7.0, 6.0, 7.0, 3.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.556884765625, -8.26220703125, -7.967529296875, -7.6728515625, -7.378173828125, -7.08349609375, -6.788818359375, -6.494140625, -6.199462890625, -5.90478515625, -5.610107421875, -5.3154296875, -5.020751953125, -4.72607421875, -4.431396484375, -4.13671875, -3.842041015625, -3.54736328125, -3.252685546875, -2.9580078125, -2.663330078125, -2.36865234375, -2.073974609375, -1.779296875, -1.484619140625, -1.18994140625, -0.895263671875, -0.6005859375, -0.305908203125, -0.01123046875, 0.283447265625, 0.578125, 0.872802734375, 1.16748046875, 1.462158203125, 1.7568359375, 2.051513671875, 2.34619140625, 2.640869140625, 2.935546875, 3.230224609375, 3.52490234375, 3.819580078125, 4.1142578125, 4.408935546875, 4.70361328125, 4.998291015625, 5.29296875, 5.587646484375, 5.88232421875, 6.177001953125, 6.4716796875, 6.766357421875, 7.06103515625, 7.355712890625, 7.650390625, 7.945068359375, 8.23974609375, 8.534423828125, 8.8291015625, 9.123779296875, 9.41845703125, 9.713134765625, 10.0078125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 8.0, 9.0, 10.0, 17.0, 10.0, 24.0, 26.0, 33.0, 48.0, 55.0, 105.0, 134.0, 237.0, 336.0, 518.0, 818.0, 1583.0, 4695.0, 25586.0, 280993.0, 658637.0, 61123.0, 8342.0, 2307.0, 1062.0, 618.0, 358.0, 249.0, 181.0, 129.0, 85.0, 71.0, 46.0, 34.0, 18.0, 13.0, 11.0, 12.0, 7.0, 1.0, 8.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.25, -32.305419921875, -31.36083984375, -30.416259765625, -29.4716796875, -28.527099609375, -27.58251953125, -26.637939453125, -25.693359375, -24.748779296875, -23.80419921875, -22.859619140625, -21.9150390625, -20.970458984375, -20.02587890625, -19.081298828125, -18.13671875, -17.192138671875, -16.24755859375, -15.302978515625, -14.3583984375, -13.413818359375, -12.46923828125, -11.524658203125, -10.580078125, -9.635498046875, -8.69091796875, -7.746337890625, -6.8017578125, -5.857177734375, -4.91259765625, -3.968017578125, -3.0234375, -2.078857421875, -1.13427734375, -0.189697265625, 0.7548828125, 1.699462890625, 2.64404296875, 3.588623046875, 4.533203125, 5.477783203125, 6.42236328125, 7.366943359375, 8.3115234375, 9.256103515625, 10.20068359375, 11.145263671875, 12.08984375, 13.034423828125, 13.97900390625, 14.923583984375, 15.8681640625, 16.812744140625, 17.75732421875, 18.701904296875, 19.646484375, 20.591064453125, 21.53564453125, 22.480224609375, 23.4248046875, 24.369384765625, 25.31396484375, 26.258544921875, 27.203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 8.0, 2.0, 3.0, 5.0, 6.0, 8.0, 9.0, 13.0, 10.0, 9.0, 10.0, 23.0, 25.0, 17.0, 24.0, 23.0, 37.0, 27.0, 36.0, 44.0, 33.0, 42.0, 40.0, 43.0, 50.0, 32.0, 33.0, 37.0, 35.0, 27.0, 38.0, 36.0, 32.0, 36.0, 27.0, 22.0, 18.0, 11.0, 14.0, 12.0, 7.0, 6.0, 12.0, 3.0, 5.0, 8.0, 8.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.9375, -26.0185546875, -25.099609375, -24.1806640625, -23.26171875, -22.3427734375, -21.423828125, -20.5048828125, -19.5859375, -18.6669921875, -17.748046875, -16.8291015625, -15.91015625, -14.9912109375, -14.072265625, -13.1533203125, -12.234375, -11.3154296875, -10.396484375, -9.4775390625, -8.55859375, -7.6396484375, -6.720703125, -5.8017578125, -4.8828125, -3.9638671875, -3.044921875, -2.1259765625, -1.20703125, -0.2880859375, 0.630859375, 1.5498046875, 2.46875, 3.3876953125, 4.306640625, 5.2255859375, 6.14453125, 7.0634765625, 7.982421875, 8.9013671875, 9.8203125, 10.7392578125, 11.658203125, 12.5771484375, 13.49609375, 14.4150390625, 15.333984375, 16.2529296875, 17.171875, 18.0908203125, 19.009765625, 19.9287109375, 20.84765625, 21.7666015625, 22.685546875, 23.6044921875, 24.5234375, 25.4423828125, 26.361328125, 27.2802734375, 28.19921875, 29.1181640625, 30.037109375, 30.9560546875, 31.875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 12.0, 11.0, 14.0, 19.0, 28.0, 39.0, 51.0, 88.0, 141.0, 216.0, 348.0, 683.0, 1489.0, 4015.0, 14966.0, 109660.0, 776941.0, 117002.0, 15669.0, 4037.0, 1496.0, 643.0, 380.0, 193.0, 134.0, 82.0, 48.0, 35.0, 40.0, 17.0, 8.0, 18.0, 8.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.8046875, -11.3231201171875, -10.841552734375, -10.3599853515625, -9.87841796875, -9.3968505859375, -8.915283203125, -8.4337158203125, -7.9521484375, -7.4705810546875, -6.989013671875, -6.5074462890625, -6.02587890625, -5.5443115234375, -5.062744140625, -4.5811767578125, -4.099609375, -3.6180419921875, -3.136474609375, -2.6549072265625, -2.17333984375, -1.6917724609375, -1.210205078125, -0.7286376953125, -0.2470703125, 0.2344970703125, 0.716064453125, 1.1976318359375, 1.67919921875, 2.1607666015625, 2.642333984375, 3.1239013671875, 3.60546875, 4.0870361328125, 4.568603515625, 5.0501708984375, 5.53173828125, 6.0133056640625, 6.494873046875, 6.9764404296875, 7.4580078125, 7.9395751953125, 8.421142578125, 8.9027099609375, 9.38427734375, 9.8658447265625, 10.347412109375, 10.8289794921875, 11.310546875, 11.7921142578125, 12.273681640625, 12.7552490234375, 13.23681640625, 13.7183837890625, 14.199951171875, 14.6815185546875, 15.1630859375, 15.6446533203125, 16.126220703125, 16.6077880859375, 17.08935546875, 17.5709228515625, 18.052490234375, 18.5340576171875, 19.015625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 5.0, 5.0, 10.0, 9.0, 20.0, 22.0, 30.0, 42.0, 59.0, 95.0, 100.0, 126.0, 124.0, 113.0, 71.0, 44.0, 37.0, 31.0, 14.0, 13.0, 9.0, 6.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002185821533203125, -0.0021143555641174316, -0.0020428895950317383, -0.001971423625946045, -0.0018999576568603516, -0.0018284916877746582, -0.0017570257186889648, -0.0016855597496032715, -0.0016140937805175781, -0.0015426278114318848, -0.0014711618423461914, -0.001399695873260498, -0.0013282299041748047, -0.0012567639350891113, -0.001185297966003418, -0.0011138319969177246, -0.0010423660278320312, -0.0009709000587463379, -0.0008994340896606445, -0.0008279681205749512, -0.0007565021514892578, -0.0006850361824035645, -0.0006135702133178711, -0.0005421042442321777, -0.0004706382751464844, -0.000399172306060791, -0.00032770633697509766, -0.0002562403678894043, -0.00018477439880371094, -0.00011330842971801758, -4.184246063232422e-05, 2.962350845336914e-05, 0.0001010894775390625, 0.00017255544662475586, 0.00024402141571044922, 0.0003154873847961426, 0.00038695335388183594, 0.0004584193229675293, 0.0005298852920532227, 0.000601351261138916, 0.0006728172302246094, 0.0007442831993103027, 0.0008157491683959961, 0.0008872151374816895, 0.0009586811065673828, 0.0010301470756530762, 0.0011016130447387695, 0.0011730790138244629, 0.0012445449829101562, 0.0013160109519958496, 0.001387476921081543, 0.0014589428901672363, 0.0015304088592529297, 0.001601874828338623, 0.0016733407974243164, 0.0017448067665100098, 0.0018162727355957031, 0.0018877387046813965, 0.00195920467376709, 0.002030670642852783, 0.0021021366119384766, 0.00217360258102417, 0.0022450685501098633, 0.0023165345191955566, 0.00238800048828125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 10.0, 8.0, 17.0, 26.0, 43.0, 113.0, 184.0, 454.0, 1099.0, 3422.0, 19349.0, 346485.0, 640951.0, 29653.0, 4460.0, 1230.0, 534.0, 253.0, 118.0, 62.0, 28.0, 24.0, 17.0, 7.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.796875, -28.11279296875, -27.4287109375, -26.74462890625, -26.060546875, -25.37646484375, -24.6923828125, -24.00830078125, -23.32421875, -22.64013671875, -21.9560546875, -21.27197265625, -20.587890625, -19.90380859375, -19.2197265625, -18.53564453125, -17.8515625, -17.16748046875, -16.4833984375, -15.79931640625, -15.115234375, -14.43115234375, -13.7470703125, -13.06298828125, -12.37890625, -11.69482421875, -11.0107421875, -10.32666015625, -9.642578125, -8.95849609375, -8.2744140625, -7.59033203125, -6.90625, -6.22216796875, -5.5380859375, -4.85400390625, -4.169921875, -3.48583984375, -2.8017578125, -2.11767578125, -1.43359375, -0.74951171875, -0.0654296875, 0.61865234375, 1.302734375, 1.98681640625, 2.6708984375, 3.35498046875, 4.0390625, 4.72314453125, 5.4072265625, 6.09130859375, 6.775390625, 7.45947265625, 8.1435546875, 8.82763671875, 9.51171875, 10.19580078125, 10.8798828125, 11.56396484375, 12.248046875, 12.93212890625, 13.6162109375, 14.30029296875, 14.984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 4.0, 6.0, 13.0, 10.0, 10.0, 15.0, 24.0, 29.0, 46.0, 60.0, 59.0, 77.0, 84.0, 113.0, 85.0, 80.0, 67.0, 58.0, 42.0, 25.0, 17.0, 23.0, 9.0, 9.0, 6.0, 13.0, 8.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.96875, -13.58740234375, -13.2060546875, -12.82470703125, -12.443359375, -12.06201171875, -11.6806640625, -11.29931640625, -10.91796875, -10.53662109375, -10.1552734375, -9.77392578125, -9.392578125, -9.01123046875, -8.6298828125, -8.24853515625, -7.8671875, -7.48583984375, -7.1044921875, -6.72314453125, -6.341796875, -5.96044921875, -5.5791015625, -5.19775390625, -4.81640625, -4.43505859375, -4.0537109375, -3.67236328125, -3.291015625, -2.90966796875, -2.5283203125, -2.14697265625, -1.765625, -1.38427734375, -1.0029296875, -0.62158203125, -0.240234375, 0.14111328125, 0.5224609375, 0.90380859375, 1.28515625, 1.66650390625, 2.0478515625, 2.42919921875, 2.810546875, 3.19189453125, 3.5732421875, 3.95458984375, 4.3359375, 4.71728515625, 5.0986328125, 5.47998046875, 5.861328125, 6.24267578125, 6.6240234375, 7.00537109375, 7.38671875, 7.76806640625, 8.1494140625, 8.53076171875, 8.912109375, 9.29345703125, 9.6748046875, 10.05615234375, 10.4375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 11.0, 23.0, 57.0, 123.0, 193.0, 235.0, 169.0, 98.0, 37.0, 25.0, 10.0, 8.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-412.002197265625, -401.8043212890625, -391.6064453125, -381.4085693359375, -371.210693359375, -361.0128173828125, -350.81494140625, -340.6170959472656, -330.4192199707031, -320.2213439941406, -310.0234680175781, -299.8255920410156, -289.6277160644531, -279.42987060546875, -269.23199462890625, -259.03411865234375, -248.8362274169922, -238.6383514404297, -228.4404754638672, -218.24261474609375, -208.04473876953125, -197.84686279296875, -187.64898681640625, -177.45111083984375, -167.25323486328125, -157.05535888671875, -146.85748291015625, -136.65960693359375, -126.46174621582031, -116.26387023925781, -106.06599426269531, -95.86812591552734, -85.67027282714844, -75.47239685058594, -65.27452850341797, -55.07665252685547, -44.878780364990234, -34.680908203125, -24.4830322265625, -14.285163879394531, -4.087287902832031, 6.1105852127075195, 16.30845832824707, 26.506332397460938, 36.70420455932617, 46.902076721191406, 57.099952697753906, 67.29782104492188, 77.49569702148438, 87.69357299804688, 97.89144134521484, 108.08931732177734, 118.28718566894531, 128.4850616455078, 138.6829376220703, 148.88079833984375, 159.07867431640625, 169.27655029296875, 179.47442626953125, 189.67230224609375, 199.8701629638672, 210.0680389404297, 220.2659149169922, 230.46377563476562, 240.6616668701172]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 3.0, 3.0, 6.0, 7.0, 10.0, 11.0, 5.0, 11.0, 14.0, 14.0, 17.0, 18.0, 19.0, 21.0, 37.0, 31.0, 36.0, 35.0, 31.0, 44.0, 50.0, 52.0, 44.0, 50.0, 53.0, 45.0, 27.0, 29.0, 27.0, 33.0, 33.0, 26.0, 27.0, 21.0, 25.0, 13.0, 11.0, 9.0, 8.0, 5.0, 8.0, 6.0, 9.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-129.1451873779297, -124.88058471679688, -120.61598205566406, -116.35137176513672, -112.0867691040039, -107.8221664428711, -103.55755615234375, -99.29295349121094, -95.02835083007812, -90.76374816894531, -86.4991455078125, -82.23453521728516, -77.96993255615234, -73.70532989501953, -69.44071960449219, -65.17611694335938, -60.91151428222656, -56.64691162109375, -52.38230514526367, -48.117698669433594, -43.85309600830078, -39.58849334716797, -35.32388687133789, -31.059282302856445, -26.794677734375, -22.530073165893555, -18.26546859741211, -14.000864028930664, -9.736259460449219, -5.471654891967773, -1.2070503234863281, 3.057554244995117, 7.322174072265625, 11.58677864074707, 15.851383209228516, 20.11598777770996, 24.380592346191406, 28.64519691467285, 32.9098014831543, 37.174407958984375, 41.43901062011719, 45.70361328125, 49.96821975708008, 54.232826232910156, 58.49742889404297, 62.76203155517578, 67.02664184570312, 71.29124450683594, 75.55584716796875, 79.82044982910156, 84.08505249023438, 88.34966278076172, 92.61426544189453, 96.87886810302734, 101.14347839355469, 105.4080810546875, 109.67268371582031, 113.93728637695312, 118.20188903808594, 122.46649932861328, 126.7311019897461, 130.99571228027344, 135.26031494140625, 139.52491760253906, 143.78952026367188]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 10.0, 13.0, 40.0, 43.0, 62.0, 70.0, 92.0, 142.0, 250.0, 367.0, 547.0, 1114.0, 2461.0, 6130.0, 21557.0, 235625.0, 3880712.0, 30915.0, 7967.0, 2963.0, 1272.0, 710.0, 423.0, 231.0, 154.0, 125.0, 68.0, 57.0, 35.0, 35.0, 21.0, 16.0, 9.0, 14.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.84375, -29.8525390625, -28.861328125, -27.8701171875, -26.87890625, -25.8876953125, -24.896484375, -23.9052734375, -22.9140625, -21.9228515625, -20.931640625, -19.9404296875, -18.94921875, -17.9580078125, -16.966796875, -15.9755859375, -14.984375, -13.9931640625, -13.001953125, -12.0107421875, -11.01953125, -10.0283203125, -9.037109375, -8.0458984375, -7.0546875, -6.0634765625, -5.072265625, -4.0810546875, -3.08984375, -2.0986328125, -1.107421875, -0.1162109375, 0.875, 1.8662109375, 2.857421875, 3.8486328125, 4.83984375, 5.8310546875, 6.822265625, 7.8134765625, 8.8046875, 9.7958984375, 10.787109375, 11.7783203125, 12.76953125, 13.7607421875, 14.751953125, 15.7431640625, 16.734375, 17.7255859375, 18.716796875, 19.7080078125, 20.69921875, 21.6904296875, 22.681640625, 23.6728515625, 24.6640625, 25.6552734375, 26.646484375, 27.6376953125, 28.62890625, 29.6201171875, 30.611328125, 31.6025390625, 32.59375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 10.0, 6.0, 10.0, 13.0, 19.0, 11.0, 41.0, 53.0, 60.0, 67.0, 67.0, 75.0, 87.0, 81.0, 74.0, 48.0, 49.0, 58.0, 42.0, 27.0, 23.0, 23.0, 15.0, 8.0, 9.0, 11.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.584716796875, -9.20068359375, -8.816650390625, -8.4326171875, -8.048583984375, -7.66455078125, -7.280517578125, -6.896484375, -6.512451171875, -6.12841796875, -5.744384765625, -5.3603515625, -4.976318359375, -4.59228515625, -4.208251953125, -3.82421875, -3.440185546875, -3.05615234375, -2.672119140625, -2.2880859375, -1.904052734375, -1.52001953125, -1.135986328125, -0.751953125, -0.367919921875, 0.01611328125, 0.400146484375, 0.7841796875, 1.168212890625, 1.55224609375, 1.936279296875, 2.3203125, 2.704345703125, 3.08837890625, 3.472412109375, 3.8564453125, 4.240478515625, 4.62451171875, 5.008544921875, 5.392578125, 5.776611328125, 6.16064453125, 6.544677734375, 6.9287109375, 7.312744140625, 7.69677734375, 8.080810546875, 8.46484375, 8.848876953125, 9.23291015625, 9.616943359375, 10.0009765625, 10.385009765625, 10.76904296875, 11.153076171875, 11.537109375, 11.921142578125, 12.30517578125, 12.689208984375, 13.0732421875, 13.457275390625, 13.84130859375, 14.225341796875, 14.609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 11.0, 16.0, 16.0, 18.0, 41.0, 89.0, 156.0, 336.0, 697.0, 1724.0, 4607.0, 19055.0, 3005311.0, 1135415.0, 19231.0, 4470.0, 1628.0, 717.0, 324.0, 182.0, 89.0, 56.0, 31.0, 33.0, 14.0, 9.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.90625, -34.66796875, -33.4296875, -32.19140625, -30.953125, -29.71484375, -28.4765625, -27.23828125, -26.0, -24.76171875, -23.5234375, -22.28515625, -21.046875, -19.80859375, -18.5703125, -17.33203125, -16.09375, -14.85546875, -13.6171875, -12.37890625, -11.140625, -9.90234375, -8.6640625, -7.42578125, -6.1875, -4.94921875, -3.7109375, -2.47265625, -1.234375, 0.00390625, 1.2421875, 2.48046875, 3.71875, 4.95703125, 6.1953125, 7.43359375, 8.671875, 9.91015625, 11.1484375, 12.38671875, 13.625, 14.86328125, 16.1015625, 17.33984375, 18.578125, 19.81640625, 21.0546875, 22.29296875, 23.53125, 24.76953125, 26.0078125, 27.24609375, 28.484375, 29.72265625, 30.9609375, 32.19921875, 33.4375, 34.67578125, 35.9140625, 37.15234375, 38.390625, 39.62890625, 40.8671875, 42.10546875, 43.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 4.0, 7.0, 10.0, 13.0, 24.0, 40.0, 78.0, 214.0, 3137.0, 287.0, 108.0, 49.0, 24.0, 14.0, 14.0, 12.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.035400390625, -8.71923828125, -8.403076171875, -8.0869140625, -7.770751953125, -7.45458984375, -7.138427734375, -6.822265625, -6.506103515625, -6.18994140625, -5.873779296875, -5.5576171875, -5.241455078125, -4.92529296875, -4.609130859375, -4.29296875, -3.976806640625, -3.66064453125, -3.344482421875, -3.0283203125, -2.712158203125, -2.39599609375, -2.079833984375, -1.763671875, -1.447509765625, -1.13134765625, -0.815185546875, -0.4990234375, -0.182861328125, 0.13330078125, 0.449462890625, 0.765625, 1.081787109375, 1.39794921875, 1.714111328125, 2.0302734375, 2.346435546875, 2.66259765625, 2.978759765625, 3.294921875, 3.611083984375, 3.92724609375, 4.243408203125, 4.5595703125, 4.875732421875, 5.19189453125, 5.508056640625, 5.82421875, 6.140380859375, 6.45654296875, 6.772705078125, 7.0888671875, 7.405029296875, 7.72119140625, 8.037353515625, 8.353515625, 8.669677734375, 8.98583984375, 9.302001953125, 9.6181640625, 9.934326171875, 10.25048828125, 10.566650390625, 10.8828125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 29.0, 66.0, 142.0, 230.0, 240.0, 131.0, 86.0, 41.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.39588928222656, -54.76677322387695, -52.13766098022461, -49.508544921875, -46.879432678222656, -44.25031661987305, -41.62120056152344, -38.992088317871094, -36.362972259521484, -33.733856201171875, -31.10474395751953, -28.475627899169922, -25.846513748168945, -23.21739959716797, -20.58828353881836, -17.959169387817383, -15.330055236816406, -12.70094108581543, -10.071825981140137, -7.442711353302002, -4.813596725463867, -2.1844825744628906, 0.44463253021240234, 3.0737476348876953, 5.702861785888672, 8.331975936889648, 10.961091041564941, 13.590206146240234, 16.21932029724121, 18.848434448242188, 21.477550506591797, 24.106664657592773, 26.73577880859375, 29.364892959594727, 31.994007110595703, 34.62312316894531, 37.252235412597656, 39.881351470947266, 42.510467529296875, 45.13957977294922, 47.76869583129883, 50.39781188964844, 53.02692413330078, 55.65604019165039, 58.28515625, 60.914268493652344, 63.54338455200195, 66.17250061035156, 68.8016128540039, 71.43072509765625, 74.05984497070312, 76.68895721435547, 79.31806945800781, 81.94718933105469, 84.57630157470703, 87.20541381835938, 89.83453369140625, 92.4636459350586, 95.09276580810547, 97.72187805175781, 100.35099029541016, 102.9801025390625, 105.60922241210938, 108.23833465576172, 110.86744689941406]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 8.0, 11.0, 11.0, 11.0, 10.0, 22.0, 23.0, 15.0, 27.0, 27.0, 31.0, 38.0, 37.0, 36.0, 48.0, 38.0, 34.0, 48.0, 49.0, 48.0, 38.0, 45.0, 41.0, 27.0, 37.0, 31.0, 28.0, 31.0, 23.0, 23.0, 13.0, 13.0, 8.0, 8.0, 11.0, 7.0, 7.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.982872009277344, -18.310510635375977, -17.63814926147461, -16.965789794921875, -16.293428421020508, -15.62106704711914, -14.948705673217773, -14.276344299316406, -13.603983879089355, -12.931622505187988, -12.259262084960938, -11.58690071105957, -10.914539337158203, -10.242178916931152, -9.569817543029785, -8.897457122802734, -8.225095748901367, -7.552734851837158, -6.880373954772949, -6.208012580871582, -5.535651683807373, -4.863290786743164, -4.190929412841797, -3.518568515777588, -2.846207618713379, -2.17384672164917, -1.5014855861663818, -0.8291244506835938, -0.15676355361938477, 0.5155973434448242, 1.1879587173461914, 1.8603196144104004, 2.5326805114746094, 3.2050414085388184, 3.8774025440216064, 4.5497636795043945, 5.2221245765686035, 5.8944854736328125, 6.56684684753418, 7.239207744598389, 7.911568641662598, 8.583930015563965, 9.256290435791016, 9.928651809692383, 10.60101318359375, 11.2733736038208, 11.945734977722168, 12.618095397949219, 13.290456771850586, 13.962818145751953, 14.635178565979004, 15.307539939880371, 15.979900360107422, 16.65226173400879, 17.324623107910156, 17.996984481811523, 18.66934585571289, 19.341707229614258, 20.014068603515625, 20.68642807006836, 21.358789443969727, 22.031150817871094, 22.70351219177246, 23.375873565673828, 24.048233032226562]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 12.0, 15.0, 19.0, 23.0, 43.0, 46.0, 64.0, 88.0, 174.0, 237.0, 380.0, 660.0, 1124.0, 2085.0, 3953.0, 7979.0, 17222.0, 38232.0, 85917.0, 189971.0, 332801.0, 200608.0, 90612.0, 40365.0, 18044.0, 8391.0, 4190.0, 2242.0, 1198.0, 673.0, 394.0, 237.0, 161.0, 123.0, 76.0, 58.0, 40.0, 26.0, 11.0, 16.0, 11.0, 7.0, 4.0, 6.0, 2.0, 7.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.90625, -17.31982421875, -16.7333984375, -16.14697265625, -15.560546875, -14.97412109375, -14.3876953125, -13.80126953125, -13.21484375, -12.62841796875, -12.0419921875, -11.45556640625, -10.869140625, -10.28271484375, -9.6962890625, -9.10986328125, -8.5234375, -7.93701171875, -7.3505859375, -6.76416015625, -6.177734375, -5.59130859375, -5.0048828125, -4.41845703125, -3.83203125, -3.24560546875, -2.6591796875, -2.07275390625, -1.486328125, -0.89990234375, -0.3134765625, 0.27294921875, 0.859375, 1.44580078125, 2.0322265625, 2.61865234375, 3.205078125, 3.79150390625, 4.3779296875, 4.96435546875, 5.55078125, 6.13720703125, 6.7236328125, 7.31005859375, 7.896484375, 8.48291015625, 9.0693359375, 9.65576171875, 10.2421875, 10.82861328125, 11.4150390625, 12.00146484375, 12.587890625, 13.17431640625, 13.7607421875, 14.34716796875, 14.93359375, 15.52001953125, 16.1064453125, 16.69287109375, 17.279296875, 17.86572265625, 18.4521484375, 19.03857421875, 19.625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 7.0, 6.0, 8.0, 12.0, 13.0, 12.0, 26.0, 37.0, 49.0, 64.0, 84.0, 57.0, 85.0, 86.0, 78.0, 78.0, 57.0, 47.0, 54.0, 35.0, 27.0, 24.0, 17.0, 13.0, 8.0, 11.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.640625, -10.2274169921875, -9.814208984375, -9.4010009765625, -8.98779296875, -8.5745849609375, -8.161376953125, -7.7481689453125, -7.3349609375, -6.9217529296875, -6.508544921875, -6.0953369140625, -5.68212890625, -5.2689208984375, -4.855712890625, -4.4425048828125, -4.029296875, -3.6160888671875, -3.202880859375, -2.7896728515625, -2.37646484375, -1.9632568359375, -1.550048828125, -1.1368408203125, -0.7236328125, -0.3104248046875, 0.102783203125, 0.5159912109375, 0.92919921875, 1.3424072265625, 1.755615234375, 2.1688232421875, 2.58203125, 2.9952392578125, 3.408447265625, 3.8216552734375, 4.23486328125, 4.6480712890625, 5.061279296875, 5.4744873046875, 5.8876953125, 6.3009033203125, 6.714111328125, 7.1273193359375, 7.54052734375, 7.9537353515625, 8.366943359375, 8.7801513671875, 9.193359375, 9.6065673828125, 10.019775390625, 10.4329833984375, 10.84619140625, 11.2593994140625, 11.672607421875, 12.0858154296875, 12.4990234375, 12.9122314453125, 13.325439453125, 13.7386474609375, 14.15185546875, 14.5650634765625, 14.978271484375, 15.3914794921875, 15.8046875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 11.0, 5.0, 10.0, 14.0, 19.0, 32.0, 58.0, 86.0, 132.0, 184.0, 271.0, 494.0, 950.0, 2101.0, 6928.0, 41130.0, 525026.0, 425251.0, 35409.0, 6247.0, 1914.0, 935.0, 510.0, 279.0, 165.0, 103.0, 78.0, 57.0, 35.0, 33.0, 23.0, 15.0, 13.0, 10.0, 4.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.26123046875, -35.9287109375, -34.59619140625, -33.263671875, -31.93115234375, -30.5986328125, -29.26611328125, -27.93359375, -26.60107421875, -25.2685546875, -23.93603515625, -22.603515625, -21.27099609375, -19.9384765625, -18.60595703125, -17.2734375, -15.94091796875, -14.6083984375, -13.27587890625, -11.943359375, -10.61083984375, -9.2783203125, -7.94580078125, -6.61328125, -5.28076171875, -3.9482421875, -2.61572265625, -1.283203125, 0.04931640625, 1.3818359375, 2.71435546875, 4.046875, 5.37939453125, 6.7119140625, 8.04443359375, 9.376953125, 10.70947265625, 12.0419921875, 13.37451171875, 14.70703125, 16.03955078125, 17.3720703125, 18.70458984375, 20.037109375, 21.36962890625, 22.7021484375, 24.03466796875, 25.3671875, 26.69970703125, 28.0322265625, 29.36474609375, 30.697265625, 32.02978515625, 33.3623046875, 34.69482421875, 36.02734375, 37.35986328125, 38.6923828125, 40.02490234375, 41.357421875, 42.68994140625, 44.0224609375, 45.35498046875, 46.6875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 12.0, 12.0, 17.0, 17.0, 20.0, 20.0, 25.0, 40.0, 38.0, 28.0, 37.0, 50.0, 52.0, 45.0, 45.0, 47.0, 52.0, 42.0, 52.0, 54.0, 48.0, 25.0, 34.0, 31.0, 28.0, 22.0, 12.0, 17.0, 9.0, 6.0, 9.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.65625, -32.59326171875, -31.5302734375, -30.46728515625, -29.404296875, -28.34130859375, -27.2783203125, -26.21533203125, -25.15234375, -24.08935546875, -23.0263671875, -21.96337890625, -20.900390625, -19.83740234375, -18.7744140625, -17.71142578125, -16.6484375, -15.58544921875, -14.5224609375, -13.45947265625, -12.396484375, -11.33349609375, -10.2705078125, -9.20751953125, -8.14453125, -7.08154296875, -6.0185546875, -4.95556640625, -3.892578125, -2.82958984375, -1.7666015625, -0.70361328125, 0.359375, 1.42236328125, 2.4853515625, 3.54833984375, 4.611328125, 5.67431640625, 6.7373046875, 7.80029296875, 8.86328125, 9.92626953125, 10.9892578125, 12.05224609375, 13.115234375, 14.17822265625, 15.2412109375, 16.30419921875, 17.3671875, 18.43017578125, 19.4931640625, 20.55615234375, 21.619140625, 22.68212890625, 23.7451171875, 24.80810546875, 25.87109375, 26.93408203125, 27.9970703125, 29.06005859375, 30.123046875, 31.18603515625, 32.2490234375, 33.31201171875, 34.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 6.0, 3.0, 10.0, 10.0, 12.0, 24.0, 30.0, 54.0, 66.0, 107.0, 179.0, 239.0, 473.0, 835.0, 1825.0, 4250.0, 12211.0, 42918.0, 179146.0, 566067.0, 177707.0, 42329.0, 12192.0, 4147.0, 1674.0, 839.0, 422.0, 250.0, 149.0, 105.0, 73.0, 49.0, 39.0, 21.0, 20.0, 16.0, 11.0, 13.0, 6.0, 7.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.56640625, -7.31829833984375, -7.0701904296875, -6.82208251953125, -6.573974609375, -6.32586669921875, -6.0777587890625, -5.82965087890625, -5.58154296875, -5.33343505859375, -5.0853271484375, -4.83721923828125, -4.589111328125, -4.34100341796875, -4.0928955078125, -3.84478759765625, -3.5966796875, -3.34857177734375, -3.1004638671875, -2.85235595703125, -2.604248046875, -2.35614013671875, -2.1080322265625, -1.85992431640625, -1.61181640625, -1.36370849609375, -1.1156005859375, -0.86749267578125, -0.619384765625, -0.37127685546875, -0.1231689453125, 0.12493896484375, 0.373046875, 0.62115478515625, 0.8692626953125, 1.11737060546875, 1.365478515625, 1.61358642578125, 1.8616943359375, 2.10980224609375, 2.35791015625, 2.60601806640625, 2.8541259765625, 3.10223388671875, 3.350341796875, 3.59844970703125, 3.8465576171875, 4.09466552734375, 4.3427734375, 4.59088134765625, 4.8389892578125, 5.08709716796875, 5.335205078125, 5.58331298828125, 5.8314208984375, 6.07952880859375, 6.32763671875, 6.57574462890625, 6.8238525390625, 7.07196044921875, 7.320068359375, 7.56817626953125, 7.8162841796875, 8.06439208984375, 8.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 7.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 12.0, 22.0, 13.0, 19.0, 25.0, 32.0, 34.0, 33.0, 41.0, 45.0, 97.0, 87.0, 83.0, 73.0, 64.0, 44.0, 40.0, 28.0, 14.0, 24.0, 18.0, 16.0, 14.0, 16.0, 11.0, 12.0, 3.0, 4.0, 5.0, 4.0, 1.0, 5.0, 7.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0015697479248046875, -0.001520305871963501, -0.0014708638191223145, -0.001421421766281128, -0.0013719797134399414, -0.0013225376605987549, -0.0012730956077575684, -0.0012236535549163818, -0.0011742115020751953, -0.0011247694492340088, -0.0010753273963928223, -0.0010258853435516357, -0.0009764432907104492, -0.0009270012378692627, -0.0008775591850280762, -0.0008281171321868896, -0.0007786750793457031, -0.0007292330265045166, -0.0006797909736633301, -0.0006303489208221436, -0.000580906867980957, -0.0005314648151397705, -0.000482022762298584, -0.00043258070945739746, -0.00038313865661621094, -0.0003336966037750244, -0.0002842545509338379, -0.00023481249809265137, -0.00018537044525146484, -0.00013592839241027832, -8.64863395690918e-05, -3.7044286727905273e-05, 1.239776611328125e-05, 6.183981895446777e-05, 0.0001112818717956543, 0.00016072392463684082, 0.00021016597747802734, 0.00025960803031921387, 0.0003090500831604004, 0.0003584921360015869, 0.00040793418884277344, 0.00045737624168395996, 0.0005068182945251465, 0.000556260347366333, 0.0006057024002075195, 0.0006551444530487061, 0.0007045865058898926, 0.0007540285587310791, 0.0008034706115722656, 0.0008529126644134521, 0.0009023547172546387, 0.0009517967700958252, 0.0010012388229370117, 0.0010506808757781982, 0.0011001229286193848, 0.0011495649814605713, 0.0011990070343017578, 0.0012484490871429443, 0.0012978911399841309, 0.0013473331928253174, 0.001396775245666504, 0.0014462172985076904, 0.001495659351348877, 0.0015451014041900635, 0.00159454345703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 8.0, 9.0, 14.0, 28.0, 31.0, 64.0, 117.0, 235.0, 457.0, 1095.0, 3201.0, 16257.0, 202389.0, 747214.0, 66361.0, 7619.0, 1937.0, 772.0, 328.0, 178.0, 108.0, 58.0, 25.0, 16.0, 11.0, 8.0, 10.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.0703125, -13.5731201171875, -13.075927734375, -12.5787353515625, -12.08154296875, -11.5843505859375, -11.087158203125, -10.5899658203125, -10.0927734375, -9.5955810546875, -9.098388671875, -8.6011962890625, -8.10400390625, -7.6068115234375, -7.109619140625, -6.6124267578125, -6.115234375, -5.6180419921875, -5.120849609375, -4.6236572265625, -4.12646484375, -3.6292724609375, -3.132080078125, -2.6348876953125, -2.1376953125, -1.6405029296875, -1.143310546875, -0.6461181640625, -0.14892578125, 0.3482666015625, 0.845458984375, 1.3426513671875, 1.83984375, 2.3370361328125, 2.834228515625, 3.3314208984375, 3.82861328125, 4.3258056640625, 4.822998046875, 5.3201904296875, 5.8173828125, 6.3145751953125, 6.811767578125, 7.3089599609375, 7.80615234375, 8.3033447265625, 8.800537109375, 9.2977294921875, 9.794921875, 10.2921142578125, 10.789306640625, 11.2864990234375, 11.78369140625, 12.2808837890625, 12.778076171875, 13.2752685546875, 13.7724609375, 14.2696533203125, 14.766845703125, 15.2640380859375, 15.76123046875, 16.2584228515625, 16.755615234375, 17.2528076171875, 17.75]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 1.0, 2.0, 2.0, 10.0, 9.0, 5.0, 9.0, 12.0, 25.0, 19.0, 26.0, 26.0, 34.0, 51.0, 45.0, 62.0, 56.0, 83.0, 75.0, 68.0, 67.0, 55.0, 38.0, 31.0, 30.0, 20.0, 27.0, 26.0, 12.0, 9.0, 10.0, 11.0, 9.0, 8.0, 8.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-8.671875, -8.4390869140625, -8.206298828125, -7.9735107421875, -7.74072265625, -7.5079345703125, -7.275146484375, -7.0423583984375, -6.8095703125, -6.5767822265625, -6.343994140625, -6.1112060546875, -5.87841796875, -5.6456298828125, -5.412841796875, -5.1800537109375, -4.947265625, -4.7144775390625, -4.481689453125, -4.2489013671875, -4.01611328125, -3.7833251953125, -3.550537109375, -3.3177490234375, -3.0849609375, -2.8521728515625, -2.619384765625, -2.3865966796875, -2.15380859375, -1.9210205078125, -1.688232421875, -1.4554443359375, -1.22265625, -0.9898681640625, -0.757080078125, -0.5242919921875, -0.29150390625, -0.0587158203125, 0.174072265625, 0.4068603515625, 0.6396484375, 0.8724365234375, 1.105224609375, 1.3380126953125, 1.57080078125, 1.8035888671875, 2.036376953125, 2.2691650390625, 2.501953125, 2.7347412109375, 2.967529296875, 3.2003173828125, 3.43310546875, 3.6658935546875, 3.898681640625, 4.1314697265625, 4.3642578125, 4.5970458984375, 4.829833984375, 5.0626220703125, 5.29541015625, 5.5281982421875, 5.760986328125, 5.9937744140625, 6.2265625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 6.0, 16.0, 16.0, 36.0, 51.0, 81.0, 115.0, 171.0, 160.0, 112.0, 82.0, 58.0, 41.0, 12.0, 17.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.3588562011719, -272.6461181640625, -264.93341064453125, -257.2206726074219, -249.5079345703125, -241.7952117919922, -234.0824737548828, -226.3697509765625, -218.65701293945312, -210.9442901611328, -203.23155212402344, -195.51882934570312, -187.80609130859375, -180.09336853027344, -172.38063049316406, -164.66790771484375, -156.95516967773438, -149.24244689941406, -141.5297088623047, -133.81698608398438, -126.104248046875, -118.39152526855469, -110.67878723144531, -102.966064453125, -95.25334167480469, -87.54061126708984, -79.827880859375, -72.11515045166016, -64.40242004394531, -56.689693450927734, -48.97696304321289, -41.26423263549805, -33.55149841308594, -25.838768005371094, -18.12603759765625, -10.413309097290039, -2.7005786895751953, 5.012149810791016, 12.72488021850586, 20.437610626220703, 28.150341033935547, 35.86307144165039, 43.575801849365234, 51.28852844238281, 59.001258850097656, 66.7139892578125, 74.42671966552734, 82.13945007324219, 89.85218048095703, 97.56491088867188, 105.27764129638672, 112.99037170410156, 120.7031021118164, 128.41583251953125, 136.12855529785156, 143.84129333496094, 151.55401611328125, 159.26673889160156, 166.97947692871094, 174.69219970703125, 182.40493774414062, 190.11766052246094, 197.8303985595703, 205.54312133789062, 213.255859375]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 12.0, 7.0, 9.0, 12.0, 16.0, 21.0, 23.0, 27.0, 41.0, 33.0, 42.0, 47.0, 52.0, 49.0, 61.0, 60.0, 55.0, 56.0, 47.0, 47.0, 38.0, 34.0, 43.0, 26.0, 24.0, 19.0, 17.0, 23.0, 10.0, 5.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.3222198486328, -148.1531982421875, -142.98419189453125, -137.81517028808594, -132.6461639404297, -127.47714233398438, -122.3081283569336, -117.13911437988281, -111.97010040283203, -106.80108642578125, -101.63207244873047, -96.46305847167969, -91.29403686523438, -86.12503051757812, -80.95600891113281, -75.78699493408203, -70.61798095703125, -65.44896697998047, -60.27995300292969, -55.11093521118164, -49.94192123413086, -44.77290725708008, -39.60388946533203, -34.43487548828125, -29.26586151123047, -24.096847534179688, -18.927831649780273, -13.758816719055176, -8.589801788330078, -3.420787811279297, 1.7482280731201172, 6.917243957519531, 12.08624267578125, 17.25525665283203, 22.424272537231445, 27.59328842163086, 32.76230239868164, 37.93131637573242, 43.10033416748047, 48.26934814453125, 53.43836212158203, 58.60737609863281, 63.776390075683594, 68.94540405273438, 74.11442565917969, 79.28343200683594, 84.45245361328125, 89.62146759033203, 94.79048156738281, 99.9594955444336, 105.12850952148438, 110.29752349853516, 115.46653747558594, 120.63555908203125, 125.80457305908203, 130.9735870361328, 136.14260864257812, 141.31163024902344, 146.4806365966797, 151.649658203125, 156.81866455078125, 161.98768615722656, 167.1566925048828, 172.32571411132812, 177.49472045898438]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 7.0, 12.0, 8.0, 20.0, 25.0, 47.0, 65.0, 78.0, 107.0, 176.0, 257.0, 384.0, 589.0, 937.0, 1598.0, 2726.0, 4856.0, 9444.0, 20445.0, 52049.0, 196381.0, 2520412.0, 1181906.0, 127138.0, 39450.0, 16281.0, 8061.0, 4290.0, 2384.0, 1441.0, 925.0, 586.0, 344.0, 249.0, 185.0, 108.0, 77.0, 74.0, 37.0, 28.0, 23.0, 12.0, 13.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0], "bins": [-14.578125, -14.090087890625, -13.60205078125, -13.114013671875, -12.6259765625, -12.137939453125, -11.64990234375, -11.161865234375, -10.673828125, -10.185791015625, -9.69775390625, -9.209716796875, -8.7216796875, -8.233642578125, -7.74560546875, -7.257568359375, -6.76953125, -6.281494140625, -5.79345703125, -5.305419921875, -4.8173828125, -4.329345703125, -3.84130859375, -3.353271484375, -2.865234375, -2.377197265625, -1.88916015625, -1.401123046875, -0.9130859375, -0.425048828125, 0.06298828125, 0.551025390625, 1.0390625, 1.527099609375, 2.01513671875, 2.503173828125, 2.9912109375, 3.479248046875, 3.96728515625, 4.455322265625, 4.943359375, 5.431396484375, 5.91943359375, 6.407470703125, 6.8955078125, 7.383544921875, 7.87158203125, 8.359619140625, 8.84765625, 9.335693359375, 9.82373046875, 10.311767578125, 10.7998046875, 11.287841796875, 11.77587890625, 12.263916015625, 12.751953125, 13.239990234375, 13.72802734375, 14.216064453125, 14.7041015625, 15.192138671875, 15.68017578125, 16.168212890625, 16.65625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 9.0, 15.0, 17.0, 19.0, 22.0, 34.0, 41.0, 43.0, 42.0, 63.0, 54.0, 59.0, 63.0, 61.0, 56.0, 80.0, 47.0, 40.0, 39.0, 32.0, 30.0, 18.0, 20.0, 22.0, 16.0, 7.0, 11.0, 8.0, 7.0, 11.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.54345703125, -8.2431640625, -7.94287109375, -7.642578125, -7.34228515625, -7.0419921875, -6.74169921875, -6.44140625, -6.14111328125, -5.8408203125, -5.54052734375, -5.240234375, -4.93994140625, -4.6396484375, -4.33935546875, -4.0390625, -3.73876953125, -3.4384765625, -3.13818359375, -2.837890625, -2.53759765625, -2.2373046875, -1.93701171875, -1.63671875, -1.33642578125, -1.0361328125, -0.73583984375, -0.435546875, -0.13525390625, 0.1650390625, 0.46533203125, 0.765625, 1.06591796875, 1.3662109375, 1.66650390625, 1.966796875, 2.26708984375, 2.5673828125, 2.86767578125, 3.16796875, 3.46826171875, 3.7685546875, 4.06884765625, 4.369140625, 4.66943359375, 4.9697265625, 5.27001953125, 5.5703125, 5.87060546875, 6.1708984375, 6.47119140625, 6.771484375, 7.07177734375, 7.3720703125, 7.67236328125, 7.97265625, 8.27294921875, 8.5732421875, 8.87353515625, 9.173828125, 9.47412109375, 9.7744140625, 10.07470703125, 10.375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 11.0, 7.0, 2.0, 9.0, 10.0, 15.0, 18.0, 28.0, 37.0, 69.0, 105.0, 230.0, 531.0, 1354.0, 4354.0, 16588.0, 90127.0, 3301631.0, 715300.0, 48815.0, 10239.0, 2953.0, 1005.0, 408.0, 179.0, 93.0, 61.0, 40.0, 23.0, 8.0, 8.0, 8.0, 6.0, 1.0, 3.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.90625, -36.8486328125, -35.791015625, -34.7333984375, -33.67578125, -32.6181640625, -31.560546875, -30.5029296875, -29.4453125, -28.3876953125, -27.330078125, -26.2724609375, -25.21484375, -24.1572265625, -23.099609375, -22.0419921875, -20.984375, -19.9267578125, -18.869140625, -17.8115234375, -16.75390625, -15.6962890625, -14.638671875, -13.5810546875, -12.5234375, -11.4658203125, -10.408203125, -9.3505859375, -8.29296875, -7.2353515625, -6.177734375, -5.1201171875, -4.0625, -3.0048828125, -1.947265625, -0.8896484375, 0.16796875, 1.2255859375, 2.283203125, 3.3408203125, 4.3984375, 5.4560546875, 6.513671875, 7.5712890625, 8.62890625, 9.6865234375, 10.744140625, 11.8017578125, 12.859375, 13.9169921875, 14.974609375, 16.0322265625, 17.08984375, 18.1474609375, 19.205078125, 20.2626953125, 21.3203125, 22.3779296875, 23.435546875, 24.4931640625, 25.55078125, 26.6083984375, 27.666015625, 28.7236328125, 29.78125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 15.0, 13.0, 27.0, 16.0, 30.0, 46.0, 53.0, 91.0, 139.0, 242.0, 466.0, 1067.0, 939.0, 370.0, 186.0, 89.0, 67.0, 58.0, 31.0, 22.0, 17.0, 15.0, 7.0, 4.0, 7.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.421875, -20.67822265625, -19.9345703125, -19.19091796875, -18.447265625, -17.70361328125, -16.9599609375, -16.21630859375, -15.47265625, -14.72900390625, -13.9853515625, -13.24169921875, -12.498046875, -11.75439453125, -11.0107421875, -10.26708984375, -9.5234375, -8.77978515625, -8.0361328125, -7.29248046875, -6.548828125, -5.80517578125, -5.0615234375, -4.31787109375, -3.57421875, -2.83056640625, -2.0869140625, -1.34326171875, -0.599609375, 0.14404296875, 0.8876953125, 1.63134765625, 2.375, 3.11865234375, 3.8623046875, 4.60595703125, 5.349609375, 6.09326171875, 6.8369140625, 7.58056640625, 8.32421875, 9.06787109375, 9.8115234375, 10.55517578125, 11.298828125, 12.04248046875, 12.7861328125, 13.52978515625, 14.2734375, 15.01708984375, 15.7607421875, 16.50439453125, 17.248046875, 17.99169921875, 18.7353515625, 19.47900390625, 20.22265625, 20.96630859375, 21.7099609375, 22.45361328125, 23.197265625, 23.94091796875, 24.6845703125, 25.42822265625, 26.171875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 13.0, 12.0, 16.0, 31.0, 57.0, 85.0, 133.0, 158.0, 141.0, 111.0, 86.0, 65.0, 33.0, 15.0, 13.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-219.05348205566406, -213.0821075439453, -207.11073303222656, -201.1393585205078, -195.16798400878906, -189.1966094970703, -183.22525024414062, -177.25387573242188, -171.28250122070312, -165.31112670898438, -159.33975219726562, -153.36837768554688, -147.39700317382812, -141.42562866210938, -135.45425415039062, -129.48287963867188, -123.51150512695312, -117.54013061523438, -111.56875610351562, -105.59738159179688, -99.62600708007812, -93.65463256835938, -87.68326568603516, -81.7118911743164, -75.74051666259766, -69.7691421508789, -63.797767639160156, -57.82639694213867, -51.85502243041992, -45.88364791870117, -39.91227722167969, -33.94090270996094, -27.96954345703125, -21.9981689453125, -16.026796340942383, -10.055423736572266, -4.084049224853516, 1.8873252868652344, 7.858695983886719, 13.830070495605469, 19.80144500732422, 25.77281951904297, 31.744192123413086, 37.7155647277832, 43.68693923950195, 49.6583137512207, 55.62968444824219, 61.60105895996094, 67.57243347167969, 73.54380798339844, 79.51518249511719, 85.48655700683594, 91.45793151855469, 97.42930603027344, 103.40067291259766, 109.3720474243164, 115.34342193603516, 121.3147964477539, 127.28617095947266, 133.25753784179688, 139.22891235351562, 145.20028686523438, 151.17166137695312, 157.14303588867188, 163.11441040039062]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 1.0, 7.0, 6.0, 12.0, 12.0, 7.0, 10.0, 8.0, 13.0, 20.0, 22.0, 22.0, 19.0, 26.0, 26.0, 37.0, 29.0, 27.0, 37.0, 45.0, 39.0, 34.0, 59.0, 36.0, 43.0, 50.0, 37.0, 27.0, 34.0, 33.0, 30.0, 41.0, 23.0, 19.0, 14.0, 22.0, 17.0, 7.0, 11.0, 8.0, 9.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-108.81504821777344, -105.65342712402344, -102.49180603027344, -99.33018493652344, -96.16856384277344, -93.00694274902344, -89.84532165527344, -86.68370056152344, -83.52207946777344, -80.36045837402344, -77.19883728027344, -74.03721618652344, -70.87559509277344, -67.71397399902344, -64.55235290527344, -61.3907356262207, -58.22911834716797, -55.06749725341797, -51.90587615966797, -48.74425506591797, -45.58263397216797, -42.42101287841797, -39.259395599365234, -36.097774505615234, -32.936153411865234, -29.774532318115234, -26.612911224365234, -23.451292037963867, -20.289670944213867, -17.128049850463867, -13.9664306640625, -10.8048095703125, -7.6431884765625, -4.481567859649658, -1.3199472427368164, 1.8416728973388672, 5.003293991088867, 8.164915084838867, 11.326534271240234, 14.488155364990234, 17.649776458740234, 20.811397552490234, 23.973018646240234, 27.1346378326416, 30.2962589263916, 33.45787811279297, 36.61949920654297, 39.78112030029297, 42.94274139404297, 46.10436248779297, 49.26598358154297, 52.42760467529297, 55.58922576904297, 58.75084686279297, 61.9124641418457, 65.07408142089844, 68.23570251464844, 71.39732360839844, 74.55894470214844, 77.72056579589844, 80.88218688964844, 84.04380798339844, 87.20542907714844, 90.36705017089844, 93.52867126464844]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 4.0, 4.0, 11.0, 16.0, 18.0, 26.0, 32.0, 67.0, 86.0, 150.0, 165.0, 301.0, 445.0, 751.0, 1314.0, 2146.0, 4021.0, 7452.0, 15138.0, 32380.0, 73710.0, 184594.0, 367034.0, 206987.0, 81564.0, 35539.0, 16564.0, 7943.0, 4299.0, 2284.0, 1366.0, 723.0, 482.0, 293.0, 209.0, 160.0, 89.0, 55.0, 39.0, 25.0, 23.0, 15.0, 10.0, 10.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-16.203125, -15.7054443359375, -15.207763671875, -14.7100830078125, -14.21240234375, -13.7147216796875, -13.217041015625, -12.7193603515625, -12.2216796875, -11.7239990234375, -11.226318359375, -10.7286376953125, -10.23095703125, -9.7332763671875, -9.235595703125, -8.7379150390625, -8.240234375, -7.7425537109375, -7.244873046875, -6.7471923828125, -6.24951171875, -5.7518310546875, -5.254150390625, -4.7564697265625, -4.2587890625, -3.7611083984375, -3.263427734375, -2.7657470703125, -2.26806640625, -1.7703857421875, -1.272705078125, -0.7750244140625, -0.27734375, 0.2203369140625, 0.718017578125, 1.2156982421875, 1.71337890625, 2.2110595703125, 2.708740234375, 3.2064208984375, 3.7041015625, 4.2017822265625, 4.699462890625, 5.1971435546875, 5.69482421875, 6.1925048828125, 6.690185546875, 7.1878662109375, 7.685546875, 8.1832275390625, 8.680908203125, 9.1785888671875, 9.67626953125, 10.1739501953125, 10.671630859375, 11.1693115234375, 11.6669921875, 12.1646728515625, 12.662353515625, 13.1600341796875, 13.65771484375, 14.1553955078125, 14.653076171875, 15.1507568359375, 15.6484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 8.0, 12.0, 12.0, 16.0, 14.0, 23.0, 24.0, 28.0, 40.0, 40.0, 41.0, 49.0, 47.0, 51.0, 66.0, 53.0, 51.0, 56.0, 50.0, 51.0, 39.0, 35.0, 27.0, 28.0, 19.0, 25.0, 20.0, 16.0, 12.0, 6.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-9.109375, -8.8382568359375, -8.567138671875, -8.2960205078125, -8.02490234375, -7.7537841796875, -7.482666015625, -7.2115478515625, -6.9404296875, -6.6693115234375, -6.398193359375, -6.1270751953125, -5.85595703125, -5.5848388671875, -5.313720703125, -5.0426025390625, -4.771484375, -4.5003662109375, -4.229248046875, -3.9581298828125, -3.68701171875, -3.4158935546875, -3.144775390625, -2.8736572265625, -2.6025390625, -2.3314208984375, -2.060302734375, -1.7891845703125, -1.51806640625, -1.2469482421875, -0.975830078125, -0.7047119140625, -0.43359375, -0.1624755859375, 0.108642578125, 0.3797607421875, 0.65087890625, 0.9219970703125, 1.193115234375, 1.4642333984375, 1.7353515625, 2.0064697265625, 2.277587890625, 2.5487060546875, 2.81982421875, 3.0909423828125, 3.362060546875, 3.6331787109375, 3.904296875, 4.1754150390625, 4.446533203125, 4.7176513671875, 4.98876953125, 5.2598876953125, 5.531005859375, 5.8021240234375, 6.0732421875, 6.3443603515625, 6.615478515625, 6.8865966796875, 7.15771484375, 7.4288330078125, 7.699951171875, 7.9710693359375, 8.2421875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 11.0, 14.0, 15.0, 23.0, 35.0, 30.0, 53.0, 83.0, 140.0, 172.0, 333.0, 598.0, 1194.0, 2932.0, 10921.0, 96354.0, 802552.0, 114608.0, 12558.0, 3100.0, 1266.0, 598.0, 321.0, 206.0, 131.0, 77.0, 65.0, 43.0, 26.0, 20.0, 12.0, 14.0, 9.0, 5.0, 7.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.71875, -41.44482421875, -40.1708984375, -38.89697265625, -37.623046875, -36.34912109375, -35.0751953125, -33.80126953125, -32.52734375, -31.25341796875, -29.9794921875, -28.70556640625, -27.431640625, -26.15771484375, -24.8837890625, -23.60986328125, -22.3359375, -21.06201171875, -19.7880859375, -18.51416015625, -17.240234375, -15.96630859375, -14.6923828125, -13.41845703125, -12.14453125, -10.87060546875, -9.5966796875, -8.32275390625, -7.048828125, -5.77490234375, -4.5009765625, -3.22705078125, -1.953125, -0.67919921875, 0.5947265625, 1.86865234375, 3.142578125, 4.41650390625, 5.6904296875, 6.96435546875, 8.23828125, 9.51220703125, 10.7861328125, 12.06005859375, 13.333984375, 14.60791015625, 15.8818359375, 17.15576171875, 18.4296875, 19.70361328125, 20.9775390625, 22.25146484375, 23.525390625, 24.79931640625, 26.0732421875, 27.34716796875, 28.62109375, 29.89501953125, 31.1689453125, 32.44287109375, 33.716796875, 34.99072265625, 36.2646484375, 37.53857421875, 38.8125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 4.0, 5.0, 12.0, 10.0, 10.0, 6.0, 17.0, 17.0, 16.0, 12.0, 20.0, 18.0, 33.0, 36.0, 25.0, 42.0, 34.0, 42.0, 41.0, 47.0, 46.0, 39.0, 46.0, 40.0, 32.0, 45.0, 35.0, 32.0, 33.0, 35.0, 34.0, 24.0, 20.0, 12.0, 12.0, 12.0, 15.0, 12.0, 8.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.301025390625, -25.36767578125, -24.434326171875, -23.5009765625, -22.567626953125, -21.63427734375, -20.700927734375, -19.767578125, -18.834228515625, -17.90087890625, -16.967529296875, -16.0341796875, -15.100830078125, -14.16748046875, -13.234130859375, -12.30078125, -11.367431640625, -10.43408203125, -9.500732421875, -8.5673828125, -7.634033203125, -6.70068359375, -5.767333984375, -4.833984375, -3.900634765625, -2.96728515625, -2.033935546875, -1.1005859375, -0.167236328125, 0.76611328125, 1.699462890625, 2.6328125, 3.566162109375, 4.49951171875, 5.432861328125, 6.3662109375, 7.299560546875, 8.23291015625, 9.166259765625, 10.099609375, 11.032958984375, 11.96630859375, 12.899658203125, 13.8330078125, 14.766357421875, 15.69970703125, 16.633056640625, 17.56640625, 18.499755859375, 19.43310546875, 20.366455078125, 21.2998046875, 22.233154296875, 23.16650390625, 24.099853515625, 25.033203125, 25.966552734375, 26.89990234375, 27.833251953125, 28.7666015625, 29.699951171875, 30.63330078125, 31.566650390625, 32.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 1.0, 2.0, 10.0, 4.0, 6.0, 8.0, 18.0, 12.0, 19.0, 29.0, 41.0, 52.0, 80.0, 118.0, 204.0, 364.0, 631.0, 1549.0, 5417.0, 31933.0, 479482.0, 487629.0, 32271.0, 5562.0, 1541.0, 637.0, 330.0, 198.0, 105.0, 78.0, 53.0, 46.0, 25.0, 27.0, 29.0, 10.0, 12.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.148193359375, -12.69482421875, -12.241455078125, -11.7880859375, -11.334716796875, -10.88134765625, -10.427978515625, -9.974609375, -9.521240234375, -9.06787109375, -8.614501953125, -8.1611328125, -7.707763671875, -7.25439453125, -6.801025390625, -6.34765625, -5.894287109375, -5.44091796875, -4.987548828125, -4.5341796875, -4.080810546875, -3.62744140625, -3.174072265625, -2.720703125, -2.267333984375, -1.81396484375, -1.360595703125, -0.9072265625, -0.453857421875, -0.00048828125, 0.452880859375, 0.90625, 1.359619140625, 1.81298828125, 2.266357421875, 2.7197265625, 3.173095703125, 3.62646484375, 4.079833984375, 4.533203125, 4.986572265625, 5.43994140625, 5.893310546875, 6.3466796875, 6.800048828125, 7.25341796875, 7.706787109375, 8.16015625, 8.613525390625, 9.06689453125, 9.520263671875, 9.9736328125, 10.427001953125, 10.88037109375, 11.333740234375, 11.787109375, 12.240478515625, 12.69384765625, 13.147216796875, 13.6005859375, 14.053955078125, 14.50732421875, 14.960693359375, 15.4140625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 8.0, 10.0, 11.0, 10.0, 18.0, 28.0, 33.0, 35.0, 53.0, 57.0, 82.0, 98.0, 100.0, 100.0, 77.0, 60.0, 45.0, 34.0, 24.0, 24.0, 13.0, 9.0, 10.0, 11.0, 3.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016164779663085938, -0.0015556365251541138, -0.0014947950839996338, -0.0014339536428451538, -0.0013731122016906738, -0.0013122707605361938, -0.0012514293193817139, -0.0011905878782272339, -0.001129746437072754, -0.001068904995918274, -0.001008063554763794, -0.000947222113609314, -0.000886380672454834, -0.000825539231300354, -0.000764697790145874, -0.000703856348991394, -0.0006430149078369141, -0.0005821734666824341, -0.0005213320255279541, -0.0004604905843734741, -0.00039964914321899414, -0.00033880770206451416, -0.0002779662609100342, -0.0002171248197555542, -0.00015628337860107422, -9.544193744659424e-05, -3.460049629211426e-05, 2.6240944862365723e-05, 8.70823860168457e-05, 0.00014792382717132568, 0.00020876526832580566, 0.00026960670948028564, 0.0003304481506347656, 0.0003912895917892456, 0.0004521310329437256, 0.0005129724740982056, 0.0005738139152526855, 0.0006346553564071655, 0.0006954967975616455, 0.0007563382387161255, 0.0008171796798706055, 0.0008780211210250854, 0.0009388625621795654, 0.0009997040033340454, 0.0010605454444885254, 0.0011213868856430054, 0.0011822283267974854, 0.0012430697679519653, 0.0013039112091064453, 0.0013647526502609253, 0.0014255940914154053, 0.0014864355325698853, 0.0015472769737243652, 0.0016081184148788452, 0.0016689598560333252, 0.0017298012971878052, 0.0017906427383422852, 0.0018514841794967651, 0.0019123256206512451, 0.001973167061805725, 0.002034008502960205, 0.002094849944114685, 0.002155691385269165, 0.002216532826423645, 0.002277374267578125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 13.0, 23.0, 33.0, 55.0, 111.0, 184.0, 392.0, 916.0, 2591.0, 13173.0, 231167.0, 761926.0, 31165.0, 4480.0, 1275.0, 482.0, 252.0, 124.0, 71.0, 42.0, 27.0, 19.0, 8.0, 9.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.828125, -21.17041015625, -20.5126953125, -19.85498046875, -19.197265625, -18.53955078125, -17.8818359375, -17.22412109375, -16.56640625, -15.90869140625, -15.2509765625, -14.59326171875, -13.935546875, -13.27783203125, -12.6201171875, -11.96240234375, -11.3046875, -10.64697265625, -9.9892578125, -9.33154296875, -8.673828125, -8.01611328125, -7.3583984375, -6.70068359375, -6.04296875, -5.38525390625, -4.7275390625, -4.06982421875, -3.412109375, -2.75439453125, -2.0966796875, -1.43896484375, -0.78125, -0.12353515625, 0.5341796875, 1.19189453125, 1.849609375, 2.50732421875, 3.1650390625, 3.82275390625, 4.48046875, 5.13818359375, 5.7958984375, 6.45361328125, 7.111328125, 7.76904296875, 8.4267578125, 9.08447265625, 9.7421875, 10.39990234375, 11.0576171875, 11.71533203125, 12.373046875, 13.03076171875, 13.6884765625, 14.34619140625, 15.00390625, 15.66162109375, 16.3193359375, 16.97705078125, 17.634765625, 18.29248046875, 18.9501953125, 19.60791015625, 20.265625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 3.0, 9.0, 13.0, 13.0, 24.0, 28.0, 27.0, 39.0, 58.0, 78.0, 59.0, 65.0, 82.0, 90.0, 78.0, 72.0, 56.0, 51.0, 26.0, 26.0, 25.0, 9.0, 10.0, 6.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.3770751953125, -11.027587890625, -10.6781005859375, -10.32861328125, -9.9791259765625, -9.629638671875, -9.2801513671875, -8.9306640625, -8.5811767578125, -8.231689453125, -7.8822021484375, -7.53271484375, -7.1832275390625, -6.833740234375, -6.4842529296875, -6.134765625, -5.7852783203125, -5.435791015625, -5.0863037109375, -4.73681640625, -4.3873291015625, -4.037841796875, -3.6883544921875, -3.3388671875, -2.9893798828125, -2.639892578125, -2.2904052734375, -1.94091796875, -1.5914306640625, -1.241943359375, -0.8924560546875, -0.54296875, -0.1934814453125, 0.156005859375, 0.5054931640625, 0.85498046875, 1.2044677734375, 1.553955078125, 1.9034423828125, 2.2529296875, 2.6024169921875, 2.951904296875, 3.3013916015625, 3.65087890625, 4.0003662109375, 4.349853515625, 4.6993408203125, 5.048828125, 5.3983154296875, 5.747802734375, 6.0972900390625, 6.44677734375, 6.7962646484375, 7.145751953125, 7.4952392578125, 7.8447265625, 8.1942138671875, 8.543701171875, 8.8931884765625, 9.24267578125, 9.5921630859375, 9.941650390625, 10.2911376953125, 10.640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 10.0, 6.0, 36.0, 131.0, 400.0, 291.0, 103.0, 23.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-543.4518432617188, -527.4437255859375, -511.43560791015625, -495.427490234375, -479.41937255859375, -463.4112548828125, -447.40313720703125, -431.39501953125, -415.38690185546875, -399.3787841796875, -383.37066650390625, -367.362548828125, -351.35443115234375, -335.3463134765625, -319.33819580078125, -303.330078125, -287.3219909667969, -271.3138732910156, -255.30575561523438, -239.29763793945312, -223.28952026367188, -207.28140258789062, -191.27330017089844, -175.2651824951172, -159.25706481933594, -143.2489471435547, -127.24082946777344, -111.23271942138672, -95.22460174560547, -79.21648406982422, -63.2083740234375, -47.20025634765625, -31.192169189453125, -15.184053421020508, 0.8240623474121094, 16.832176208496094, 32.840293884277344, 48.848411560058594, 64.85652160644531, 80.86463928222656, 96.87275695800781, 112.88087463378906, 128.8889923095703, 144.8970947265625, 160.90521240234375, 176.913330078125, 192.92144775390625, 208.9295654296875, 224.93768310546875, 240.94580078125, 256.95391845703125, 272.9620361328125, 288.97015380859375, 304.978271484375, 320.98638916015625, 336.9945068359375, 353.00262451171875, 369.0107421875, 385.01885986328125, 401.0269775390625, 417.03509521484375, 433.043212890625, 449.05133056640625, 465.0594482421875, 481.0675354003906]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 5.0, 9.0, 8.0, 10.0, 14.0, 12.0, 21.0, 24.0, 31.0, 34.0, 34.0, 37.0, 61.0, 66.0, 73.0, 43.0, 62.0, 76.0, 60.0, 48.0, 39.0, 37.0, 28.0, 28.0, 34.0, 15.0, 14.0, 19.0, 9.0, 10.0, 5.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0], "bins": [-161.8929443359375, -157.3733367919922, -152.8537139892578, -148.3341064453125, -143.8144989013672, -139.29489135742188, -134.7752685546875, -130.2556610107422, -125.73605346679688, -121.21643829345703, -116.69683074951172, -112.17721557617188, -107.65760803222656, -103.13799285888672, -98.61837768554688, -94.09877014160156, -89.57915496826172, -85.05953979492188, -80.53993225097656, -76.02031707763672, -71.5007095336914, -66.98109436035156, -62.461483001708984, -57.941871643066406, -53.42226028442383, -48.90264892578125, -44.38303756713867, -39.863426208496094, -35.34381103515625, -30.824201583862305, -26.304588317871094, -21.784976959228516, -17.265357971191406, -12.745746612548828, -8.226134300231934, -3.706521987915039, 0.8130893707275391, 5.332700729370117, 9.852313995361328, 14.371925354003906, 18.891536712646484, 23.411148071289062, 27.93075942993164, 32.45037078857422, 36.96998596191406, 41.489593505859375, 46.00920867919922, 50.5288200378418, 55.048431396484375, 59.56804275512695, 64.08765411376953, 68.60726928710938, 73.12687683105469, 77.64649200439453, 82.16610717773438, 86.68571472167969, 91.205322265625, 95.72493743896484, 100.24454498291016, 104.76416015625, 109.28376770019531, 113.80338287353516, 118.322998046875, 122.84260559082031, 127.36222076416016]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 4.0, 17.0, 12.0, 17.0, 18.0, 19.0, 33.0, 52.0, 62.0, 55.0, 113.0, 145.0, 267.0, 1021.0, 12554.0, 4068233.0, 107501.0, 2971.0, 497.0, 208.0, 135.0, 101.0, 56.0, 45.0, 45.0, 26.0, 24.0, 10.0, 14.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.875, -51.6064453125, -49.337890625, -47.0693359375, -44.80078125, -42.5322265625, -40.263671875, -37.9951171875, -35.7265625, -33.4580078125, -31.189453125, -28.9208984375, -26.65234375, -24.3837890625, -22.115234375, -19.8466796875, -17.578125, -15.3095703125, -13.041015625, -10.7724609375, -8.50390625, -6.2353515625, -3.966796875, -1.6982421875, 0.5703125, 2.8388671875, 5.107421875, 7.3759765625, 9.64453125, 11.9130859375, 14.181640625, 16.4501953125, 18.71875, 20.9873046875, 23.255859375, 25.5244140625, 27.79296875, 30.0615234375, 32.330078125, 34.5986328125, 36.8671875, 39.1357421875, 41.404296875, 43.6728515625, 45.94140625, 48.2099609375, 50.478515625, 52.7470703125, 55.015625, 57.2841796875, 59.552734375, 61.8212890625, 64.08984375, 66.3583984375, 68.626953125, 70.8955078125, 73.1640625, 75.4326171875, 77.701171875, 79.9697265625, 82.23828125, 84.5068359375, 86.775390625, 89.0439453125, 91.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 8.0, 12.0, 13.0, 9.0, 26.0, 20.0, 25.0, 30.0, 27.0, 44.0, 45.0, 50.0, 52.0, 56.0, 58.0, 60.0, 71.0, 58.0, 43.0, 45.0, 37.0, 31.0, 36.0, 24.0, 22.0, 20.0, 17.0, 12.0, 9.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.3515625, -9.077392578125, -8.80322265625, -8.529052734375, -8.2548828125, -7.980712890625, -7.70654296875, -7.432373046875, -7.158203125, -6.884033203125, -6.60986328125, -6.335693359375, -6.0615234375, -5.787353515625, -5.51318359375, -5.239013671875, -4.96484375, -4.690673828125, -4.41650390625, -4.142333984375, -3.8681640625, -3.593994140625, -3.31982421875, -3.045654296875, -2.771484375, -2.497314453125, -2.22314453125, -1.948974609375, -1.6748046875, -1.400634765625, -1.12646484375, -0.852294921875, -0.578125, -0.303955078125, -0.02978515625, 0.244384765625, 0.5185546875, 0.792724609375, 1.06689453125, 1.341064453125, 1.615234375, 1.889404296875, 2.16357421875, 2.437744140625, 2.7119140625, 2.986083984375, 3.26025390625, 3.534423828125, 3.80859375, 4.082763671875, 4.35693359375, 4.631103515625, 4.9052734375, 5.179443359375, 5.45361328125, 5.727783203125, 6.001953125, 6.276123046875, 6.55029296875, 6.824462890625, 7.0986328125, 7.372802734375, 7.64697265625, 7.921142578125, 8.1953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 13.0, 13.0, 14.0, 30.0, 51.0, 81.0, 141.0, 263.0, 490.0, 978.0, 2053.0, 4481.0, 11799.0, 35620.0, 195551.0, 3413345.0, 448455.0, 53433.0, 16169.0, 6138.0, 2687.0, 1220.0, 563.0, 282.0, 169.0, 81.0, 60.0, 30.0, 10.0, 20.0, 13.0, 9.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.28125, -19.640380859375, -18.99951171875, -18.358642578125, -17.7177734375, -17.076904296875, -16.43603515625, -15.795166015625, -15.154296875, -14.513427734375, -13.87255859375, -13.231689453125, -12.5908203125, -11.949951171875, -11.30908203125, -10.668212890625, -10.02734375, -9.386474609375, -8.74560546875, -8.104736328125, -7.4638671875, -6.822998046875, -6.18212890625, -5.541259765625, -4.900390625, -4.259521484375, -3.61865234375, -2.977783203125, -2.3369140625, -1.696044921875, -1.05517578125, -0.414306640625, 0.2265625, 0.867431640625, 1.50830078125, 2.149169921875, 2.7900390625, 3.430908203125, 4.07177734375, 4.712646484375, 5.353515625, 5.994384765625, 6.63525390625, 7.276123046875, 7.9169921875, 8.557861328125, 9.19873046875, 9.839599609375, 10.48046875, 11.121337890625, 11.76220703125, 12.403076171875, 13.0439453125, 13.684814453125, 14.32568359375, 14.966552734375, 15.607421875, 16.248291015625, 16.88916015625, 17.530029296875, 18.1708984375, 18.811767578125, 19.45263671875, 20.093505859375, 20.734375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 9.0, 10.0, 11.0, 14.0, 17.0, 28.0, 40.0, 82.0, 100.0, 256.0, 633.0, 1358.0, 822.0, 319.0, 135.0, 79.0, 47.0, 25.0, 21.0, 13.0, 11.0, 16.0, 4.0, 5.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.09375, -20.358154296875, -19.62255859375, -18.886962890625, -18.1513671875, -17.415771484375, -16.68017578125, -15.944580078125, -15.208984375, -14.473388671875, -13.73779296875, -13.002197265625, -12.2666015625, -11.531005859375, -10.79541015625, -10.059814453125, -9.32421875, -8.588623046875, -7.85302734375, -7.117431640625, -6.3818359375, -5.646240234375, -4.91064453125, -4.175048828125, -3.439453125, -2.703857421875, -1.96826171875, -1.232666015625, -0.4970703125, 0.238525390625, 0.97412109375, 1.709716796875, 2.4453125, 3.180908203125, 3.91650390625, 4.652099609375, 5.3876953125, 6.123291015625, 6.85888671875, 7.594482421875, 8.330078125, 9.065673828125, 9.80126953125, 10.536865234375, 11.2724609375, 12.008056640625, 12.74365234375, 13.479248046875, 14.21484375, 14.950439453125, 15.68603515625, 16.421630859375, 17.1572265625, 17.892822265625, 18.62841796875, 19.364013671875, 20.099609375, 20.835205078125, 21.57080078125, 22.306396484375, 23.0419921875, 23.777587890625, 24.51318359375, 25.248779296875, 25.984375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 12.0, 34.0, 86.0, 207.0, 289.0, 229.0, 97.0, 26.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-227.63230895996094, -218.76780700683594, -209.90330505371094, -201.03878784179688, -192.17428588867188, -183.30978393554688, -174.44528198242188, -165.58078002929688, -156.71627807617188, -147.85177612304688, -138.98727416992188, -130.12277221679688, -121.25825500488281, -112.39375305175781, -103.52925109863281, -94.66474914550781, -85.80023193359375, -76.93572998046875, -68.07122039794922, -59.20671844482422, -50.34221267700195, -41.47770690917969, -32.61320495605469, -23.748699188232422, -14.884193420410156, -6.019688606262207, 2.844816207885742, 11.709320068359375, 20.57382583618164, 29.438331604003906, 38.302833557128906, 47.16733932495117, 56.031829833984375, 64.89633178710938, 73.7608413696289, 82.6253433227539, 91.48985290527344, 100.35435485839844, 109.21885681152344, 118.08335876464844, 126.94786834716797, 135.8123779296875, 144.6768798828125, 153.5413818359375, 162.4058837890625, 171.2703857421875, 180.1348876953125, 188.99940490722656, 197.86390686035156, 206.72840881347656, 215.59291076660156, 224.45742797851562, 233.32192993164062, 242.18643188476562, 251.05093383789062, 259.9154357910156, 268.7799377441406, 277.6444396972656, 286.5089416503906, 295.3734436035156, 304.2379455566406, 313.10247802734375, 321.96697998046875, 330.83148193359375, 339.69598388671875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 10.0, 19.0, 11.0, 17.0, 27.0, 28.0, 42.0, 31.0, 39.0, 45.0, 52.0, 48.0, 59.0, 64.0, 54.0, 57.0, 51.0, 51.0, 51.0, 37.0, 39.0, 18.0, 32.0, 25.0, 11.0, 17.0, 9.0, 16.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-96.53462219238281, -93.73416137695312, -90.9336929321289, -88.13323211669922, -85.332763671875, -82.53230285644531, -79.73184204101562, -76.9313735961914, -74.13090515136719, -71.3304443359375, -68.52997589111328, -65.7295150756836, -62.929046630859375, -60.12858581542969, -57.328121185302734, -54.52765655517578, -51.727195739746094, -48.92673110961914, -46.12626647949219, -43.3258056640625, -40.52533721923828, -37.724876403808594, -34.92441177368164, -32.12394714355469, -29.323482513427734, -26.52301788330078, -23.722553253173828, -20.922090530395508, -18.121625900268555, -15.321161270141602, -12.520698547363281, -9.720233917236328, -6.919769287109375, -4.11930513381958, -1.3188409805297852, 1.4816226959228516, 4.282087326049805, 7.082551956176758, 9.883014678955078, 12.683479309082031, 15.483943939208984, 18.284408569335938, 21.08487319946289, 23.88533592224121, 26.685800552368164, 29.486265182495117, 32.28672790527344, 35.08719253540039, 37.887657165527344, 40.6881217956543, 43.48858642578125, 46.28904724121094, 49.089515686035156, 51.889976501464844, 54.6904411315918, 57.49090576171875, 60.2913703918457, 63.091835021972656, 65.89229583740234, 68.69276428222656, 71.49322509765625, 74.29369354248047, 77.09415435791016, 79.89462280273438, 82.69508361816406]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 5.0, 5.0, 11.0, 9.0, 16.0, 27.0, 37.0, 55.0, 98.0, 99.0, 186.0, 283.0, 436.0, 716.0, 1238.0, 2174.0, 3774.0, 6970.0, 12770.0, 25306.0, 51249.0, 110601.0, 250870.0, 304961.0, 144579.0, 65053.0, 31509.0, 15984.0, 8414.0, 4647.0, 2641.0, 1449.0, 859.0, 521.0, 334.0, 239.0, 136.0, 85.0, 56.0, 52.0, 37.0, 20.0, 10.0, 9.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-14.796875, -14.3876953125, -13.978515625, -13.5693359375, -13.16015625, -12.7509765625, -12.341796875, -11.9326171875, -11.5234375, -11.1142578125, -10.705078125, -10.2958984375, -9.88671875, -9.4775390625, -9.068359375, -8.6591796875, -8.25, -7.8408203125, -7.431640625, -7.0224609375, -6.61328125, -6.2041015625, -5.794921875, -5.3857421875, -4.9765625, -4.5673828125, -4.158203125, -3.7490234375, -3.33984375, -2.9306640625, -2.521484375, -2.1123046875, -1.703125, -1.2939453125, -0.884765625, -0.4755859375, -0.06640625, 0.3427734375, 0.751953125, 1.1611328125, 1.5703125, 1.9794921875, 2.388671875, 2.7978515625, 3.20703125, 3.6162109375, 4.025390625, 4.4345703125, 4.84375, 5.2529296875, 5.662109375, 6.0712890625, 6.48046875, 6.8896484375, 7.298828125, 7.7080078125, 8.1171875, 8.5263671875, 8.935546875, 9.3447265625, 9.75390625, 10.1630859375, 10.572265625, 10.9814453125, 11.390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 6.0, 12.0, 9.0, 10.0, 17.0, 27.0, 24.0, 21.0, 38.0, 39.0, 31.0, 48.0, 50.0, 58.0, 61.0, 56.0, 57.0, 56.0, 47.0, 49.0, 49.0, 40.0, 25.0, 30.0, 24.0, 17.0, 17.0, 14.0, 12.0, 7.0, 9.0, 13.0, 3.0, 2.0, 4.0, 4.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.296875, -9.0201416015625, -8.743408203125, -8.4666748046875, -8.18994140625, -7.9132080078125, -7.636474609375, -7.3597412109375, -7.0830078125, -6.8062744140625, -6.529541015625, -6.2528076171875, -5.97607421875, -5.6993408203125, -5.422607421875, -5.1458740234375, -4.869140625, -4.5924072265625, -4.315673828125, -4.0389404296875, -3.76220703125, -3.4854736328125, -3.208740234375, -2.9320068359375, -2.6552734375, -2.3785400390625, -2.101806640625, -1.8250732421875, -1.54833984375, -1.2716064453125, -0.994873046875, -0.7181396484375, -0.44140625, -0.1646728515625, 0.112060546875, 0.3887939453125, 0.66552734375, 0.9422607421875, 1.218994140625, 1.4957275390625, 1.7724609375, 2.0491943359375, 2.325927734375, 2.6026611328125, 2.87939453125, 3.1561279296875, 3.432861328125, 3.7095947265625, 3.986328125, 4.2630615234375, 4.539794921875, 4.8165283203125, 5.09326171875, 5.3699951171875, 5.646728515625, 5.9234619140625, 6.2001953125, 6.4769287109375, 6.753662109375, 7.0303955078125, 7.30712890625, 7.5838623046875, 7.860595703125, 8.1373291015625, 8.4140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 10.0, 3.0, 4.0, 10.0, 13.0, 19.0, 26.0, 37.0, 62.0, 70.0, 112.0, 178.0, 269.0, 436.0, 820.0, 1670.0, 4147.0, 13465.0, 57637.0, 344731.0, 523689.0, 75139.0, 17012.0, 4870.0, 1938.0, 878.0, 458.0, 279.0, 187.0, 126.0, 64.0, 51.0, 51.0, 27.0, 25.0, 13.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.46533203125, -19.6494140625, -18.83349609375, -18.017578125, -17.20166015625, -16.3857421875, -15.56982421875, -14.75390625, -13.93798828125, -13.1220703125, -12.30615234375, -11.490234375, -10.67431640625, -9.8583984375, -9.04248046875, -8.2265625, -7.41064453125, -6.5947265625, -5.77880859375, -4.962890625, -4.14697265625, -3.3310546875, -2.51513671875, -1.69921875, -0.88330078125, -0.0673828125, 0.74853515625, 1.564453125, 2.38037109375, 3.1962890625, 4.01220703125, 4.828125, 5.64404296875, 6.4599609375, 7.27587890625, 8.091796875, 8.90771484375, 9.7236328125, 10.53955078125, 11.35546875, 12.17138671875, 12.9873046875, 13.80322265625, 14.619140625, 15.43505859375, 16.2509765625, 17.06689453125, 17.8828125, 18.69873046875, 19.5146484375, 20.33056640625, 21.146484375, 21.96240234375, 22.7783203125, 23.59423828125, 24.41015625, 25.22607421875, 26.0419921875, 26.85791015625, 27.673828125, 28.48974609375, 29.3056640625, 30.12158203125, 30.9375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 4.0, 3.0, 2.0, 5.0, 2.0, 11.0, 16.0, 12.0, 18.0, 18.0, 30.0, 23.0, 40.0, 34.0, 41.0, 42.0, 58.0, 53.0, 56.0, 46.0, 59.0, 48.0, 55.0, 51.0, 48.0, 43.0, 32.0, 26.0, 27.0, 14.0, 24.0, 12.0, 11.0, 7.0, 10.0, 8.0, 3.0, 2.0, 2.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.21875, -31.11669921875, -30.0146484375, -28.91259765625, -27.810546875, -26.70849609375, -25.6064453125, -24.50439453125, -23.40234375, -22.30029296875, -21.1982421875, -20.09619140625, -18.994140625, -17.89208984375, -16.7900390625, -15.68798828125, -14.5859375, -13.48388671875, -12.3818359375, -11.27978515625, -10.177734375, -9.07568359375, -7.9736328125, -6.87158203125, -5.76953125, -4.66748046875, -3.5654296875, -2.46337890625, -1.361328125, -0.25927734375, 0.8427734375, 1.94482421875, 3.046875, 4.14892578125, 5.2509765625, 6.35302734375, 7.455078125, 8.55712890625, 9.6591796875, 10.76123046875, 11.86328125, 12.96533203125, 14.0673828125, 15.16943359375, 16.271484375, 17.37353515625, 18.4755859375, 19.57763671875, 20.6796875, 21.78173828125, 22.8837890625, 23.98583984375, 25.087890625, 26.18994140625, 27.2919921875, 28.39404296875, 29.49609375, 30.59814453125, 31.7001953125, 32.80224609375, 33.904296875, 35.00634765625, 36.1083984375, 37.21044921875, 38.3125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 8.0, 10.0, 18.0, 19.0, 30.0, 42.0, 73.0, 140.0, 270.0, 598.0, 2033.0, 12132.0, 231929.0, 766416.0, 29572.0, 3605.0, 935.0, 318.0, 140.0, 76.0, 44.0, 38.0, 38.0, 12.0, 11.0, 8.0, 5.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.609375, -20.9951171875, -20.380859375, -19.7666015625, -19.15234375, -18.5380859375, -17.923828125, -17.3095703125, -16.6953125, -16.0810546875, -15.466796875, -14.8525390625, -14.23828125, -13.6240234375, -13.009765625, -12.3955078125, -11.78125, -11.1669921875, -10.552734375, -9.9384765625, -9.32421875, -8.7099609375, -8.095703125, -7.4814453125, -6.8671875, -6.2529296875, -5.638671875, -5.0244140625, -4.41015625, -3.7958984375, -3.181640625, -2.5673828125, -1.953125, -1.3388671875, -0.724609375, -0.1103515625, 0.50390625, 1.1181640625, 1.732421875, 2.3466796875, 2.9609375, 3.5751953125, 4.189453125, 4.8037109375, 5.41796875, 6.0322265625, 6.646484375, 7.2607421875, 7.875, 8.4892578125, 9.103515625, 9.7177734375, 10.33203125, 10.9462890625, 11.560546875, 12.1748046875, 12.7890625, 13.4033203125, 14.017578125, 14.6318359375, 15.24609375, 15.8603515625, 16.474609375, 17.0888671875, 17.703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 9.0, 10.0, 12.0, 8.0, 15.0, 35.0, 37.0, 44.0, 53.0, 81.0, 93.0, 119.0, 125.0, 74.0, 62.0, 42.0, 35.0, 17.0, 28.0, 9.0, 12.0, 17.0, 6.0, 5.0, 4.0, 4.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00200653076171875, -0.0019413530826568604, -0.0018761754035949707, -0.001810997724533081, -0.0017458200454711914, -0.0016806423664093018, -0.0016154646873474121, -0.0015502870082855225, -0.0014851093292236328, -0.0014199316501617432, -0.0013547539710998535, -0.0012895762920379639, -0.0012243986129760742, -0.0011592209339141846, -0.001094043254852295, -0.0010288655757904053, -0.0009636878967285156, -0.000898510217666626, -0.0008333325386047363, -0.0007681548595428467, -0.000702977180480957, -0.0006377995014190674, -0.0005726218223571777, -0.0005074441432952881, -0.00044226646423339844, -0.0003770887851715088, -0.00031191110610961914, -0.0002467334270477295, -0.00018155574798583984, -0.0001163780689239502, -5.120038986206055e-05, 1.3977289199829102e-05, 7.915496826171875e-05, 0.0001443326473236084, 0.00020951032638549805, 0.0002746880054473877, 0.00033986568450927734, 0.000405043363571167, 0.00047022104263305664, 0.0005353987216949463, 0.0006005764007568359, 0.0006657540798187256, 0.0007309317588806152, 0.0007961094379425049, 0.0008612871170043945, 0.0009264647960662842, 0.0009916424751281738, 0.0010568201541900635, 0.0011219978332519531, 0.0011871755123138428, 0.0012523531913757324, 0.001317530870437622, 0.0013827085494995117, 0.0014478862285614014, 0.001513063907623291, 0.0015782415866851807, 0.0016434192657470703, 0.00170859694480896, 0.0017737746238708496, 0.0018389523029327393, 0.001904129981994629, 0.0019693076610565186, 0.002034485340118408, 0.002099663019180298, 0.0021648406982421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 9.0, 8.0, 27.0, 40.0, 83.0, 148.0, 297.0, 647.0, 1810.0, 5744.0, 42279.0, 732097.0, 243018.0, 16765.0, 3447.0, 1143.0, 473.0, 248.0, 115.0, 51.0, 30.0, 25.0, 12.0, 9.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.625, -14.1171875, -13.609375, -13.1015625, -12.59375, -12.0859375, -11.578125, -11.0703125, -10.5625, -10.0546875, -9.546875, -9.0390625, -8.53125, -8.0234375, -7.515625, -7.0078125, -6.5, -5.9921875, -5.484375, -4.9765625, -4.46875, -3.9609375, -3.453125, -2.9453125, -2.4375, -1.9296875, -1.421875, -0.9140625, -0.40625, 0.1015625, 0.609375, 1.1171875, 1.625, 2.1328125, 2.640625, 3.1484375, 3.65625, 4.1640625, 4.671875, 5.1796875, 5.6875, 6.1953125, 6.703125, 7.2109375, 7.71875, 8.2265625, 8.734375, 9.2421875, 9.75, 10.2578125, 10.765625, 11.2734375, 11.78125, 12.2890625, 12.796875, 13.3046875, 13.8125, 14.3203125, 14.828125, 15.3359375, 15.84375, 16.3515625, 16.859375, 17.3671875, 17.875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 3.0, 2.0, 13.0, 9.0, 18.0, 14.0, 16.0, 20.0, 26.0, 47.0, 36.0, 53.0, 48.0, 56.0, 76.0, 78.0, 73.0, 68.0, 66.0, 55.0, 32.0, 31.0, 34.0, 22.0, 25.0, 12.0, 18.0, 8.0, 7.0, 5.0, 5.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.6580810546875, -7.421630859375, -7.1851806640625, -6.94873046875, -6.7122802734375, -6.475830078125, -6.2393798828125, -6.0029296875, -5.7664794921875, -5.530029296875, -5.2935791015625, -5.05712890625, -4.8206787109375, -4.584228515625, -4.3477783203125, -4.111328125, -3.8748779296875, -3.638427734375, -3.4019775390625, -3.16552734375, -2.9290771484375, -2.692626953125, -2.4561767578125, -2.2197265625, -1.9832763671875, -1.746826171875, -1.5103759765625, -1.27392578125, -1.0374755859375, -0.801025390625, -0.5645751953125, -0.328125, -0.0916748046875, 0.144775390625, 0.3812255859375, 0.61767578125, 0.8541259765625, 1.090576171875, 1.3270263671875, 1.5634765625, 1.7999267578125, 2.036376953125, 2.2728271484375, 2.50927734375, 2.7457275390625, 2.982177734375, 3.2186279296875, 3.455078125, 3.6915283203125, 3.927978515625, 4.1644287109375, 4.40087890625, 4.6373291015625, 4.873779296875, 5.1102294921875, 5.3466796875, 5.5831298828125, 5.819580078125, 6.0560302734375, 6.29248046875, 6.5289306640625, 6.765380859375, 7.0018310546875, 7.23828125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 9.0, 14.0, 20.0, 29.0, 41.0, 92.0, 93.0, 147.0, 155.0, 143.0, 91.0, 62.0, 39.0, 19.0, 16.0, 10.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-237.98324584960938, -232.77313232421875, -227.5630340576172, -222.35292053222656, -217.14280700683594, -211.93270874023438, -206.72259521484375, -201.51248168945312, -196.3023681640625, -191.09225463867188, -185.8821563720703, -180.6720428466797, -175.46192932128906, -170.2518310546875, -165.04171752929688, -159.83160400390625, -154.6215057373047, -149.41139221191406, -144.2012939453125, -138.99118041992188, -133.78106689453125, -128.57095336914062, -123.36085510253906, -118.15074157714844, -112.94063568115234, -107.73052978515625, -102.52041625976562, -97.31031036376953, -92.10020446777344, -86.89009094238281, -81.67998504638672, -76.46987915039062, -71.25975036621094, -66.04964447021484, -60.83953094482422, -55.629425048828125, -50.419315338134766, -45.209205627441406, -39.99909973144531, -34.78899002075195, -29.578880310058594, -24.368770599365234, -19.158662796020508, -13.948554039001465, -8.738445281982422, -3.5283355712890625, 1.681772232055664, 6.891880035400391, 12.10198974609375, 17.31209945678711, 22.522207260131836, 27.732315063476562, 32.94242477416992, 38.15253448486328, 43.362640380859375, 48.572750091552734, 53.782859802246094, 58.99296951293945, 64.20307922363281, 69.4131851196289, 74.623291015625, 79.83340454101562, 85.04351043701172, 90.25361633300781, 95.46372985839844]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 14.0, 13.0, 17.0, 15.0, 25.0, 37.0, 34.0, 50.0, 59.0, 61.0, 70.0, 102.0, 96.0, 53.0, 63.0, 52.0, 45.0, 29.0, 44.0, 24.0, 23.0, 19.0, 22.0, 7.0, 8.0, 1.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.56808471679688, -139.45872497558594, -133.349365234375, -127.2400131225586, -121.13065338134766, -115.02129364013672, -108.91194152832031, -102.80258178710938, -96.69322204589844, -90.5838623046875, -84.47450256347656, -78.36515045166016, -72.25579071044922, -66.14643096923828, -60.03707504272461, -53.92771911621094, -47.818359375, -41.70899963378906, -35.59964370727539, -29.490285873413086, -23.38092803955078, -17.271570205688477, -11.162212371826172, -5.0528564453125, 1.0565032958984375, 7.165861129760742, 13.275218963623047, 19.38457679748535, 25.493934631347656, 31.60329246520996, 37.712650299072266, 43.82200622558594, 49.93138122558594, 56.040740966796875, 62.15009689331055, 68.25945281982422, 74.36881256103516, 80.4781723022461, 86.5875244140625, 92.69688415527344, 98.80624389648438, 104.91560363769531, 111.02496337890625, 117.13431549072266, 123.2436752319336, 129.35302734375, 135.46238708496094, 141.57174682617188, 147.6811065673828, 153.79046630859375, 159.8998260498047, 166.00918579101562, 172.1185302734375, 178.22789001464844, 184.33724975585938, 190.4466094970703, 196.55596923828125, 202.6653289794922, 208.77468872070312, 214.88404846191406, 220.993408203125, 227.10275268554688, 233.2121124267578, 239.32147216796875, 245.4308319091797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 16.0, 25.0, 31.0, 59.0, 92.0, 124.0, 169.0, 379.0, 657.0, 1376.0, 2914.0, 6937.0, 18754.0, 75751.0, 796619.0, 2960958.0, 269440.0, 39960.0, 11370.0, 4353.0, 1911.0, 958.0, 503.0, 287.0, 174.0, 140.0, 83.0, 61.0, 36.0, 23.0, 22.0, 14.0, 16.0, 12.0, 9.0, 5.0, 7.0, 4.0, 0.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.53125, -12.99658203125, -12.4619140625, -11.92724609375, -11.392578125, -10.85791015625, -10.3232421875, -9.78857421875, -9.25390625, -8.71923828125, -8.1845703125, -7.64990234375, -7.115234375, -6.58056640625, -6.0458984375, -5.51123046875, -4.9765625, -4.44189453125, -3.9072265625, -3.37255859375, -2.837890625, -2.30322265625, -1.7685546875, -1.23388671875, -0.69921875, -0.16455078125, 0.3701171875, 0.90478515625, 1.439453125, 1.97412109375, 2.5087890625, 3.04345703125, 3.578125, 4.11279296875, 4.6474609375, 5.18212890625, 5.716796875, 6.25146484375, 6.7861328125, 7.32080078125, 7.85546875, 8.39013671875, 8.9248046875, 9.45947265625, 9.994140625, 10.52880859375, 11.0634765625, 11.59814453125, 12.1328125, 12.66748046875, 13.2021484375, 13.73681640625, 14.271484375, 14.80615234375, 15.3408203125, 15.87548828125, 16.41015625, 16.94482421875, 17.4794921875, 18.01416015625, 18.548828125, 19.08349609375, 19.6181640625, 20.15283203125, 20.6875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 21.0, 34.0, 70.0, 81.0, 113.0, 112.0, 139.0, 114.0, 98.0, 90.0, 53.0, 27.0, 24.0, 13.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -8.8812255859375, -8.270263671875, -7.6593017578125, -7.04833984375, -6.4373779296875, -5.826416015625, -5.2154541015625, -4.6044921875, -3.9935302734375, -3.382568359375, -2.7716064453125, -2.16064453125, -1.5496826171875, -0.938720703125, -0.3277587890625, 0.283203125, 0.8941650390625, 1.505126953125, 2.1160888671875, 2.72705078125, 3.3380126953125, 3.948974609375, 4.5599365234375, 5.1708984375, 5.7818603515625, 6.392822265625, 7.0037841796875, 7.61474609375, 8.2257080078125, 8.836669921875, 9.4476318359375, 10.05859375, 10.6695556640625, 11.280517578125, 11.8914794921875, 12.50244140625, 13.1134033203125, 13.724365234375, 14.3353271484375, 14.9462890625, 15.5572509765625, 16.168212890625, 16.7791748046875, 17.39013671875, 18.0010986328125, 18.612060546875, 19.2230224609375, 19.833984375, 20.4449462890625, 21.055908203125, 21.6668701171875, 22.27783203125, 22.8887939453125, 23.499755859375, 24.1107177734375, 24.7216796875, 25.3326416015625, 25.943603515625, 26.5545654296875, 27.16552734375, 27.7764892578125, 28.387451171875, 28.9984130859375, 29.609375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 9.0, 4.0, 7.0, 16.0, 19.0, 39.0, 58.0, 87.0, 146.0, 295.0, 601.0, 1453.0, 3857.0, 12232.0, 55707.0, 576816.0, 3290800.0, 207118.0, 31955.0, 8117.0, 2693.0, 1136.0, 488.0, 252.0, 142.0, 60.0, 46.0, 26.0, 21.0, 19.0, 9.0, 16.0, 12.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.203125, -19.48974609375, -18.7763671875, -18.06298828125, -17.349609375, -16.63623046875, -15.9228515625, -15.20947265625, -14.49609375, -13.78271484375, -13.0693359375, -12.35595703125, -11.642578125, -10.92919921875, -10.2158203125, -9.50244140625, -8.7890625, -8.07568359375, -7.3623046875, -6.64892578125, -5.935546875, -5.22216796875, -4.5087890625, -3.79541015625, -3.08203125, -2.36865234375, -1.6552734375, -0.94189453125, -0.228515625, 0.48486328125, 1.1982421875, 1.91162109375, 2.625, 3.33837890625, 4.0517578125, 4.76513671875, 5.478515625, 6.19189453125, 6.9052734375, 7.61865234375, 8.33203125, 9.04541015625, 9.7587890625, 10.47216796875, 11.185546875, 11.89892578125, 12.6123046875, 13.32568359375, 14.0390625, 14.75244140625, 15.4658203125, 16.17919921875, 16.892578125, 17.60595703125, 18.3193359375, 19.03271484375, 19.74609375, 20.45947265625, 21.1728515625, 21.88623046875, 22.599609375, 23.31298828125, 24.0263671875, 24.73974609375, 25.453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 6.0, 5.0, 1.0, 5.0, 6.0, 2.0, 2.0, 7.0, 17.0, 21.0, 21.0, 36.0, 36.0, 58.0, 96.0, 135.0, 182.0, 348.0, 527.0, 702.0, 665.0, 423.0, 233.0, 151.0, 99.0, 75.0, 58.0, 35.0, 20.0, 16.0, 22.0, 18.0, 7.0, 11.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.26904296875, -16.6474609375, -16.02587890625, -15.404296875, -14.78271484375, -14.1611328125, -13.53955078125, -12.91796875, -12.29638671875, -11.6748046875, -11.05322265625, -10.431640625, -9.81005859375, -9.1884765625, -8.56689453125, -7.9453125, -7.32373046875, -6.7021484375, -6.08056640625, -5.458984375, -4.83740234375, -4.2158203125, -3.59423828125, -2.97265625, -2.35107421875, -1.7294921875, -1.10791015625, -0.486328125, 0.13525390625, 0.7568359375, 1.37841796875, 2.0, 2.62158203125, 3.2431640625, 3.86474609375, 4.486328125, 5.10791015625, 5.7294921875, 6.35107421875, 6.97265625, 7.59423828125, 8.2158203125, 8.83740234375, 9.458984375, 10.08056640625, 10.7021484375, 11.32373046875, 11.9453125, 12.56689453125, 13.1884765625, 13.81005859375, 14.431640625, 15.05322265625, 15.6748046875, 16.29638671875, 16.91796875, 17.53955078125, 18.1611328125, 18.78271484375, 19.404296875, 20.02587890625, 20.6474609375, 21.26904296875, 21.890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 7.0, 23.0, 94.0, 194.0, 283.0, 204.0, 115.0, 38.0, 14.0, 7.0, 8.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-252.84799194335938, -242.0911865234375, -231.33436584472656, -220.5775604248047, -209.8207550048828, -199.06393432617188, -188.30712890625, -177.55032348632812, -166.79351806640625, -156.03671264648438, -145.27989196777344, -134.52308654785156, -123.76628112792969, -113.00946807861328, -102.25265502929688, -91.495849609375, -80.73902893066406, -69.98221588134766, -59.22541046142578, -48.468597412109375, -37.711788177490234, -26.954978942871094, -16.198165893554688, -5.4413604736328125, 5.315452575683594, 16.072261810302734, 26.829072952270508, 37.58588409423828, 48.34269332885742, 59.09950256347656, 69.85631561279297, 80.61312103271484, 91.36993408203125, 102.12674713134766, 112.88355255126953, 123.64036560058594, 134.3971710205078, 145.15399169921875, 155.91079711914062, 166.6676025390625, 177.42440795898438, 188.18121337890625, 198.9380340576172, 209.69483947753906, 220.45164489746094, 231.20846557617188, 241.96527099609375, 252.72207641601562, 263.4788818359375, 274.2356872558594, 284.99249267578125, 295.74932861328125, 306.5061340332031, 317.262939453125, 328.0197448730469, 338.77655029296875, 349.53338623046875, 360.2901916503906, 371.0469970703125, 381.8038330078125, 392.5606384277344, 403.31744384765625, 414.0742492675781, 424.8310546875, 435.5878601074219]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 10.0, 11.0, 13.0, 19.0, 27.0, 25.0, 28.0, 40.0, 51.0, 48.0, 50.0, 54.0, 60.0, 49.0, 77.0, 69.0, 58.0, 57.0, 48.0, 46.0, 38.0, 27.0, 19.0, 22.0, 21.0, 5.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-183.96829223632812, -179.79054260253906, -175.61279296875, -171.43505859375, -167.25730895996094, -163.07955932617188, -158.90182495117188, -154.7240753173828, -150.54632568359375, -146.3685760498047, -142.19082641601562, -138.01309204101562, -133.83534240722656, -129.6575927734375, -125.47985076904297, -121.30210876464844, -117.12435913085938, -112.94660949707031, -108.76886749267578, -104.59112548828125, -100.41337585449219, -96.23562622070312, -92.0578842163086, -87.88014221191406, -83.702392578125, -79.52464294433594, -75.3469009399414, -71.16915893554688, -66.99140930175781, -62.813663482666016, -58.63591766357422, -54.45817184448242, -50.280418395996094, -46.1026725769043, -41.9249267578125, -37.7471809387207, -33.569435119628906, -29.39168930053711, -25.213943481445312, -21.036197662353516, -16.85845184326172, -12.680706024169922, -8.502960205078125, -4.325214385986328, -0.14746856689453125, 4.030277252197266, 8.208023071289062, 12.38576889038086, 16.563514709472656, 20.741260528564453, 24.91900634765625, 29.096752166748047, 33.274497985839844, 37.45224380493164, 41.62998962402344, 45.807735443115234, 49.98548126220703, 54.16322708129883, 58.340972900390625, 62.51871871948242, 66.69646453857422, 70.87420654296875, 75.05195617675781, 79.22970581054688, 83.4074478149414]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 10.0, 6.0, 14.0, 21.0, 34.0, 62.0, 89.0, 169.0, 248.0, 556.0, 1089.0, 2222.0, 4903.0, 12564.0, 32640.0, 89590.0, 244226.0, 395620.0, 165106.0, 61360.0, 22469.0, 8639.0, 3501.0, 1642.0, 759.0, 408.0, 268.0, 128.0, 75.0, 46.0, 26.0, 21.0, 16.0, 1.0, 10.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.78125, -20.23876953125, -19.6962890625, -19.15380859375, -18.611328125, -18.06884765625, -17.5263671875, -16.98388671875, -16.44140625, -15.89892578125, -15.3564453125, -14.81396484375, -14.271484375, -13.72900390625, -13.1865234375, -12.64404296875, -12.1015625, -11.55908203125, -11.0166015625, -10.47412109375, -9.931640625, -9.38916015625, -8.8466796875, -8.30419921875, -7.76171875, -7.21923828125, -6.6767578125, -6.13427734375, -5.591796875, -5.04931640625, -4.5068359375, -3.96435546875, -3.421875, -2.87939453125, -2.3369140625, -1.79443359375, -1.251953125, -0.70947265625, -0.1669921875, 0.37548828125, 0.91796875, 1.46044921875, 2.0029296875, 2.54541015625, 3.087890625, 3.63037109375, 4.1728515625, 4.71533203125, 5.2578125, 5.80029296875, 6.3427734375, 6.88525390625, 7.427734375, 7.97021484375, 8.5126953125, 9.05517578125, 9.59765625, 10.14013671875, 10.6826171875, 11.22509765625, 11.767578125, 12.31005859375, 12.8525390625, 13.39501953125, 13.9375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 16.0, 18.0, 21.0, 17.0, 39.0, 44.0, 47.0, 45.0, 55.0, 62.0, 65.0, 50.0, 64.0, 53.0, 62.0, 57.0, 49.0, 26.0, 32.0, 36.0, 27.0, 20.0, 18.0, 12.0, 11.0, 12.0, 8.0, 8.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.390625, -9.08935546875, -8.7880859375, -8.48681640625, -8.185546875, -7.88427734375, -7.5830078125, -7.28173828125, -6.98046875, -6.67919921875, -6.3779296875, -6.07666015625, -5.775390625, -5.47412109375, -5.1728515625, -4.87158203125, -4.5703125, -4.26904296875, -3.9677734375, -3.66650390625, -3.365234375, -3.06396484375, -2.7626953125, -2.46142578125, -2.16015625, -1.85888671875, -1.5576171875, -1.25634765625, -0.955078125, -0.65380859375, -0.3525390625, -0.05126953125, 0.25, 0.55126953125, 0.8525390625, 1.15380859375, 1.455078125, 1.75634765625, 2.0576171875, 2.35888671875, 2.66015625, 2.96142578125, 3.2626953125, 3.56396484375, 3.865234375, 4.16650390625, 4.4677734375, 4.76904296875, 5.0703125, 5.37158203125, 5.6728515625, 5.97412109375, 6.275390625, 6.57666015625, 6.8779296875, 7.17919921875, 7.48046875, 7.78173828125, 8.0830078125, 8.38427734375, 8.685546875, 8.98681640625, 9.2880859375, 9.58935546875, 9.890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 6.0, 9.0, 8.0, 8.0, 15.0, 28.0, 31.0, 42.0, 66.0, 104.0, 132.0, 182.0, 264.0, 369.0, 534.0, 896.0, 1516.0, 2994.0, 7796.0, 33010.0, 230458.0, 664242.0, 81063.0, 14843.0, 4437.0, 2131.0, 1145.0, 699.0, 442.0, 326.0, 211.0, 158.0, 111.0, 73.0, 62.0, 45.0, 27.0, 14.0, 22.0, 11.0, 8.0, 8.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-27.875, -26.953369140625, -26.03173828125, -25.110107421875, -24.1884765625, -23.266845703125, -22.34521484375, -21.423583984375, -20.501953125, -19.580322265625, -18.65869140625, -17.737060546875, -16.8154296875, -15.893798828125, -14.97216796875, -14.050537109375, -13.12890625, -12.207275390625, -11.28564453125, -10.364013671875, -9.4423828125, -8.520751953125, -7.59912109375, -6.677490234375, -5.755859375, -4.834228515625, -3.91259765625, -2.990966796875, -2.0693359375, -1.147705078125, -0.22607421875, 0.695556640625, 1.6171875, 2.538818359375, 3.46044921875, 4.382080078125, 5.3037109375, 6.225341796875, 7.14697265625, 8.068603515625, 8.990234375, 9.911865234375, 10.83349609375, 11.755126953125, 12.6767578125, 13.598388671875, 14.52001953125, 15.441650390625, 16.36328125, 17.284912109375, 18.20654296875, 19.128173828125, 20.0498046875, 20.971435546875, 21.89306640625, 22.814697265625, 23.736328125, 24.657958984375, 25.57958984375, 26.501220703125, 27.4228515625, 28.344482421875, 29.26611328125, 30.187744140625, 31.109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 0.0, 4.0, 4.0, 3.0, 7.0, 3.0, 3.0, 10.0, 6.0, 9.0, 10.0, 10.0, 16.0, 13.0, 33.0, 22.0, 27.0, 37.0, 36.0, 52.0, 37.0, 29.0, 34.0, 45.0, 48.0, 49.0, 38.0, 33.0, 41.0, 41.0, 47.0, 35.0, 32.0, 25.0, 26.0, 29.0, 17.0, 11.0, 13.0, 9.0, 13.0, 4.0, 6.0, 4.0, 5.0, 6.0, 4.0, 4.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-31.03125, -30.093017578125, -29.15478515625, -28.216552734375, -27.2783203125, -26.340087890625, -25.40185546875, -24.463623046875, -23.525390625, -22.587158203125, -21.64892578125, -20.710693359375, -19.7724609375, -18.834228515625, -17.89599609375, -16.957763671875, -16.01953125, -15.081298828125, -14.14306640625, -13.204833984375, -12.2666015625, -11.328369140625, -10.39013671875, -9.451904296875, -8.513671875, -7.575439453125, -6.63720703125, -5.698974609375, -4.7607421875, -3.822509765625, -2.88427734375, -1.946044921875, -1.0078125, -0.069580078125, 0.86865234375, 1.806884765625, 2.7451171875, 3.683349609375, 4.62158203125, 5.559814453125, 6.498046875, 7.436279296875, 8.37451171875, 9.312744140625, 10.2509765625, 11.189208984375, 12.12744140625, 13.065673828125, 14.00390625, 14.942138671875, 15.88037109375, 16.818603515625, 17.7568359375, 18.695068359375, 19.63330078125, 20.571533203125, 21.509765625, 22.447998046875, 23.38623046875, 24.324462890625, 25.2626953125, 26.200927734375, 27.13916015625, 28.077392578125, 29.015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 10.0, 11.0, 13.0, 17.0, 30.0, 30.0, 59.0, 112.0, 156.0, 322.0, 775.0, 2376.0, 12090.0, 121322.0, 790463.0, 106349.0, 10760.0, 2159.0, 750.0, 320.0, 144.0, 109.0, 50.0, 35.0, 24.0, 19.0, 9.0, 13.0, 5.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.381103515625, -10.05126953125, -9.721435546875, -9.3916015625, -9.061767578125, -8.73193359375, -8.402099609375, -8.072265625, -7.742431640625, -7.41259765625, -7.082763671875, -6.7529296875, -6.423095703125, -6.09326171875, -5.763427734375, -5.43359375, -5.103759765625, -4.77392578125, -4.444091796875, -4.1142578125, -3.784423828125, -3.45458984375, -3.124755859375, -2.794921875, -2.465087890625, -2.13525390625, -1.805419921875, -1.4755859375, -1.145751953125, -0.81591796875, -0.486083984375, -0.15625, 0.173583984375, 0.50341796875, 0.833251953125, 1.1630859375, 1.492919921875, 1.82275390625, 2.152587890625, 2.482421875, 2.812255859375, 3.14208984375, 3.471923828125, 3.8017578125, 4.131591796875, 4.46142578125, 4.791259765625, 5.12109375, 5.450927734375, 5.78076171875, 6.110595703125, 6.4404296875, 6.770263671875, 7.10009765625, 7.429931640625, 7.759765625, 8.089599609375, 8.41943359375, 8.749267578125, 9.0791015625, 9.408935546875, 9.73876953125, 10.068603515625, 10.3984375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 14.0, 5.0, 14.0, 17.0, 15.0, 22.0, 21.0, 31.0, 41.0, 55.0, 78.0, 79.0, 98.0, 106.0, 70.0, 56.0, 63.0, 39.0, 25.0, 26.0, 20.0, 21.0, 14.0, 9.0, 7.0, 8.0, 4.0, 3.0, 9.0, 1.0, 3.0, 4.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.001720428466796875, -0.0016647577285766602, -0.0016090869903564453, -0.0015534162521362305, -0.0014977455139160156, -0.0014420747756958008, -0.001386404037475586, -0.001330733299255371, -0.0012750625610351562, -0.0012193918228149414, -0.0011637210845947266, -0.0011080503463745117, -0.0010523796081542969, -0.000996708869934082, -0.0009410381317138672, -0.0008853673934936523, -0.0008296966552734375, -0.0007740259170532227, -0.0007183551788330078, -0.000662684440612793, -0.0006070137023925781, -0.0005513429641723633, -0.0004956722259521484, -0.0004400014877319336, -0.00038433074951171875, -0.0003286600112915039, -0.00027298927307128906, -0.00021731853485107422, -0.00016164779663085938, -0.00010597705841064453, -5.030632019042969e-05, 5.364418029785156e-06, 6.103515625e-05, 0.00011670589447021484, 0.0001723766326904297, 0.00022804737091064453, 0.0002837181091308594, 0.0003393888473510742, 0.00039505958557128906, 0.0004507303237915039, 0.0005064010620117188, 0.0005620718002319336, 0.0006177425384521484, 0.0006734132766723633, 0.0007290840148925781, 0.000784754753112793, 0.0008404254913330078, 0.0008960962295532227, 0.0009517669677734375, 0.0010074377059936523, 0.0010631084442138672, 0.001118779182434082, 0.0011744499206542969, 0.0012301206588745117, 0.0012857913970947266, 0.0013414621353149414, 0.0013971328735351562, 0.001452803611755371, 0.001508474349975586, 0.0015641450881958008, 0.0016198158264160156, 0.0016754865646362305, 0.0017311573028564453, 0.0017868280410766602, 0.001842498779296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 17.0, 23.0, 25.0, 41.0, 63.0, 90.0, 142.0, 198.0, 353.0, 610.0, 1243.0, 2783.0, 7989.0, 34742.0, 270588.0, 639759.0, 69381.0, 12740.0, 4042.0, 1727.0, 800.0, 459.0, 254.0, 162.0, 95.0, 72.0, 43.0, 34.0, 18.0, 16.0, 8.0, 2.0, 4.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.9185791015625, -6.673095703125, -6.4276123046875, -6.18212890625, -5.9366455078125, -5.691162109375, -5.4456787109375, -5.2001953125, -4.9547119140625, -4.709228515625, -4.4637451171875, -4.21826171875, -3.9727783203125, -3.727294921875, -3.4818115234375, -3.236328125, -2.9908447265625, -2.745361328125, -2.4998779296875, -2.25439453125, -2.0089111328125, -1.763427734375, -1.5179443359375, -1.2724609375, -1.0269775390625, -0.781494140625, -0.5360107421875, -0.29052734375, -0.0450439453125, 0.200439453125, 0.4459228515625, 0.69140625, 0.9368896484375, 1.182373046875, 1.4278564453125, 1.67333984375, 1.9188232421875, 2.164306640625, 2.4097900390625, 2.6552734375, 2.9007568359375, 3.146240234375, 3.3917236328125, 3.63720703125, 3.8826904296875, 4.128173828125, 4.3736572265625, 4.619140625, 4.8646240234375, 5.110107421875, 5.3555908203125, 5.60107421875, 5.8465576171875, 6.092041015625, 6.3375244140625, 6.5830078125, 6.8284912109375, 7.073974609375, 7.3194580078125, 7.56494140625, 7.8104248046875, 8.055908203125, 8.3013916015625, 8.546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 7.0, 7.0, 11.0, 13.0, 12.0, 21.0, 19.0, 26.0, 25.0, 26.0, 29.0, 38.0, 33.0, 46.0, 30.0, 62.0, 41.0, 56.0, 50.0, 55.0, 59.0, 41.0, 40.0, 38.0, 29.0, 23.0, 24.0, 23.0, 16.0, 16.0, 17.0, 6.0, 6.0, 8.0, 6.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.61328125, -4.470703125, -4.328125, -4.185546875, -4.04296875, -3.900390625, -3.7578125, -3.615234375, -3.47265625, -3.330078125, -3.1875, -3.044921875, -2.90234375, -2.759765625, -2.6171875, -2.474609375, -2.33203125, -2.189453125, -2.046875, -1.904296875, -1.76171875, -1.619140625, -1.4765625, -1.333984375, -1.19140625, -1.048828125, -0.90625, -0.763671875, -0.62109375, -0.478515625, -0.3359375, -0.193359375, -0.05078125, 0.091796875, 0.234375, 0.376953125, 0.51953125, 0.662109375, 0.8046875, 0.947265625, 1.08984375, 1.232421875, 1.375, 1.517578125, 1.66015625, 1.802734375, 1.9453125, 2.087890625, 2.23046875, 2.373046875, 2.515625, 2.658203125, 2.80078125, 2.943359375, 3.0859375, 3.228515625, 3.37109375, 3.513671875, 3.65625, 3.798828125, 3.94140625, 4.083984375, 4.2265625, 4.369140625, 4.51171875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 14.0, 11.0, 27.0, 53.0, 88.0, 156.0, 233.0, 142.0, 115.0, 77.0, 27.0, 19.0, 14.0, 8.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-147.45614624023438, -141.1963653564453, -134.9365997314453, -128.67681884765625, -122.41703796386719, -116.15726470947266, -109.89749145507812, -103.63771057128906, -97.3779296875, -91.11815643310547, -84.8583755493164, -78.59860229492188, -72.33882141113281, -66.07904815673828, -59.819271087646484, -53.55949401855469, -47.299720764160156, -41.03994369506836, -34.78016662597656, -28.5203914642334, -22.2606143951416, -16.000837326049805, -9.74106216430664, -3.4812850952148438, 2.778491973876953, 9.03826904296875, 15.29804515838623, 21.55782127380371, 27.817598342895508, 34.07737731933594, 40.33715057373047, 46.596927642822266, 52.85670471191406, 59.11648178100586, 65.37625885009766, 71.63603210449219, 77.89581298828125, 84.15558624267578, 90.41535949707031, 96.67514038085938, 102.93492126464844, 109.19469451904297, 115.45447540283203, 121.71424865722656, 127.97402954101562, 134.2338104248047, 140.4935760498047, 146.75335693359375, 153.01312255859375, 159.2729034423828, 165.5326690673828, 171.79244995117188, 178.05223083496094, 184.31201171875, 190.57177734375, 196.83155822753906, 203.09133911132812, 209.3511199951172, 215.6108856201172, 221.87066650390625, 228.1304473876953, 234.39022827148438, 240.64999389648438, 246.90977478027344, 253.1695556640625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 4.0, 1.0, 11.0, 7.0, 12.0, 8.0, 9.0, 10.0, 9.0, 19.0, 16.0, 23.0, 21.0, 27.0, 37.0, 32.0, 25.0, 45.0, 56.0, 58.0, 74.0, 70.0, 55.0, 40.0, 32.0, 33.0, 26.0, 33.0, 27.0, 23.0, 15.0, 28.0, 25.0, 19.0, 13.0, 10.0, 14.0, 5.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-132.94903564453125, -129.16490173339844, -125.38077545166016, -121.59664154052734, -117.81251525878906, -114.02838134765625, -110.24424743652344, -106.46012115478516, -102.67599487304688, -98.89186096191406, -95.10773468017578, -91.32360076904297, -87.53947448730469, -83.75534057617188, -79.97120666503906, -76.18708038330078, -72.40294647216797, -68.61881256103516, -64.83468627929688, -61.05055236816406, -57.26642608642578, -53.48229217529297, -49.69816207885742, -45.914031982421875, -42.12990188598633, -38.34577178955078, -34.561641693115234, -30.777509689331055, -26.993379592895508, -23.20924949645996, -19.42511749267578, -15.640987396240234, -11.856857299804688, -8.07272720336914, -4.288596153259277, -0.5044651031494141, 3.279664993286133, 7.06379508972168, 10.84792709350586, 14.632057189941406, 18.416187286376953, 22.2003173828125, 25.984447479248047, 29.768579483032227, 33.552711486816406, 37.33683776855469, 41.1209716796875, 44.90510177612305, 48.689231872558594, 52.47336196899414, 56.25749206542969, 60.0416259765625, 63.82575225830078, 67.6098861694336, 71.39401245117188, 75.17814636230469, 78.9622802734375, 82.74641418457031, 86.5305404663086, 90.3146743774414, 94.09880065917969, 97.8829345703125, 101.66706848144531, 105.4511947631836, 109.23532104492188]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 16.0, 12.0, 22.0, 37.0, 71.0, 101.0, 177.0, 292.0, 519.0, 928.0, 1994.0, 4198.0, 9782.0, 26380.0, 93560.0, 582416.0, 2577436.0, 739325.0, 108526.0, 28618.0, 10530.0, 4649.0, 2160.0, 1061.0, 608.0, 323.0, 188.0, 119.0, 70.0, 51.0, 32.0, 19.0, 19.0, 8.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-12.1640625, -11.831298828125, -11.49853515625, -11.165771484375, -10.8330078125, -10.500244140625, -10.16748046875, -9.834716796875, -9.501953125, -9.169189453125, -8.83642578125, -8.503662109375, -8.1708984375, -7.838134765625, -7.50537109375, -7.172607421875, -6.83984375, -6.507080078125, -6.17431640625, -5.841552734375, -5.5087890625, -5.176025390625, -4.84326171875, -4.510498046875, -4.177734375, -3.844970703125, -3.51220703125, -3.179443359375, -2.8466796875, -2.513916015625, -2.18115234375, -1.848388671875, -1.515625, -1.182861328125, -0.85009765625, -0.517333984375, -0.1845703125, 0.148193359375, 0.48095703125, 0.813720703125, 1.146484375, 1.479248046875, 1.81201171875, 2.144775390625, 2.4775390625, 2.810302734375, 3.14306640625, 3.475830078125, 3.80859375, 4.141357421875, 4.47412109375, 4.806884765625, 5.1396484375, 5.472412109375, 5.80517578125, 6.137939453125, 6.470703125, 6.803466796875, 7.13623046875, 7.468994140625, 7.8017578125, 8.134521484375, 8.46728515625, 8.800048828125, 9.1328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 6.0, 2.0, 5.0, 10.0, 19.0, 26.0, 20.0, 14.0, 24.0, 33.0, 34.0, 34.0, 47.0, 50.0, 52.0, 65.0, 66.0, 49.0, 54.0, 55.0, 50.0, 43.0, 37.0, 39.0, 29.0, 29.0, 20.0, 22.0, 20.0, 15.0, 9.0, 4.0, 10.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.9320068359375, -8.653076171875, -8.3741455078125, -8.09521484375, -7.8162841796875, -7.537353515625, -7.2584228515625, -6.9794921875, -6.7005615234375, -6.421630859375, -6.1427001953125, -5.86376953125, -5.5848388671875, -5.305908203125, -5.0269775390625, -4.748046875, -4.4691162109375, -4.190185546875, -3.9112548828125, -3.63232421875, -3.3533935546875, -3.074462890625, -2.7955322265625, -2.5166015625, -2.2376708984375, -1.958740234375, -1.6798095703125, -1.40087890625, -1.1219482421875, -0.843017578125, -0.5640869140625, -0.28515625, -0.0062255859375, 0.272705078125, 0.5516357421875, 0.83056640625, 1.1094970703125, 1.388427734375, 1.6673583984375, 1.9462890625, 2.2252197265625, 2.504150390625, 2.7830810546875, 3.06201171875, 3.3409423828125, 3.619873046875, 3.8988037109375, 4.177734375, 4.4566650390625, 4.735595703125, 5.0145263671875, 5.29345703125, 5.5723876953125, 5.851318359375, 6.1302490234375, 6.4091796875, 6.6881103515625, 6.967041015625, 7.2459716796875, 7.52490234375, 7.8038330078125, 8.082763671875, 8.3616943359375, 8.640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 10.0, 20.0, 32.0, 50.0, 71.0, 95.0, 158.0, 282.0, 524.0, 1056.0, 2448.0, 6224.0, 18085.0, 66453.0, 486761.0, 3161403.0, 363379.0, 59230.0, 16937.0, 6051.0, 2479.0, 1139.0, 569.0, 322.0, 176.0, 108.0, 75.0, 41.0, 21.0, 19.0, 10.0, 8.0, 3.0, 10.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-18.671875, -18.1732177734375, -17.674560546875, -17.1759033203125, -16.67724609375, -16.1785888671875, -15.679931640625, -15.1812744140625, -14.6826171875, -14.1839599609375, -13.685302734375, -13.1866455078125, -12.68798828125, -12.1893310546875, -11.690673828125, -11.1920166015625, -10.693359375, -10.1947021484375, -9.696044921875, -9.1973876953125, -8.69873046875, -8.2000732421875, -7.701416015625, -7.2027587890625, -6.7041015625, -6.2054443359375, -5.706787109375, -5.2081298828125, -4.70947265625, -4.2108154296875, -3.712158203125, -3.2135009765625, -2.71484375, -2.2161865234375, -1.717529296875, -1.2188720703125, -0.72021484375, -0.2215576171875, 0.277099609375, 0.7757568359375, 1.2744140625, 1.7730712890625, 2.271728515625, 2.7703857421875, 3.26904296875, 3.7677001953125, 4.266357421875, 4.7650146484375, 5.263671875, 5.7623291015625, 6.260986328125, 6.7596435546875, 7.25830078125, 7.7569580078125, 8.255615234375, 8.7542724609375, 9.2529296875, 9.7515869140625, 10.250244140625, 10.7489013671875, 11.24755859375, 11.7462158203125, 12.244873046875, 12.7435302734375, 13.2421875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 8.0, 11.0, 5.0, 15.0, 12.0, 12.0, 14.0, 29.0, 42.0, 52.0, 87.0, 156.0, 230.0, 474.0, 662.0, 785.0, 573.0, 330.0, 173.0, 94.0, 86.0, 63.0, 52.0, 29.0, 15.0, 21.0, 10.0, 9.0, 6.0, 4.0, 4.0, 7.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.953125, -20.359375, -19.765625, -19.171875, -18.578125, -17.984375, -17.390625, -16.796875, -16.203125, -15.609375, -15.015625, -14.421875, -13.828125, -13.234375, -12.640625, -12.046875, -11.453125, -10.859375, -10.265625, -9.671875, -9.078125, -8.484375, -7.890625, -7.296875, -6.703125, -6.109375, -5.515625, -4.921875, -4.328125, -3.734375, -3.140625, -2.546875, -1.953125, -1.359375, -0.765625, -0.171875, 0.421875, 1.015625, 1.609375, 2.203125, 2.796875, 3.390625, 3.984375, 4.578125, 5.171875, 5.765625, 6.359375, 6.953125, 7.546875, 8.140625, 8.734375, 9.328125, 9.921875, 10.515625, 11.109375, 11.703125, 12.296875, 12.890625, 13.484375, 14.078125, 14.671875, 15.265625, 15.859375, 16.453125, 17.046875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 13.0, 45.0, 152.0, 305.0, 274.0, 120.0, 50.0, 16.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.2875671386719, -336.6203918457031, -326.9532165527344, -317.2860412597656, -307.6188659667969, -297.9516906738281, -288.2845153808594, -278.6173400878906, -268.9501647949219, -259.2829895019531, -249.61581420898438, -239.94863891601562, -230.28146362304688, -220.61428833007812, -210.94711303710938, -201.27993774414062, -191.61277770996094, -181.9456024169922, -172.27842712402344, -162.6112518310547, -152.94407653808594, -143.2769012451172, -133.6097412109375, -123.94255828857422, -114.27538299560547, -104.60820770263672, -94.94103240966797, -85.27386474609375, -75.606689453125, -65.93951416015625, -56.2723388671875, -46.60516357421875, -36.93798828125, -27.27081298828125, -17.603639602661133, -7.936466217041016, 1.7307090759277344, 11.397884368896484, 21.06505584716797, 30.73223114013672, 40.39940643310547, 50.06658172607422, 59.73375701904297, 69.40092468261719, 79.06809997558594, 88.73527526855469, 98.40245056152344, 108.06962585449219, 117.73680114746094, 127.40397644042969, 137.07115173339844, 146.7383270263672, 156.40550231933594, 166.0726776123047, 175.73983764648438, 185.40701293945312, 195.07418823242188, 204.74136352539062, 214.40853881835938, 224.07571411132812, 233.74288940429688, 243.41006469726562, 253.07723999023438, 262.7444152832031, 272.4115905761719]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 2.0, 8.0, 3.0, 7.0, 9.0, 7.0, 10.0, 17.0, 19.0, 26.0, 23.0, 29.0, 30.0, 33.0, 42.0, 40.0, 36.0, 48.0, 48.0, 65.0, 47.0, 50.0, 52.0, 48.0, 52.0, 41.0, 32.0, 34.0, 25.0, 15.0, 23.0, 20.0, 12.0, 15.0, 11.0, 9.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.00346374511719, -78.33860778808594, -75.67374420166016, -73.0088882446289, -70.34402465820312, -67.67916870117188, -65.0143051147461, -62.349449157714844, -59.68458938598633, -57.01972961425781, -54.3548698425293, -51.69001007080078, -49.02515411376953, -46.36029052734375, -43.6954345703125, -41.030574798583984, -38.36571502685547, -35.70085525512695, -33.03599548339844, -30.371137619018555, -27.70627784729004, -25.041418075561523, -22.37656021118164, -19.711700439453125, -17.04684066772461, -14.381980895996094, -11.717122077941895, -9.052263259887695, -6.38740348815918, -3.722543716430664, -1.0576848983764648, 1.6071739196777344, 4.27203369140625, 6.936892986297607, 9.601752281188965, 12.266611099243164, 14.93147087097168, 17.596330642700195, 20.261188507080078, 22.926048278808594, 25.59090805053711, 28.255767822265625, 30.92062759399414, 33.585487365722656, 36.250343322753906, 38.91520690917969, 41.58006286621094, 44.24492263793945, 46.90978240966797, 49.574642181396484, 52.239501953125, 54.904361724853516, 57.56922149658203, 60.23407745361328, 62.8989372253418, 65.56379699707031, 68.22865295410156, 70.89350891113281, 73.5583724975586, 76.22322845458984, 78.88809204101562, 81.55294799804688, 84.21781158447266, 86.8826675415039, 89.54753112792969]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 12.0, 18.0, 35.0, 43.0, 80.0, 82.0, 157.0, 227.0, 341.0, 614.0, 977.0, 1667.0, 2882.0, 5210.0, 9757.0, 18537.0, 37535.0, 79118.0, 190094.0, 346687.0, 194200.0, 80409.0, 38135.0, 19251.0, 10119.0, 5294.0, 2878.0, 1635.0, 954.0, 591.0, 358.0, 225.0, 133.0, 83.0, 73.0, 33.0, 31.0, 25.0, 13.0, 9.0, 4.0, 1.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.53125, -11.1533203125, -10.775390625, -10.3974609375, -10.01953125, -9.6416015625, -9.263671875, -8.8857421875, -8.5078125, -8.1298828125, -7.751953125, -7.3740234375, -6.99609375, -6.6181640625, -6.240234375, -5.8623046875, -5.484375, -5.1064453125, -4.728515625, -4.3505859375, -3.97265625, -3.5947265625, -3.216796875, -2.8388671875, -2.4609375, -2.0830078125, -1.705078125, -1.3271484375, -0.94921875, -0.5712890625, -0.193359375, 0.1845703125, 0.5625, 0.9404296875, 1.318359375, 1.6962890625, 2.07421875, 2.4521484375, 2.830078125, 3.2080078125, 3.5859375, 3.9638671875, 4.341796875, 4.7197265625, 5.09765625, 5.4755859375, 5.853515625, 6.2314453125, 6.609375, 6.9873046875, 7.365234375, 7.7431640625, 8.12109375, 8.4990234375, 8.876953125, 9.2548828125, 9.6328125, 10.0107421875, 10.388671875, 10.7666015625, 11.14453125, 11.5224609375, 11.900390625, 12.2783203125, 12.65625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 7.0, 11.0, 15.0, 16.0, 11.0, 18.0, 15.0, 23.0, 22.0, 33.0, 35.0, 40.0, 57.0, 55.0, 58.0, 47.0, 57.0, 60.0, 62.0, 49.0, 47.0, 31.0, 35.0, 38.0, 28.0, 23.0, 26.0, 21.0, 15.0, 15.0, 6.0, 8.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.8294677734375, -8.549560546875, -8.2696533203125, -7.98974609375, -7.7098388671875, -7.429931640625, -7.1500244140625, -6.8701171875, -6.5902099609375, -6.310302734375, -6.0303955078125, -5.75048828125, -5.4705810546875, -5.190673828125, -4.9107666015625, -4.630859375, -4.3509521484375, -4.071044921875, -3.7911376953125, -3.51123046875, -3.2313232421875, -2.951416015625, -2.6715087890625, -2.3916015625, -2.1116943359375, -1.831787109375, -1.5518798828125, -1.27197265625, -0.9920654296875, -0.712158203125, -0.4322509765625, -0.15234375, 0.1275634765625, 0.407470703125, 0.6873779296875, 0.96728515625, 1.2471923828125, 1.527099609375, 1.8070068359375, 2.0869140625, 2.3668212890625, 2.646728515625, 2.9266357421875, 3.20654296875, 3.4864501953125, 3.766357421875, 4.0462646484375, 4.326171875, 4.6060791015625, 4.885986328125, 5.1658935546875, 5.44580078125, 5.7257080078125, 6.005615234375, 6.2855224609375, 6.5654296875, 6.8453369140625, 7.125244140625, 7.4051513671875, 7.68505859375, 7.9649658203125, 8.244873046875, 8.5247802734375, 8.8046875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 10.0, 18.0, 29.0, 37.0, 57.0, 100.0, 142.0, 228.0, 327.0, 561.0, 967.0, 1808.0, 4855.0, 21483.0, 202383.0, 742483.0, 57788.0, 9215.0, 2822.0, 1257.0, 737.0, 434.0, 272.0, 169.0, 113.0, 87.0, 56.0, 25.0, 32.0, 13.0, 14.0, 5.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.875, -36.76904296875, -35.6630859375, -34.55712890625, -33.451171875, -32.34521484375, -31.2392578125, -30.13330078125, -29.02734375, -27.92138671875, -26.8154296875, -25.70947265625, -24.603515625, -23.49755859375, -22.3916015625, -21.28564453125, -20.1796875, -19.07373046875, -17.9677734375, -16.86181640625, -15.755859375, -14.64990234375, -13.5439453125, -12.43798828125, -11.33203125, -10.22607421875, -9.1201171875, -8.01416015625, -6.908203125, -5.80224609375, -4.6962890625, -3.59033203125, -2.484375, -1.37841796875, -0.2724609375, 0.83349609375, 1.939453125, 3.04541015625, 4.1513671875, 5.25732421875, 6.36328125, 7.46923828125, 8.5751953125, 9.68115234375, 10.787109375, 11.89306640625, 12.9990234375, 14.10498046875, 15.2109375, 16.31689453125, 17.4228515625, 18.52880859375, 19.634765625, 20.74072265625, 21.8466796875, 22.95263671875, 24.05859375, 25.16455078125, 26.2705078125, 27.37646484375, 28.482421875, 29.58837890625, 30.6943359375, 31.80029296875, 32.90625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 11.0, 13.0, 7.0, 19.0, 14.0, 21.0, 32.0, 37.0, 30.0, 29.0, 41.0, 45.0, 56.0, 62.0, 58.0, 49.0, 61.0, 45.0, 43.0, 30.0, 42.0, 32.0, 28.0, 33.0, 27.0, 16.0, 19.0, 18.0, 16.0, 4.0, 13.0, 13.0, 4.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-35.03125, -34.014404296875, -32.99755859375, -31.980712890625, -30.9638671875, -29.947021484375, -28.93017578125, -27.913330078125, -26.896484375, -25.879638671875, -24.86279296875, -23.845947265625, -22.8291015625, -21.812255859375, -20.79541015625, -19.778564453125, -18.76171875, -17.744873046875, -16.72802734375, -15.711181640625, -14.6943359375, -13.677490234375, -12.66064453125, -11.643798828125, -10.626953125, -9.610107421875, -8.59326171875, -7.576416015625, -6.5595703125, -5.542724609375, -4.52587890625, -3.509033203125, -2.4921875, -1.475341796875, -0.45849609375, 0.558349609375, 1.5751953125, 2.592041015625, 3.60888671875, 4.625732421875, 5.642578125, 6.659423828125, 7.67626953125, 8.693115234375, 9.7099609375, 10.726806640625, 11.74365234375, 12.760498046875, 13.77734375, 14.794189453125, 15.81103515625, 16.827880859375, 17.8447265625, 18.861572265625, 19.87841796875, 20.895263671875, 21.912109375, 22.928955078125, 23.94580078125, 24.962646484375, 25.9794921875, 26.996337890625, 28.01318359375, 29.030029296875, 30.046875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 3.0, 8.0, 9.0, 17.0, 17.0, 23.0, 43.0, 54.0, 117.0, 217.0, 545.0, 1699.0, 8102.0, 76002.0, 835122.0, 112766.0, 10532.0, 2098.0, 631.0, 236.0, 127.0, 54.0, 49.0, 24.0, 24.0, 10.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.614990234375, -10.22998046875, -9.844970703125, -9.4599609375, -9.074951171875, -8.68994140625, -8.304931640625, -7.919921875, -7.534912109375, -7.14990234375, -6.764892578125, -6.3798828125, -5.994873046875, -5.60986328125, -5.224853515625, -4.83984375, -4.454833984375, -4.06982421875, -3.684814453125, -3.2998046875, -2.914794921875, -2.52978515625, -2.144775390625, -1.759765625, -1.374755859375, -0.98974609375, -0.604736328125, -0.2197265625, 0.165283203125, 0.55029296875, 0.935302734375, 1.3203125, 1.705322265625, 2.09033203125, 2.475341796875, 2.8603515625, 3.245361328125, 3.63037109375, 4.015380859375, 4.400390625, 4.785400390625, 5.17041015625, 5.555419921875, 5.9404296875, 6.325439453125, 6.71044921875, 7.095458984375, 7.48046875, 7.865478515625, 8.25048828125, 8.635498046875, 9.0205078125, 9.405517578125, 9.79052734375, 10.175537109375, 10.560546875, 10.945556640625, 11.33056640625, 11.715576171875, 12.1005859375, 12.485595703125, 12.87060546875, 13.255615234375, 13.640625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 4.0, 8.0, 10.0, 6.0, 10.0, 11.0, 24.0, 29.0, 36.0, 50.0, 63.0, 96.0, 127.0, 151.0, 105.0, 81.0, 49.0, 27.0, 26.0, 11.0, 15.0, 12.0, 8.0, 5.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020961761474609375, -0.0020237863063812256, -0.0019513964653015137, -0.0018790066242218018, -0.0018066167831420898, -0.001734226942062378, -0.001661837100982666, -0.001589447259902954, -0.0015170574188232422, -0.0014446675777435303, -0.0013722777366638184, -0.0012998878955841064, -0.0012274980545043945, -0.0011551082134246826, -0.0010827183723449707, -0.0010103285312652588, -0.0009379386901855469, -0.000865548849105835, -0.000793159008026123, -0.0007207691669464111, -0.0006483793258666992, -0.0005759894847869873, -0.0005035996437072754, -0.0004312098026275635, -0.00035881996154785156, -0.00028643012046813965, -0.00021404027938842773, -0.00014165043830871582, -6.92605972290039e-05, 3.129243850708008e-06, 7.551908493041992e-05, 0.00014790892601013184, 0.00022029876708984375, 0.00029268860816955566, 0.0003650784492492676, 0.0004374682903289795, 0.0005098581314086914, 0.0005822479724884033, 0.0006546378135681152, 0.0007270276546478271, 0.0007994174957275391, 0.000871807336807251, 0.0009441971778869629, 0.0010165870189666748, 0.0010889768600463867, 0.0011613667011260986, 0.0012337565422058105, 0.0013061463832855225, 0.0013785362243652344, 0.0014509260654449463, 0.0015233159065246582, 0.0015957057476043701, 0.001668095588684082, 0.001740485429763794, 0.0018128752708435059, 0.0018852651119232178, 0.0019576549530029297, 0.0020300447940826416, 0.0021024346351623535, 0.0021748244762420654, 0.0022472143173217773, 0.0023196041584014893, 0.002391993999481201, 0.002464383840560913, 0.002536773681640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 0.0, 9.0, 14.0, 27.0, 18.0, 47.0, 67.0, 136.0, 230.0, 446.0, 1161.0, 3077.0, 12616.0, 118930.0, 818246.0, 79287.0, 9830.0, 2593.0, 949.0, 425.0, 197.0, 93.0, 68.0, 32.0, 20.0, 16.0, 5.0, 9.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.56640625, -6.24493408203125, -5.9234619140625, -5.60198974609375, -5.280517578125, -4.95904541015625, -4.6375732421875, -4.31610107421875, -3.99462890625, -3.67315673828125, -3.3516845703125, -3.03021240234375, -2.708740234375, -2.38726806640625, -2.0657958984375, -1.74432373046875, -1.4228515625, -1.10137939453125, -0.7799072265625, -0.45843505859375, -0.136962890625, 0.18450927734375, 0.5059814453125, 0.82745361328125, 1.14892578125, 1.47039794921875, 1.7918701171875, 2.11334228515625, 2.434814453125, 2.75628662109375, 3.0777587890625, 3.39923095703125, 3.720703125, 4.04217529296875, 4.3636474609375, 4.68511962890625, 5.006591796875, 5.32806396484375, 5.6495361328125, 5.97100830078125, 6.29248046875, 6.61395263671875, 6.9354248046875, 7.25689697265625, 7.578369140625, 7.89984130859375, 8.2213134765625, 8.54278564453125, 8.8642578125, 9.18572998046875, 9.5072021484375, 9.82867431640625, 10.150146484375, 10.47161865234375, 10.7930908203125, 11.11456298828125, 11.43603515625, 11.75750732421875, 12.0789794921875, 12.40045166015625, 12.721923828125, 13.04339599609375, 13.3648681640625, 13.68634033203125, 14.0078125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 6.0, 4.0, 5.0, 6.0, 15.0, 13.0, 19.0, 25.0, 26.0, 42.0, 46.0, 32.0, 63.0, 63.0, 90.0, 83.0, 76.0, 71.0, 66.0, 49.0, 43.0, 42.0, 39.0, 20.0, 15.0, 8.0, 11.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.65716552734375, -6.4588623046875, -6.26055908203125, -6.062255859375, -5.86395263671875, -5.6656494140625, -5.46734619140625, -5.26904296875, -5.07073974609375, -4.8724365234375, -4.67413330078125, -4.475830078125, -4.27752685546875, -4.0792236328125, -3.88092041015625, -3.6826171875, -3.48431396484375, -3.2860107421875, -3.08770751953125, -2.889404296875, -2.69110107421875, -2.4927978515625, -2.29449462890625, -2.09619140625, -1.89788818359375, -1.6995849609375, -1.50128173828125, -1.302978515625, -1.10467529296875, -0.9063720703125, -0.70806884765625, -0.509765625, -0.31146240234375, -0.1131591796875, 0.08514404296875, 0.283447265625, 0.48175048828125, 0.6800537109375, 0.87835693359375, 1.07666015625, 1.27496337890625, 1.4732666015625, 1.67156982421875, 1.869873046875, 2.06817626953125, 2.2664794921875, 2.46478271484375, 2.6630859375, 2.86138916015625, 3.0596923828125, 3.25799560546875, 3.456298828125, 3.65460205078125, 3.8529052734375, 4.05120849609375, 4.24951171875, 4.44781494140625, 4.6461181640625, 4.84442138671875, 5.042724609375, 5.24102783203125, 5.4393310546875, 5.63763427734375, 5.8359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 14.0, 25.0, 39.0, 72.0, 129.0, 243.0, 228.0, 109.0, 72.0, 29.0, 9.0, 5.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-258.89837646484375, -252.25265502929688, -245.60691833496094, -238.96119689941406, -232.31546020507812, -225.66973876953125, -219.02401733398438, -212.37828063964844, -205.7325439453125, -199.08682250976562, -192.4410858154297, -185.7953643798828, -179.14962768554688, -172.50390625, -165.85818481445312, -159.2124481201172, -152.5667266845703, -145.92100524902344, -139.2752685546875, -132.62954711914062, -125.98381042480469, -119.33808898925781, -112.6923599243164, -106.046630859375, -99.4009017944336, -92.75517272949219, -86.10944366455078, -79.46371459960938, -72.8179931640625, -66.17225646972656, -59.52653503417969, -52.88080596923828, -46.23509216308594, -39.58936309814453, -32.943634033203125, -26.297908782958984, -19.652179718017578, -13.006450653076172, -6.360725402832031, 0.285003662109375, 6.930732727050781, 13.576460838317871, 20.22218894958496, 26.867916107177734, 33.51364517211914, 40.15937423706055, 46.80509948730469, 53.450828552246094, 60.0965576171875, 66.7422866821289, 73.38801574707031, 80.03373718261719, 86.67947387695312, 93.3251953125, 99.9709243774414, 106.61665344238281, 113.26238250732422, 119.90811157226562, 126.55384063720703, 133.19956970214844, 139.8452911376953, 146.49102783203125, 153.13674926757812, 159.782470703125, 166.42820739746094]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 7.0, 7.0, 10.0, 8.0, 14.0, 17.0, 11.0, 14.0, 19.0, 13.0, 16.0, 26.0, 38.0, 33.0, 27.0, 36.0, 45.0, 71.0, 78.0, 58.0, 49.0, 62.0, 67.0, 33.0, 23.0, 26.0, 18.0, 29.0, 24.0, 18.0, 15.0, 15.0, 16.0, 11.0, 14.0, 6.0, 6.0, 6.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-117.03082275390625, -113.3010025024414, -109.5711898803711, -105.84136962890625, -102.11155700683594, -98.3817367553711, -94.65192413330078, -90.92210388183594, -87.19229125976562, -83.46247100830078, -79.73265838623047, -76.00283813476562, -72.27302551269531, -68.54320526123047, -64.81339263916016, -61.08357238769531, -57.353755950927734, -53.623939514160156, -49.89412307739258, -46.164306640625, -42.43449020385742, -38.704673767089844, -34.974853515625, -31.245038986206055, -27.515222549438477, -23.7854061126709, -20.05558967590332, -16.32577133178711, -12.595955848693848, -8.866138458251953, -5.136322021484375, -1.4065055847167969, 2.3233108520507812, 6.053127288818359, 9.782943725585938, 13.512761116027832, 17.242576599121094, 20.972394943237305, 24.702211380004883, 28.43202781677246, 32.161842346191406, 35.891658782958984, 39.62147521972656, 43.35129165649414, 47.08110809326172, 50.81092834472656, 54.540740966796875, 58.27056121826172, 62.0003776550293, 65.73019409179688, 69.46001434326172, 73.18982696533203, 76.91964721679688, 80.64945983886719, 84.37928009033203, 88.10909271240234, 91.83891296386719, 95.56873321533203, 99.29854583740234, 103.02836608886719, 106.7581787109375, 110.48799896240234, 114.21781158447266, 117.9476318359375, 121.67744445800781]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 6.0, 13.0, 13.0, 17.0, 25.0, 41.0, 52.0, 87.0, 134.0, 209.0, 342.0, 596.0, 838.0, 1606.0, 2914.0, 5839.0, 14725.0, 51398.0, 356489.0, 2506174.0, 1092607.0, 117750.0, 24605.0, 8588.0, 3909.0, 2059.0, 1182.0, 727.0, 427.0, 293.0, 182.0, 138.0, 86.0, 65.0, 37.0, 28.0, 19.0, 6.0, 13.0, 11.0, 5.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.3515625, -11.0048828125, -10.658203125, -10.3115234375, -9.96484375, -9.6181640625, -9.271484375, -8.9248046875, -8.578125, -8.2314453125, -7.884765625, -7.5380859375, -7.19140625, -6.8447265625, -6.498046875, -6.1513671875, -5.8046875, -5.4580078125, -5.111328125, -4.7646484375, -4.41796875, -4.0712890625, -3.724609375, -3.3779296875, -3.03125, -2.6845703125, -2.337890625, -1.9912109375, -1.64453125, -1.2978515625, -0.951171875, -0.6044921875, -0.2578125, 0.0888671875, 0.435546875, 0.7822265625, 1.12890625, 1.4755859375, 1.822265625, 2.1689453125, 2.515625, 2.8623046875, 3.208984375, 3.5556640625, 3.90234375, 4.2490234375, 4.595703125, 4.9423828125, 5.2890625, 5.6357421875, 5.982421875, 6.3291015625, 6.67578125, 7.0224609375, 7.369140625, 7.7158203125, 8.0625, 8.4091796875, 8.755859375, 9.1025390625, 9.44921875, 9.7958984375, 10.142578125, 10.4892578125, 10.8359375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 11.0, 15.0, 19.0, 20.0, 17.0, 33.0, 30.0, 44.0, 36.0, 47.0, 53.0, 39.0, 42.0, 67.0, 67.0, 53.0, 71.0, 49.0, 40.0, 34.0, 34.0, 36.0, 39.0, 24.0, 16.0, 12.0, 15.0, 6.0, 7.0, 10.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0689697265625, -8.786376953125, -8.5037841796875, -8.22119140625, -7.9385986328125, -7.656005859375, -7.3734130859375, -7.0908203125, -6.8082275390625, -6.525634765625, -6.2430419921875, -5.96044921875, -5.6778564453125, -5.395263671875, -5.1126708984375, -4.830078125, -4.5474853515625, -4.264892578125, -3.9822998046875, -3.69970703125, -3.4171142578125, -3.134521484375, -2.8519287109375, -2.5693359375, -2.2867431640625, -2.004150390625, -1.7215576171875, -1.43896484375, -1.1563720703125, -0.873779296875, -0.5911865234375, -0.30859375, -0.0260009765625, 0.256591796875, 0.5391845703125, 0.82177734375, 1.1043701171875, 1.386962890625, 1.6695556640625, 1.9521484375, 2.2347412109375, 2.517333984375, 2.7999267578125, 3.08251953125, 3.3651123046875, 3.647705078125, 3.9302978515625, 4.212890625, 4.4954833984375, 4.778076171875, 5.0606689453125, 5.34326171875, 5.6258544921875, 5.908447265625, 6.1910400390625, 6.4736328125, 6.7562255859375, 7.038818359375, 7.3214111328125, 7.60400390625, 7.8865966796875, 8.169189453125, 8.4517822265625, 8.734375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 5.0, 4.0, 3.0, 11.0, 6.0, 13.0, 19.0, 40.0, 40.0, 72.0, 143.0, 288.0, 610.0, 1606.0, 5166.0, 22748.0, 294840.0, 3725461.0, 121905.0, 15209.0, 3710.0, 1313.0, 547.0, 228.0, 124.0, 79.0, 34.0, 19.0, 10.0, 9.0, 3.0, 7.0, 6.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.625, -30.82177734375, -30.0185546875, -29.21533203125, -28.412109375, -27.60888671875, -26.8056640625, -26.00244140625, -25.19921875, -24.39599609375, -23.5927734375, -22.78955078125, -21.986328125, -21.18310546875, -20.3798828125, -19.57666015625, -18.7734375, -17.97021484375, -17.1669921875, -16.36376953125, -15.560546875, -14.75732421875, -13.9541015625, -13.15087890625, -12.34765625, -11.54443359375, -10.7412109375, -9.93798828125, -9.134765625, -8.33154296875, -7.5283203125, -6.72509765625, -5.921875, -5.11865234375, -4.3154296875, -3.51220703125, -2.708984375, -1.90576171875, -1.1025390625, -0.29931640625, 0.50390625, 1.30712890625, 2.1103515625, 2.91357421875, 3.716796875, 4.52001953125, 5.3232421875, 6.12646484375, 6.9296875, 7.73291015625, 8.5361328125, 9.33935546875, 10.142578125, 10.94580078125, 11.7490234375, 12.55224609375, 13.35546875, 14.15869140625, 14.9619140625, 15.76513671875, 16.568359375, 17.37158203125, 18.1748046875, 18.97802734375, 19.78125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 7.0, 12.0, 15.0, 25.0, 60.0, 76.0, 158.0, 317.0, 725.0, 1170.0, 789.0, 339.0, 163.0, 77.0, 41.0, 23.0, 21.0, 10.0, 7.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.28125, -30.4892578125, -29.697265625, -28.9052734375, -28.11328125, -27.3212890625, -26.529296875, -25.7373046875, -24.9453125, -24.1533203125, -23.361328125, -22.5693359375, -21.77734375, -20.9853515625, -20.193359375, -19.4013671875, -18.609375, -17.8173828125, -17.025390625, -16.2333984375, -15.44140625, -14.6494140625, -13.857421875, -13.0654296875, -12.2734375, -11.4814453125, -10.689453125, -9.8974609375, -9.10546875, -8.3134765625, -7.521484375, -6.7294921875, -5.9375, -5.1455078125, -4.353515625, -3.5615234375, -2.76953125, -1.9775390625, -1.185546875, -0.3935546875, 0.3984375, 1.1904296875, 1.982421875, 2.7744140625, 3.56640625, 4.3583984375, 5.150390625, 5.9423828125, 6.734375, 7.5263671875, 8.318359375, 9.1103515625, 9.90234375, 10.6943359375, 11.486328125, 12.2783203125, 13.0703125, 13.8623046875, 14.654296875, 15.4462890625, 16.23828125, 17.0302734375, 17.822265625, 18.6142578125, 19.40625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 13.0, 35.0, 95.0, 210.0, 283.0, 219.0, 81.0, 32.0, 8.0, 4.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.28248596191406, -126.15614318847656, -118.02980041503906, -109.90345764160156, -101.77711486816406, -93.65077209472656, -85.5244369506836, -77.3980941772461, -69.2717514038086, -61.145408630371094, -53.019065856933594, -44.89272689819336, -36.76638412475586, -28.64004135131836, -20.513702392578125, -12.387359619140625, -4.261016845703125, 3.8653249740600586, 11.991666793823242, 20.11800765991211, 28.24435043334961, 36.37069320678711, 44.497032165527344, 52.623374938964844, 60.749717712402344, 68.87606048583984, 77.00240325927734, 85.12873840332031, 93.25508117675781, 101.38142395019531, 109.50776672363281, 117.63410949707031, 125.76046752929688, 133.88681030273438, 142.01315307617188, 150.13949584960938, 158.26583862304688, 166.39218139648438, 174.51852416992188, 182.64486694335938, 190.77120971679688, 198.89755249023438, 207.02389526367188, 215.15023803710938, 223.27658081054688, 231.40292358398438, 239.52926635742188, 247.65560913085938, 255.7819366455078, 263.90826416015625, 272.03460693359375, 280.16094970703125, 288.28729248046875, 296.41363525390625, 304.53997802734375, 312.66632080078125, 320.79266357421875, 328.91900634765625, 337.04534912109375, 345.17169189453125, 353.29803466796875, 361.42437744140625, 369.55072021484375, 377.67706298828125, 385.80340576171875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 4.0, 13.0, 19.0, 21.0, 25.0, 26.0, 26.0, 36.0, 32.0, 39.0, 38.0, 41.0, 46.0, 50.0, 44.0, 48.0, 58.0, 52.0, 41.0, 40.0, 46.0, 40.0, 28.0, 20.0, 24.0, 26.0, 13.0, 12.0, 17.0, 14.0, 11.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-81.655029296875, -79.3887710571289, -77.12251281738281, -74.85626220703125, -72.59000396728516, -70.32374572753906, -68.05748748779297, -65.79122924804688, -63.52497482299805, -61.25871658325195, -58.992462158203125, -56.72620391845703, -54.45994567871094, -52.19369125366211, -49.927433013916016, -47.66117858886719, -45.394920349121094, -43.128662109375, -40.86240768432617, -38.59614944458008, -36.32989501953125, -34.063636779785156, -31.797378540039062, -29.5311222076416, -27.26486587524414, -24.99860954284668, -22.73235321044922, -20.466094970703125, -18.199838638305664, -15.933582305908203, -13.667325019836426, -11.401067733764648, -9.134807586669922, -6.868550777435303, -4.602293968200684, -2.3360371589660645, -0.06978034973144531, 2.1964759826660156, 4.462733268737793, 6.72899055480957, 8.995246887207031, 11.261503219604492, 13.52776050567627, 15.794017791748047, 18.060274124145508, 20.32653045654297, 22.592788696289062, 24.859045028686523, 27.125301361083984, 29.391557693481445, 31.657814025878906, 33.924072265625, 36.190330505371094, 38.45658493041992, 40.722843170166016, 42.989097595214844, 45.25535583496094, 47.52161407470703, 49.78786849975586, 52.05412673950195, 54.32038116455078, 56.586639404296875, 58.85289764404297, 61.11915588378906, 63.38541030883789]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 11.0, 10.0, 27.0, 48.0, 66.0, 97.0, 176.0, 285.0, 523.0, 909.0, 1756.0, 3431.0, 7393.0, 16771.0, 42912.0, 120397.0, 305338.0, 327572.0, 137274.0, 48565.0, 18891.0, 8021.0, 3801.0, 1911.0, 1051.0, 538.0, 336.0, 169.0, 106.0, 60.0, 37.0, 20.0, 16.0, 10.0, 4.0, 8.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0703125, -10.7354736328125, -10.400634765625, -10.0657958984375, -9.73095703125, -9.3961181640625, -9.061279296875, -8.7264404296875, -8.3916015625, -8.0567626953125, -7.721923828125, -7.3870849609375, -7.05224609375, -6.7174072265625, -6.382568359375, -6.0477294921875, -5.712890625, -5.3780517578125, -5.043212890625, -4.7083740234375, -4.37353515625, -4.0386962890625, -3.703857421875, -3.3690185546875, -3.0341796875, -2.6993408203125, -2.364501953125, -2.0296630859375, -1.69482421875, -1.3599853515625, -1.025146484375, -0.6903076171875, -0.35546875, -0.0206298828125, 0.314208984375, 0.6490478515625, 0.98388671875, 1.3187255859375, 1.653564453125, 1.9884033203125, 2.3232421875, 2.6580810546875, 2.992919921875, 3.3277587890625, 3.66259765625, 3.9974365234375, 4.332275390625, 4.6671142578125, 5.001953125, 5.3367919921875, 5.671630859375, 6.0064697265625, 6.34130859375, 6.6761474609375, 7.010986328125, 7.3458251953125, 7.6806640625, 8.0155029296875, 8.350341796875, 8.6851806640625, 9.02001953125, 9.3548583984375, 9.689697265625, 10.0245361328125, 10.359375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 10.0, 15.0, 9.0, 13.0, 19.0, 17.0, 24.0, 25.0, 36.0, 38.0, 38.0, 46.0, 65.0, 54.0, 58.0, 51.0, 63.0, 50.0, 56.0, 64.0, 46.0, 25.0, 35.0, 21.0, 24.0, 16.0, 14.0, 16.0, 12.0, 9.0, 10.0, 10.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3984375, -9.117919921875, -8.83740234375, -8.556884765625, -8.2763671875, -7.995849609375, -7.71533203125, -7.434814453125, -7.154296875, -6.873779296875, -6.59326171875, -6.312744140625, -6.0322265625, -5.751708984375, -5.47119140625, -5.190673828125, -4.91015625, -4.629638671875, -4.34912109375, -4.068603515625, -3.7880859375, -3.507568359375, -3.22705078125, -2.946533203125, -2.666015625, -2.385498046875, -2.10498046875, -1.824462890625, -1.5439453125, -1.263427734375, -0.98291015625, -0.702392578125, -0.421875, -0.141357421875, 0.13916015625, 0.419677734375, 0.7001953125, 0.980712890625, 1.26123046875, 1.541748046875, 1.822265625, 2.102783203125, 2.38330078125, 2.663818359375, 2.9443359375, 3.224853515625, 3.50537109375, 3.785888671875, 4.06640625, 4.346923828125, 4.62744140625, 4.907958984375, 5.1884765625, 5.468994140625, 5.74951171875, 6.030029296875, 6.310546875, 6.591064453125, 6.87158203125, 7.152099609375, 7.4326171875, 7.713134765625, 7.99365234375, 8.274169921875, 8.5546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 8.0, 15.0, 21.0, 36.0, 37.0, 67.0, 108.0, 192.0, 445.0, 1062.0, 2841.0, 10910.0, 64164.0, 674427.0, 254628.0, 29921.0, 6290.0, 1859.0, 716.0, 326.0, 189.0, 90.0, 64.0, 39.0, 33.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.738525390625, -19.99267578125, -19.246826171875, -18.5009765625, -17.755126953125, -17.00927734375, -16.263427734375, -15.517578125, -14.771728515625, -14.02587890625, -13.280029296875, -12.5341796875, -11.788330078125, -11.04248046875, -10.296630859375, -9.55078125, -8.804931640625, -8.05908203125, -7.313232421875, -6.5673828125, -5.821533203125, -5.07568359375, -4.329833984375, -3.583984375, -2.838134765625, -2.09228515625, -1.346435546875, -0.6005859375, 0.145263671875, 0.89111328125, 1.636962890625, 2.3828125, 3.128662109375, 3.87451171875, 4.620361328125, 5.3662109375, 6.112060546875, 6.85791015625, 7.603759765625, 8.349609375, 9.095458984375, 9.84130859375, 10.587158203125, 11.3330078125, 12.078857421875, 12.82470703125, 13.570556640625, 14.31640625, 15.062255859375, 15.80810546875, 16.553955078125, 17.2998046875, 18.045654296875, 18.79150390625, 19.537353515625, 20.283203125, 21.029052734375, 21.77490234375, 22.520751953125, 23.2666015625, 24.012451171875, 24.75830078125, 25.504150390625, 26.25]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 6.0, 8.0, 14.0, 20.0, 15.0, 40.0, 35.0, 37.0, 55.0, 45.0, 64.0, 57.0, 61.0, 70.0, 56.0, 61.0, 52.0, 51.0, 46.0, 27.0, 45.0, 26.0, 23.0, 20.0, 17.0, 12.0, 7.0, 5.0, 5.0, 9.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.546875, -30.484619140625, -29.42236328125, -28.360107421875, -27.2978515625, -26.235595703125, -25.17333984375, -24.111083984375, -23.048828125, -21.986572265625, -20.92431640625, -19.862060546875, -18.7998046875, -17.737548828125, -16.67529296875, -15.613037109375, -14.55078125, -13.488525390625, -12.42626953125, -11.364013671875, -10.3017578125, -9.239501953125, -8.17724609375, -7.114990234375, -6.052734375, -4.990478515625, -3.92822265625, -2.865966796875, -1.8037109375, -0.741455078125, 0.32080078125, 1.383056640625, 2.4453125, 3.507568359375, 4.56982421875, 5.632080078125, 6.6943359375, 7.756591796875, 8.81884765625, 9.881103515625, 10.943359375, 12.005615234375, 13.06787109375, 14.130126953125, 15.1923828125, 16.254638671875, 17.31689453125, 18.379150390625, 19.44140625, 20.503662109375, 21.56591796875, 22.628173828125, 23.6904296875, 24.752685546875, 25.81494140625, 26.877197265625, 27.939453125, 29.001708984375, 30.06396484375, 31.126220703125, 32.1884765625, 33.250732421875, 34.31298828125, 35.375244140625, 36.4375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 10.0, 5.0, 11.0, 21.0, 27.0, 44.0, 71.0, 91.0, 194.0, 356.0, 792.0, 1686.0, 4264.0, 11410.0, 37192.0, 150402.0, 618754.0, 163025.0, 39941.0, 12299.0, 4352.0, 1836.0, 809.0, 418.0, 195.0, 102.0, 81.0, 36.0, 21.0, 21.0, 14.0, 12.0, 6.0, 9.0, 7.0, 9.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.95703125, -4.8175048828125, -4.677978515625, -4.5384521484375, -4.39892578125, -4.2593994140625, -4.119873046875, -3.9803466796875, -3.8408203125, -3.7012939453125, -3.561767578125, -3.4222412109375, -3.28271484375, -3.1431884765625, -3.003662109375, -2.8641357421875, -2.724609375, -2.5850830078125, -2.445556640625, -2.3060302734375, -2.16650390625, -2.0269775390625, -1.887451171875, -1.7479248046875, -1.6083984375, -1.4688720703125, -1.329345703125, -1.1898193359375, -1.05029296875, -0.9107666015625, -0.771240234375, -0.6317138671875, -0.4921875, -0.3526611328125, -0.213134765625, -0.0736083984375, 0.06591796875, 0.2054443359375, 0.344970703125, 0.4844970703125, 0.6240234375, 0.7635498046875, 0.903076171875, 1.0426025390625, 1.18212890625, 1.3216552734375, 1.461181640625, 1.6007080078125, 1.740234375, 1.8797607421875, 2.019287109375, 2.1588134765625, 2.29833984375, 2.4378662109375, 2.577392578125, 2.7169189453125, 2.8564453125, 2.9959716796875, 3.135498046875, 3.2750244140625, 3.41455078125, 3.5540771484375, 3.693603515625, 3.8331298828125, 3.97265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 15.0, 40.0, 40.0, 72.0, 121.0, 182.0, 158.0, 129.0, 84.0, 42.0, 31.0, 13.0, 10.0, 7.0, 3.0, 7.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020465850830078125, -0.0019785165786743164, -0.0019104480743408203, -0.0018423795700073242, -0.0017743110656738281, -0.001706242561340332, -0.001638174057006836, -0.0015701055526733398, -0.0015020370483398438, -0.0014339685440063477, -0.0013659000396728516, -0.0012978315353393555, -0.0012297630310058594, -0.0011616945266723633, -0.0010936260223388672, -0.001025557518005371, -0.000957489013671875, -0.0008894205093383789, -0.0008213520050048828, -0.0007532835006713867, -0.0006852149963378906, -0.0006171464920043945, -0.0005490779876708984, -0.00048100948333740234, -0.00041294097900390625, -0.00034487247467041016, -0.00027680397033691406, -0.00020873546600341797, -0.00014066696166992188, -7.259845733642578e-05, -4.5299530029296875e-06, 6.35385513305664e-05, 0.0001316070556640625, 0.0001996755599975586, 0.0002677440643310547, 0.0003358125686645508, 0.0004038810729980469, 0.00047194957733154297, 0.0005400180816650391, 0.0006080865859985352, 0.0006761550903320312, 0.0007442235946655273, 0.0008122920989990234, 0.0008803606033325195, 0.0009484291076660156, 0.0010164976119995117, 0.0010845661163330078, 0.001152634620666504, 0.001220703125, 0.001288771629333496, 0.0013568401336669922, 0.0014249086380004883, 0.0014929771423339844, 0.0015610456466674805, 0.0016291141510009766, 0.0016971826553344727, 0.0017652511596679688, 0.0018333196640014648, 0.001901388168334961, 0.001969456672668457, 0.002037525177001953, 0.0021055936813354492, 0.0021736621856689453, 0.0022417306900024414, 0.0023097991943359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 10.0, 17.0, 19.0, 19.0, 21.0, 43.0, 86.0, 125.0, 210.0, 387.0, 680.0, 1472.0, 3288.0, 8444.0, 25513.0, 89178.0, 477685.0, 321155.0, 82327.0, 23733.0, 7965.0, 3135.0, 1472.0, 685.0, 322.0, 198.0, 123.0, 89.0, 42.0, 33.0, 23.0, 12.0, 14.0, 5.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3046875, -4.1700439453125, -4.035400390625, -3.9007568359375, -3.76611328125, -3.6314697265625, -3.496826171875, -3.3621826171875, -3.2275390625, -3.0928955078125, -2.958251953125, -2.8236083984375, -2.68896484375, -2.5543212890625, -2.419677734375, -2.2850341796875, -2.150390625, -2.0157470703125, -1.881103515625, -1.7464599609375, -1.61181640625, -1.4771728515625, -1.342529296875, -1.2078857421875, -1.0732421875, -0.9385986328125, -0.803955078125, -0.6693115234375, -0.53466796875, -0.4000244140625, -0.265380859375, -0.1307373046875, 0.00390625, 0.1385498046875, 0.273193359375, 0.4078369140625, 0.54248046875, 0.6771240234375, 0.811767578125, 0.9464111328125, 1.0810546875, 1.2156982421875, 1.350341796875, 1.4849853515625, 1.61962890625, 1.7542724609375, 1.888916015625, 2.0235595703125, 2.158203125, 2.2928466796875, 2.427490234375, 2.5621337890625, 2.69677734375, 2.8314208984375, 2.966064453125, 3.1007080078125, 3.2353515625, 3.3699951171875, 3.504638671875, 3.6392822265625, 3.77392578125, 3.9085693359375, 4.043212890625, 4.1778564453125, 4.3125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 5.0, 7.0, 9.0, 14.0, 16.0, 20.0, 20.0, 46.0, 55.0, 76.0, 84.0, 97.0, 102.0, 116.0, 80.0, 63.0, 52.0, 43.0, 25.0, 20.0, 18.0, 11.0, 8.0, 8.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.97308349609375, -5.7821044921875, -5.59112548828125, -5.400146484375, -5.20916748046875, -5.0181884765625, -4.82720947265625, -4.63623046875, -4.44525146484375, -4.2542724609375, -4.06329345703125, -3.872314453125, -3.68133544921875, -3.4903564453125, -3.29937744140625, -3.1083984375, -2.91741943359375, -2.7264404296875, -2.53546142578125, -2.344482421875, -2.15350341796875, -1.9625244140625, -1.77154541015625, -1.58056640625, -1.38958740234375, -1.1986083984375, -1.00762939453125, -0.816650390625, -0.62567138671875, -0.4346923828125, -0.24371337890625, -0.052734375, 0.13824462890625, 0.3292236328125, 0.52020263671875, 0.711181640625, 0.90216064453125, 1.0931396484375, 1.28411865234375, 1.47509765625, 1.66607666015625, 1.8570556640625, 2.04803466796875, 2.239013671875, 2.42999267578125, 2.6209716796875, 2.81195068359375, 3.0029296875, 3.19390869140625, 3.3848876953125, 3.57586669921875, 3.766845703125, 3.95782470703125, 4.1488037109375, 4.33978271484375, 4.53076171875, 4.72174072265625, 4.9127197265625, 5.10369873046875, 5.294677734375, 5.48565673828125, 5.6766357421875, 5.86761474609375, 6.05859375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 7.0, 8.0, 17.0, 39.0, 54.0, 94.0, 162.0, 245.0, 149.0, 92.0, 54.0, 33.0, 22.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-186.63433837890625, -182.4351043701172, -178.23587036132812, -174.03663635253906, -169.83740234375, -165.63818359375, -161.43894958496094, -157.23971557617188, -153.0404815673828, -148.84124755859375, -144.6420135498047, -140.44277954101562, -136.24356079101562, -132.04432678222656, -127.8450927734375, -123.64585876464844, -119.44662475585938, -115.24739074707031, -111.04815673828125, -106.84893035888672, -102.64969635009766, -98.4504623413086, -94.25123596191406, -90.052001953125, -85.85276794433594, -81.65353393554688, -77.45429992675781, -73.25507354736328, -69.05583953857422, -64.85660552978516, -60.65737533569336, -56.45814514160156, -52.25889587402344, -48.059661865234375, -43.86043167114258, -39.66120147705078, -35.46196746826172, -31.26273536682129, -27.06350326538086, -22.86427116394043, -18.6650390625, -14.46580696105957, -10.26657485961914, -6.067342758178711, -1.8681106567382812, 2.3311214447021484, 6.530353546142578, 10.729585647583008, 14.928817749023438, 19.128049850463867, 23.327281951904297, 27.526514053344727, 31.725746154785156, 35.92498016357422, 40.124210357666016, 44.32344055175781, 48.522674560546875, 52.72190856933594, 56.921138763427734, 61.12036895751953, 65.3196029663086, 69.51883697509766, 73.71806335449219, 77.91729736328125, 82.11653137207031]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 7.0, 3.0, 5.0, 4.0, 5.0, 10.0, 8.0, 13.0, 16.0, 17.0, 13.0, 28.0, 32.0, 36.0, 23.0, 36.0, 48.0, 59.0, 78.0, 82.0, 80.0, 60.0, 40.0, 36.0, 36.0, 34.0, 34.0, 28.0, 28.0, 14.0, 16.0, 17.0, 13.0, 10.0, 10.0, 4.0, 7.0, 6.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.71212005615234, -97.30599975585938, -93.8998794555664, -90.49375915527344, -87.08763122558594, -83.6815185546875, -80.275390625, -76.86927032470703, -73.46315002441406, -70.0570297241211, -66.65090942382812, -63.24478530883789, -59.83866500854492, -56.43254470825195, -53.02642059326172, -49.62030029296875, -46.21417999267578, -42.80805969238281, -39.401939392089844, -35.99581527709961, -32.58969497680664, -29.183574676513672, -25.77745246887207, -22.37133026123047, -18.9652099609375, -15.559088706970215, -12.15296745300293, -8.746846199035645, -5.340724945068359, -1.9346046447753906, 1.471517562866211, 4.8776397705078125, 8.283767700195312, 11.689888954162598, 15.096010208129883, 18.502132415771484, 21.908252716064453, 25.314373016357422, 28.720495223999023, 32.126617431640625, 35.532737731933594, 38.93885803222656, 42.34497833251953, 45.751102447509766, 49.157222747802734, 52.5633430480957, 55.96946716308594, 59.375587463378906, 62.781707763671875, 66.18782806396484, 69.59394836425781, 73.00006866455078, 76.40618896484375, 79.81231689453125, 83.21843719482422, 86.62455749511719, 90.03067779541016, 93.43679809570312, 96.8429183959961, 100.24903869628906, 103.65516662597656, 107.061279296875, 110.4674072265625, 113.87352752685547, 117.27964782714844]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 6.0, 8.0, 16.0, 21.0, 24.0, 31.0, 64.0, 71.0, 100.0, 154.0, 241.0, 369.0, 580.0, 933.0, 1605.0, 3020.0, 6119.0, 13948.0, 40644.0, 158466.0, 719975.0, 2028410.0, 939753.0, 200943.0, 48460.0, 15652.0, 6740.0, 3284.0, 1796.0, 916.0, 651.0, 399.0, 273.0, 146.0, 128.0, 90.0, 57.0, 43.0, 37.0, 24.0, 21.0, 15.0, 12.0, 7.0, 1.0, 5.0, 7.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.9375, -6.7030029296875, -6.468505859375, -6.2340087890625, -5.99951171875, -5.7650146484375, -5.530517578125, -5.2960205078125, -5.0615234375, -4.8270263671875, -4.592529296875, -4.3580322265625, -4.12353515625, -3.8890380859375, -3.654541015625, -3.4200439453125, -3.185546875, -2.9510498046875, -2.716552734375, -2.4820556640625, -2.24755859375, -2.0130615234375, -1.778564453125, -1.5440673828125, -1.3095703125, -1.0750732421875, -0.840576171875, -0.6060791015625, -0.37158203125, -0.1370849609375, 0.097412109375, 0.3319091796875, 0.56640625, 0.8009033203125, 1.035400390625, 1.2698974609375, 1.50439453125, 1.7388916015625, 1.973388671875, 2.2078857421875, 2.4423828125, 2.6768798828125, 2.911376953125, 3.1458740234375, 3.38037109375, 3.6148681640625, 3.849365234375, 4.0838623046875, 4.318359375, 4.5528564453125, 4.787353515625, 5.0218505859375, 5.25634765625, 5.4908447265625, 5.725341796875, 5.9598388671875, 6.1943359375, 6.4288330078125, 6.663330078125, 6.8978271484375, 7.13232421875, 7.3668212890625, 7.601318359375, 7.8358154296875, 8.0703125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 14.0, 10.0, 15.0, 26.0, 32.0, 20.0, 41.0, 45.0, 37.0, 55.0, 49.0, 59.0, 66.0, 65.0, 62.0, 42.0, 39.0, 47.0, 56.0, 34.0, 35.0, 28.0, 28.0, 26.0, 7.0, 14.0, 11.0, 5.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.46875, -9.1864013671875, -8.904052734375, -8.6217041015625, -8.33935546875, -8.0570068359375, -7.774658203125, -7.4923095703125, -7.2099609375, -6.9276123046875, -6.645263671875, -6.3629150390625, -6.08056640625, -5.7982177734375, -5.515869140625, -5.2335205078125, -4.951171875, -4.6688232421875, -4.386474609375, -4.1041259765625, -3.82177734375, -3.5394287109375, -3.257080078125, -2.9747314453125, -2.6923828125, -2.4100341796875, -2.127685546875, -1.8453369140625, -1.56298828125, -1.2806396484375, -0.998291015625, -0.7159423828125, -0.43359375, -0.1512451171875, 0.131103515625, 0.4134521484375, 0.69580078125, 0.9781494140625, 1.260498046875, 1.5428466796875, 1.8251953125, 2.1075439453125, 2.389892578125, 2.6722412109375, 2.95458984375, 3.2369384765625, 3.519287109375, 3.8016357421875, 4.083984375, 4.3663330078125, 4.648681640625, 4.9310302734375, 5.21337890625, 5.4957275390625, 5.778076171875, 6.0604248046875, 6.3427734375, 6.6251220703125, 6.907470703125, 7.1898193359375, 7.47216796875, 7.7545166015625, 8.036865234375, 8.3192138671875, 8.6015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 4.0, 7.0, 2.0, 9.0, 7.0, 15.0, 21.0, 29.0, 36.0, 66.0, 85.0, 179.0, 389.0, 987.0, 3573.0, 19038.0, 269286.0, 3714934.0, 166110.0, 14939.0, 3001.0, 784.0, 342.0, 175.0, 99.0, 41.0, 39.0, 20.0, 21.0, 10.0, 8.0, 7.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.515625, -23.82373046875, -23.1318359375, -22.43994140625, -21.748046875, -21.05615234375, -20.3642578125, -19.67236328125, -18.98046875, -18.28857421875, -17.5966796875, -16.90478515625, -16.212890625, -15.52099609375, -14.8291015625, -14.13720703125, -13.4453125, -12.75341796875, -12.0615234375, -11.36962890625, -10.677734375, -9.98583984375, -9.2939453125, -8.60205078125, -7.91015625, -7.21826171875, -6.5263671875, -5.83447265625, -5.142578125, -4.45068359375, -3.7587890625, -3.06689453125, -2.375, -1.68310546875, -0.9912109375, -0.29931640625, 0.392578125, 1.08447265625, 1.7763671875, 2.46826171875, 3.16015625, 3.85205078125, 4.5439453125, 5.23583984375, 5.927734375, 6.61962890625, 7.3115234375, 8.00341796875, 8.6953125, 9.38720703125, 10.0791015625, 10.77099609375, 11.462890625, 12.15478515625, 12.8466796875, 13.53857421875, 14.23046875, 14.92236328125, 15.6142578125, 16.30615234375, 16.998046875, 17.68994140625, 18.3818359375, 19.07373046875, 19.765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 3.0, 6.0, 9.0, 6.0, 12.0, 21.0, 20.0, 22.0, 51.0, 62.0, 104.0, 176.0, 262.0, 437.0, 608.0, 737.0, 549.0, 328.0, 217.0, 133.0, 110.0, 63.0, 37.0, 26.0, 17.0, 10.0, 12.0, 7.0, 8.0, 7.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.125, -12.642578125, -12.16015625, -11.677734375, -11.1953125, -10.712890625, -10.23046875, -9.748046875, -9.265625, -8.783203125, -8.30078125, -7.818359375, -7.3359375, -6.853515625, -6.37109375, -5.888671875, -5.40625, -4.923828125, -4.44140625, -3.958984375, -3.4765625, -2.994140625, -2.51171875, -2.029296875, -1.546875, -1.064453125, -0.58203125, -0.099609375, 0.3828125, 0.865234375, 1.34765625, 1.830078125, 2.3125, 2.794921875, 3.27734375, 3.759765625, 4.2421875, 4.724609375, 5.20703125, 5.689453125, 6.171875, 6.654296875, 7.13671875, 7.619140625, 8.1015625, 8.583984375, 9.06640625, 9.548828125, 10.03125, 10.513671875, 10.99609375, 11.478515625, 11.9609375, 12.443359375, 12.92578125, 13.408203125, 13.890625, 14.373046875, 14.85546875, 15.337890625, 15.8203125, 16.302734375, 16.78515625, 17.267578125, 17.75]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 28.0, 48.0, 118.0, 198.0, 211.0, 168.0, 117.0, 52.0, 18.0, 15.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-202.45848083496094, -197.18507385253906, -191.9116668701172, -186.6382598876953, -181.36485290527344, -176.09144592285156, -170.8180389404297, -165.54464721679688, -160.271240234375, -154.99783325195312, -149.72442626953125, -144.45101928710938, -139.1776123046875, -133.90420532226562, -128.63079833984375, -123.3573989868164, -118.083984375, -112.81057739257812, -107.53717041015625, -102.26376342773438, -96.9903564453125, -91.71694946289062, -86.44355010986328, -81.1701431274414, -75.89673614501953, -70.62332916259766, -65.34992218017578, -60.07651901245117, -54.8031120300293, -49.52970504760742, -44.25630187988281, -38.98289489746094, -33.70948791503906, -28.436080932617188, -23.162675857543945, -17.889270782470703, -12.615863800048828, -7.342456817626953, -2.069051742553711, 3.2043533325195312, 8.477760314941406, 13.751166343688965, 19.024572372436523, 24.297977447509766, 29.57138442993164, 34.844791412353516, 40.118194580078125, 45.3916015625, 50.665008544921875, 55.93841552734375, 61.211822509765625, 66.4852294921875, 71.75863647460938, 77.03204345703125, 82.3054428100586, 87.57884979248047, 92.85225677490234, 98.12566375732422, 103.3990707397461, 108.67247772216797, 113.94587707519531, 119.21928405761719, 124.49269104003906, 129.76609802246094, 135.0395050048828]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 9.0, 14.0, 12.0, 13.0, 5.0, 10.0, 15.0, 19.0, 19.0, 22.0, 32.0, 37.0, 25.0, 38.0, 38.0, 45.0, 46.0, 37.0, 35.0, 47.0, 46.0, 46.0, 49.0, 36.0, 35.0, 43.0, 36.0, 27.0, 25.0, 20.0, 23.0, 10.0, 16.0, 12.0, 7.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.35954284667969, -58.442535400390625, -56.5255241394043, -54.608516693115234, -52.691505432128906, -50.774497985839844, -48.85749053955078, -46.94047927856445, -45.02347183227539, -43.10646438598633, -41.189453125, -39.27244567871094, -37.35543441772461, -35.43842697143555, -33.52141571044922, -31.604408264160156, -29.68739891052246, -27.770389556884766, -25.85338020324707, -23.936370849609375, -22.019363403320312, -20.102354049682617, -18.185344696044922, -16.26833724975586, -14.351326942443848, -12.434317588806152, -10.517309188842773, -8.600299835205078, -6.683290958404541, -4.766282081604004, -2.8492727279663086, -0.9322643280029297, 0.9847450256347656, 2.9017539024353027, 4.81876277923584, 6.735772132873535, 8.652780532836914, 10.56978988647461, 12.486799240112305, 14.403807640075684, 16.320816040039062, 18.237825393676758, 20.154834747314453, 22.071842193603516, 23.98885154724121, 25.905860900878906, 27.8228702545166, 29.739879608154297, 31.656888961791992, 33.57389831542969, 35.49090576171875, 37.40791702270508, 39.32492446899414, 41.24193572998047, 43.15894317626953, 45.075950622558594, 46.99296188354492, 48.909969329833984, 50.82698059082031, 52.743988037109375, 54.6609992980957, 56.578006744384766, 58.495018005371094, 60.412025451660156, 62.32903289794922]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 12.0, 9.0, 11.0, 24.0, 33.0, 51.0, 73.0, 120.0, 196.0, 304.0, 538.0, 959.0, 1805.0, 3726.0, 8510.0, 20422.0, 53131.0, 147753.0, 355475.0, 284496.0, 104991.0, 38155.0, 15028.0, 6465.0, 2908.0, 1465.0, 745.0, 396.0, 257.0, 156.0, 115.0, 71.0, 46.0, 28.0, 23.0, 13.0, 12.0, 7.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7265625, -9.4210205078125, -9.115478515625, -8.8099365234375, -8.50439453125, -8.1988525390625, -7.893310546875, -7.5877685546875, -7.2822265625, -6.9766845703125, -6.671142578125, -6.3656005859375, -6.06005859375, -5.7545166015625, -5.448974609375, -5.1434326171875, -4.837890625, -4.5323486328125, -4.226806640625, -3.9212646484375, -3.61572265625, -3.3101806640625, -3.004638671875, -2.6990966796875, -2.3935546875, -2.0880126953125, -1.782470703125, -1.4769287109375, -1.17138671875, -0.8658447265625, -0.560302734375, -0.2547607421875, 0.05078125, 0.3563232421875, 0.661865234375, 0.9674072265625, 1.27294921875, 1.5784912109375, 1.884033203125, 2.1895751953125, 2.4951171875, 2.8006591796875, 3.106201171875, 3.4117431640625, 3.71728515625, 4.0228271484375, 4.328369140625, 4.6339111328125, 4.939453125, 5.2449951171875, 5.550537109375, 5.8560791015625, 6.16162109375, 6.4671630859375, 6.772705078125, 7.0782470703125, 7.3837890625, 7.6893310546875, 7.994873046875, 8.3004150390625, 8.60595703125, 8.9114990234375, 9.217041015625, 9.5225830078125, 9.828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 3.0, 2.0, 10.0, 5.0, 9.0, 12.0, 21.0, 28.0, 26.0, 32.0, 47.0, 38.0, 44.0, 44.0, 44.0, 59.0, 61.0, 62.0, 59.0, 49.0, 42.0, 50.0, 44.0, 43.0, 28.0, 22.0, 26.0, 18.0, 17.0, 16.0, 13.0, 10.0, 2.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0635986328125, -8.783447265625, -8.5032958984375, -8.22314453125, -7.9429931640625, -7.662841796875, -7.3826904296875, -7.1025390625, -6.8223876953125, -6.542236328125, -6.2620849609375, -5.98193359375, -5.7017822265625, -5.421630859375, -5.1414794921875, -4.861328125, -4.5811767578125, -4.301025390625, -4.0208740234375, -3.74072265625, -3.4605712890625, -3.180419921875, -2.9002685546875, -2.6201171875, -2.3399658203125, -2.059814453125, -1.7796630859375, -1.49951171875, -1.2193603515625, -0.939208984375, -0.6590576171875, -0.37890625, -0.0987548828125, 0.181396484375, 0.4615478515625, 0.74169921875, 1.0218505859375, 1.302001953125, 1.5821533203125, 1.8623046875, 2.1424560546875, 2.422607421875, 2.7027587890625, 2.98291015625, 3.2630615234375, 3.543212890625, 3.8233642578125, 4.103515625, 4.3836669921875, 4.663818359375, 4.9439697265625, 5.22412109375, 5.5042724609375, 5.784423828125, 6.0645751953125, 6.3447265625, 6.6248779296875, 6.905029296875, 7.1851806640625, 7.46533203125, 7.7454833984375, 8.025634765625, 8.3057861328125, 8.5859375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 7.0, 7.0, 12.0, 13.0, 24.0, 27.0, 26.0, 54.0, 62.0, 95.0, 115.0, 157.0, 255.0, 393.0, 648.0, 1249.0, 2850.0, 8355.0, 32536.0, 190092.0, 693059.0, 89739.0, 18566.0, 5460.0, 2080.0, 989.0, 562.0, 306.0, 234.0, 146.0, 125.0, 79.0, 59.0, 44.0, 37.0, 22.0, 17.0, 13.0, 9.0, 10.0, 9.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.640625, -16.091552734375, -15.54248046875, -14.993408203125, -14.4443359375, -13.895263671875, -13.34619140625, -12.797119140625, -12.248046875, -11.698974609375, -11.14990234375, -10.600830078125, -10.0517578125, -9.502685546875, -8.95361328125, -8.404541015625, -7.85546875, -7.306396484375, -6.75732421875, -6.208251953125, -5.6591796875, -5.110107421875, -4.56103515625, -4.011962890625, -3.462890625, -2.913818359375, -2.36474609375, -1.815673828125, -1.2666015625, -0.717529296875, -0.16845703125, 0.380615234375, 0.9296875, 1.478759765625, 2.02783203125, 2.576904296875, 3.1259765625, 3.675048828125, 4.22412109375, 4.773193359375, 5.322265625, 5.871337890625, 6.42041015625, 6.969482421875, 7.5185546875, 8.067626953125, 8.61669921875, 9.165771484375, 9.71484375, 10.263916015625, 10.81298828125, 11.362060546875, 11.9111328125, 12.460205078125, 13.00927734375, 13.558349609375, 14.107421875, 14.656494140625, 15.20556640625, 15.754638671875, 16.3037109375, 16.852783203125, 17.40185546875, 17.950927734375, 18.5]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 3.0, 8.0, 8.0, 10.0, 10.0, 12.0, 26.0, 14.0, 29.0, 34.0, 27.0, 35.0, 32.0, 50.0, 42.0, 46.0, 51.0, 60.0, 42.0, 51.0, 57.0, 49.0, 41.0, 39.0, 40.0, 19.0, 20.0, 28.0, 19.0, 14.0, 11.0, 10.0, 8.0, 11.0, 9.0, 6.0, 2.0, 2.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-27.453125, -26.60791015625, -25.7626953125, -24.91748046875, -24.072265625, -23.22705078125, -22.3818359375, -21.53662109375, -20.69140625, -19.84619140625, -19.0009765625, -18.15576171875, -17.310546875, -16.46533203125, -15.6201171875, -14.77490234375, -13.9296875, -13.08447265625, -12.2392578125, -11.39404296875, -10.548828125, -9.70361328125, -8.8583984375, -8.01318359375, -7.16796875, -6.32275390625, -5.4775390625, -4.63232421875, -3.787109375, -2.94189453125, -2.0966796875, -1.25146484375, -0.40625, 0.43896484375, 1.2841796875, 2.12939453125, 2.974609375, 3.81982421875, 4.6650390625, 5.51025390625, 6.35546875, 7.20068359375, 8.0458984375, 8.89111328125, 9.736328125, 10.58154296875, 11.4267578125, 12.27197265625, 13.1171875, 13.96240234375, 14.8076171875, 15.65283203125, 16.498046875, 17.34326171875, 18.1884765625, 19.03369140625, 19.87890625, 20.72412109375, 21.5693359375, 22.41455078125, 23.259765625, 24.10498046875, 24.9501953125, 25.79541015625, 26.640625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 9.0, 14.0, 13.0, 24.0, 34.0, 40.0, 55.0, 102.0, 173.0, 309.0, 515.0, 994.0, 2159.0, 5141.0, 14299.0, 47284.0, 274060.0, 611300.0, 63014.0, 17587.0, 6234.0, 2643.0, 1169.0, 578.0, 302.0, 169.0, 96.0, 70.0, 51.0, 27.0, 18.0, 15.0, 5.0, 5.0, 8.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.11328125, -3.971923828125, -3.83056640625, -3.689208984375, -3.5478515625, -3.406494140625, -3.26513671875, -3.123779296875, -2.982421875, -2.841064453125, -2.69970703125, -2.558349609375, -2.4169921875, -2.275634765625, -2.13427734375, -1.992919921875, -1.8515625, -1.710205078125, -1.56884765625, -1.427490234375, -1.2861328125, -1.144775390625, -1.00341796875, -0.862060546875, -0.720703125, -0.579345703125, -0.43798828125, -0.296630859375, -0.1552734375, -0.013916015625, 0.12744140625, 0.268798828125, 0.41015625, 0.551513671875, 0.69287109375, 0.834228515625, 0.9755859375, 1.116943359375, 1.25830078125, 1.399658203125, 1.541015625, 1.682373046875, 1.82373046875, 1.965087890625, 2.1064453125, 2.247802734375, 2.38916015625, 2.530517578125, 2.671875, 2.813232421875, 2.95458984375, 3.095947265625, 3.2373046875, 3.378662109375, 3.52001953125, 3.661376953125, 3.802734375, 3.944091796875, 4.08544921875, 4.226806640625, 4.3681640625, 4.509521484375, 4.65087890625, 4.792236328125, 4.93359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 8.0, 7.0, 7.0, 6.0, 13.0, 18.0, 24.0, 35.0, 66.0, 62.0, 117.0, 141.0, 154.0, 87.0, 65.0, 43.0, 28.0, 21.0, 19.0, 16.0, 10.0, 9.0, 5.0, 7.0, 6.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015840530395507812, -0.0015386193990707397, -0.0014931857585906982, -0.0014477521181106567, -0.0014023184776306152, -0.0013568848371505737, -0.0013114511966705322, -0.0012660175561904907, -0.0012205839157104492, -0.0011751502752304077, -0.0011297166347503662, -0.0010842829942703247, -0.0010388493537902832, -0.0009934157133102417, -0.0009479820728302002, -0.0009025484323501587, -0.0008571147918701172, -0.0008116811513900757, -0.0007662475109100342, -0.0007208138704299927, -0.0006753802299499512, -0.0006299465894699097, -0.0005845129489898682, -0.0005390793085098267, -0.0004936456680297852, -0.00044821202754974365, -0.00040277838706970215, -0.00035734474658966064, -0.00031191110610961914, -0.00026647746562957764, -0.00022104382514953613, -0.00017561018466949463, -0.00013017654418945312, -8.474290370941162e-05, -3.930926322937012e-05, 6.124377250671387e-06, 5.155801773071289e-05, 9.69916582107544e-05, 0.0001424252986907959, 0.0001878589391708374, 0.0002332925796508789, 0.0002787262201309204, 0.0003241598606109619, 0.0003695935010910034, 0.0004150271415710449, 0.0004604607820510864, 0.0005058944225311279, 0.0005513280630111694, 0.0005967617034912109, 0.0006421953439712524, 0.0006876289844512939, 0.0007330626249313354, 0.000778496265411377, 0.0008239299058914185, 0.00086936354637146, 0.0009147971868515015, 0.000960230827331543, 0.0010056644678115845, 0.001051098108291626, 0.0010965317487716675, 0.001141965389251709, 0.0011873990297317505, 0.001232832670211792, 0.0012782663106918335, 0.001323699951171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 5.0, 9.0, 13.0, 14.0, 23.0, 36.0, 49.0, 57.0, 103.0, 158.0, 266.0, 396.0, 760.0, 1556.0, 3337.0, 8129.0, 23589.0, 86725.0, 648448.0, 206486.0, 44417.0, 13965.0, 5256.0, 2260.0, 991.0, 589.0, 344.0, 193.0, 111.0, 72.0, 50.0, 36.0, 25.0, 18.0, 12.0, 14.0, 8.0, 3.0, 10.0, 5.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.10546875, -3.97198486328125, -3.8385009765625, -3.70501708984375, -3.571533203125, -3.43804931640625, -3.3045654296875, -3.17108154296875, -3.03759765625, -2.90411376953125, -2.7706298828125, -2.63714599609375, -2.503662109375, -2.37017822265625, -2.2366943359375, -2.10321044921875, -1.9697265625, -1.83624267578125, -1.7027587890625, -1.56927490234375, -1.435791015625, -1.30230712890625, -1.1688232421875, -1.03533935546875, -0.90185546875, -0.76837158203125, -0.6348876953125, -0.50140380859375, -0.367919921875, -0.23443603515625, -0.1009521484375, 0.03253173828125, 0.166015625, 0.29949951171875, 0.4329833984375, 0.56646728515625, 0.699951171875, 0.83343505859375, 0.9669189453125, 1.10040283203125, 1.23388671875, 1.36737060546875, 1.5008544921875, 1.63433837890625, 1.767822265625, 1.90130615234375, 2.0347900390625, 2.16827392578125, 2.3017578125, 2.43524169921875, 2.5687255859375, 2.70220947265625, 2.835693359375, 2.96917724609375, 3.1026611328125, 3.23614501953125, 3.36962890625, 3.50311279296875, 3.6365966796875, 3.77008056640625, 3.903564453125, 4.03704833984375, 4.1705322265625, 4.30401611328125, 4.4375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 10.0, 6.0, 15.0, 10.0, 21.0, 12.0, 23.0, 39.0, 40.0, 59.0, 86.0, 114.0, 112.0, 98.0, 99.0, 65.0, 42.0, 35.0, 22.0, 19.0, 12.0, 10.0, 12.0, 10.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.89453125, -5.71942138671875, -5.5443115234375, -5.36920166015625, -5.194091796875, -5.01898193359375, -4.8438720703125, -4.66876220703125, -4.49365234375, -4.31854248046875, -4.1434326171875, -3.96832275390625, -3.793212890625, -3.61810302734375, -3.4429931640625, -3.26788330078125, -3.0927734375, -2.91766357421875, -2.7425537109375, -2.56744384765625, -2.392333984375, -2.21722412109375, -2.0421142578125, -1.86700439453125, -1.69189453125, -1.51678466796875, -1.3416748046875, -1.16656494140625, -0.991455078125, -0.81634521484375, -0.6412353515625, -0.46612548828125, -0.291015625, -0.11590576171875, 0.0592041015625, 0.23431396484375, 0.409423828125, 0.58453369140625, 0.7596435546875, 0.93475341796875, 1.10986328125, 1.28497314453125, 1.4600830078125, 1.63519287109375, 1.810302734375, 1.98541259765625, 2.1605224609375, 2.33563232421875, 2.5107421875, 2.68585205078125, 2.8609619140625, 3.03607177734375, 3.211181640625, 3.38629150390625, 3.5614013671875, 3.73651123046875, 3.91162109375, 4.08673095703125, 4.2618408203125, 4.43695068359375, 4.612060546875, 4.78717041015625, 4.9622802734375, 5.13739013671875, 5.3125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 17.0, 36.0, 75.0, 138.0, 327.0, 182.0, 91.0, 52.0, 22.0, 16.0, 7.0, 2.0, 0.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-226.6300506591797, -221.7748565673828, -216.91964721679688, -212.064453125, -207.20925903320312, -202.35406494140625, -197.49887084960938, -192.64366149902344, -187.78846740722656, -182.9332733154297, -178.07806396484375, -173.22286987304688, -168.36767578125, -163.51248168945312, -158.65728759765625, -153.8020782470703, -148.94688415527344, -144.09169006347656, -139.23648071289062, -134.38128662109375, -129.52609252929688, -124.6708984375, -119.8156967163086, -114.96049499511719, -110.10530090332031, -105.25010681152344, -100.39490509033203, -95.53970336914062, -90.68450927734375, -85.82931518554688, -80.97411346435547, -76.11891174316406, -71.26371002197266, -66.40850830078125, -61.553314208984375, -56.698116302490234, -51.842918395996094, -46.98772048950195, -42.13252258300781, -37.27732467651367, -32.42212677001953, -27.56692886352539, -22.71173095703125, -17.85653305053711, -13.001335144042969, -8.146137237548828, -3.2909393310546875, 1.5642585754394531, 6.419456481933594, 11.274654388427734, 16.129852294921875, 20.985050201416016, 25.840248107910156, 30.695446014404297, 35.55064392089844, 40.40584182739258, 45.26103973388672, 50.11623764038086, 54.971435546875, 59.82663345336914, 64.68183135986328, 69.53703308105469, 74.39222717285156, 79.24742126464844, 84.10262298583984]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 11.0, 12.0, 5.0, 15.0, 16.0, 17.0, 21.0, 22.0, 27.0, 35.0, 41.0, 50.0, 45.0, 82.0, 100.0, 103.0, 72.0, 42.0, 47.0, 32.0, 31.0, 29.0, 17.0, 15.0, 20.0, 13.0, 11.0, 7.0, 14.0, 10.0, 8.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-136.49073791503906, -132.78094482421875, -129.07113647460938, -125.36134338378906, -121.65154266357422, -117.94174194335938, -114.23194885253906, -110.52214813232422, -106.81234741210938, -103.10254669189453, -99.39275360107422, -95.68295288085938, -91.97315216064453, -88.26335144042969, -84.55355834960938, -80.84375762939453, -77.13395690917969, -73.42415618896484, -69.71436309814453, -66.00456237792969, -62.294761657714844, -58.584964752197266, -54.87516784667969, -51.165367126464844, -47.45557403564453, -43.74577713012695, -40.03597640991211, -36.32617950439453, -32.61637878417969, -28.90658187866211, -25.1967830657959, -21.486984252929688, -17.777183532714844, -14.067384719848633, -10.357585906982422, -6.647788047790527, -2.9379892349243164, 0.7718086242675781, 4.481607437133789, 8.19140625, 11.901205062866211, 15.611003875732422, 19.320802688598633, 23.030601501464844, 26.740398406982422, 30.450197219848633, 34.159996032714844, 37.86979675292969, 41.579593658447266, 45.289390563964844, 48.99919128417969, 52.708988189697266, 56.41878890991211, 60.12858581542969, 63.83838653564453, 67.54818725585938, 71.25798034667969, 74.96778106689453, 78.67757415771484, 82.38737487792969, 86.09717559814453, 89.80697631835938, 93.51676940917969, 97.22657012939453, 100.93637084960938]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 2.0, 6.0, 8.0, 12.0, 17.0, 18.0, 28.0, 51.0, 60.0, 95.0, 147.0, 198.0, 284.0, 503.0, 777.0, 1271.0, 2440.0, 5682.0, 14637.0, 50989.0, 245215.0, 1301696.0, 1999037.0, 451983.0, 82330.0, 21774.0, 7607.0, 3237.0, 1589.0, 966.0, 523.0, 366.0, 241.0, 148.0, 98.0, 79.0, 42.0, 24.0, 30.0, 20.0, 10.0, 11.0, 9.0, 9.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-8.1171875, -7.8389892578125, -7.560791015625, -7.2825927734375, -7.00439453125, -6.7261962890625, -6.447998046875, -6.1697998046875, -5.8916015625, -5.6134033203125, -5.335205078125, -5.0570068359375, -4.77880859375, -4.5006103515625, -4.222412109375, -3.9442138671875, -3.666015625, -3.3878173828125, -3.109619140625, -2.8314208984375, -2.55322265625, -2.2750244140625, -1.996826171875, -1.7186279296875, -1.4404296875, -1.1622314453125, -0.884033203125, -0.6058349609375, -0.32763671875, -0.0494384765625, 0.228759765625, 0.5069580078125, 0.78515625, 1.0633544921875, 1.341552734375, 1.6197509765625, 1.89794921875, 2.1761474609375, 2.454345703125, 2.7325439453125, 3.0107421875, 3.2889404296875, 3.567138671875, 3.8453369140625, 4.12353515625, 4.4017333984375, 4.679931640625, 4.9581298828125, 5.236328125, 5.5145263671875, 5.792724609375, 6.0709228515625, 6.34912109375, 6.6273193359375, 6.905517578125, 7.1837158203125, 7.4619140625, 7.7401123046875, 8.018310546875, 8.2965087890625, 8.57470703125, 8.8529052734375, 9.131103515625, 9.4093017578125, 9.6875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 8.0, 25.0, 23.0, 29.0, 31.0, 41.0, 45.0, 47.0, 54.0, 48.0, 45.0, 50.0, 60.0, 70.0, 53.0, 51.0, 45.0, 46.0, 44.0, 29.0, 20.0, 25.0, 20.0, 17.0, 19.0, 10.0, 7.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3515625, -9.0726318359375, -8.793701171875, -8.5147705078125, -8.23583984375, -7.9569091796875, -7.677978515625, -7.3990478515625, -7.1201171875, -6.8411865234375, -6.562255859375, -6.2833251953125, -6.00439453125, -5.7254638671875, -5.446533203125, -5.1676025390625, -4.888671875, -4.6097412109375, -4.330810546875, -4.0518798828125, -3.77294921875, -3.4940185546875, -3.215087890625, -2.9361572265625, -2.6572265625, -2.3782958984375, -2.099365234375, -1.8204345703125, -1.54150390625, -1.2625732421875, -0.983642578125, -0.7047119140625, -0.42578125, -0.1468505859375, 0.132080078125, 0.4110107421875, 0.68994140625, 0.9688720703125, 1.247802734375, 1.5267333984375, 1.8056640625, 2.0845947265625, 2.363525390625, 2.6424560546875, 2.92138671875, 3.2003173828125, 3.479248046875, 3.7581787109375, 4.037109375, 4.3160400390625, 4.594970703125, 4.8739013671875, 5.15283203125, 5.4317626953125, 5.710693359375, 5.9896240234375, 6.2685546875, 6.5474853515625, 6.826416015625, 7.1053466796875, 7.38427734375, 7.6632080078125, 7.942138671875, 8.2210693359375, 8.5]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 11.0, 10.0, 13.0, 16.0, 28.0, 37.0, 48.0, 97.0, 163.0, 361.0, 807.0, 2546.0, 13247.0, 197194.0, 3823638.0, 141040.0, 11211.0, 2298.0, 714.0, 376.0, 172.0, 96.0, 54.0, 37.0, 22.0, 17.0, 14.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.953125, -21.181640625, -20.41015625, -19.638671875, -18.8671875, -18.095703125, -17.32421875, -16.552734375, -15.78125, -15.009765625, -14.23828125, -13.466796875, -12.6953125, -11.923828125, -11.15234375, -10.380859375, -9.609375, -8.837890625, -8.06640625, -7.294921875, -6.5234375, -5.751953125, -4.98046875, -4.208984375, -3.4375, -2.666015625, -1.89453125, -1.123046875, -0.3515625, 0.419921875, 1.19140625, 1.962890625, 2.734375, 3.505859375, 4.27734375, 5.048828125, 5.8203125, 6.591796875, 7.36328125, 8.134765625, 8.90625, 9.677734375, 10.44921875, 11.220703125, 11.9921875, 12.763671875, 13.53515625, 14.306640625, 15.078125, 15.849609375, 16.62109375, 17.392578125, 18.1640625, 18.935546875, 19.70703125, 20.478515625, 21.25, 22.021484375, 22.79296875, 23.564453125, 24.3359375, 25.107421875, 25.87890625, 26.650390625, 27.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 15.0, 14.0, 31.0, 38.0, 85.0, 132.0, 242.0, 416.0, 704.0, 863.0, 659.0, 372.0, 185.0, 100.0, 58.0, 51.0, 23.0, 21.0, 19.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.074462890625, -23.43017578125, -22.785888671875, -22.1416015625, -21.497314453125, -20.85302734375, -20.208740234375, -19.564453125, -18.920166015625, -18.27587890625, -17.631591796875, -16.9873046875, -16.343017578125, -15.69873046875, -15.054443359375, -14.41015625, -13.765869140625, -13.12158203125, -12.477294921875, -11.8330078125, -11.188720703125, -10.54443359375, -9.900146484375, -9.255859375, -8.611572265625, -7.96728515625, -7.322998046875, -6.6787109375, -6.034423828125, -5.39013671875, -4.745849609375, -4.1015625, -3.457275390625, -2.81298828125, -2.168701171875, -1.5244140625, -0.880126953125, -0.23583984375, 0.408447265625, 1.052734375, 1.697021484375, 2.34130859375, 2.985595703125, 3.6298828125, 4.274169921875, 4.91845703125, 5.562744140625, 6.20703125, 6.851318359375, 7.49560546875, 8.139892578125, 8.7841796875, 9.428466796875, 10.07275390625, 10.717041015625, 11.361328125, 12.005615234375, 12.64990234375, 13.294189453125, 13.9384765625, 14.582763671875, 15.22705078125, 15.871337890625, 16.515625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 9.0, 7.0, 10.0, 34.0, 53.0, 139.0, 249.0, 226.0, 144.0, 76.0, 29.0, 10.0, 10.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.17324829101562, -157.8883056640625, -151.60337829589844, -145.3184356689453, -139.03350830078125, -132.74856567382812, -126.463623046875, -120.1786880493164, -113.89375305175781, -107.60881805419922, -101.32388305664062, -95.0389404296875, -88.7540054321289, -82.46907043457031, -76.18412780761719, -69.8991928100586, -63.6142578125, -57.329322814941406, -51.04438400268555, -44.75944519042969, -38.474510192871094, -32.1895751953125, -25.90463638305664, -19.61969757080078, -13.334762573242188, -7.049825668334961, -0.7648887634277344, 5.520048141479492, 11.804985046386719, 18.089921951293945, 24.374858856201172, 30.65979766845703, 36.94474792480469, 43.22968292236328, 49.51462173461914, 55.799560546875, 62.084495544433594, 68.36943054199219, 74.65437316894531, 80.9393081665039, 87.2242431640625, 93.5091781616211, 99.79411315917969, 106.07905578613281, 112.3639907836914, 118.64892578125, 124.93386840820312, 131.21881103515625, 137.5037384033203, 143.78868103027344, 150.0736083984375, 156.35855102539062, 162.64349365234375, 168.9284210205078, 175.21336364746094, 181.498291015625, 187.78323364257812, 194.06817626953125, 200.3531036376953, 206.63804626464844, 212.9229736328125, 219.20791625976562, 225.49285888671875, 231.77780151367188, 238.06272888183594]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 13.0, 8.0, 14.0, 12.0, 11.0, 13.0, 18.0, 24.0, 25.0, 39.0, 16.0, 29.0, 40.0, 40.0, 44.0, 70.0, 69.0, 59.0, 66.0, 44.0, 35.0, 45.0, 34.0, 28.0, 26.0, 23.0, 19.0, 19.0, 16.0, 24.0, 12.0, 14.0, 13.0, 7.0, 6.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-62.90861892700195, -60.680538177490234, -58.45246124267578, -56.22438049316406, -53.996299743652344, -51.768218994140625, -49.540138244628906, -47.31206130981445, -45.083980560302734, -42.855899810791016, -40.62782287597656, -38.399742126464844, -36.171661376953125, -33.943580627441406, -31.71550178527832, -29.487422943115234, -27.259342193603516, -25.031261444091797, -22.80318260192871, -20.575103759765625, -18.347023010253906, -16.118942260742188, -13.890863418579102, -11.6627836227417, -9.434703826904297, -7.2066240310668945, -4.978544235229492, -2.75046443939209, -0.5223846435546875, 1.7056951522827148, 3.933774948120117, 6.1618547439575195, 8.389930725097656, 10.618010520935059, 12.846090316772461, 15.074170112609863, 17.302249908447266, 19.530330657958984, 21.75840950012207, 23.986488342285156, 26.214569091796875, 28.442649841308594, 30.67072868347168, 32.898807525634766, 35.126888275146484, 37.3549690246582, 39.583045959472656, 41.811126708984375, 44.039207458496094, 46.26728820800781, 48.49536895751953, 50.723445892333984, 52.9515266418457, 55.17960739135742, 57.407684326171875, 59.635765075683594, 61.86384582519531, 64.09192657470703, 66.32000732421875, 68.54808807373047, 70.77616882324219, 73.00424194335938, 75.2323226928711, 77.46040344238281, 79.68848419189453]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 1.0, 9.0, 9.0, 13.0, 25.0, 28.0, 48.0, 64.0, 117.0, 175.0, 263.0, 460.0, 773.0, 1595.0, 2848.0, 5855.0, 12275.0, 27993.0, 67971.0, 182314.0, 380960.0, 221138.0, 82149.0, 33008.0, 14371.0, 6691.0, 3455.0, 1706.0, 930.0, 509.0, 326.0, 173.0, 102.0, 61.0, 46.0, 34.0, 19.0, 11.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.51708984375, -9.2060546875, -8.89501953125, -8.583984375, -8.27294921875, -7.9619140625, -7.65087890625, -7.33984375, -7.02880859375, -6.7177734375, -6.40673828125, -6.095703125, -5.78466796875, -5.4736328125, -5.16259765625, -4.8515625, -4.54052734375, -4.2294921875, -3.91845703125, -3.607421875, -3.29638671875, -2.9853515625, -2.67431640625, -2.36328125, -2.05224609375, -1.7412109375, -1.43017578125, -1.119140625, -0.80810546875, -0.4970703125, -0.18603515625, 0.125, 0.43603515625, 0.7470703125, 1.05810546875, 1.369140625, 1.68017578125, 1.9912109375, 2.30224609375, 2.61328125, 2.92431640625, 3.2353515625, 3.54638671875, 3.857421875, 4.16845703125, 4.4794921875, 4.79052734375, 5.1015625, 5.41259765625, 5.7236328125, 6.03466796875, 6.345703125, 6.65673828125, 6.9677734375, 7.27880859375, 7.58984375, 7.90087890625, 8.2119140625, 8.52294921875, 8.833984375, 9.14501953125, 9.4560546875, 9.76708984375, 10.078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 9.0, 17.0, 14.0, 22.0, 33.0, 41.0, 37.0, 40.0, 46.0, 48.0, 39.0, 44.0, 63.0, 54.0, 49.0, 65.0, 54.0, 43.0, 47.0, 36.0, 30.0, 24.0, 25.0, 18.0, 15.0, 13.0, 12.0, 12.0, 9.0, 10.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375, -9.09716796875, -8.8193359375, -8.54150390625, -8.263671875, -7.98583984375, -7.7080078125, -7.43017578125, -7.15234375, -6.87451171875, -6.5966796875, -6.31884765625, -6.041015625, -5.76318359375, -5.4853515625, -5.20751953125, -4.9296875, -4.65185546875, -4.3740234375, -4.09619140625, -3.818359375, -3.54052734375, -3.2626953125, -2.98486328125, -2.70703125, -2.42919921875, -2.1513671875, -1.87353515625, -1.595703125, -1.31787109375, -1.0400390625, -0.76220703125, -0.484375, -0.20654296875, 0.0712890625, 0.34912109375, 0.626953125, 0.90478515625, 1.1826171875, 1.46044921875, 1.73828125, 2.01611328125, 2.2939453125, 2.57177734375, 2.849609375, 3.12744140625, 3.4052734375, 3.68310546875, 3.9609375, 4.23876953125, 4.5166015625, 4.79443359375, 5.072265625, 5.35009765625, 5.6279296875, 5.90576171875, 6.18359375, 6.46142578125, 6.7392578125, 7.01708984375, 7.294921875, 7.57275390625, 7.8505859375, 8.12841796875, 8.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 7.0, 3.0, 9.0, 18.0, 28.0, 45.0, 47.0, 62.0, 64.0, 150.0, 187.0, 272.0, 450.0, 675.0, 1218.0, 2337.0, 5994.0, 23962.0, 168678.0, 757221.0, 66455.0, 12537.0, 3890.0, 1687.0, 935.0, 568.0, 332.0, 232.0, 134.0, 112.0, 65.0, 44.0, 42.0, 24.0, 20.0, 11.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.65234375, -19.9921875, -19.33203125, -18.671875, -18.01171875, -17.3515625, -16.69140625, -16.03125, -15.37109375, -14.7109375, -14.05078125, -13.390625, -12.73046875, -12.0703125, -11.41015625, -10.75, -10.08984375, -9.4296875, -8.76953125, -8.109375, -7.44921875, -6.7890625, -6.12890625, -5.46875, -4.80859375, -4.1484375, -3.48828125, -2.828125, -2.16796875, -1.5078125, -0.84765625, -0.1875, 0.47265625, 1.1328125, 1.79296875, 2.453125, 3.11328125, 3.7734375, 4.43359375, 5.09375, 5.75390625, 6.4140625, 7.07421875, 7.734375, 8.39453125, 9.0546875, 9.71484375, 10.375, 11.03515625, 11.6953125, 12.35546875, 13.015625, 13.67578125, 14.3359375, 14.99609375, 15.65625, 16.31640625, 16.9765625, 17.63671875, 18.296875, 18.95703125, 19.6171875, 20.27734375, 20.9375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 2.0, 1.0, 6.0, 5.0, 10.0, 17.0, 16.0, 20.0, 24.0, 28.0, 25.0, 28.0, 51.0, 47.0, 53.0, 63.0, 82.0, 71.0, 50.0, 67.0, 60.0, 40.0, 44.0, 40.0, 34.0, 26.0, 20.0, 17.0, 11.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -36.35205078125, -35.2353515625, -34.11865234375, -33.001953125, -31.88525390625, -30.7685546875, -29.65185546875, -28.53515625, -27.41845703125, -26.3017578125, -25.18505859375, -24.068359375, -22.95166015625, -21.8349609375, -20.71826171875, -19.6015625, -18.48486328125, -17.3681640625, -16.25146484375, -15.134765625, -14.01806640625, -12.9013671875, -11.78466796875, -10.66796875, -9.55126953125, -8.4345703125, -7.31787109375, -6.201171875, -5.08447265625, -3.9677734375, -2.85107421875, -1.734375, -0.61767578125, 0.4990234375, 1.61572265625, 2.732421875, 3.84912109375, 4.9658203125, 6.08251953125, 7.19921875, 8.31591796875, 9.4326171875, 10.54931640625, 11.666015625, 12.78271484375, 13.8994140625, 15.01611328125, 16.1328125, 17.24951171875, 18.3662109375, 19.48291015625, 20.599609375, 21.71630859375, 22.8330078125, 23.94970703125, 25.06640625, 26.18310546875, 27.2998046875, 28.41650390625, 29.533203125, 30.64990234375, 31.7666015625, 32.88330078125, 34.0]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 12.0, 6.0, 12.0, 25.0, 18.0, 45.0, 93.0, 162.0, 347.0, 780.0, 2268.0, 9506.0, 79436.0, 878019.0, 65720.0, 8550.0, 2085.0, 716.0, 330.0, 165.0, 85.0, 56.0, 31.0, 16.0, 10.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 7.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.7578125, -7.53271484375, -7.3076171875, -7.08251953125, -6.857421875, -6.63232421875, -6.4072265625, -6.18212890625, -5.95703125, -5.73193359375, -5.5068359375, -5.28173828125, -5.056640625, -4.83154296875, -4.6064453125, -4.38134765625, -4.15625, -3.93115234375, -3.7060546875, -3.48095703125, -3.255859375, -3.03076171875, -2.8056640625, -2.58056640625, -2.35546875, -2.13037109375, -1.9052734375, -1.68017578125, -1.455078125, -1.22998046875, -1.0048828125, -0.77978515625, -0.5546875, -0.32958984375, -0.1044921875, 0.12060546875, 0.345703125, 0.57080078125, 0.7958984375, 1.02099609375, 1.24609375, 1.47119140625, 1.6962890625, 1.92138671875, 2.146484375, 2.37158203125, 2.5966796875, 2.82177734375, 3.046875, 3.27197265625, 3.4970703125, 3.72216796875, 3.947265625, 4.17236328125, 4.3974609375, 4.62255859375, 4.84765625, 5.07275390625, 5.2978515625, 5.52294921875, 5.748046875, 5.97314453125, 6.1982421875, 6.42333984375, 6.6484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 11.0, 13.0, 23.0, 39.0, 31.0, 53.0, 96.0, 175.0, 185.0, 111.0, 63.0, 44.0, 25.0, 21.0, 17.0, 9.0, 7.0, 13.0, 11.0, 6.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001689910888671875, -0.001631706953048706, -0.0015735030174255371, -0.0015152990818023682, -0.0014570951461791992, -0.0013988912105560303, -0.0013406872749328613, -0.0012824833393096924, -0.0012242794036865234, -0.0011660754680633545, -0.0011078715324401855, -0.0010496675968170166, -0.0009914636611938477, -0.0009332597255706787, -0.0008750557899475098, -0.0008168518543243408, -0.0007586479187011719, -0.0007004439830780029, -0.000642240047454834, -0.000584036111831665, -0.0005258321762084961, -0.00046762824058532715, -0.0004094243049621582, -0.00035122036933898926, -0.0002930164337158203, -0.00023481249809265137, -0.00017660856246948242, -0.00011840462684631348, -6.020069122314453e-05, -1.996755599975586e-06, 5.620718002319336e-05, 0.0001144111156463623, 0.00017261505126953125, 0.0002308189868927002, 0.00028902292251586914, 0.0003472268581390381, 0.00040543079376220703, 0.000463634729385376, 0.0005218386650085449, 0.0005800426006317139, 0.0006382465362548828, 0.0006964504718780518, 0.0007546544075012207, 0.0008128583431243896, 0.0008710622787475586, 0.0009292662143707275, 0.0009874701499938965, 0.0010456740856170654, 0.0011038780212402344, 0.0011620819568634033, 0.0012202858924865723, 0.0012784898281097412, 0.0013366937637329102, 0.001394897699356079, 0.001453101634979248, 0.001511305570602417, 0.001569509506225586, 0.0016277134418487549, 0.0016859173774719238, 0.0017441213130950928, 0.0018023252487182617, 0.0018605291843414307, 0.0019187331199645996, 0.0019769370555877686, 0.0020351409912109375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 16.0, 10.0, 16.0, 22.0, 40.0, 55.0, 103.0, 151.0, 272.0, 490.0, 1077.0, 2327.0, 6338.0, 23367.0, 147471.0, 766412.0, 77313.0, 14931.0, 4484.0, 1734.0, 810.0, 455.0, 228.0, 153.0, 69.0, 67.0, 40.0, 19.0, 14.0, 17.0, 10.0, 3.0, 9.0, 4.0, 1.0, 9.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.882080078125, -4.72119140625, -4.560302734375, -4.3994140625, -4.238525390625, -4.07763671875, -3.916748046875, -3.755859375, -3.594970703125, -3.43408203125, -3.273193359375, -3.1123046875, -2.951416015625, -2.79052734375, -2.629638671875, -2.46875, -2.307861328125, -2.14697265625, -1.986083984375, -1.8251953125, -1.664306640625, -1.50341796875, -1.342529296875, -1.181640625, -1.020751953125, -0.85986328125, -0.698974609375, -0.5380859375, -0.377197265625, -0.21630859375, -0.055419921875, 0.10546875, 0.266357421875, 0.42724609375, 0.588134765625, 0.7490234375, 0.909912109375, 1.07080078125, 1.231689453125, 1.392578125, 1.553466796875, 1.71435546875, 1.875244140625, 2.0361328125, 2.197021484375, 2.35791015625, 2.518798828125, 2.6796875, 2.840576171875, 3.00146484375, 3.162353515625, 3.3232421875, 3.484130859375, 3.64501953125, 3.805908203125, 3.966796875, 4.127685546875, 4.28857421875, 4.449462890625, 4.6103515625, 4.771240234375, 4.93212890625, 5.093017578125, 5.25390625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 9.0, 16.0, 18.0, 30.0, 41.0, 51.0, 65.0, 122.0, 148.0, 131.0, 83.0, 73.0, 56.0, 45.0, 30.0, 17.0, 11.0, 10.0, 6.0, 4.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.66796875, -6.4825439453125, -6.297119140625, -6.1116943359375, -5.92626953125, -5.7408447265625, -5.555419921875, -5.3699951171875, -5.1845703125, -4.9991455078125, -4.813720703125, -4.6282958984375, -4.44287109375, -4.2574462890625, -4.072021484375, -3.8865966796875, -3.701171875, -3.5157470703125, -3.330322265625, -3.1448974609375, -2.95947265625, -2.7740478515625, -2.588623046875, -2.4031982421875, -2.2177734375, -2.0323486328125, -1.846923828125, -1.6614990234375, -1.47607421875, -1.2906494140625, -1.105224609375, -0.9197998046875, -0.734375, -0.5489501953125, -0.363525390625, -0.1781005859375, 0.00732421875, 0.1927490234375, 0.378173828125, 0.5635986328125, 0.7490234375, 0.9344482421875, 1.119873046875, 1.3052978515625, 1.49072265625, 1.6761474609375, 1.861572265625, 2.0469970703125, 2.232421875, 2.4178466796875, 2.603271484375, 2.7886962890625, 2.97412109375, 3.1595458984375, 3.344970703125, 3.5303955078125, 3.7158203125, 3.9012451171875, 4.086669921875, 4.2720947265625, 4.45751953125, 4.6429443359375, 4.828369140625, 5.0137939453125, 5.19921875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 7.0, 15.0, 55.0, 171.0, 480.0, 172.0, 62.0, 23.0, 6.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-420.51397705078125, -411.8282165527344, -403.1424865722656, -394.45672607421875, -385.77099609375, -377.0852355957031, -368.3995056152344, -359.7137451171875, -351.02801513671875, -342.3422546386719, -333.6565246582031, -324.97076416015625, -316.2850341796875, -307.5992736816406, -298.9135437011719, -290.227783203125, -281.5420227050781, -272.85626220703125, -264.1705322265625, -255.4847869873047, -246.79904174804688, -238.11328125, -229.4275360107422, -220.74179077148438, -212.05604553222656, -203.37030029296875, -194.68455505371094, -185.99880981445312, -177.31304931640625, -168.6273193359375, -159.94155883789062, -151.2558135986328, -142.57008361816406, -133.88433837890625, -125.19859313964844, -116.5128402709961, -107.82709503173828, -99.14134979248047, -90.45559692382812, -81.76985168457031, -73.0841064453125, -64.39836120605469, -55.71261215209961, -47.02686309814453, -38.34111785888672, -29.655372619628906, -20.969623565673828, -12.28387451171875, -3.5981292724609375, 5.087617874145508, 13.773365020751953, 22.4591121673584, 31.144859313964844, 39.830604553222656, 48.516353607177734, 57.20210266113281, 65.88784790039062, 74.57359313964844, 83.25933837890625, 91.9450912475586, 100.6308364868164, 109.31658172607422, 118.00233459472656, 126.68807983398438, 135.3738250732422]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 11.0, 13.0, 10.0, 18.0, 10.0, 15.0, 13.0, 16.0, 13.0, 29.0, 35.0, 39.0, 41.0, 49.0, 101.0, 114.0, 121.0, 63.0, 53.0, 39.0, 21.0, 29.0, 24.0, 15.0, 20.0, 14.0, 7.0, 15.0, 12.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-118.04840087890625, -114.33404541015625, -110.61968231201172, -106.90532684326172, -103.19097137451172, -99.47660827636719, -95.76225280761719, -92.04789733886719, -88.33353424072266, -84.61917877197266, -80.90481567382812, -77.19046020507812, -73.47610473632812, -69.7617416381836, -66.0473861694336, -62.33302688598633, -58.61867141723633, -54.90431213378906, -51.18995666503906, -47.4755973815918, -43.76123809814453, -40.04688262939453, -36.332523345947266, -32.6181640625, -28.903806686401367, -25.189449310302734, -21.47509002685547, -17.760732650756836, -14.046374320983887, -10.332015991210938, -6.617658615112305, -2.903299331665039, 0.8110580444335938, 4.525416374206543, 8.239774703979492, 11.954132080078125, 15.668490409851074, 19.382848739624023, 23.097206115722656, 26.811565399169922, 30.525922775268555, 34.24028015136719, 37.95463943481445, 41.66899871826172, 45.38335418701172, 49.097713470458984, 52.81207275390625, 56.52642822265625, 60.240787506103516, 63.95514678955078, 67.66950225830078, 71.38386535644531, 75.09822082519531, 78.81257629394531, 82.52693176269531, 86.24129486083984, 89.95565032958984, 93.67000579833984, 97.38436889648438, 101.09872436523438, 104.81307983398438, 108.5274429321289, 112.2417984008789, 115.95616149902344, 119.67051696777344]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 9.0, 6.0, 12.0, 9.0, 18.0, 27.0, 37.0, 65.0, 103.0, 177.0, 373.0, 842.0, 1965.0, 5442.0, 22283.0, 171352.0, 1504604.0, 2192646.0, 253025.0, 29797.0, 7072.0, 2379.0, 1028.0, 465.0, 205.0, 120.0, 81.0, 48.0, 33.0, 16.0, 11.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.0859375, -11.6229248046875, -11.159912109375, -10.6968994140625, -10.23388671875, -9.7708740234375, -9.307861328125, -8.8448486328125, -8.3818359375, -7.9188232421875, -7.455810546875, -6.9927978515625, -6.52978515625, -6.0667724609375, -5.603759765625, -5.1407470703125, -4.677734375, -4.2147216796875, -3.751708984375, -3.2886962890625, -2.82568359375, -2.3626708984375, -1.899658203125, -1.4366455078125, -0.9736328125, -0.5106201171875, -0.047607421875, 0.4154052734375, 0.87841796875, 1.3414306640625, 1.804443359375, 2.2674560546875, 2.73046875, 3.1934814453125, 3.656494140625, 4.1195068359375, 4.58251953125, 5.0455322265625, 5.508544921875, 5.9715576171875, 6.4345703125, 6.8975830078125, 7.360595703125, 7.8236083984375, 8.28662109375, 8.7496337890625, 9.212646484375, 9.6756591796875, 10.138671875, 10.6016845703125, 11.064697265625, 11.5277099609375, 11.99072265625, 12.4537353515625, 12.916748046875, 13.3797607421875, 13.8427734375, 14.3057861328125, 14.768798828125, 15.2318115234375, 15.69482421875, 16.1578369140625, 16.620849609375, 17.0838623046875, 17.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 10.0, 21.0, 21.0, 20.0, 40.0, 32.0, 48.0, 71.0, 53.0, 49.0, 48.0, 67.0, 53.0, 65.0, 49.0, 48.0, 49.0, 58.0, 33.0, 34.0, 24.0, 18.0, 22.0, 9.0, 6.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.0548095703125, -8.773681640625, -8.4925537109375, -8.21142578125, -7.9302978515625, -7.649169921875, -7.3680419921875, -7.0869140625, -6.8057861328125, -6.524658203125, -6.2435302734375, -5.96240234375, -5.6812744140625, -5.400146484375, -5.1190185546875, -4.837890625, -4.5567626953125, -4.275634765625, -3.9945068359375, -3.71337890625, -3.4322509765625, -3.151123046875, -2.8699951171875, -2.5888671875, -2.3077392578125, -2.026611328125, -1.7454833984375, -1.46435546875, -1.1832275390625, -0.902099609375, -0.6209716796875, -0.33984375, -0.0587158203125, 0.222412109375, 0.5035400390625, 0.78466796875, 1.0657958984375, 1.346923828125, 1.6280517578125, 1.9091796875, 2.1903076171875, 2.471435546875, 2.7525634765625, 3.03369140625, 3.3148193359375, 3.595947265625, 3.8770751953125, 4.158203125, 4.4393310546875, 4.720458984375, 5.0015869140625, 5.28271484375, 5.5638427734375, 5.844970703125, 6.1260986328125, 6.4072265625, 6.6883544921875, 6.969482421875, 7.2506103515625, 7.53173828125, 7.8128662109375, 8.093994140625, 8.3751220703125, 8.65625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 4.0, 6.0, 7.0, 9.0, 11.0, 11.0, 26.0, 38.0, 59.0, 75.0, 97.0, 151.0, 248.0, 441.0, 805.0, 1603.0, 4211.0, 18885.0, 446685.0, 3650624.0, 57068.0, 7962.0, 2550.0, 1153.0, 565.0, 346.0, 211.0, 131.0, 78.0, 56.0, 48.0, 33.0, 21.0, 15.0, 12.0, 8.0, 2.0, 5.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-31.9375, -30.9462890625, -29.955078125, -28.9638671875, -27.97265625, -26.9814453125, -25.990234375, -24.9990234375, -24.0078125, -23.0166015625, -22.025390625, -21.0341796875, -20.04296875, -19.0517578125, -18.060546875, -17.0693359375, -16.078125, -15.0869140625, -14.095703125, -13.1044921875, -12.11328125, -11.1220703125, -10.130859375, -9.1396484375, -8.1484375, -7.1572265625, -6.166015625, -5.1748046875, -4.18359375, -3.1923828125, -2.201171875, -1.2099609375, -0.21875, 0.7724609375, 1.763671875, 2.7548828125, 3.74609375, 4.7373046875, 5.728515625, 6.7197265625, 7.7109375, 8.7021484375, 9.693359375, 10.6845703125, 11.67578125, 12.6669921875, 13.658203125, 14.6494140625, 15.640625, 16.6318359375, 17.623046875, 18.6142578125, 19.60546875, 20.5966796875, 21.587890625, 22.5791015625, 23.5703125, 24.5615234375, 25.552734375, 26.5439453125, 27.53515625, 28.5263671875, 29.517578125, 30.5087890625, 31.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 2.0, 3.0, 11.0, 8.0, 11.0, 15.0, 16.0, 35.0, 36.0, 86.0, 114.0, 176.0, 324.0, 569.0, 752.0, 627.0, 439.0, 292.0, 174.0, 109.0, 85.0, 54.0, 31.0, 32.0, 16.0, 15.0, 10.0, 8.0, 10.0, 5.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.779052734375, -23.99560546875, -23.212158203125, -22.4287109375, -21.645263671875, -20.86181640625, -20.078369140625, -19.294921875, -18.511474609375, -17.72802734375, -16.944580078125, -16.1611328125, -15.377685546875, -14.59423828125, -13.810791015625, -13.02734375, -12.243896484375, -11.46044921875, -10.677001953125, -9.8935546875, -9.110107421875, -8.32666015625, -7.543212890625, -6.759765625, -5.976318359375, -5.19287109375, -4.409423828125, -3.6259765625, -2.842529296875, -2.05908203125, -1.275634765625, -0.4921875, 0.291259765625, 1.07470703125, 1.858154296875, 2.6416015625, 3.425048828125, 4.20849609375, 4.991943359375, 5.775390625, 6.558837890625, 7.34228515625, 8.125732421875, 8.9091796875, 9.692626953125, 10.47607421875, 11.259521484375, 12.04296875, 12.826416015625, 13.60986328125, 14.393310546875, 15.1767578125, 15.960205078125, 16.74365234375, 17.527099609375, 18.310546875, 19.093994140625, 19.87744140625, 20.660888671875, 21.4443359375, 22.227783203125, 23.01123046875, 23.794677734375, 24.578125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 11.0, 9.0, 13.0, 14.0, 32.0, 56.0, 121.0, 186.0, 197.0, 143.0, 79.0, 52.0, 22.0, 14.0, 9.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-195.37460327148438, -187.87167358398438, -180.3687286376953, -172.8657989501953, -165.36285400390625, -157.85992431640625, -150.35699462890625, -142.8540496826172, -135.3511199951172, -127.84818267822266, -120.34524536132812, -112.84231567382812, -105.3393783569336, -97.83644104003906, -90.33350372314453, -82.83056640625, -75.32762908935547, -67.82469177246094, -60.32175827026367, -52.81882095336914, -45.315887451171875, -37.812950134277344, -30.310012817382812, -22.807079315185547, -15.304141998291016, -7.801206111907959, -0.29827022552490234, 7.2046661376953125, 14.707601547241211, 22.21053695678711, 29.71347427368164, 37.216407775878906, 44.71934509277344, 52.22228240966797, 59.725215911865234, 67.2281494140625, 74.73108673095703, 82.23402404785156, 89.7369613647461, 97.23989868164062, 104.74282836914062, 112.24576568603516, 119.74870300292969, 127.25163269042969, 134.75457763671875, 142.25750732421875, 149.76043701171875, 157.2633819580078, 164.76632690429688, 172.26925659179688, 179.77220153808594, 187.27513122558594, 194.778076171875, 202.281005859375, 209.783935546875, 217.28688049316406, 224.78981018066406, 232.29273986816406, 239.79568481445312, 247.29861450195312, 254.8015594482422, 262.30450439453125, 269.80743408203125, 277.31036376953125, 284.81329345703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 6.0, 10.0, 4.0, 13.0, 18.0, 17.0, 18.0, 12.0, 29.0, 35.0, 28.0, 30.0, 41.0, 30.0, 40.0, 56.0, 50.0, 61.0, 85.0, 66.0, 43.0, 46.0, 54.0, 35.0, 28.0, 25.0, 32.0, 17.0, 13.0, 9.0, 17.0, 7.0, 5.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-147.8236846923828, -143.45022583007812, -139.07676696777344, -134.70330810546875, -130.32986450195312, -125.9563980102539, -121.58294677734375, -117.20948791503906, -112.83602905273438, -108.46257019042969, -104.089111328125, -99.71566009521484, -95.34220123291016, -90.96874237060547, -86.59529113769531, -82.22183227539062, -77.84837341308594, -73.47491455078125, -69.10145568847656, -64.7280044555664, -60.35454559326172, -55.98108673095703, -51.60763168334961, -47.23417663574219, -42.8607177734375, -38.48725891113281, -34.11380386352539, -29.740346908569336, -25.36688995361328, -20.993432998657227, -16.619976043701172, -12.246519088745117, -7.8730621337890625, -3.499605178833008, 0.8738517761230469, 5.247308731079102, 9.620765686035156, 13.994222640991211, 18.367679595947266, 22.74113655090332, 27.114593505859375, 31.48805046081543, 35.861507415771484, 40.234962463378906, 44.608421325683594, 48.98188018798828, 53.3553352355957, 57.728790283203125, 62.10224914550781, 66.4757080078125, 70.84916687011719, 75.22261810302734, 79.59607696533203, 83.96953582763672, 88.34298706054688, 92.71644592285156, 97.08990478515625, 101.46336364746094, 105.83682250976562, 110.21027374267578, 114.58373260498047, 118.95719146728516, 123.33064270019531, 127.7041015625, 132.0775604248047]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 3.0, 11.0, 13.0, 20.0, 32.0, 34.0, 56.0, 63.0, 106.0, 163.0, 265.0, 422.0, 683.0, 1280.0, 2309.0, 4740.0, 10502.0, 27111.0, 85213.0, 354054.0, 412137.0, 96642.0, 30291.0, 11477.0, 4994.0, 2593.0, 1397.0, 754.0, 441.0, 269.0, 181.0, 89.0, 71.0, 38.0, 27.0, 17.0, 12.0, 12.0, 8.0, 5.0, 10.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.381103515625, -10.03564453125, -9.690185546875, -9.3447265625, -8.999267578125, -8.65380859375, -8.308349609375, -7.962890625, -7.617431640625, -7.27197265625, -6.926513671875, -6.5810546875, -6.235595703125, -5.89013671875, -5.544677734375, -5.19921875, -4.853759765625, -4.50830078125, -4.162841796875, -3.8173828125, -3.471923828125, -3.12646484375, -2.781005859375, -2.435546875, -2.090087890625, -1.74462890625, -1.399169921875, -1.0537109375, -0.708251953125, -0.36279296875, -0.017333984375, 0.328125, 0.673583984375, 1.01904296875, 1.364501953125, 1.7099609375, 2.055419921875, 2.40087890625, 2.746337890625, 3.091796875, 3.437255859375, 3.78271484375, 4.128173828125, 4.4736328125, 4.819091796875, 5.16455078125, 5.510009765625, 5.85546875, 6.200927734375, 6.54638671875, 6.891845703125, 7.2373046875, 7.582763671875, 7.92822265625, 8.273681640625, 8.619140625, 8.964599609375, 9.31005859375, 9.655517578125, 10.0009765625, 10.346435546875, 10.69189453125, 11.037353515625, 11.3828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 10.0, 8.0, 9.0, 17.0, 25.0, 21.0, 19.0, 38.0, 50.0, 38.0, 58.0, 70.0, 57.0, 55.0, 81.0, 45.0, 49.0, 56.0, 51.0, 41.0, 39.0, 34.0, 21.0, 25.0, 17.0, 17.0, 19.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.5838623046875, -8.269287109375, -7.9547119140625, -7.64013671875, -7.3255615234375, -7.010986328125, -6.6964111328125, -6.3818359375, -6.0672607421875, -5.752685546875, -5.4381103515625, -5.12353515625, -4.8089599609375, -4.494384765625, -4.1798095703125, -3.865234375, -3.5506591796875, -3.236083984375, -2.9215087890625, -2.60693359375, -2.2923583984375, -1.977783203125, -1.6632080078125, -1.3486328125, -1.0340576171875, -0.719482421875, -0.4049072265625, -0.09033203125, 0.2242431640625, 0.538818359375, 0.8533935546875, 1.16796875, 1.4825439453125, 1.797119140625, 2.1116943359375, 2.42626953125, 2.7408447265625, 3.055419921875, 3.3699951171875, 3.6845703125, 3.9991455078125, 4.313720703125, 4.6282958984375, 4.94287109375, 5.2574462890625, 5.572021484375, 5.8865966796875, 6.201171875, 6.5157470703125, 6.830322265625, 7.1448974609375, 7.45947265625, 7.7740478515625, 8.088623046875, 8.4031982421875, 8.7177734375, 9.0323486328125, 9.346923828125, 9.6614990234375, 9.97607421875, 10.2906494140625, 10.605224609375, 10.9197998046875, 11.234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 8.0, 17.0, 17.0, 15.0, 26.0, 45.0, 39.0, 72.0, 109.0, 176.0, 244.0, 447.0, 841.0, 2094.0, 9213.0, 127827.0, 859903.0, 39420.0, 5059.0, 1431.0, 588.0, 338.0, 202.0, 135.0, 88.0, 48.0, 41.0, 28.0, 25.0, 13.0, 15.0, 12.0, 6.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.9140625, -15.3712158203125, -14.828369140625, -14.2855224609375, -13.74267578125, -13.1998291015625, -12.656982421875, -12.1141357421875, -11.5712890625, -11.0284423828125, -10.485595703125, -9.9427490234375, -9.39990234375, -8.8570556640625, -8.314208984375, -7.7713623046875, -7.228515625, -6.6856689453125, -6.142822265625, -5.5999755859375, -5.05712890625, -4.5142822265625, -3.971435546875, -3.4285888671875, -2.8857421875, -2.3428955078125, -1.800048828125, -1.2572021484375, -0.71435546875, -0.1715087890625, 0.371337890625, 0.9141845703125, 1.45703125, 1.9998779296875, 2.542724609375, 3.0855712890625, 3.62841796875, 4.1712646484375, 4.714111328125, 5.2569580078125, 5.7998046875, 6.3426513671875, 6.885498046875, 7.4283447265625, 7.97119140625, 8.5140380859375, 9.056884765625, 9.5997314453125, 10.142578125, 10.6854248046875, 11.228271484375, 11.7711181640625, 12.31396484375, 12.8568115234375, 13.399658203125, 13.9425048828125, 14.4853515625, 15.0281982421875, 15.571044921875, 16.1138916015625, 16.65673828125, 17.1995849609375, 17.742431640625, 18.2852783203125, 18.828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 1.0, 7.0, 6.0, 8.0, 9.0, 15.0, 13.0, 19.0, 11.0, 29.0, 17.0, 27.0, 41.0, 31.0, 31.0, 31.0, 54.0, 60.0, 68.0, 68.0, 55.0, 47.0, 51.0, 42.0, 29.0, 32.0, 32.0, 26.0, 22.0, 22.0, 15.0, 14.0, 11.0, 10.0, 4.0, 3.0, 7.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0, -24.143310546875, -23.28662109375, -22.429931640625, -21.5732421875, -20.716552734375, -19.85986328125, -19.003173828125, -18.146484375, -17.289794921875, -16.43310546875, -15.576416015625, -14.7197265625, -13.863037109375, -13.00634765625, -12.149658203125, -11.29296875, -10.436279296875, -9.57958984375, -8.722900390625, -7.8662109375, -7.009521484375, -6.15283203125, -5.296142578125, -4.439453125, -3.582763671875, -2.72607421875, -1.869384765625, -1.0126953125, -0.156005859375, 0.70068359375, 1.557373046875, 2.4140625, 3.270751953125, 4.12744140625, 4.984130859375, 5.8408203125, 6.697509765625, 7.55419921875, 8.410888671875, 9.267578125, 10.124267578125, 10.98095703125, 11.837646484375, 12.6943359375, 13.551025390625, 14.40771484375, 15.264404296875, 16.12109375, 16.977783203125, 17.83447265625, 18.691162109375, 19.5478515625, 20.404541015625, 21.26123046875, 22.117919921875, 22.974609375, 23.831298828125, 24.68798828125, 25.544677734375, 26.4013671875, 27.258056640625, 28.11474609375, 28.971435546875, 29.828125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 8.0, 11.0, 9.0, 20.0, 17.0, 44.0, 59.0, 82.0, 156.0, 204.0, 377.0, 725.0, 1582.0, 4013.0, 13451.0, 76381.0, 871274.0, 61597.0, 11775.0, 3667.0, 1511.0, 647.0, 313.0, 182.0, 124.0, 90.0, 60.0, 40.0, 26.0, 20.0, 20.0, 14.0, 11.0, 4.0, 3.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.412109375, -2.339996337890625, -2.26788330078125, -2.195770263671875, -2.1236572265625, -2.051544189453125, -1.97943115234375, -1.907318115234375, -1.835205078125, -1.763092041015625, -1.69097900390625, -1.618865966796875, -1.5467529296875, -1.474639892578125, -1.40252685546875, -1.330413818359375, -1.25830078125, -1.186187744140625, -1.11407470703125, -1.041961669921875, -0.9698486328125, -0.897735595703125, -0.82562255859375, -0.753509521484375, -0.681396484375, -0.609283447265625, -0.53717041015625, -0.465057373046875, -0.3929443359375, -0.320831298828125, -0.24871826171875, -0.176605224609375, -0.1044921875, -0.032379150390625, 0.03973388671875, 0.111846923828125, 0.1839599609375, 0.256072998046875, 0.32818603515625, 0.400299072265625, 0.472412109375, 0.544525146484375, 0.61663818359375, 0.688751220703125, 0.7608642578125, 0.832977294921875, 0.90509033203125, 0.977203369140625, 1.04931640625, 1.121429443359375, 1.19354248046875, 1.265655517578125, 1.3377685546875, 1.409881591796875, 1.48199462890625, 1.554107666015625, 1.626220703125, 1.698333740234375, 1.77044677734375, 1.842559814453125, 1.9146728515625, 1.986785888671875, 2.05889892578125, 2.131011962890625, 2.203125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 3.0, 8.0, 10.0, 10.0, 11.0, 16.0, 18.0, 20.0, 18.0, 47.0, 45.0, 93.0, 140.0, 152.0, 129.0, 67.0, 50.0, 31.0, 33.0, 18.0, 22.0, 4.0, 7.0, 4.0, 4.0, 5.0, 2.0, 6.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0009822845458984375, -0.0009566321969032288, -0.00093097984790802, -0.0009053274989128113, -0.0008796751499176025, -0.0008540228009223938, -0.0008283704519271851, -0.0008027181029319763, -0.0007770657539367676, -0.0007514134049415588, -0.0007257610559463501, -0.0007001087069511414, -0.0006744563579559326, -0.0006488040089607239, -0.0006231516599655151, -0.0005974993109703064, -0.0005718469619750977, -0.0005461946129798889, -0.0005205422639846802, -0.0004948899149894714, -0.0004692375659942627, -0.00044358521699905396, -0.0004179328680038452, -0.0003922805190086365, -0.00036662817001342773, -0.000340975821018219, -0.00031532347202301025, -0.0002896711230278015, -0.0002640187740325928, -0.00023836642503738403, -0.0002127140760421753, -0.00018706172704696655, -0.0001614093780517578, -0.00013575702905654907, -0.00011010468006134033, -8.445233106613159e-05, -5.879998207092285e-05, -3.314763307571411e-05, -7.495284080505371e-06, 1.815706491470337e-05, 4.380941390991211e-05, 6.946176290512085e-05, 9.511411190032959e-05, 0.00012076646089553833, 0.00014641880989074707, 0.0001720711588859558, 0.00019772350788116455, 0.0002233758568763733, 0.00024902820587158203, 0.00027468055486679077, 0.0003003329038619995, 0.00032598525285720825, 0.000351637601852417, 0.00037728995084762573, 0.00040294229984283447, 0.0004285946488380432, 0.00045424699783325195, 0.0004798993468284607, 0.0005055516958236694, 0.0005312040448188782, 0.0005568563938140869, 0.0005825087428092957, 0.0006081610918045044, 0.0006338134407997131, 0.0006594657897949219]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 10.0, 9.0, 8.0, 11.0, 16.0, 25.0, 33.0, 55.0, 71.0, 108.0, 152.0, 208.0, 421.0, 614.0, 1116.0, 2070.0, 3917.0, 8362.0, 19488.0, 57229.0, 619179.0, 261171.0, 43552.0, 16031.0, 6973.0, 3205.0, 1813.0, 996.0, 622.0, 366.0, 238.0, 147.0, 95.0, 69.0, 45.0, 28.0, 28.0, 15.0, 11.0, 11.0, 12.0, 10.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3541107177734375, -1.308807373046875, -1.2635040283203125, -1.21820068359375, -1.1728973388671875, -1.127593994140625, -1.0822906494140625, -1.0369873046875, -0.9916839599609375, -0.946380615234375, -0.9010772705078125, -0.85577392578125, -0.8104705810546875, -0.765167236328125, -0.7198638916015625, -0.674560546875, -0.6292572021484375, -0.583953857421875, -0.5386505126953125, -0.49334716796875, -0.4480438232421875, -0.402740478515625, -0.3574371337890625, -0.3121337890625, -0.2668304443359375, -0.221527099609375, -0.1762237548828125, -0.13092041015625, -0.0856170654296875, -0.040313720703125, 0.0049896240234375, 0.05029296875, 0.0955963134765625, 0.140899658203125, 0.1862030029296875, 0.23150634765625, 0.2768096923828125, 0.322113037109375, 0.3674163818359375, 0.4127197265625, 0.4580230712890625, 0.503326416015625, 0.5486297607421875, 0.59393310546875, 0.6392364501953125, 0.684539794921875, 0.7298431396484375, 0.775146484375, 0.8204498291015625, 0.865753173828125, 0.9110565185546875, 0.95635986328125, 1.0016632080078125, 1.046966552734375, 1.0922698974609375, 1.1375732421875, 1.1828765869140625, 1.228179931640625, 1.2734832763671875, 1.31878662109375, 1.3640899658203125, 1.409393310546875, 1.4546966552734375, 1.5]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 23.0, 12.0, 17.0, 32.0, 39.0, 53.0, 70.0, 95.0, 142.0, 121.0, 84.0, 70.0, 41.0, 35.0, 38.0, 16.0, 19.0, 16.0, 8.0, 14.0, 6.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.373046875, -2.296356201171875, -2.21966552734375, -2.142974853515625, -2.0662841796875, -1.989593505859375, -1.91290283203125, -1.836212158203125, -1.759521484375, -1.682830810546875, -1.60614013671875, -1.529449462890625, -1.4527587890625, -1.376068115234375, -1.29937744140625, -1.222686767578125, -1.14599609375, -1.069305419921875, -0.99261474609375, -0.915924072265625, -0.8392333984375, -0.762542724609375, -0.68585205078125, -0.609161376953125, -0.532470703125, -0.455780029296875, -0.37908935546875, -0.302398681640625, -0.2257080078125, -0.149017333984375, -0.07232666015625, 0.004364013671875, 0.0810546875, 0.157745361328125, 0.23443603515625, 0.311126708984375, 0.3878173828125, 0.464508056640625, 0.54119873046875, 0.617889404296875, 0.694580078125, 0.771270751953125, 0.84796142578125, 0.924652099609375, 1.0013427734375, 1.078033447265625, 1.15472412109375, 1.231414794921875, 1.30810546875, 1.384796142578125, 1.46148681640625, 1.538177490234375, 1.6148681640625, 1.691558837890625, 1.76824951171875, 1.844940185546875, 1.921630859375, 1.998321533203125, 2.07501220703125, 2.151702880859375, 2.2283935546875, 2.305084228515625, 2.38177490234375, 2.458465576171875, 2.53515625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 19.0, 31.0, 43.0, 166.0, 410.0, 187.0, 58.0, 37.0, 13.0, 8.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.36531829833984, -103.95246887207031, -99.53961181640625, -95.12676239013672, -90.71391296386719, -86.30105590820312, -81.8882064819336, -77.47535705566406, -73.0625, -68.64965057373047, -64.2367935180664, -59.823944091796875, -55.411094665527344, -50.99824142456055, -46.58538818359375, -42.17253875732422, -37.75968933105469, -33.34683609008789, -28.93398666381836, -24.521133422851562, -20.1082820892334, -15.695430755615234, -11.282577514648438, -6.869726181030273, -2.4568748474121094, 1.955976963043213, 6.368828773498535, 10.781681060791016, 15.19453239440918, 19.607383728027344, 24.02023696899414, 28.433088302612305, 32.845947265625, 37.2588005065918, 41.67164993286133, 46.084503173828125, 50.497352600097656, 54.91020584106445, 59.32305908203125, 63.73590850830078, 68.14875793457031, 72.56160736083984, 76.9744644165039, 81.38731384277344, 85.80016326904297, 90.2130126953125, 94.62586975097656, 99.0387191772461, 103.45157623291016, 107.86442565917969, 112.27728271484375, 116.69013214111328, 121.10298156738281, 125.51583862304688, 129.92868041992188, 134.34153747558594, 138.75439453125, 143.16725158691406, 147.58009338378906, 151.99295043945312, 156.4058074951172, 160.8186492919922, 165.23150634765625, 169.6443634033203, 174.0572052001953]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 5.0, 7.0, 8.0, 10.0, 11.0, 12.0, 10.0, 10.0, 16.0, 15.0, 17.0, 24.0, 21.0, 25.0, 43.0, 112.0, 98.0, 57.0, 111.0, 138.0, 50.0, 23.0, 19.0, 19.0, 22.0, 7.0, 14.0, 11.0, 18.0, 12.0, 12.0, 6.0, 8.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.00067138671875, -90.29997253417969, -87.59927368164062, -84.89857482910156, -82.1978759765625, -79.49717712402344, -76.79647827148438, -74.09577941894531, -71.39508056640625, -68.69438171386719, -65.99368286132812, -63.29298400878906, -60.59228515625, -57.89158630371094, -55.190887451171875, -52.49018859863281, -49.789485931396484, -47.08878707885742, -44.38808822631836, -41.6873893737793, -38.986690521240234, -36.28599166870117, -33.585289001464844, -30.884592056274414, -28.18389320373535, -25.48319435119629, -22.782495498657227, -20.08179473876953, -17.38109588623047, -14.680397987365723, -11.979698181152344, -9.278999328613281, -6.578300476074219, -3.877601385116577, -1.1769022941589355, 1.5237970352172852, 4.224495887756348, 6.92519474029541, 9.625894546508789, 12.326593399047852, 15.027292251586914, 17.727991104125977, 20.42868995666504, 23.129390716552734, 25.830089569091797, 28.53078842163086, 31.231487274169922, 33.932186126708984, 36.63288497924805, 39.33358383178711, 42.03428268432617, 44.734981536865234, 47.4356803894043, 50.13637924194336, 52.83708190917969, 55.53778076171875, 58.23847961425781, 60.939178466796875, 63.63987731933594, 66.340576171875, 69.04127502441406, 71.74197387695312, 74.44267272949219, 77.14337158203125, 79.84407043457031]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 6.0, 3.0, 5.0, 4.0, 7.0, 11.0, 14.0, 12.0, 13.0, 15.0, 21.0, 29.0, 30.0, 27.0, 30.0, 41.0, 87.0, 252.0, 85.0, 34.0, 29.0, 25.0, 19.0, 26.0, 19.0, 28.0, 21.0, 17.0, 14.0, 10.0, 9.0, 5.0, 6.0, 5.0, 8.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.25390625, -7.03167724609375, -6.8094482421875, -6.58721923828125, -6.364990234375, -6.14276123046875, -5.9205322265625, -5.69830322265625, -5.47607421875, -5.25384521484375, -5.0316162109375, -4.80938720703125, -4.587158203125, -4.36492919921875, -4.1427001953125, -3.92047119140625, -3.6982421875, -3.47601318359375, -3.2537841796875, -3.03155517578125, -2.809326171875, -2.58709716796875, -2.3648681640625, -2.14263916015625, -1.92041015625, -1.69818115234375, -1.4759521484375, -1.25372314453125, -1.031494140625, -0.80926513671875, -0.5870361328125, -0.36480712890625, -0.142578125, 0.07965087890625, 0.3018798828125, 0.52410888671875, 0.746337890625, 0.96856689453125, 1.1907958984375, 1.41302490234375, 1.63525390625, 1.85748291015625, 2.0797119140625, 2.30194091796875, 2.524169921875, 2.74639892578125, 2.9686279296875, 3.19085693359375, 3.4130859375, 3.63531494140625, 3.8575439453125, 4.07977294921875, 4.302001953125, 4.52423095703125, 4.7464599609375, 4.96868896484375, 5.19091796875, 5.41314697265625, 5.6353759765625, 5.85760498046875, 6.079833984375, 6.30206298828125, 6.5242919921875, 6.74652099609375, 6.96875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 5.0, 0.0, 3.0, 5.0, 4.0, 2.0, 11.0, 18.0, 21.0, 25.0, 63.0, 89.0, 79.0, 214.0, 595.0, 2002.0, 9564.0, 8338266.0, 32156.0, 3777.0, 938.0, 335.0, 149.0, 78.0, 55.0, 36.0, 25.0, 12.0, 10.0, 13.0, 4.0, 7.0, 5.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-107.97128295898438, -104.94878387451172, -101.92628479003906, -98.9037857055664, -95.88128662109375, -92.8587875366211, -89.83628845214844, -86.81378173828125, -83.79129028320312, -80.76879119873047, -77.74629211425781, -74.72379302978516, -71.7012939453125, -68.67879486083984, -65.65629577636719, -62.633792877197266, -59.611289978027344, -56.58879089355469, -53.56629180908203, -50.543792724609375, -47.52129364013672, -44.49879455566406, -41.47629165649414, -38.453792572021484, -35.43129348754883, -32.40879440307617, -29.386295318603516, -26.363794326782227, -23.34129524230957, -20.318796157836914, -17.296295166015625, -14.273796081542969, -11.251296997070312, -8.228797912597656, -5.206297874450684, -2.183797836303711, 0.8387012481689453, 3.8612003326416016, 6.883701324462891, 9.906200408935547, 12.928699493408203, 15.95119857788086, 18.973697662353516, 21.996198654174805, 25.01869773864746, 28.041196823120117, 31.063697814941406, 34.08619689941406, 37.10869598388672, 40.131195068359375, 43.15369415283203, 46.17619323730469, 49.198692321777344, 52.22119140625, 55.24369430541992, 58.26619338989258, 61.288692474365234, 64.31119537353516, 67.33369445800781, 70.35619354248047, 73.37869262695312, 76.40119171142578, 79.42369079589844, 82.4461898803711, 85.46868896484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 2.0, 5.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-120.77578735351562, -116.64141082763672, -112.50702667236328, -108.37265014648438, -104.23826599121094, -100.10388946533203, -95.96951293945312, -91.83512878417969, -87.70075225830078, -83.56637573242188, -79.43199157714844, -75.29761505126953, -71.16323852539062, -67.02885437011719, -62.89447784423828, -58.76009750366211, -54.62571716308594, -50.491336822509766, -46.356956481933594, -42.22257995605469, -38.088199615478516, -33.953819274902344, -29.819440841674805, -25.685062408447266, -21.550682067871094, -17.416301727294922, -13.281923294067383, -9.147543907165527, -5.013164520263672, -0.8787841796875, 3.255594253540039, 7.389972686767578, 11.52435302734375, 15.658732414245605, 19.79311180114746, 23.927490234375, 28.061870574951172, 32.196250915527344, 36.33062744140625, 40.46500778198242, 44.599388122558594, 48.733768463134766, 52.86814880371094, 57.002525329589844, 61.136905670166016, 65.27128601074219, 69.4056625366211, 73.5400390625, 77.67442321777344, 81.80879974365234, 85.94318389892578, 90.07756042480469, 94.21194458007812, 98.34632110595703, 102.48069763183594, 106.61508178710938, 110.74945831298828, 114.88383483886719, 119.01821899414062, 123.15259552001953, 127.28697204589844, 131.42135620117188, 135.5557403564453, 139.6901092529297, 143.82449340820312]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 3.0, 3.0, 6.0, 12.0, 19.0, 19.0, 37.0, 42.0, 70.0, 110.0, 159.0, 268.0, 454.0, 846.0, 1751.0, 3570.0, 8308.0, 21293.0, 57069.0, 149801.0, 169267.0, 68736.0, 24864.0, 9665.0, 3970.0, 1801.0, 888.0, 465.0, 289.0, 145.0, 106.0, 82.0, 46.0, 31.0, 14.0, 13.0, 12.0, 4.0, 4.0, 5.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-57.0625, -55.166015625, -53.26953125, -51.373046875, -49.4765625, -47.580078125, -45.68359375, -43.787109375, -41.890625, -39.994140625, -38.09765625, -36.201171875, -34.3046875, -32.408203125, -30.51171875, -28.615234375, -26.71875, -24.822265625, -22.92578125, -21.029296875, -19.1328125, -17.236328125, -15.33984375, -13.443359375, -11.546875, -9.650390625, -7.75390625, -5.857421875, -3.9609375, -2.064453125, -0.16796875, 1.728515625, 3.625, 5.521484375, 7.41796875, 9.314453125, 11.2109375, 13.107421875, 15.00390625, 16.900390625, 18.796875, 20.693359375, 22.58984375, 24.486328125, 26.3828125, 28.279296875, 30.17578125, 32.072265625, 33.96875, 35.865234375, 37.76171875, 39.658203125, 41.5546875, 43.451171875, 45.34765625, 47.244140625, 49.140625, 51.037109375, 52.93359375, 54.830078125, 56.7265625, 58.623046875, 60.51953125, 62.416015625, 64.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 3.0, 5.0, 6.0, 8.0, 9.0, 20.0, 19.0, 17.0, 27.0, 30.0, 39.0, 42.0, 60.0, 51.0, 68.0, 63.0, 69.0, 78.0, 76.0, 50.0, 54.0, 44.0, 28.0, 33.0, 13.0, 15.0, 16.0, 14.0, 6.0, 9.0, 6.0, 6.0, 1.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.25048828125, -8.9462890625, -8.64208984375, -8.337890625, -8.03369140625, -7.7294921875, -7.42529296875, -7.12109375, -6.81689453125, -6.5126953125, -6.20849609375, -5.904296875, -5.60009765625, -5.2958984375, -4.99169921875, -4.6875, -4.38330078125, -4.0791015625, -3.77490234375, -3.470703125, -3.16650390625, -2.8623046875, -2.55810546875, -2.25390625, -1.94970703125, -1.6455078125, -1.34130859375, -1.037109375, -0.73291015625, -0.4287109375, -0.12451171875, 0.1796875, 0.48388671875, 0.7880859375, 1.09228515625, 1.396484375, 1.70068359375, 2.0048828125, 2.30908203125, 2.61328125, 2.91748046875, 3.2216796875, 3.52587890625, 3.830078125, 4.13427734375, 4.4384765625, 4.74267578125, 5.046875, 5.35107421875, 5.6552734375, 5.95947265625, 6.263671875, 6.56787109375, 6.8720703125, 7.17626953125, 7.48046875, 7.78466796875, 8.0888671875, 8.39306640625, 8.697265625, 9.00146484375, 9.3056640625, 9.60986328125, 9.9140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 17.0, 45.0, 54.0, 112.0, 86.0, 60.0, 45.0, 19.0, 13.0, 5.0, 4.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.49837875366211, -29.815095901489258, -27.131813049316406, -24.448528289794922, -21.76524543762207, -19.08196258544922, -16.398677825927734, -13.715394973754883, -11.032112121582031, -8.34882926940918, -5.665545463562012, -2.9822616577148438, -0.2989788055419922, 2.3843040466308594, 5.067588806152344, 7.750871658325195, 10.434154510498047, 13.117437362670898, 15.800721168518066, 18.484004974365234, 21.167287826538086, 23.850570678710938, 26.533855438232422, 29.217138290405273, 31.900421142578125, 34.58370590209961, 37.26698684692383, 39.95027160644531, 42.63355255126953, 45.316837310791016, 48.0001220703125, 50.68340301513672, 53.36668395996094, 56.04996871948242, 58.73324966430664, 61.416534423828125, 64.09981536865234, 66.78309631347656, 69.46638488769531, 72.14966583251953, 74.83294677734375, 77.51622772216797, 80.19951629638672, 82.88279724121094, 85.56607818603516, 88.24935913085938, 90.93264770507812, 93.61592864990234, 96.2992172241211, 98.98249816894531, 101.66578674316406, 104.34906768798828, 107.0323486328125, 109.71563720703125, 112.39891815185547, 115.08219909667969, 117.76548767089844, 120.44876861572266, 123.1320571899414, 125.81533813476562, 128.49862670898438, 131.18190002441406, 133.8651885986328, 136.54847717285156, 139.23175048828125]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 7.0, 10.0, 8.0, 15.0, 19.0, 38.0, 67.0, 79.0, 86.0, 55.0, 32.0, 16.0, 8.0, 8.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.633628845214844, -50.882179260253906, -49.130733489990234, -47.3792839050293, -45.62783432006836, -43.87638854980469, -42.12493896484375, -40.37348937988281, -38.622039794921875, -36.87059020996094, -35.119144439697266, -33.36769485473633, -31.61624526977539, -29.864797592163086, -28.11334991455078, -26.361900329589844, -24.610454559326172, -22.859006881713867, -21.10755729675293, -19.356109619140625, -17.604660034179688, -15.853212356567383, -14.101764678955078, -12.350316047668457, -10.598867416381836, -8.847418785095215, -7.095970630645752, -5.344522476196289, -3.593073844909668, -1.8416252136230469, -0.09017753601074219, 1.661271095275879, 3.4127235412597656, 5.164172172546387, 6.91562032699585, 8.667068481445312, 10.418517112731934, 12.169965744018555, 13.92141342163086, 15.67286205291748, 17.4243106842041, 19.175758361816406, 20.927207946777344, 22.67865562438965, 24.430103302001953, 26.18155288696289, 27.933000564575195, 29.6844482421875, 31.435897827148438, 33.187347412109375, 34.93879318237305, 36.690242767333984, 38.44169235229492, 40.193138122558594, 41.94458770751953, 43.69603729248047, 45.447486877441406, 47.198936462402344, 48.950382232666016, 50.70183181762695, 52.45328140258789, 54.20472717285156, 55.9561767578125, 57.70762634277344, 59.45907211303711]}, "eval/loss": 0.8383785486221313, "eval/wer": 0.1366748020715519, "eval/runtime": 1219.9567, "eval/samples_per_second": 2.166, "eval/steps_per_second": 0.271} \ No newline at end of file